You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
614 lines
18 KiB
Fortran
614 lines
18 KiB
Fortran
!
|
|
! Parallel Sparse BLAS version 3.5
|
|
! (C) Copyright 2006-2018
|
|
! Salvatore Filippone
|
|
! Alfredo Buttari
|
|
!
|
|
! Redistribution and use in source and binary forms, with or without
|
|
! modification, are permitted provided that the following conditions
|
|
! are met:
|
|
! 1. Redistributions of source code must retain the above copyright
|
|
! notice, this list of conditions and the following disclaimer.
|
|
! 2. Redistributions in binary form must reproduce the above copyright
|
|
! notice, this list of conditions, and the following disclaimer in the
|
|
! documentation and/or other materials provided with the distribution.
|
|
! 3. The name of the PSBLAS group or the names of its contributors may
|
|
! not be used to endorse or promote products derived from this
|
|
! software without specific written permission.
|
|
!
|
|
! THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
! ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
|
|
! TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
|
|
! PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE PSBLAS GROUP OR ITS CONTRIBUTORS
|
|
! BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
! CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
! SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
! INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
! CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
! ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
|
! POSSIBILITY OF SUCH DAMAGE.
|
|
!
|
|
!
|
|
!
|
|
!
|
|
module psb_hash_mod
|
|
use psb_const_mod
|
|
use psb_desc_const_mod
|
|
use psb_cbind_const_mod
|
|
!> \class psb_hash_mod
|
|
!! \brief Simple hash module for storing integer keys.
|
|
!!
|
|
!! This module implements a very simple minded hash table.
|
|
!! The hash is based on the idea of open addressing with double hashing;
|
|
!! the primary hash function h1(K) is simply the remainder modulo 2^N, while
|
|
!! the secondary hash function is 1 if H1(k) == 0, otherwise IOR((2^N-H1(k)),1)
|
|
!! (See Knuth: TAOCP, Vol. 3, sec. 6.4)
|
|
!!
|
|
!! These hash functions are not very smart; however they are very simple and fast.
|
|
!! The intended usage of this hash table is to store indices of halo points, which
|
|
!! are supposed to be few compared to the internal indices
|
|
!! (which are stored elsewhere).
|
|
!! Therefore, either the table has a very low occupancy, and this scheme will work,
|
|
!! or we have lots more to worry about in parallel performance than the efficiency
|
|
!! of this hashing scheme.
|
|
!!
|
|
!!
|
|
! For us a hash is a Nx2 table.
|
|
! Note: we are assuming that the keys are positive numbers.
|
|
! Allocatable scalars would be a nice solution...
|
|
!
|
|
type psb_hash_type
|
|
integer(psb_ipk_) :: nbits, hsize, hmask, nk
|
|
integer(psb_lpk_), allocatable :: table(:,:)
|
|
integer(psb_lpk_) :: nsrch, nacc
|
|
end type psb_hash_type
|
|
|
|
|
|
integer(psb_ipk_), parameter :: HashOK=0
|
|
integer(psb_ipk_), parameter :: HashDuplicate = 123
|
|
integer(psb_ipk_), parameter :: HashOutOfMemory=-512
|
|
integer(psb_ipk_), parameter :: HashFreeEntry = -1
|
|
integer(psb_ipk_), parameter :: HashNotFound = -256
|
|
|
|
interface psb_hashval
|
|
#if defined(IPK4)
|
|
function psb_c_hashval_32(key) bind(c) result(res)
|
|
import psb_c_ipk_
|
|
implicit none
|
|
integer(psb_c_ipk_), value :: key
|
|
integer(psb_c_ipk_) :: res
|
|
end function psb_c_hashval_32
|
|
#endif
|
|
#if defined(IPK4) && defined(LPK8)
|
|
function psb_c_hashval_64_32(key) bind(c) result(res)
|
|
import psb_c_ipk_, psb_c_lpk_
|
|
implicit none
|
|
integer(psb_c_lpk_), value :: key
|
|
integer(psb_c_ipk_) :: res
|
|
end function psb_c_hashval_64_32
|
|
#endif
|
|
#if defined(IPK8)
|
|
function psb_c_hashval_64(key) bind(c) result(res)
|
|
import psb_c_ipk_
|
|
implicit none
|
|
integer(psb_c_ipk_), value :: key
|
|
integer(psb_c_ipk_) :: res
|
|
end function psb_c_hashval_64
|
|
#endif
|
|
end interface psb_hashval
|
|
|
|
|
|
interface psb_hash_init
|
|
module procedure psb_hash_init_lv, psb_hash_init_ln
|
|
end interface psb_hash_init
|
|
|
|
interface psb_sizeof
|
|
module procedure psb_sizeof_hash_type
|
|
end interface
|
|
|
|
|
|
interface psb_hash_searchinskey
|
|
module procedure psb_hash_lsearchinskey
|
|
end interface psb_hash_searchinskey
|
|
|
|
interface psb_hash_searchkey
|
|
module procedure psb_hash_lsearchkey
|
|
end interface psb_hash_searchkey
|
|
|
|
#if defined(IPK4) && defined(LPK8)
|
|
interface psb_hash_init
|
|
module procedure psb_hash_init_v, psb_hash_init_n
|
|
end interface
|
|
|
|
interface psb_hash_searchinskey
|
|
module procedure psb_hash_isearchinskey
|
|
end interface psb_hash_searchinskey
|
|
|
|
interface psb_hash_searchkey
|
|
module procedure psb_hash_isearchkey
|
|
end interface psb_hash_searchkey
|
|
#endif
|
|
|
|
interface psb_move_alloc
|
|
module procedure HashTransfer
|
|
end interface
|
|
|
|
interface psb_hash_copy
|
|
module procedure HashCopy
|
|
end interface
|
|
|
|
interface psb_free
|
|
module procedure HashFree
|
|
end interface
|
|
|
|
|
|
contains
|
|
|
|
function psb_Sizeof_hash_type(hash) result(val)
|
|
type(psb_hash_type) :: hash
|
|
integer(psb_epk_) :: val
|
|
val = 4*psb_sizeof_ip + 2*psb_sizeof_lp
|
|
if (allocated(hash%table)) &
|
|
& val = val + psb_sizeof_lp * size(hash%table)
|
|
|
|
end function psb_Sizeof_hash_type
|
|
|
|
function psb_hash_avg_acc(hash)
|
|
type(psb_hash_type), intent(in) :: hash
|
|
real(psb_dpk_) :: psb_hash_avg_acc
|
|
|
|
psb_hash_avg_acc = dble(hash%nacc)/dble(hash%nsrch)
|
|
end function psb_hash_avg_acc
|
|
|
|
subroutine HashFree(hashin,info)
|
|
use psb_realloc_mod
|
|
type(psb_hash_type) :: hashin
|
|
integer(psb_ipk_) :: info
|
|
|
|
info = psb_success_
|
|
if (allocated(hashin%table)) then
|
|
deallocate(hashin%table,stat=info)
|
|
end if
|
|
hashin%nbits = 0
|
|
hashin%hsize = 0
|
|
hashin%hmask = 0
|
|
hashin%nk = 0
|
|
end subroutine HashFree
|
|
|
|
subroutine HashTransfer(hashin,hashout,info)
|
|
use psb_realloc_mod
|
|
type(psb_hash_type) :: hashin
|
|
type(psb_hash_type) :: hashout
|
|
integer(psb_ipk_), intent(out) :: info
|
|
|
|
info = HashOk
|
|
hashout%nbits = hashin%nbits
|
|
hashout%hsize = hashin%hsize
|
|
hashout%hmask = hashin%hmask
|
|
hashout%nk = hashin%nk
|
|
hashout%nsrch = hashin%nsrch
|
|
hashout%nacc = hashin%nacc
|
|
call psb_move_alloc(hashin%table, hashout%table,info)
|
|
|
|
end subroutine HashTransfer
|
|
|
|
subroutine HashCopy(hashin,hashout,info)
|
|
use psb_realloc_mod
|
|
type(psb_hash_type) :: hashin
|
|
type(psb_hash_type) :: hashout
|
|
integer(psb_ipk_), intent(out) :: info
|
|
|
|
info = HashOk
|
|
hashout%nbits = hashin%nbits
|
|
hashout%hsize = hashin%hsize
|
|
hashout%hmask = hashin%hmask
|
|
hashout%nk = hashin%nk
|
|
hashout%nsrch = hashin%nsrch
|
|
hashout%nacc = hashin%nacc
|
|
call psb_safe_ab_cpy(hashin%table, hashout%table,info)
|
|
|
|
end subroutine HashCopy
|
|
|
|
subroutine CloneHashTable(hashin,hashout,info)
|
|
type(psb_hash_type), pointer :: hashin
|
|
type(psb_hash_type), pointer :: hashout
|
|
integer(psb_ipk_), intent(out) :: info
|
|
|
|
if (associated(hashout)) then
|
|
deallocate(hashout,stat=info)
|
|
!if (info /= psb_success_) return
|
|
end if
|
|
if (associated(hashin)) then
|
|
allocate(hashout,stat=info)
|
|
if (info /= psb_success_) return
|
|
call HashCopy(hashin,hashout,info)
|
|
end if
|
|
|
|
end subroutine CloneHashTable
|
|
|
|
subroutine psb_hash_init_v(v,hash,info)
|
|
integer(psb_ipk_), intent(in) :: v(:)
|
|
type(psb_hash_type), intent(out) :: hash
|
|
integer(psb_ipk_), intent(out) :: info
|
|
|
|
integer(psb_ipk_) :: i,j,nbits, nv
|
|
|
|
info = psb_success_
|
|
nv = size(v)
|
|
call psb_hash_init(nv,hash,info)
|
|
if (info /= psb_success_) return
|
|
do i=1,nv
|
|
call psb_hash_searchinskey(v(i),j,i,hash,info)
|
|
if ((j /= i).or.(info /= HashOK)) then
|
|
write(psb_err_unit,*) 'Error from hash_ins',i,v(i),j,info
|
|
info = HashNotFound
|
|
return
|
|
end if
|
|
end do
|
|
end subroutine psb_hash_init_v
|
|
|
|
subroutine psb_hash_init_lv(v,hash,info)
|
|
integer(psb_lpk_), intent(in) :: v(:)
|
|
type(psb_hash_type), intent(out) :: hash
|
|
integer(psb_ipk_), intent(out) :: info
|
|
|
|
integer(psb_lpk_) :: i,j, nv
|
|
|
|
info = psb_success_
|
|
nv = size(v)
|
|
call psb_hash_init(nv,hash,info)
|
|
if (info /= psb_success_) return
|
|
do i=1,nv
|
|
call psb_hash_searchinskey(v(i),j,i,hash,info)
|
|
if ((j /= i).or.(info /= HashOK)) then
|
|
write(psb_err_unit,*) 'Error from hash_ins',i,v(i),j,info
|
|
info = HashNotFound
|
|
return
|
|
end if
|
|
end do
|
|
end subroutine psb_hash_init_lv
|
|
|
|
subroutine psb_hash_init_n(nv,hash,info)
|
|
integer(psb_ipk_), intent(in) :: nv
|
|
type(psb_hash_type), intent(out) :: hash
|
|
integer(psb_ipk_), intent(out) :: info
|
|
|
|
integer(psb_ipk_) :: hsize,nbits
|
|
|
|
info = psb_success_
|
|
nbits = psb_hash_bits
|
|
hsize = 2**nbits
|
|
!
|
|
! Figure out the smallest power of 2 bigger than NV
|
|
! Note: in our intended usage NV will be the size of the
|
|
! local index space, NOT the global index space.
|
|
!
|
|
do
|
|
if (hsize < 0) then
|
|
write(psb_err_unit,*) 'Error: hash size overflow ',hsize,nbits
|
|
info = -2
|
|
return
|
|
end if
|
|
if (hsize > nv) exit
|
|
nbits = nbits + 1
|
|
hsize = hsize * 2
|
|
end do
|
|
hash%nbits = nbits
|
|
hash%hsize = hsize
|
|
hash%hmask = hsize-1
|
|
hash%nsrch = 0
|
|
hash%nacc = 0
|
|
allocate(hash%table(0:hsize-1,2),stat=info)
|
|
if (info /= psb_success_) then
|
|
write(psb_err_unit,*) 'Error: memory allocation failure ',hsize
|
|
info = HashOutOfMemory
|
|
return
|
|
end if
|
|
hash%table = HashFreeEntry
|
|
hash%nk = 0
|
|
end subroutine psb_hash_init_n
|
|
|
|
subroutine psb_hash_init_ln(nv,hash,info)
|
|
integer(psb_lpk_), intent(in) :: nv
|
|
type(psb_hash_type), intent(out) :: hash
|
|
integer(psb_ipk_), intent(out) :: info
|
|
|
|
integer(psb_ipk_) :: hsize,nbits
|
|
|
|
info = psb_success_
|
|
nbits = psb_hash_bits
|
|
hsize = 2**nbits
|
|
!
|
|
! Figure out the smallest power of 2 bigger than NV
|
|
! Note: in our intended usage NV will be the size of the
|
|
! local index space, NOT the global index space.
|
|
!
|
|
do
|
|
if (hsize < 0) then
|
|
write(psb_err_unit,*) 'Error: hash size overflow ',hsize,nbits
|
|
info = -2
|
|
return
|
|
end if
|
|
if (hsize > nv) exit
|
|
nbits = nbits + 1
|
|
hsize = hsize * 2
|
|
end do
|
|
hash%nbits = nbits
|
|
hash%hsize = hsize
|
|
hash%hmask = hsize-1
|
|
hash%nsrch = 0
|
|
hash%nacc = 0
|
|
allocate(hash%table(0:hsize-1,2),stat=info)
|
|
if (info /= psb_success_) then
|
|
write(psb_err_unit,*) 'Error: memory allocation failure ',hsize
|
|
info = HashOutOfMemory
|
|
return
|
|
end if
|
|
hash%table = HashFreeEntry
|
|
hash%nk = 0
|
|
end subroutine psb_hash_init_ln
|
|
|
|
|
|
subroutine psb_hash_realloc(hash,info)
|
|
type(psb_hash_type), intent(inout) :: hash
|
|
integer(psb_ipk_), intent(out) :: info
|
|
type(psb_hash_type) :: nhash
|
|
integer(psb_lpk_) :: key, val, nextval,i
|
|
|
|
info = HashOk
|
|
|
|
call psb_hash_init((hash%hsize+1),nhash,info)
|
|
|
|
if (info /= HashOk) then
|
|
info = HashOutOfMemory
|
|
return
|
|
endif
|
|
do i=0, hash%hsize-1
|
|
key = hash%table(i,1)
|
|
nextval = hash%table(i,2)
|
|
if (key /= HashFreeEntry) then
|
|
call psb_hash_searchinskey(key,val,nextval,nhash,info)
|
|
if (info /= psb_success_) then
|
|
info = HashOutOfMemory
|
|
return
|
|
end if
|
|
end if
|
|
end do
|
|
call HashTransfer(nhash,hash,info)
|
|
end subroutine psb_hash_realloc
|
|
|
|
recursive subroutine psb_hash_lsearchinskey(key,val,nextval,hash,info)
|
|
integer(psb_lpk_), intent(in) :: key,nextval
|
|
type(psb_hash_type) :: hash
|
|
integer(psb_lpk_), intent(out) :: val
|
|
integer(psb_ipk_), intent(out) :: info
|
|
|
|
integer(psb_ipk_) :: hsize,hmask, hk, hd, i
|
|
logical :: redo
|
|
|
|
info = HashOK
|
|
hsize = hash%hsize
|
|
hmask = hash%hmask
|
|
hk = iand(psb_hashval(key),hmask)
|
|
if (hk == 0) then
|
|
hd = 1
|
|
else
|
|
hd = hsize - hk
|
|
hd = ior(hd,1_psb_ipk_)
|
|
end if
|
|
if (.not.allocated(hash%table)) then
|
|
info = HashOutOfMemory
|
|
return
|
|
end if
|
|
val = -1
|
|
!$omp atomic
|
|
hash%nsrch = hash%nsrch + 1
|
|
!$omp end atomic
|
|
do
|
|
!$omp atomic
|
|
hash%nacc = hash%nacc + 1
|
|
!$omp end atomic
|
|
if (hash%table(hk,1) == key) then
|
|
val = hash%table(hk,2)
|
|
info = HashDuplicate
|
|
return
|
|
end if
|
|
redo = .false.
|
|
!$omp critical(hashsearchins)
|
|
if (hash%table(hk,1) == HashFreeEntry) then
|
|
if (hash%nk == hash%hsize -1) then
|
|
!
|
|
! Note: because of the way we allocate things at CDALL
|
|
! time this is really unlikely; if we get here, we
|
|
! have at least as many halo indices as internals, which
|
|
! means we're already in trouble. But we try to keep going.
|
|
!
|
|
call psb_hash_realloc(hash,info)
|
|
if (info /= HashOk) then
|
|
info = HashOutOfMemory
|
|
else
|
|
redo = .true.
|
|
end if
|
|
else
|
|
hash%nk = hash%nk + 1
|
|
hash%table(hk,1) = key
|
|
hash%table(hk,2) = nextval
|
|
val = nextval
|
|
info = HashOk
|
|
end if
|
|
else if (hash%table(hk,1) == key) then
|
|
val = hash%table(hk,2)
|
|
info = HashDuplicate
|
|
else
|
|
info = HashNotFound
|
|
end if
|
|
!$omp end critical(hashsearchins)
|
|
if (redo) then
|
|
call psb_hash_searchinskey(key,val,nextval,hash,info)
|
|
return
|
|
end if
|
|
if (val > 0) exit
|
|
hk = hk - hd
|
|
if (hk < 0) hk = hk + hsize
|
|
end do
|
|
end subroutine psb_hash_lsearchinskey
|
|
|
|
recursive subroutine psb_hash_isearchinskey(key,val,nextval,hash,info)
|
|
integer(psb_ipk_), intent(in) :: key,nextval
|
|
type(psb_hash_type) :: hash
|
|
integer(psb_ipk_), intent(out) :: val, info
|
|
|
|
integer(psb_ipk_) :: hsize,hmask, hk, hd
|
|
logical :: redo
|
|
|
|
info = HashOK
|
|
hsize = hash%hsize
|
|
hmask = hash%hmask
|
|
|
|
hk = iand(psb_hashval(key),hmask)
|
|
if (hk == 0) then
|
|
hd = 1
|
|
else
|
|
hd = hsize - hk
|
|
hd = ior(hd,1_psb_ipk_)
|
|
end if
|
|
if (.not.allocated(hash%table)) then
|
|
info = HashOutOfMemory
|
|
return
|
|
end if
|
|
val = -1
|
|
val = -1
|
|
!$omp atomic
|
|
hash%nsrch = hash%nsrch + 1
|
|
!$omp end atomic
|
|
do
|
|
!$omp atomic
|
|
hash%nacc = hash%nacc + 1
|
|
!$omp end atomic
|
|
if (hash%table(hk,1) == key) then
|
|
val = hash%table(hk,2)
|
|
info = HashDuplicate
|
|
return
|
|
end if
|
|
redo = .false.
|
|
!$omp critical(hashsearchins)
|
|
if (hash%table(hk,1) == HashFreeEntry) then
|
|
if (hash%nk == hash%hsize -1) then
|
|
!
|
|
! Note: because of the way we allocate things at CDALL
|
|
! time this is really unlikely; if we get here, we
|
|
! have at least as many halo indices as internals, which
|
|
! means we're already in trouble. But we try to keep going.
|
|
!
|
|
call psb_hash_realloc(hash,info)
|
|
if (info /= HashOk) then
|
|
info = HashOutOfMemory
|
|
else
|
|
redo = .true.
|
|
end if
|
|
else
|
|
hash%nk = hash%nk + 1
|
|
hash%table(hk,1) = key
|
|
hash%table(hk,2) = nextval
|
|
val = nextval
|
|
info = HashOk
|
|
end if
|
|
else if (hash%table(hk,1) == key) then
|
|
val = hash%table(hk,2)
|
|
info = HashDuplicate
|
|
else
|
|
info = HashNotFound
|
|
end if
|
|
!$omp end critical(hashsearchins)
|
|
if (redo) then
|
|
call psb_hash_searchinskey(key,val,nextval,hash,info)
|
|
return
|
|
end if
|
|
if (val > 0) exit
|
|
hk = hk - hd
|
|
if (hk < 0) hk = hk + hsize
|
|
end do
|
|
end subroutine psb_hash_isearchinskey
|
|
|
|
subroutine psb_hash_isearchkey(key,val,hash,info)
|
|
integer(psb_ipk_), intent(in) :: key
|
|
type(psb_hash_type) :: hash
|
|
integer(psb_ipk_), intent(out) :: val, info
|
|
|
|
integer(psb_ipk_) :: hsize,hmask, hk, hd
|
|
|
|
info = HashOK
|
|
if (.not.allocated(hash%table) ) then
|
|
val = HashFreeEntry
|
|
return
|
|
end if
|
|
hsize = hash%hsize
|
|
hmask = hash%hmask
|
|
hk = iand(psb_hashval(key),hmask)
|
|
|
|
if (hk == 0) then
|
|
hd = 1
|
|
else
|
|
hd = hsize - hk
|
|
hd = ior(hd,1_psb_ipk_)
|
|
end if
|
|
|
|
hash%nsrch = hash%nsrch + 1
|
|
do
|
|
hash%nacc = hash%nacc + 1
|
|
if (hash%table(hk,1) == key) then
|
|
val = hash%table(hk,2)
|
|
return
|
|
end if
|
|
if (hash%table(hk,1) == HashFreeEntry) then
|
|
val = HashFreeEntry
|
|
info = HashNotFound
|
|
return
|
|
end if
|
|
hk = hk - hd
|
|
if (hk < 0) hk = hk + hsize
|
|
end do
|
|
end subroutine psb_hash_isearchkey
|
|
|
|
subroutine psb_hash_lsearchkey(key,val,hash,info)
|
|
integer(psb_lpk_), intent(in) :: key
|
|
type(psb_hash_type) :: hash
|
|
integer(psb_lpk_), intent(out) :: val
|
|
integer(psb_ipk_), intent(out) :: info
|
|
|
|
integer(psb_ipk_) :: hsize,hmask, hk, hd
|
|
|
|
info = HashOK
|
|
if (.not.allocated(hash%table) ) then
|
|
val = HashFreeEntry
|
|
return
|
|
end if
|
|
hsize = hash%hsize
|
|
hmask = hash%hmask
|
|
hk = iand(psb_hashval(key),hmask)
|
|
if (hk == 0) then
|
|
hd = 1
|
|
else
|
|
hd = hsize - hk
|
|
hd = ior(hd,1_psb_ipk_)
|
|
end if
|
|
|
|
hash%nsrch = hash%nsrch + 1
|
|
do
|
|
hash%nacc = hash%nacc + 1
|
|
if (hash%table(hk,1) == key) then
|
|
val = hash%table(hk,2)
|
|
return
|
|
end if
|
|
if (hash%table(hk,1) == HashFreeEntry) then
|
|
val = HashFreeEntry
|
|
info = HashNotFound
|
|
return
|
|
end if
|
|
hk = hk - hd
|
|
if (hk < 0) hk = hk + hsize
|
|
end do
|
|
end subroutine psb_hash_lsearchkey
|
|
|
|
end module psb_hash_mod
|