You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
384 lines
11 KiB
Fortran
384 lines
11 KiB
Fortran
!!$
|
|
!!$ Parallel Sparse BLAS version 3.1
|
|
!!$ (C) Copyright 2006, 2007, 2008, 2009, 2010, 2012, 2013
|
|
!!$ Salvatore Filippone University of Rome Tor Vergata
|
|
!!$ Alfredo Buttari CNRS-IRIT, Toulouse
|
|
!!$
|
|
!!$ Redistribution and use in source and binary forms, with or without
|
|
!!$ modification, are permitted provided that the following conditions
|
|
!!$ are met:
|
|
!!$ 1. Redistributions of source code must retain the above copyright
|
|
!!$ notice, this list of conditions and the following disclaimer.
|
|
!!$ 2. Redistributions in binary form must reproduce the above copyright
|
|
!!$ notice, this list of conditions, and the following disclaimer in the
|
|
!!$ documentation and/or other materials provided with the distribution.
|
|
!!$ 3. The name of the PSBLAS group or the names of its contributors may
|
|
!!$ not be used to endorse or promote products derived from this
|
|
!!$ software without specific written permission.
|
|
!!$
|
|
!!$ THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
!!$ ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
|
|
!!$ TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
|
|
!!$ PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE PSBLAS GROUP OR ITS CONTRIBUTORS
|
|
!!$ BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
!!$ CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
!!$ SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
!!$ INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
!!$ CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
!!$ ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
|
!!$ POSSIBILITY OF SUCH DAMAGE.
|
|
!!$
|
|
!!$
|
|
!
|
|
!
|
|
module psb_hash_mod
|
|
use psb_const_mod
|
|
|
|
!> \class psb_hash_mod
|
|
!! \brief Simple hash module for storing integer keys.
|
|
!!
|
|
!! This module implements a very simple minded hash table.
|
|
!! The hash is based on the idea of open addressing with double hashing;
|
|
!! the primary hash function h1(K) is simply the remainder modulo 2^N, while
|
|
!! the secondary hash function is 1 if H1(k) == 0, otherwise IOR((2^N-H1(k)),1)
|
|
!! (See Knuth: TAOCP, Vol. 3, sec. 6.4)
|
|
!!
|
|
!! These hash functions are not very smart; however they are very simple and fast.
|
|
!! The intended usage of this hash table is to store indices of halo points, which
|
|
!! are supposed to be few compared to the internal indices
|
|
!! (which are stored elsewhere).
|
|
!! Therefore, either the table has a very low occupancy, and this scheme will work,
|
|
!! or we have lots more to worry about in parallel performance than the efficiency
|
|
!! of this hashing scheme.
|
|
!!
|
|
!!
|
|
! For us a hash is a Nx2 table.
|
|
! Note: we are assuming that the keys are positive numbers.
|
|
! Allocatable scalars would be a nice solution...
|
|
!
|
|
type psb_hash_type
|
|
integer(psb_ipk_) :: nbits, hsize, hmask, nk
|
|
integer(psb_ipk_), allocatable :: table(:,:)
|
|
integer(psb_long_int_k_) :: nsrch, nacc
|
|
end type psb_hash_type
|
|
|
|
|
|
integer(psb_ipk_), parameter :: HashDuplicate = 123, HashOK=0, HashOutOfMemory=-512,&
|
|
& HashFreeEntry = -1, HashNotFound = -256
|
|
|
|
interface psb_hash_init
|
|
module procedure psb_hash_init_v, psb_hash_init_n
|
|
end interface
|
|
|
|
interface psb_sizeof
|
|
module procedure psb_sizeof_hash_type
|
|
end interface
|
|
|
|
|
|
interface psb_move_alloc
|
|
module procedure HashTransfer
|
|
end interface
|
|
|
|
interface psb_hash_copy
|
|
module procedure HashCopy
|
|
end interface
|
|
|
|
interface psb_free
|
|
module procedure HashFree
|
|
end interface
|
|
|
|
contains
|
|
|
|
|
|
!
|
|
! This is based on the djb2 hashing algorithm
|
|
! see e.g. http://www.cse.yorku.ca/~oz/hash.html
|
|
!
|
|
function hashval(key) result(val)
|
|
integer(psb_ipk_), intent(in) :: key
|
|
integer(psb_ipk_), parameter :: ival=5381, mask=huge(ival)
|
|
integer(psb_ipk_) :: key_, val, i
|
|
|
|
key_ = key
|
|
val = ival
|
|
do i=1, psb_sizeof_int
|
|
val = val * 33 + iand(key_,255)
|
|
key_ = ishft(key_,-8)
|
|
end do
|
|
|
|
val = val + ishft(val,-5)
|
|
val = iand(val,mask)
|
|
|
|
end function hashval
|
|
|
|
|
|
function psb_Sizeof_hash_type(hash) result(val)
|
|
type(psb_hash_type) :: hash
|
|
integer(psb_long_int_k_) :: val
|
|
val = 4*psb_sizeof_int + 2*psb_sizeof_long_int
|
|
if (allocated(hash%table)) &
|
|
& val = val + psb_sizeof_int * size(hash%table)
|
|
|
|
end function psb_Sizeof_hash_type
|
|
|
|
|
|
function psb_hash_avg_acc(hash)
|
|
type(psb_hash_type), intent(in) :: hash
|
|
real(psb_dpk_) :: psb_hash_avg_acc
|
|
|
|
psb_hash_avg_acc = dble(hash%nacc)/dble(hash%nsrch)
|
|
end function psb_hash_avg_acc
|
|
|
|
subroutine HashFree(hashin,info)
|
|
use psb_realloc_mod
|
|
type(psb_hash_type) :: hashin
|
|
integer(psb_ipk_) :: info
|
|
|
|
info = psb_success_
|
|
if (allocated(hashin%table)) then
|
|
deallocate(hashin%table,stat=info)
|
|
end if
|
|
hashin%nbits = 0
|
|
hashin%hsize = 0
|
|
hashin%hmask = 0
|
|
hashin%nk = 0
|
|
end subroutine HashFree
|
|
|
|
subroutine HashTransfer(hashin,hashout,info)
|
|
use psb_realloc_mod
|
|
type(psb_hash_type) :: hashin
|
|
type(psb_hash_type) :: hashout
|
|
integer(psb_ipk_), intent(out) :: info
|
|
|
|
info = HashOk
|
|
hashout%nbits = hashin%nbits
|
|
hashout%hsize = hashin%hsize
|
|
hashout%hmask = hashin%hmask
|
|
hashout%nk = hashin%nk
|
|
hashout%nsrch = hashin%nsrch
|
|
hashout%nacc = hashin%nacc
|
|
call psb_move_alloc(hashin%table, hashout%table,info)
|
|
|
|
end subroutine HashTransfer
|
|
|
|
subroutine HashCopy(hashin,hashout,info)
|
|
use psb_realloc_mod
|
|
type(psb_hash_type) :: hashin
|
|
type(psb_hash_type) :: hashout
|
|
integer(psb_ipk_), intent(out) :: info
|
|
|
|
info = HashOk
|
|
hashout%nbits = hashin%nbits
|
|
hashout%hsize = hashin%hsize
|
|
hashout%hmask = hashin%hmask
|
|
hashout%nk = hashin%nk
|
|
hashout%nsrch = hashin%nsrch
|
|
hashout%nacc = hashin%nacc
|
|
call psb_safe_ab_cpy(hashin%table, hashout%table,info)
|
|
|
|
end subroutine HashCopy
|
|
|
|
subroutine CloneHashTable(hashin,hashout,info)
|
|
type(psb_hash_type), pointer :: hashin
|
|
type(psb_hash_type), pointer :: hashout
|
|
integer(psb_ipk_), intent(out) :: info
|
|
|
|
if (associated(hashout)) then
|
|
deallocate(hashout,stat=info)
|
|
!if (info /= psb_success_) return
|
|
end if
|
|
if (associated(hashin)) then
|
|
allocate(hashout,stat=info)
|
|
if (info /= psb_success_) return
|
|
call HashCopy(hashin,hashout,info)
|
|
end if
|
|
|
|
end subroutine CloneHashTable
|
|
|
|
subroutine psb_hash_init_V(v,hash,info)
|
|
integer(psb_ipk_), intent(in) :: v(:)
|
|
type(psb_hash_type), intent(out) :: hash
|
|
integer(psb_ipk_), intent(out) :: info
|
|
|
|
integer(psb_ipk_) :: i,j,nbits, nv
|
|
|
|
info = psb_success_
|
|
nv = size(v)
|
|
call psb_hash_init(nv,hash,info)
|
|
if (info /= psb_success_) return
|
|
do i=1,nv
|
|
call psb_hash_searchinskey(v(i),j,i,hash,info)
|
|
if ((j /= i).or.(info /= HashOK)) then
|
|
write(psb_err_unit,*) 'Error from hash_ins',i,v(i),j,info
|
|
info = HashNotFound
|
|
return
|
|
end if
|
|
end do
|
|
end subroutine psb_hash_init_V
|
|
|
|
subroutine psb_hash_init_n(nv,hash,info)
|
|
integer(psb_ipk_), intent(in) :: nv
|
|
type(psb_hash_type), intent(out) :: hash
|
|
integer(psb_ipk_), intent(out) :: info
|
|
|
|
integer(psb_ipk_) :: hsize,nbits
|
|
|
|
info = psb_success_
|
|
nbits = 12
|
|
hsize = 2**nbits
|
|
!
|
|
! Figure out the smallest power of 2 bigger than NV
|
|
! Note: in our intended usage NV will be the size of the
|
|
! local index space, NOT the global index space.
|
|
!
|
|
do
|
|
if (hsize < 0) then
|
|
write(psb_err_unit,*) 'Error: hash size overflow ',hsize,nbits
|
|
info = -2
|
|
return
|
|
end if
|
|
if (hsize > nv) exit
|
|
nbits = nbits + 1
|
|
hsize = hsize * 2
|
|
end do
|
|
hash%nbits = nbits
|
|
hash%hsize = hsize
|
|
hash%hmask = hsize-1
|
|
hash%nsrch = 0
|
|
hash%nacc = 0
|
|
allocate(hash%table(0:hsize-1,2),stat=info)
|
|
if (info /= psb_success_) then
|
|
write(psb_err_unit,*) 'Error: memory allocation failure ',hsize
|
|
info = HashOutOfMemory
|
|
return
|
|
end if
|
|
hash%table = HashFreeEntry
|
|
hash%nk = 0
|
|
end subroutine psb_hash_init_n
|
|
|
|
|
|
subroutine psb_hash_realloc(hash,info)
|
|
type(psb_hash_type), intent(inout) :: hash
|
|
integer(psb_ipk_), intent(out) :: info
|
|
type(psb_hash_type) :: nhash
|
|
integer(psb_ipk_) :: key, val, nextval,i
|
|
|
|
info = HashOk
|
|
|
|
call psb_hash_init((hash%hsize+1),nhash,info)
|
|
|
|
if (info /= HashOk) then
|
|
info = HashOutOfMemory
|
|
return
|
|
endif
|
|
do i=0, hash%hsize-1
|
|
key = hash%table(i,1)
|
|
nextval = hash%table(i,2)
|
|
if (key /= HashFreeEntry) then
|
|
call psb_hash_searchinskey(key,val,nextval,nhash,info)
|
|
if (info /= psb_success_) then
|
|
info = HashOutOfMemory
|
|
return
|
|
end if
|
|
end if
|
|
end do
|
|
call HashTransfer(nhash,hash,info)
|
|
end subroutine psb_hash_realloc
|
|
|
|
recursive subroutine psb_hash_searchinskey(key,val,nextval,hash,info)
|
|
integer(psb_ipk_), intent(in) :: key,nextval
|
|
type(psb_hash_type) :: hash
|
|
integer(psb_ipk_), intent(out) :: val, info
|
|
|
|
integer(psb_ipk_) :: hsize,hmask, hk, hd
|
|
|
|
info = HashOK
|
|
hsize = hash%hsize
|
|
hmask = hash%hmask
|
|
|
|
hk = iand(hashval(key),hmask)
|
|
if (hk == 0) then
|
|
hd = 1
|
|
else
|
|
hd = hsize - hk
|
|
hd = ior(hd,1)
|
|
end if
|
|
|
|
hash%nsrch = hash%nsrch + 1
|
|
do
|
|
hash%nacc = hash%nacc + 1
|
|
if (hash%table(hk,1) == key) then
|
|
val = hash%table(hk,2)
|
|
info = HashDuplicate
|
|
return
|
|
end if
|
|
if (hash%table(hk,1) == HashFreeEntry) then
|
|
if (hash%nk == hash%hsize -1) then
|
|
!
|
|
! Note: because of the way we allocate things at CDALL
|
|
! time this is really unlikely; if we get here, we
|
|
! have at least as many halo indices as internals, which
|
|
! means we're already in trouble. But we try to keep going.
|
|
!
|
|
call psb_hash_realloc(hash,info)
|
|
if (info /= HashOk) then
|
|
info = HashOutOfMemory
|
|
return
|
|
else
|
|
call psb_hash_searchinskey(key,val,nextval,hash,info)
|
|
return
|
|
end if
|
|
else
|
|
hash%nk = hash%nk + 1
|
|
hash%table(hk,1) = key
|
|
hash%table(hk,2) = nextval
|
|
val = nextval
|
|
return
|
|
end if
|
|
end if
|
|
hk = hk - hd
|
|
if (hk < 0) hk = hk + hsize
|
|
end do
|
|
end subroutine psb_hash_searchinskey
|
|
|
|
subroutine psb_hash_searchkey(key,val,hash,info)
|
|
integer(psb_ipk_), intent(in) :: key
|
|
type(psb_hash_type) :: hash
|
|
integer(psb_ipk_), intent(out) :: val, info
|
|
|
|
integer(psb_ipk_) :: hsize,hmask, hk, hd
|
|
|
|
info = HashOK
|
|
if (.not.allocated(hash%table) ) then
|
|
val = HashFreeEntry
|
|
return
|
|
end if
|
|
hsize = hash%hsize
|
|
hmask = hash%hmask
|
|
hk = iand(hashval(key),hmask)
|
|
if (hk == 0) then
|
|
hd = 1
|
|
else
|
|
hd = hsize - hk
|
|
hd = ior(hd,1)
|
|
end if
|
|
|
|
hash%nsrch = hash%nsrch + 1
|
|
do
|
|
hash%nacc = hash%nacc + 1
|
|
if (hash%table(hk,1) == key) then
|
|
val = hash%table(hk,2)
|
|
return
|
|
end if
|
|
if (hash%table(hk,1) == HashFreeEntry) then
|
|
val = HashFreeEntry
|
|
! !$ info = HashNotFound
|
|
return
|
|
end if
|
|
hk = hk - hd
|
|
if (hk < 0) hk = hk + hsize
|
|
end do
|
|
end subroutine psb_hash_searchkey
|
|
|
|
end module psb_hash_mod
|