|
|
@ -185,12 +185,6 @@ subroutine psi_itranidxm(iictxt,iicomm,flag,n,beta,y,idx,totxch,totsnd,totrcv,wo
|
|
|
|
integer(psb_ipk_) :: nesd, nerv,&
|
|
|
|
integer(psb_ipk_) :: nesd, nerv,&
|
|
|
|
& err_act, i, idx_pt, totsnd_, totrcv_,&
|
|
|
|
& err_act, i, idx_pt, totsnd_, totrcv_,&
|
|
|
|
& snd_pt, rcv_pt, pnti
|
|
|
|
& snd_pt, rcv_pt, pnti
|
|
|
|
!!$ integer(psb_ipk_) :: np, me, nesd, nerv,&
|
|
|
|
|
|
|
|
!!$ & proc_to_comm, p2ptag, p2pstat(mpi_status_size),&
|
|
|
|
|
|
|
|
!!$ & iret, err_act, i, idx_pt, totsnd_, totrcv_,&
|
|
|
|
|
|
|
|
!!$ & snd_pt, rcv_pt, pnti, data_
|
|
|
|
|
|
|
|
!!$ integer(psb_ipk_), allocatable, dimension(:) :: bsdidx, brvidx,&
|
|
|
|
|
|
|
|
!!$ & sdsz, rvsz, prcid, rvhd, sdhd
|
|
|
|
|
|
|
|
integer(psb_ipk_) :: ierr(5)
|
|
|
|
integer(psb_ipk_) :: ierr(5)
|
|
|
|
logical :: swap_mpi, swap_sync, swap_send, swap_recv,&
|
|
|
|
logical :: swap_mpi, swap_sync, swap_send, swap_recv,&
|
|
|
|
& albf,do_send,do_recv
|
|
|
|
& albf,do_send,do_recv
|
|
|
@ -1049,10 +1043,10 @@ end subroutine psi_itranidxv
|
|
|
|
subroutine psi_iswaptran_vect(flag,beta,y,desc_a,work,info,data)
|
|
|
|
subroutine psi_iswaptran_vect(flag,beta,y,desc_a,work,info,data)
|
|
|
|
|
|
|
|
|
|
|
|
use psi_mod, psb_protect_name => psi_iswaptran_vect
|
|
|
|
use psi_mod, psb_protect_name => psi_iswaptran_vect
|
|
|
|
|
|
|
|
use psb_i_base_vect_mod
|
|
|
|
use psb_error_mod
|
|
|
|
use psb_error_mod
|
|
|
|
use psb_desc_mod
|
|
|
|
use psb_desc_mod
|
|
|
|
use psb_penv_mod
|
|
|
|
use psb_penv_mod
|
|
|
|
use psb_i_base_vect_mod
|
|
|
|
|
|
|
|
#ifdef MPI_MOD
|
|
|
|
#ifdef MPI_MOD
|
|
|
|
use mpi
|
|
|
|
use mpi
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
@ -1071,7 +1065,7 @@ subroutine psi_iswaptran_vect(flag,beta,y,desc_a,work,info,data)
|
|
|
|
|
|
|
|
|
|
|
|
! locals
|
|
|
|
! locals
|
|
|
|
integer(psb_ipk_) :: ictxt, np, me, icomm, idxs, idxr, totxch, err_act, data_
|
|
|
|
integer(psb_ipk_) :: ictxt, np, me, icomm, idxs, idxr, totxch, err_act, data_
|
|
|
|
integer(psb_ipk_), pointer :: d_idx(:)
|
|
|
|
class(psb_i_base_vect_type), pointer :: d_vidx
|
|
|
|
integer(psb_ipk_) :: ierr(5)
|
|
|
|
integer(psb_ipk_) :: ierr(5)
|
|
|
|
character(len=20) :: name
|
|
|
|
character(len=20) :: name
|
|
|
|
|
|
|
|
|
|
|
@ -1100,13 +1094,13 @@ subroutine psi_iswaptran_vect(flag,beta,y,desc_a,work,info,data)
|
|
|
|
data_ = psb_comm_halo_
|
|
|
|
data_ = psb_comm_halo_
|
|
|
|
end if
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
|
|
call desc_a%get_list(data_,d_idx,totxch,idxr,idxs,info)
|
|
|
|
call desc_a%get_list(data_,d_vidx,totxch,idxr,idxs,info)
|
|
|
|
if (info /= psb_success_) then
|
|
|
|
if (info /= psb_success_) then
|
|
|
|
call psb_errpush(psb_err_internal_error_,name,a_err='psb_cd_get_list')
|
|
|
|
call psb_errpush(psb_err_internal_error_,name,a_err='psb_cd_get_list')
|
|
|
|
goto 9999
|
|
|
|
goto 9999
|
|
|
|
end if
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
|
|
call psi_swaptran(ictxt,icomm,flag,beta,y,d_idx,totxch,idxs,idxr,work,info)
|
|
|
|
call psi_swaptran(ictxt,icomm,flag,beta,y,d_vidx,totxch,idxs,idxr,work,info)
|
|
|
|
if (info /= psb_success_) goto 9999
|
|
|
|
if (info /= psb_success_) goto 9999
|
|
|
|
|
|
|
|
|
|
|
|
call psb_erractionrestore(err_act)
|
|
|
|
call psb_erractionrestore(err_act)
|
|
|
@ -1119,10 +1113,23 @@ end subroutine psi_iswaptran_vect
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
subroutine psi_itranidx_vect(iictxt,iicomm,flag,beta,y,idx,&
|
|
|
|
!
|
|
|
|
|
|
|
|
!
|
|
|
|
|
|
|
|
! Subroutine: psi_itran_vidx_vect
|
|
|
|
|
|
|
|
! Data exchange among processes.
|
|
|
|
|
|
|
|
!
|
|
|
|
|
|
|
|
! Takes care of Y an exanspulated vector. Relies on the gather/scatter methods
|
|
|
|
|
|
|
|
! of vectors.
|
|
|
|
|
|
|
|
!
|
|
|
|
|
|
|
|
! The real workhorse: the outer routine will only choose the index list
|
|
|
|
|
|
|
|
! this one takes the index list and does the actual exchange.
|
|
|
|
|
|
|
|
!
|
|
|
|
|
|
|
|
!
|
|
|
|
|
|
|
|
!
|
|
|
|
|
|
|
|
subroutine psi_itran_vidx_vect(iictxt,iicomm,flag,beta,y,idx,&
|
|
|
|
& totxch,totsnd,totrcv,work,info)
|
|
|
|
& totxch,totsnd,totrcv,work,info)
|
|
|
|
|
|
|
|
|
|
|
|
use psi_mod, psb_protect_name => psi_itranidx_vect
|
|
|
|
use psi_mod, psb_protect_name => psi_itran_vidx_vect
|
|
|
|
use psb_error_mod
|
|
|
|
use psb_error_mod
|
|
|
|
use psb_desc_mod
|
|
|
|
use psb_desc_mod
|
|
|
|
use psb_penv_mod
|
|
|
|
use psb_penv_mod
|
|
|
@ -1140,25 +1147,20 @@ subroutine psi_itranidx_vect(iictxt,iicomm,flag,beta,y,idx,&
|
|
|
|
class(psb_i_base_vect_type) :: y
|
|
|
|
class(psb_i_base_vect_type) :: y
|
|
|
|
integer(psb_ipk_) :: beta
|
|
|
|
integer(psb_ipk_) :: beta
|
|
|
|
integer(psb_ipk_), target :: work(:)
|
|
|
|
integer(psb_ipk_), target :: work(:)
|
|
|
|
integer(psb_ipk_), intent(in) :: idx(:),totxch,totsnd, totrcv
|
|
|
|
class(psb_i_base_vect_type), intent(inout) :: idx
|
|
|
|
|
|
|
|
integer(psb_ipk_), intent(in) :: totxch,totsnd, totrcv
|
|
|
|
|
|
|
|
|
|
|
|
! locals
|
|
|
|
! locals
|
|
|
|
integer(psb_mpik_) :: ictxt, icomm, np, me,&
|
|
|
|
integer(psb_mpik_) :: ictxt, icomm, np, me,&
|
|
|
|
& proc_to_comm, p2ptag, p2pstat(mpi_status_size), iret
|
|
|
|
& proc_to_comm, p2ptag, p2pstat(mpi_status_size), iret
|
|
|
|
integer(psb_mpik_), allocatable, dimension(:) :: bsdidx, brvidx,&
|
|
|
|
integer(psb_mpik_), allocatable :: prcid(:)
|
|
|
|
& sdsz, rvsz, prcid, rvhd, sdhd
|
|
|
|
|
|
|
|
integer(psb_ipk_) :: nesd, nerv,&
|
|
|
|
integer(psb_ipk_) :: nesd, nerv,&
|
|
|
|
& err_act, i, idx_pt, totsnd_, totrcv_,&
|
|
|
|
& err_act, i, idx_pt, totsnd_, totrcv_,&
|
|
|
|
& snd_pt, rcv_pt, pnti, n
|
|
|
|
& snd_pt, rcv_pt, pnti, n
|
|
|
|
integer(psb_ipk_) :: ierr(5)
|
|
|
|
integer(psb_ipk_) :: ierr(5)
|
|
|
|
logical :: swap_mpi, swap_sync, swap_send, swap_recv,&
|
|
|
|
logical :: swap_mpi, swap_sync, swap_send, swap_recv,&
|
|
|
|
& albf,do_send,do_recv
|
|
|
|
& albf,do_send,do_recv
|
|
|
|
logical, parameter :: usersend=.false.
|
|
|
|
logical, parameter :: usersend=.false., debug=.false.
|
|
|
|
|
|
|
|
|
|
|
|
integer(psb_ipk_), pointer, dimension(:) :: sndbuf, rcvbuf
|
|
|
|
|
|
|
|
#ifdef HAVE_VOLATILE
|
|
|
|
|
|
|
|
volatile :: sndbuf, rcvbuf
|
|
|
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
character(len=20) :: name
|
|
|
|
character(len=20) :: name
|
|
|
|
|
|
|
|
|
|
|
|
info=psb_success_
|
|
|
|
info=psb_success_
|
|
|
@ -1185,97 +1187,89 @@ subroutine psi_itranidx_vect(iictxt,iicomm,flag,beta,y,idx,&
|
|
|
|
totrcv_ = totrcv * n
|
|
|
|
totrcv_ = totrcv * n
|
|
|
|
totsnd_ = totsnd * n
|
|
|
|
totsnd_ = totsnd * n
|
|
|
|
|
|
|
|
|
|
|
|
if (swap_mpi) then
|
|
|
|
call idx%sync()
|
|
|
|
allocate(sdsz(0:np-1), rvsz(0:np-1), bsdidx(0:np-1),&
|
|
|
|
|
|
|
|
& brvidx(0:np-1), rvhd(0:np-1), sdhd(0:np-1), prcid(0:np-1),&
|
|
|
|
if (debug) write(*,*) me,'Internal buffer'
|
|
|
|
& stat=info)
|
|
|
|
if (do_send) then
|
|
|
|
if(info /= psb_success_) then
|
|
|
|
if (allocated(y%comid)) then
|
|
|
|
call psb_errpush(psb_err_alloc_dealloc_,name)
|
|
|
|
!
|
|
|
|
|
|
|
|
! Unfinished communication? Something is wrong....
|
|
|
|
|
|
|
|
!
|
|
|
|
|
|
|
|
info=psb_err_mpi_error_
|
|
|
|
|
|
|
|
ierr(1) = -2
|
|
|
|
|
|
|
|
call psb_errpush(info,name,i_err=ierr)
|
|
|
|
goto 9999
|
|
|
|
goto 9999
|
|
|
|
end if
|
|
|
|
end if
|
|
|
|
|
|
|
|
if (debug) write(*,*) me,'do_send start'
|
|
|
|
|
|
|
|
call y%new_buffer(size(idx%v),info)
|
|
|
|
|
|
|
|
call y%new_comid(totxch,info)
|
|
|
|
|
|
|
|
call psb_realloc(totxch,prcid,info)
|
|
|
|
|
|
|
|
! First I post all the non blocking receives
|
|
|
|
|
|
|
|
pnti = 1
|
|
|
|
|
|
|
|
p2ptag = psb_int_swap_tag
|
|
|
|
|
|
|
|
do i=1, totxch
|
|
|
|
|
|
|
|
proc_to_comm = idx%v(pnti+psb_proc_id_)
|
|
|
|
|
|
|
|
nerv = idx%v(pnti+psb_n_elem_recv_)
|
|
|
|
|
|
|
|
nesd = idx%v(pnti+nerv+psb_n_elem_send_)
|
|
|
|
|
|
|
|
|
|
|
|
rvhd(:) = mpi_request_null
|
|
|
|
snd_pt = 1+pnti+nerv+psb_n_elem_send_
|
|
|
|
sdsz(:) = 0
|
|
|
|
rcv_pt = 1+pnti+psb_n_elem_recv_
|
|
|
|
rvsz(:) = 0
|
|
|
|
call psb_get_rank(prcid(i),ictxt,proc_to_comm)
|
|
|
|
|
|
|
|
if ((nesd>0).and.(proc_to_comm /= me)) then
|
|
|
|
! prepare info for communications
|
|
|
|
if (debug) write(*,*) me,'Posting receive from',prcid(i),rcv_pt
|
|
|
|
|
|
|
|
call mpi_irecv(y%combuf(snd_pt),nesd,&
|
|
|
|
|
|
|
|
& psb_mpi_ipk_integer,prcid(i),&
|
|
|
|
|
|
|
|
& p2ptag, icomm,y%comid(i,2),iret)
|
|
|
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
pnti = pnti + nerv + nesd + 3
|
|
|
|
|
|
|
|
end do
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
if (debug) write(*,*) me,' Gather '
|
|
|
|
|
|
|
|
!
|
|
|
|
|
|
|
|
! Then gather for sending.
|
|
|
|
|
|
|
|
!
|
|
|
|
pnti = 1
|
|
|
|
pnti = 1
|
|
|
|
snd_pt = 1
|
|
|
|
snd_pt = 1
|
|
|
|
rcv_pt = 1
|
|
|
|
|
|
|
|
do i=1, totxch
|
|
|
|
do i=1, totxch
|
|
|
|
proc_to_comm = idx(pnti+psb_proc_id_)
|
|
|
|
nerv = idx%v(pnti+psb_n_elem_recv_)
|
|
|
|
nerv = idx(pnti+psb_n_elem_recv_)
|
|
|
|
nesd = idx%v(pnti+nerv+psb_n_elem_send_)
|
|
|
|
nesd = idx(pnti+nerv+psb_n_elem_send_)
|
|
|
|
snd_pt = 1+pnti+nerv+psb_n_elem_send_
|
|
|
|
call psb_get_rank(prcid(proc_to_comm),ictxt,proc_to_comm)
|
|
|
|
rcv_pt = 1+pnti+psb_n_elem_recv_
|
|
|
|
|
|
|
|
|
|
|
|
brvidx(proc_to_comm) = rcv_pt
|
|
|
|
idx_pt = rcv_pt
|
|
|
|
rvsz(proc_to_comm) = nerv
|
|
|
|
call y%gth(idx_pt,nerv,idx)
|
|
|
|
|
|
|
|
|
|
|
|
bsdidx(proc_to_comm) = snd_pt
|
|
|
|
|
|
|
|
sdsz(proc_to_comm) = nesd
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
rcv_pt = rcv_pt + nerv
|
|
|
|
|
|
|
|
snd_pt = snd_pt + nesd
|
|
|
|
|
|
|
|
pnti = pnti + nerv + nesd + 3
|
|
|
|
pnti = pnti + nerv + nesd + 3
|
|
|
|
|
|
|
|
|
|
|
|
end do
|
|
|
|
end do
|
|
|
|
|
|
|
|
|
|
|
|
else
|
|
|
|
!
|
|
|
|
allocate(rvhd(totxch),prcid(totxch),stat=info)
|
|
|
|
! Then wait
|
|
|
|
if(info /= psb_success_) then
|
|
|
|
!
|
|
|
|
call psb_errpush(psb_err_alloc_dealloc_,name)
|
|
|
|
call y%device_wait()
|
|
|
|
goto 9999
|
|
|
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
totrcv_ = max(totrcv_,1)
|
|
|
|
|
|
|
|
totsnd_ = max(totsnd_,1)
|
|
|
|
|
|
|
|
if((totrcv_+totsnd_) < size(work)) then
|
|
|
|
|
|
|
|
sndbuf => work(1:totsnd_)
|
|
|
|
|
|
|
|
rcvbuf => work(totsnd_+1:totsnd_+totrcv_)
|
|
|
|
|
|
|
|
albf=.false.
|
|
|
|
|
|
|
|
else
|
|
|
|
|
|
|
|
allocate(sndbuf(totsnd_),rcvbuf(totrcv_), stat=info)
|
|
|
|
|
|
|
|
if(info /= psb_success_) then
|
|
|
|
|
|
|
|
call psb_errpush(psb_err_alloc_dealloc_,name)
|
|
|
|
|
|
|
|
goto 9999
|
|
|
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
albf=.true.
|
|
|
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
if (debug) write(*,*) me,' isend'
|
|
|
|
|
|
|
|
|
|
|
|
if (do_send) then
|
|
|
|
!
|
|
|
|
|
|
|
|
! Then send
|
|
|
|
|
|
|
|
!
|
|
|
|
|
|
|
|
|
|
|
|
! Pack send buffers
|
|
|
|
|
|
|
|
pnti = 1
|
|
|
|
pnti = 1
|
|
|
|
snd_pt = 1
|
|
|
|
snd_pt = 1
|
|
|
|
rcv_pt = 1
|
|
|
|
rcv_pt = 1
|
|
|
|
|
|
|
|
p2ptag = psb_int_swap_tag
|
|
|
|
do i=1, totxch
|
|
|
|
do i=1, totxch
|
|
|
|
proc_to_comm = idx(pnti+psb_proc_id_)
|
|
|
|
proc_to_comm = idx%v(pnti+psb_proc_id_)
|
|
|
|
nerv = idx(pnti+psb_n_elem_recv_)
|
|
|
|
nerv = idx%v(pnti+psb_n_elem_recv_)
|
|
|
|
nesd = idx(pnti+nerv+psb_n_elem_send_)
|
|
|
|
nesd = idx%v(pnti+nerv+psb_n_elem_send_)
|
|
|
|
idx_pt = 1+pnti+psb_n_elem_recv_
|
|
|
|
snd_pt = 1+pnti+nerv+psb_n_elem_send_
|
|
|
|
|
|
|
|
rcv_pt = 1+pnti+psb_n_elem_recv_
|
|
|
|
call y%gth(nerv,idx(idx_pt:idx_pt+nerv-1),&
|
|
|
|
|
|
|
|
& rcvbuf(rcv_pt:rcv_pt+nerv-1))
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
rcv_pt = rcv_pt + nerv
|
|
|
|
|
|
|
|
snd_pt = snd_pt + nesd
|
|
|
|
|
|
|
|
pnti = pnti + nerv + nesd + 3
|
|
|
|
|
|
|
|
end do
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
if ((nerv>0).and.(proc_to_comm /= me)) then
|
|
|
|
|
|
|
|
call mpi_isend(y%combuf(rcv_pt),nerv,&
|
|
|
|
|
|
|
|
& psb_mpi_ipk_integer,prcid(i),&
|
|
|
|
|
|
|
|
& p2ptag,icomm,y%comid(i,1),iret)
|
|
|
|
end if
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
|
|
! Case SWAP_MPI
|
|
|
|
|
|
|
|
if (swap_mpi) then
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
! swap elements using mpi_alltoallv
|
|
|
|
|
|
|
|
call mpi_alltoallv(rcvbuf,rvsz,brvidx,&
|
|
|
|
|
|
|
|
& psb_mpi_ipk_integer,&
|
|
|
|
|
|
|
|
& sndbuf,sdsz,bsdidx,psb_mpi_ipk_integer,icomm,iret)
|
|
|
|
|
|
|
|
if(iret /= mpi_success) then
|
|
|
|
if(iret /= mpi_success) then
|
|
|
|
ierr(1) = iret
|
|
|
|
ierr(1) = iret
|
|
|
|
info=psb_err_mpi_error_
|
|
|
|
info=psb_err_mpi_error_
|
|
|
@ -1283,87 +1277,36 @@ subroutine psi_itranidx_vect(iictxt,iicomm,flag,beta,y,idx,&
|
|
|
|
goto 9999
|
|
|
|
goto 9999
|
|
|
|
end if
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
|
|
else if (swap_sync) then
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
pnti = 1
|
|
|
|
|
|
|
|
snd_pt = 1
|
|
|
|
|
|
|
|
rcv_pt = 1
|
|
|
|
|
|
|
|
do i=1, totxch
|
|
|
|
|
|
|
|
proc_to_comm = idx(pnti+psb_proc_id_)
|
|
|
|
|
|
|
|
nerv = idx(pnti+psb_n_elem_recv_)
|
|
|
|
|
|
|
|
nesd = idx(pnti+nerv+psb_n_elem_send_)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
if (proc_to_comm < me) then
|
|
|
|
|
|
|
|
if (nerv>0) call psb_snd(ictxt,&
|
|
|
|
|
|
|
|
& rcvbuf(rcv_pt:rcv_pt+nerv-1), proc_to_comm)
|
|
|
|
|
|
|
|
if (nesd>0) call psb_rcv(ictxt,&
|
|
|
|
|
|
|
|
& sndbuf(snd_pt:snd_pt+nesd-1), proc_to_comm)
|
|
|
|
|
|
|
|
else if (proc_to_comm > me) then
|
|
|
|
|
|
|
|
if (nesd>0) call psb_rcv(ictxt,&
|
|
|
|
|
|
|
|
& sndbuf(snd_pt:snd_pt+nesd-1), proc_to_comm)
|
|
|
|
|
|
|
|
if (nerv>0) call psb_snd(ictxt,&
|
|
|
|
|
|
|
|
& rcvbuf(rcv_pt:rcv_pt+nerv-1), proc_to_comm)
|
|
|
|
|
|
|
|
else if (proc_to_comm == me) then
|
|
|
|
|
|
|
|
if (nesd /= nerv) then
|
|
|
|
|
|
|
|
write(psb_err_unit,*) &
|
|
|
|
|
|
|
|
& 'Fatal error in swaptran: mismatch on self send',&
|
|
|
|
|
|
|
|
& nerv,nesd
|
|
|
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
sndbuf(snd_pt:snd_pt+nesd-1) = rcvbuf(rcv_pt:rcv_pt+nerv-1)
|
|
|
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
rcv_pt = rcv_pt + nerv
|
|
|
|
|
|
|
|
snd_pt = snd_pt + nesd
|
|
|
|
|
|
|
|
pnti = pnti + nerv + nesd + 3
|
|
|
|
pnti = pnti + nerv + nesd + 3
|
|
|
|
|
|
|
|
|
|
|
|
end do
|
|
|
|
end do
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
else if (swap_send .and. swap_recv) then
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
! First I post all the non blocking receives
|
|
|
|
|
|
|
|
pnti = 1
|
|
|
|
|
|
|
|
snd_pt = 1
|
|
|
|
|
|
|
|
rcv_pt = 1
|
|
|
|
|
|
|
|
do i=1, totxch
|
|
|
|
|
|
|
|
proc_to_comm = idx(pnti+psb_proc_id_)
|
|
|
|
|
|
|
|
nerv = idx(pnti+psb_n_elem_recv_)
|
|
|
|
|
|
|
|
nesd = idx(pnti+nerv+psb_n_elem_send_)
|
|
|
|
|
|
|
|
call psb_get_rank(prcid(i),ictxt,proc_to_comm)
|
|
|
|
|
|
|
|
if ((nesd>0).and.(proc_to_comm /= me)) then
|
|
|
|
|
|
|
|
p2ptag = psb_int_swap_tag
|
|
|
|
|
|
|
|
call mpi_irecv(sndbuf(snd_pt),nesd,&
|
|
|
|
|
|
|
|
& psb_mpi_ipk_integer,prcid(i),&
|
|
|
|
|
|
|
|
& p2ptag,icomm,rvhd(i),iret)
|
|
|
|
|
|
|
|
end if
|
|
|
|
end if
|
|
|
|
rcv_pt = rcv_pt + nerv
|
|
|
|
|
|
|
|
snd_pt = snd_pt + nesd
|
|
|
|
|
|
|
|
pnti = pnti + nerv + nesd + 3
|
|
|
|
|
|
|
|
end do
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
! Then I post all the blocking sends
|
|
|
|
if (do_recv) then
|
|
|
|
if (usersend) call mpi_barrier(icomm,iret)
|
|
|
|
if (debug) write(*,*) me,' do_Recv'
|
|
|
|
|
|
|
|
if (.not.allocated(y%comid)) then
|
|
|
|
|
|
|
|
!
|
|
|
|
|
|
|
|
! No matching send? Something is wrong....
|
|
|
|
|
|
|
|
!
|
|
|
|
|
|
|
|
info=psb_err_mpi_error_
|
|
|
|
|
|
|
|
ierr(1) = -2
|
|
|
|
|
|
|
|
call psb_errpush(info,name,i_err=ierr)
|
|
|
|
|
|
|
|
goto 9999
|
|
|
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
call psb_realloc(totxch,prcid,info)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
if (debug) write(*,*) me,' wait'
|
|
|
|
pnti = 1
|
|
|
|
pnti = 1
|
|
|
|
snd_pt = 1
|
|
|
|
|
|
|
|
rcv_pt = 1
|
|
|
|
|
|
|
|
do i=1, totxch
|
|
|
|
|
|
|
|
proc_to_comm = idx(pnti+psb_proc_id_)
|
|
|
|
|
|
|
|
nerv = idx(pnti+psb_n_elem_recv_)
|
|
|
|
|
|
|
|
nesd = idx(pnti+nerv+psb_n_elem_send_)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
if ((nerv>0).and.(proc_to_comm /= me)) then
|
|
|
|
|
|
|
|
p2ptag = psb_int_swap_tag
|
|
|
|
p2ptag = psb_int_swap_tag
|
|
|
|
if (usersend) then
|
|
|
|
do i=1, totxch
|
|
|
|
call mpi_rsend(rcvbuf(rcv_pt),nerv,&
|
|
|
|
proc_to_comm = idx%v(pnti+psb_proc_id_)
|
|
|
|
& psb_mpi_ipk_integer,prcid(i),&
|
|
|
|
nerv = idx%v(pnti+psb_n_elem_recv_)
|
|
|
|
& p2ptag, icomm,iret)
|
|
|
|
nesd = idx%v(pnti+nerv+psb_n_elem_send_)
|
|
|
|
else
|
|
|
|
snd_pt = 1+pnti+nerv+psb_n_elem_send_
|
|
|
|
call mpi_send(rcvbuf(rcv_pt),nerv,&
|
|
|
|
rcv_pt = 1+pnti+psb_n_elem_recv_
|
|
|
|
& psb_mpi_ipk_integer,prcid(i),&
|
|
|
|
|
|
|
|
& p2ptag, icomm,iret)
|
|
|
|
if (proc_to_comm /= me)then
|
|
|
|
end if
|
|
|
|
if (nerv>0) then
|
|
|
|
|
|
|
|
call mpi_wait(y%comid(i,1),p2pstat,iret)
|
|
|
|
if(iret /= mpi_success) then
|
|
|
|
if(iret /= mpi_success) then
|
|
|
|
ierr(1) = iret
|
|
|
|
ierr(1) = iret
|
|
|
|
info=psb_err_mpi_error_
|
|
|
|
info=psb_err_mpi_error_
|
|
|
@ -1371,120 +1314,69 @@ subroutine psi_itranidx_vect(iictxt,iicomm,flag,beta,y,idx,&
|
|
|
|
goto 9999
|
|
|
|
goto 9999
|
|
|
|
end if
|
|
|
|
end if
|
|
|
|
end if
|
|
|
|
end if
|
|
|
|
rcv_pt = rcv_pt + nerv
|
|
|
|
if (nesd>0) then
|
|
|
|
snd_pt = snd_pt + nesd
|
|
|
|
call mpi_wait(y%comid(i,2),p2pstat,iret)
|
|
|
|
pnti = pnti + nerv + nesd + 3
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
end do
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
pnti = 1
|
|
|
|
|
|
|
|
do i=1, totxch
|
|
|
|
|
|
|
|
proc_to_comm = idx(pnti+psb_proc_id_)
|
|
|
|
|
|
|
|
nerv = idx(pnti+psb_n_elem_recv_)
|
|
|
|
|
|
|
|
nesd = idx(pnti+nerv+psb_n_elem_send_)
|
|
|
|
|
|
|
|
p2ptag = psb_int_swap_tag
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
if ((proc_to_comm /= me).and.(nesd>0)) then
|
|
|
|
|
|
|
|
call mpi_wait(rvhd(i),p2pstat,iret)
|
|
|
|
|
|
|
|
if(iret /= mpi_success) then
|
|
|
|
if(iret /= mpi_success) then
|
|
|
|
ierr(1) = iret
|
|
|
|
ierr(1) = iret
|
|
|
|
info=psb_err_mpi_error_
|
|
|
|
info=psb_err_mpi_error_
|
|
|
|
call psb_errpush(info,name,i_err=ierr)
|
|
|
|
call psb_errpush(info,name,i_err=ierr)
|
|
|
|
goto 9999
|
|
|
|
goto 9999
|
|
|
|
end if
|
|
|
|
end if
|
|
|
|
|
|
|
|
end if
|
|
|
|
else if (proc_to_comm == me) then
|
|
|
|
else if (proc_to_comm == me) then
|
|
|
|
if (nesd /= nerv) then
|
|
|
|
if (nesd /= nerv) then
|
|
|
|
write(psb_err_unit,*) &
|
|
|
|
write(psb_err_unit,*) &
|
|
|
|
& 'Fatal error in swaptran: mismatch on self send', &
|
|
|
|
& 'Fatal error in swapdata: mismatch on self send',&
|
|
|
|
& nerv,nesd
|
|
|
|
& nerv,nesd
|
|
|
|
end if
|
|
|
|
end if
|
|
|
|
sndbuf(snd_pt:snd_pt+nesd-1) = rcvbuf(rcv_pt:rcv_pt+nerv-1)
|
|
|
|
y%combuf(snd_pt:snd_pt+nesd-1) = y%combuf(rcv_pt:rcv_pt+nerv-1)
|
|
|
|
end if
|
|
|
|
end if
|
|
|
|
pnti = pnti + nerv + nesd + 3
|
|
|
|
pnti = pnti + nerv + nesd + 3
|
|
|
|
end do
|
|
|
|
end do
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
if (debug) write(*,*) me,' scatter'
|
|
|
|
else if (swap_send) then
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
pnti = 1
|
|
|
|
|
|
|
|
snd_pt = 1
|
|
|
|
|
|
|
|
rcv_pt = 1
|
|
|
|
|
|
|
|
do i=1, totxch
|
|
|
|
|
|
|
|
proc_to_comm = idx(pnti+psb_proc_id_)
|
|
|
|
|
|
|
|
nerv = idx(pnti+psb_n_elem_recv_)
|
|
|
|
|
|
|
|
nesd = idx(pnti+nerv+psb_n_elem_send_)
|
|
|
|
|
|
|
|
if (nerv>0) call psb_snd(ictxt,&
|
|
|
|
|
|
|
|
& rcvbuf(rcv_pt:rcv_pt+nerv-1), proc_to_comm)
|
|
|
|
|
|
|
|
rcv_pt = rcv_pt + nerv
|
|
|
|
|
|
|
|
snd_pt = snd_pt + nesd
|
|
|
|
|
|
|
|
pnti = pnti + nerv + nesd + 3
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
end do
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
else if (swap_recv) then
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
pnti = 1
|
|
|
|
pnti = 1
|
|
|
|
snd_pt = 1
|
|
|
|
snd_pt = 1
|
|
|
|
rcv_pt = 1
|
|
|
|
rcv_pt = 1
|
|
|
|
do i=1, totxch
|
|
|
|
do i=1, totxch
|
|
|
|
proc_to_comm = idx(pnti+psb_proc_id_)
|
|
|
|
proc_to_comm = idx%v(pnti+psb_proc_id_)
|
|
|
|
nerv = idx(pnti+psb_n_elem_recv_)
|
|
|
|
nerv = idx%v(pnti+psb_n_elem_recv_)
|
|
|
|
nesd = idx(pnti+nerv+psb_n_elem_send_)
|
|
|
|
nesd = idx%v(pnti+nerv+psb_n_elem_send_)
|
|
|
|
if (nesd>0) call psb_rcv(ictxt,&
|
|
|
|
idx_pt = 1+pnti+psb_n_elem_recv_
|
|
|
|
& sndbuf(snd_pt:snd_pt+nesd-1), proc_to_comm)
|
|
|
|
snd_pt = 1+pnti+nerv+psb_n_elem_send_
|
|
|
|
rcv_pt = rcv_pt + nerv
|
|
|
|
rcv_pt = 1+pnti+psb_n_elem_recv_
|
|
|
|
snd_pt = snd_pt + nesd
|
|
|
|
|
|
|
|
pnti = pnti + nerv + nesd + 3
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
end do
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
if (do_recv) then
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
pnti = 1
|
|
|
|
if (debug) write(0,*)me,' Received from: ',prcid(i),&
|
|
|
|
snd_pt = 1
|
|
|
|
& y%combuf(snd_pt:snd_pt+nesd-1)
|
|
|
|
rcv_pt = 1
|
|
|
|
call y%sct(snd_pt,nesd,idx,beta)
|
|
|
|
do i=1, totxch
|
|
|
|
|
|
|
|
proc_to_comm = idx(pnti+psb_proc_id_)
|
|
|
|
|
|
|
|
nerv = idx(pnti+psb_n_elem_recv_)
|
|
|
|
|
|
|
|
nesd = idx(pnti+nerv+psb_n_elem_send_)
|
|
|
|
|
|
|
|
idx_pt = 1+pnti+nerv+psb_n_elem_send_
|
|
|
|
|
|
|
|
call y%sct(nesd,idx(idx_pt:idx_pt+nesd-1),&
|
|
|
|
|
|
|
|
& sndbuf(snd_pt:snd_pt+nesd-1),beta)
|
|
|
|
|
|
|
|
rcv_pt = rcv_pt + nerv
|
|
|
|
|
|
|
|
snd_pt = snd_pt + nesd
|
|
|
|
|
|
|
|
pnti = pnti + nerv + nesd + 3
|
|
|
|
pnti = pnti + nerv + nesd + 3
|
|
|
|
end do
|
|
|
|
end do
|
|
|
|
|
|
|
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
!
|
|
|
|
if (swap_mpi) then
|
|
|
|
! Then wait
|
|
|
|
deallocate(sdsz,rvsz,bsdidx,brvidx,rvhd,prcid,sdhd,&
|
|
|
|
!
|
|
|
|
& stat=info)
|
|
|
|
if (debug) write(*,*) me,' wait'
|
|
|
|
else
|
|
|
|
call y%device_wait()
|
|
|
|
deallocate(rvhd,prcid,stat=info)
|
|
|
|
if (debug) write(*,*) me,' free buffer'
|
|
|
|
end if
|
|
|
|
call y%free_buffer(info)
|
|
|
|
if(info /= psb_success_) then
|
|
|
|
if (info == 0) call y%free_comid(info)
|
|
|
|
|
|
|
|
if (info /= 0) then
|
|
|
|
call psb_errpush(psb_err_alloc_dealloc_,name)
|
|
|
|
call psb_errpush(psb_err_alloc_dealloc_,name)
|
|
|
|
goto 9999
|
|
|
|
goto 9999
|
|
|
|
end if
|
|
|
|
end if
|
|
|
|
if(albf) deallocate(sndbuf,rcvbuf,stat=info)
|
|
|
|
if (debug) write(*,*) me,' done'
|
|
|
|
if(info /= psb_success_) then
|
|
|
|
|
|
|
|
call psb_errpush(psb_err_alloc_dealloc_,name)
|
|
|
|
|
|
|
|
goto 9999
|
|
|
|
|
|
|
|
end if
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
call psb_erractionrestore(err_act)
|
|
|
|
call psb_erractionrestore(err_act)
|
|
|
|
return
|
|
|
|
return
|
|
|
|
|
|
|
|
|
|
|
|
9999 call psb_error_handler(ictxt,err_act)
|
|
|
|
9999 call psb_error_handler(ictxt,err_act)
|
|
|
|
|
|
|
|
|
|
|
|
return
|
|
|
|
return
|
|
|
|
end subroutine psi_itranidx_vect
|
|
|
|
|
|
|
|
|
|
|
|
end subroutine psi_itran_vidx_vect
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|