|
|
|
@ -1,7 +1,7 @@
|
|
|
|
|
module mat_dist
|
|
|
|
|
|
|
|
|
|
interface matdist
|
|
|
|
|
module procedure dmatdistf, zmatdistf, dmatdistv
|
|
|
|
|
module procedure dmatdistf, dmatdistv
|
|
|
|
|
end interface
|
|
|
|
|
|
|
|
|
|
contains
|
|
|
|
@ -64,18 +64,21 @@ contains
|
|
|
|
|
! on entry: specifies processor holding a_glob. default: 0
|
|
|
|
|
! on exit : unchanged.
|
|
|
|
|
!
|
|
|
|
|
use f90sparse
|
|
|
|
|
implicit none ! parameters
|
|
|
|
|
type(d_spmat) :: a_glob
|
|
|
|
|
use psb_all_mod
|
|
|
|
|
implicit none
|
|
|
|
|
|
|
|
|
|
! parameters
|
|
|
|
|
type(psb_dspmat_type) :: a_glob
|
|
|
|
|
real(kind(1.d0)), pointer :: b_glob(:)
|
|
|
|
|
integer :: icontxt
|
|
|
|
|
type(d_spmat) :: a
|
|
|
|
|
type(psb_dspmat_type) :: a
|
|
|
|
|
real(kind(1.d0)), pointer :: b(:)
|
|
|
|
|
type (desc_type) :: desc_a
|
|
|
|
|
type (psb_desc_type) :: desc_a
|
|
|
|
|
integer, intent(out) :: info
|
|
|
|
|
integer, optional :: inroot
|
|
|
|
|
character(len=5), optional :: fmt
|
|
|
|
|
interface
|
|
|
|
|
|
|
|
|
|
! .....user passed subroutine.....
|
|
|
|
|
subroutine parts(global_indx,n,np,pv,nv)
|
|
|
|
|
implicit none
|
|
|
|
@ -83,19 +86,21 @@ contains
|
|
|
|
|
integer, intent(out) :: nv
|
|
|
|
|
integer, intent(out) :: pv(*)
|
|
|
|
|
end subroutine parts
|
|
|
|
|
end interface ! local variables
|
|
|
|
|
end interface
|
|
|
|
|
|
|
|
|
|
! local variables
|
|
|
|
|
integer :: nprow, npcol, myprow, mypcol
|
|
|
|
|
integer :: ircode, length_row, i_count, j_count,&
|
|
|
|
|
& k_count, blockdim, root, liwork, nrow, ncol, nnzero, nrhs,&
|
|
|
|
|
& i,j,k, ll, isize, iproc, nnr, err, err_act, int_err(5)
|
|
|
|
|
integer, pointer :: iwork(:)
|
|
|
|
|
character :: afmt*5, atyp*5
|
|
|
|
|
type(d_spmat) :: blck
|
|
|
|
|
type(psb_dspmat_type) :: blck
|
|
|
|
|
integer, parameter :: nb=30
|
|
|
|
|
real(kind(1.d0)) :: t0, t1, t2, t3, t4, t5, mpi_wtime
|
|
|
|
|
external :: mpi_wtime
|
|
|
|
|
logical, parameter :: newt=.true.
|
|
|
|
|
character(len=20) :: name, ch_err
|
|
|
|
|
character(len=20) :: name, ch_err
|
|
|
|
|
|
|
|
|
|
info = 0
|
|
|
|
|
err = 0
|
|
|
|
@ -142,7 +147,6 @@ contains
|
|
|
|
|
liwork = max(nprow, nrow + ncol)
|
|
|
|
|
allocate(iwork(liwork), stat = info)
|
|
|
|
|
if (info /= 0) then
|
|
|
|
|
write(0,*) 'matdist allocation failed'
|
|
|
|
|
info=2025
|
|
|
|
|
int_err(1)=liwork
|
|
|
|
|
call psb_errpush(info,name,i_err=int_err)
|
|
|
|
@ -161,7 +165,7 @@ contains
|
|
|
|
|
goto 9999
|
|
|
|
|
end if
|
|
|
|
|
else
|
|
|
|
|
call f90_psdscall(nrow,nrow,parts,icontxt,desc_a,info)
|
|
|
|
|
call psb_dscall(nrow,nrow,parts,icontxt,desc_a,info)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
|
ch_err='psb_psdscall'
|
|
|
|
@ -169,14 +173,14 @@ contains
|
|
|
|
|
goto 9999
|
|
|
|
|
end if
|
|
|
|
|
endif
|
|
|
|
|
call f90_psspall(a,desc_a,info,nnz=nnzero/nprow)
|
|
|
|
|
call psb_spalloc(a,desc_a,info,nnz=nnzero/nprow)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
|
ch_err='psb_psspall'
|
|
|
|
|
call psb_errpush(info,name,a_err=ch_err)
|
|
|
|
|
goto 9999
|
|
|
|
|
end if
|
|
|
|
|
call f90_psdsall(nrow,b,desc_a,info)
|
|
|
|
|
call psb_alloc(nrow,b,desc_a,info)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
|
ch_err='psb_psdsall'
|
|
|
|
@ -188,7 +192,7 @@ contains
|
|
|
|
|
|
|
|
|
|
blck%m = nb
|
|
|
|
|
blck%k = ncol
|
|
|
|
|
call spall(blck,nb*ncol,info)
|
|
|
|
|
call psb_spall(blck,nb*ncol,info)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
|
ch_err='spall'
|
|
|
|
@ -201,8 +205,6 @@ contains
|
|
|
|
|
|
|
|
|
|
do while (i_count.le.nrow)
|
|
|
|
|
|
|
|
|
|
!!$ write(0,*) myprow,'main loop in matdist',i_count,nrow
|
|
|
|
|
!!$ call blacs_barrier(icontxt,'all')
|
|
|
|
|
call parts(i_count,nrow,nprow,iwork, length_row)
|
|
|
|
|
|
|
|
|
|
if (length_row.eq.1) then
|
|
|
|
@ -219,8 +221,7 @@ contains
|
|
|
|
|
|
|
|
|
|
! now we should insert rows i_count..j_count-1
|
|
|
|
|
nnr = j_count - i_count
|
|
|
|
|
!!$ write(0,*) myprow,'main loop in matdist',i_count,nnr,iproc
|
|
|
|
|
!!$ call blacs_barrier(icontxt,'all')
|
|
|
|
|
|
|
|
|
|
if (myprow == root) then
|
|
|
|
|
|
|
|
|
|
do j = i_count, j_count
|
|
|
|
@ -238,18 +239,18 @@ contains
|
|
|
|
|
blck%m = nnr
|
|
|
|
|
blck%k = nrow
|
|
|
|
|
if (iproc == myprow) then
|
|
|
|
|
call f90_psspins(a,i_count,1,blck,desc_a,info)
|
|
|
|
|
call psb_spins(ll,blck%ia1,blck%ia2,blck%aspk,a,desc_a,info)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
|
ch_err='psspins'
|
|
|
|
|
ch_err='psb_spins'
|
|
|
|
|
call psb_errpush(info,name,a_err=ch_err)
|
|
|
|
|
goto 9999
|
|
|
|
|
end if
|
|
|
|
|
call f90_psdsins(nnr,b,i_count,b_glob(i_count:j_count-1),&
|
|
|
|
|
call psb_ins(nnr,b,i_count,b_glob(i_count:j_count-1),&
|
|
|
|
|
&desc_a,info)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
|
ch_err='psdsins'
|
|
|
|
|
ch_err='psb_ins'
|
|
|
|
|
call psb_errpush(info,name,a_err=ch_err)
|
|
|
|
|
goto 9999
|
|
|
|
|
end if
|
|
|
|
@ -267,33 +268,33 @@ contains
|
|
|
|
|
if (iproc == myprow) then
|
|
|
|
|
call igerv2d(icontxt,1,1,nnr,1,root,0)
|
|
|
|
|
call igerv2d(icontxt,1,1,ll,1,root,0)
|
|
|
|
|
!!$ write(0,*) myprow,'rows and size ',nnr,ll,size(blck%ia2),size(blck%ia1)
|
|
|
|
|
call igerv2d(icontxt,nnr+1,1,blck%ia2,nnr+1,root,0)
|
|
|
|
|
if (ll > size(blck%ia1)) then
|
|
|
|
|
write(0,*) myprow,'need to reallocate ',ll
|
|
|
|
|
call spreall(blck,ll,info)
|
|
|
|
|
call psb_spreall(blck,ll,info)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
|
ch_err='spreall'
|
|
|
|
|
ch_err='psb_spreall'
|
|
|
|
|
call psb_errpush(info,name,a_err=ch_err)
|
|
|
|
|
goto 9999
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
endif
|
|
|
|
|
call igerv2d(icontxt,ll,1,blck%ia1,ll,root,0)
|
|
|
|
|
call igerv2d(icontxt,nnr+1,1,blck%ia2,nnr+1,root,0)
|
|
|
|
|
call dgerv2d(icontxt,ll,1,blck%aspk,ll,root,0)
|
|
|
|
|
call dgerv2d(icontxt,nnr,1,b_glob(i_count:i_count+nnr-1),nnr,root,0)
|
|
|
|
|
call igesd2d(icontxt,1,1,ll,1,root,0)
|
|
|
|
|
blck%m = nnr
|
|
|
|
|
blck%k = nrow
|
|
|
|
|
call f90_psspins(a,i_count,1,blck,desc_a,info)
|
|
|
|
|
blck%infoa(psb_nnz_) = ll
|
|
|
|
|
call psb_spins(ll,blck%ia1,blck%ia2,blck%aspk,a,desc_a,info)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
|
ch_err='psspins'
|
|
|
|
|
call psb_errpush(info,name,a_err=ch_err)
|
|
|
|
|
goto 9999
|
|
|
|
|
end if
|
|
|
|
|
call f90_psdsins(nnr,b,i_count,b_glob(i_count:i_count+nnr-1),&
|
|
|
|
|
call psb_ins(nnr,b,i_count,b_glob(i_count:i_count+nnr-1),&
|
|
|
|
|
&desc_a,info)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
@ -330,14 +331,14 @@ contains
|
|
|
|
|
blck%m = 1
|
|
|
|
|
blck%k = nrow
|
|
|
|
|
|
|
|
|
|
call f90_psspins(a,i_count,1,blck,desc_a,info)
|
|
|
|
|
call psb_spins(ll,blck%ia1,blck%ia2,blck%aspk,a,desc_a,info)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
|
ch_err='psspins'
|
|
|
|
|
call psb_errpush(info,name,a_err=ch_err)
|
|
|
|
|
goto 9999
|
|
|
|
|
end if
|
|
|
|
|
call f90_psdsins(1,b,i_count,b_glob(i_count:i_count),&
|
|
|
|
|
call psb_ins(1,b,i_count,b_glob(i_count:i_count),&
|
|
|
|
|
&desc_a,info)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
@ -363,14 +364,14 @@ contains
|
|
|
|
|
call igesd2d(icontxt,1,1,ll,1,root,0)
|
|
|
|
|
blck%m = 1
|
|
|
|
|
blck%k = nrow
|
|
|
|
|
call f90_psspins(a,i_count,1,blck,desc_a,info)
|
|
|
|
|
call psb_spins(ll,blck%ia1,blck%ia2,blck%aspk,a,desc_a,info)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
|
ch_err='psspins'
|
|
|
|
|
call psb_errpush(info,name,a_err=ch_err)
|
|
|
|
|
goto 9999
|
|
|
|
|
end if
|
|
|
|
|
call f90_psdsins(1,b,i_count,b_glob(i_count:i_count),&
|
|
|
|
|
call psb_ins(1,b,i_count,b_glob(i_count:i_count),&
|
|
|
|
|
&desc_a,info)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
@ -422,7 +423,7 @@ contains
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
else
|
|
|
|
|
call f90_psspasb(a,desc_a,info,dup=1,afmt=afmt)
|
|
|
|
|
call psb_spasb(a,desc_a,info,afmt=afmt,dup=1)
|
|
|
|
|
if(info/=0)then
|
|
|
|
|
info=4010
|
|
|
|
|
ch_err='psspasb'
|
|
|
|
@ -432,14 +433,14 @@ contains
|
|
|
|
|
endif
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
call f90_psdsasb(b,desc_a,info)
|
|
|
|
|
call psb_asb(b,desc_a,info)
|
|
|
|
|
if(info/=0)then
|
|
|
|
|
info=4010
|
|
|
|
|
ch_err='psdsasb'
|
|
|
|
|
call psb_errpush(info,name,a_err=ch_err)
|
|
|
|
|
goto 9999
|
|
|
|
|
end if
|
|
|
|
|
call spfree(blck,info)
|
|
|
|
|
call psb_spfree(blck,info)
|
|
|
|
|
if(info/=0)then
|
|
|
|
|
info=4010
|
|
|
|
|
ch_err='spfree'
|
|
|
|
@ -522,14 +523,14 @@ contains
|
|
|
|
|
! on entry: specifies processor holding a_glob. default: 0
|
|
|
|
|
! on exit : unchanged.
|
|
|
|
|
!
|
|
|
|
|
use f90sparse
|
|
|
|
|
use psb_all_mod
|
|
|
|
|
implicit none ! parameters
|
|
|
|
|
type(d_spmat) :: a_glob
|
|
|
|
|
type(psb_dspmat_type) :: a_glob
|
|
|
|
|
real(kind(1.d0)), pointer :: b_glob(:)
|
|
|
|
|
integer :: icontxt, v(:)
|
|
|
|
|
type(d_spmat) :: a
|
|
|
|
|
type(psb_dspmat_type) :: a
|
|
|
|
|
real(kind(1.d0)), pointer :: b(:)
|
|
|
|
|
type (desc_type) :: desc_a
|
|
|
|
|
type (psb_desc_type) :: desc_a
|
|
|
|
|
integer, intent(out) :: info
|
|
|
|
|
integer, optional :: inroot
|
|
|
|
|
character(len=5), optional :: fmt
|
|
|
|
@ -540,7 +541,7 @@ contains
|
|
|
|
|
& i,j,k, ll, isize, iproc, nnr, err, err_act, int_err(5)
|
|
|
|
|
integer, pointer :: iwork(:)
|
|
|
|
|
character :: afmt*5, atyp*5
|
|
|
|
|
type(d_spmat) :: blck
|
|
|
|
|
type(psb_dspmat_type) :: blck
|
|
|
|
|
integer, parameter :: nb=30
|
|
|
|
|
logical, parameter :: newt=.true.
|
|
|
|
|
real(kind(1.d0)) :: t0, t1, t2, t3, t4, t5, mpi_wtime
|
|
|
|
@ -615,14 +616,14 @@ contains
|
|
|
|
|
goto 9999
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
call f90_psspall(a,desc_a,info,nnz=((nnzero+nprow-1)/nprow))
|
|
|
|
|
call psb_spalloc(a,desc_a,info,nnz=((nnzero+nprow-1)/nprow))
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
|
ch_err='psb_psspall'
|
|
|
|
|
call psb_errpush(info,name,a_err=ch_err)
|
|
|
|
|
goto 9999
|
|
|
|
|
end if
|
|
|
|
|
call f90_psdsall(nrow,b,desc_a,info)
|
|
|
|
|
call psb_alloc(nrow,b,desc_a,info)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
|
ch_err='psb_psdsall'
|
|
|
|
@ -634,7 +635,7 @@ contains
|
|
|
|
|
|
|
|
|
|
blck%m = nb
|
|
|
|
|
blck%k = ncol
|
|
|
|
|
call spall(blck,nb*ncol,info)
|
|
|
|
|
call psb_spall(blck,nb*ncol,info)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
|
ch_err='spall'
|
|
|
|
@ -663,7 +664,7 @@ contains
|
|
|
|
|
if (myprow == root) then
|
|
|
|
|
ll = a_glob%ia2(j_count)-a_glob%ia2(i_count)
|
|
|
|
|
if (ll > size(blck%aspk)) then
|
|
|
|
|
call spreall(blck,ll,info)
|
|
|
|
|
call psb_spreall(blck,ll,info)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
|
ch_err='spreall'
|
|
|
|
@ -683,17 +684,17 @@ contains
|
|
|
|
|
|
|
|
|
|
blck%m = nnr
|
|
|
|
|
blck%k = nrow
|
|
|
|
|
blck%infoa(nnz_) = ll
|
|
|
|
|
blck%infoa(psb_nnz_) = ll
|
|
|
|
|
if (iproc == myprow) then
|
|
|
|
|
call psb_spins(ll,blck%ia1,blck%ia2,blck%aspk,a,desc_a,info)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
|
ch_err='spins'
|
|
|
|
|
ch_err='psb_spins'
|
|
|
|
|
call psb_errpush(info,name,a_err=ch_err)
|
|
|
|
|
goto 9999
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
call f90_psdsins(nnr,b,i_count,b_glob(i_count:j_count-1),&
|
|
|
|
|
call psb_ins(nnr,b,i_count,b_glob(i_count:j_count-1),&
|
|
|
|
|
&desc_a,info)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
@ -717,7 +718,7 @@ contains
|
|
|
|
|
call igerv2d(icontxt,1,1,ll,1,root,0)
|
|
|
|
|
if (ll > size(blck%aspk)) then
|
|
|
|
|
write(0,*) myprow,'need to reallocate ',ll
|
|
|
|
|
call spreall(blck,ll,info)
|
|
|
|
|
call psb_spreall(blck,ll,info)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
|
ch_err='spreall'
|
|
|
|
@ -732,7 +733,7 @@ contains
|
|
|
|
|
call igesd2d(icontxt,1,1,ll,1,root,0)
|
|
|
|
|
blck%m = nnr
|
|
|
|
|
blck%k = nrow
|
|
|
|
|
blck%infoa(nnz_) = ll
|
|
|
|
|
blck%infoa(psb_nnz_) = ll
|
|
|
|
|
call psb_spins(ll,blck%ia1,blck%ia2,blck%aspk,a,desc_a,info)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
@ -740,7 +741,7 @@ contains
|
|
|
|
|
call psb_errpush(info,name,a_err=ch_err)
|
|
|
|
|
goto 9999
|
|
|
|
|
end if
|
|
|
|
|
call f90_psdsins(nnr,b,i_count,b_glob(i_count:i_count+nnr-1),&
|
|
|
|
|
call psb_ins(nnr,b,i_count,b_glob(i_count:i_count+nnr-1),&
|
|
|
|
|
&desc_a,info)
|
|
|
|
|
if(info/=0) then
|
|
|
|
|
info=4010
|
|
|
|
@ -795,7 +796,7 @@ contains
|
|
|
|
|
call psb_errpush(info,name,a_err=ch_err)
|
|
|
|
|
goto 9999
|
|
|
|
|
end if
|
|
|
|
|
call spfree(blck,info)
|
|
|
|
|
call psb_spfree(blck,info)
|
|
|
|
|
if(info/=0)then
|
|
|
|
|
info=4010
|
|
|
|
|
ch_err='spfree'
|
|
|
|
@ -819,297 +820,4 @@ contains
|
|
|
|
|
|
|
|
|
|
end subroutine dmatdistv
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
subroutine zmatdistf (a_glob, a, parts, icontxt, desc_a,&
|
|
|
|
|
& b_glob, b, info,inroot,fmt)
|
|
|
|
|
!
|
|
|
|
|
! an utility subroutine to distribute a matrix among processors
|
|
|
|
|
! according to a user defined data distribution, using pessl
|
|
|
|
|
! sparse matrix subroutines.
|
|
|
|
|
!
|
|
|
|
|
! type(d_spmat) :: a_glob
|
|
|
|
|
! on entry: this contains the global sparse matrix as follows:
|
|
|
|
|
! a%fida =='csr'
|
|
|
|
|
! a%aspk for coefficient values
|
|
|
|
|
! a%ia1 for column indices
|
|
|
|
|
! a%ia2 for row pointers
|
|
|
|
|
! a%m for number of global matrix rows
|
|
|
|
|
! a%k for number of global matrix columns
|
|
|
|
|
! on exit : undefined, with unassociated pointers.
|
|
|
|
|
!
|
|
|
|
|
! type(d_spmat) :: a
|
|
|
|
|
! on entry: fresh variable.
|
|
|
|
|
! on exit : this will contain the local sparse matrix.
|
|
|
|
|
!
|
|
|
|
|
! interface parts
|
|
|
|
|
! ! .....user passed subroutine.....
|
|
|
|
|
! subroutine parts(global_indx,n,np,pv,nv)
|
|
|
|
|
! implicit none
|
|
|
|
|
! integer, intent(in) :: global_indx, n, np
|
|
|
|
|
! integer, intent(out) :: nv
|
|
|
|
|
! integer, intent(out) :: pv(*)
|
|
|
|
|
!
|
|
|
|
|
! end subroutine parts
|
|
|
|
|
! end interface
|
|
|
|
|
! on entry: subroutine providing user defined data distribution.
|
|
|
|
|
! for each global_indx the subroutine should return
|
|
|
|
|
! the list pv of all processes owning the row with
|
|
|
|
|
! that index; the list will contain nv entries.
|
|
|
|
|
! usually nv=1; if nv >1 then we have an overlap in the data
|
|
|
|
|
! distribution.
|
|
|
|
|
!
|
|
|
|
|
! integer :: icontxt
|
|
|
|
|
! on entry: blacs context.
|
|
|
|
|
! on exit : unchanged.
|
|
|
|
|
!
|
|
|
|
|
! type (desc_type) :: desc_a
|
|
|
|
|
! on entry: fresh variable.
|
|
|
|
|
! on exit : the updated array descriptor
|
|
|
|
|
!
|
|
|
|
|
! real(kind(1.d0)), pointer, optional :: b_glob(:)
|
|
|
|
|
! on entry: this contains right hand side.
|
|
|
|
|
! on exit :
|
|
|
|
|
!
|
|
|
|
|
! real(kind(1.d0)), pointer, optional :: b(:)
|
|
|
|
|
! on entry: fresh variable.
|
|
|
|
|
! on exit : this will contain the local right hand side.
|
|
|
|
|
!
|
|
|
|
|
! integer, optional :: inroot
|
|
|
|
|
! on entry: specifies processor holding a_glob. default: 0
|
|
|
|
|
! on exit : unchanged.
|
|
|
|
|
!
|
|
|
|
|
use typesp
|
|
|
|
|
use typedesc
|
|
|
|
|
use f90tools
|
|
|
|
|
implicit none ! parameters
|
|
|
|
|
type(z_spmat) :: a_glob
|
|
|
|
|
complex(kind(1.d0)), pointer :: b_glob(:)
|
|
|
|
|
integer :: icontxt
|
|
|
|
|
type(z_spmat) :: a
|
|
|
|
|
complex(kind(1.d0)), pointer :: b(:)
|
|
|
|
|
type (desc_type) :: desc_a
|
|
|
|
|
integer, intent(out) :: info
|
|
|
|
|
integer, optional :: inroot
|
|
|
|
|
character(len=5), optional :: fmt
|
|
|
|
|
interface
|
|
|
|
|
! .....user passed subroutine.....
|
|
|
|
|
subroutine parts(global_indx,n,np,pv,nv)
|
|
|
|
|
implicit none
|
|
|
|
|
integer, intent(in) :: global_indx, n, np
|
|
|
|
|
integer, intent(out) :: nv
|
|
|
|
|
integer, intent(out) :: pv(*)
|
|
|
|
|
end subroutine parts
|
|
|
|
|
end interface ! local variables
|
|
|
|
|
integer :: nprow, npcol, myprow, mypcol
|
|
|
|
|
integer :: ircode, length_row, i_count, j_count,&
|
|
|
|
|
& k_count, blockdim, root, liwork, nrow, ncol, nnzero, nrhs,&
|
|
|
|
|
& i,j,k, ll, isize, iproc, nnr, err, err_act, int_err(5)
|
|
|
|
|
integer, pointer :: iwork(:)
|
|
|
|
|
character :: afmt*5, atyp*5
|
|
|
|
|
type(z_spmat) :: blck
|
|
|
|
|
integer, parameter :: nb = 30
|
|
|
|
|
character(len=20) :: name, ch_err
|
|
|
|
|
|
|
|
|
|
info = 0
|
|
|
|
|
err = 0
|
|
|
|
|
name = 'mat_distf'
|
|
|
|
|
call psb_erractionsave(err_act)
|
|
|
|
|
|
|
|
|
|
! executable statements
|
|
|
|
|
if (present(inroot)) then
|
|
|
|
|
root = inroot
|
|
|
|
|
else
|
|
|
|
|
root = 0
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
call blacs_gridinfo(icontxt, nprow, npcol, myprow, mypcol)
|
|
|
|
|
if (myprow == root) then
|
|
|
|
|
! extract information from a_glob
|
|
|
|
|
if (a_glob%fida.ne. 'CSR') then
|
|
|
|
|
write(0,*) 'unsupported input matrix format'
|
|
|
|
|
call blacs_abort(icontxt,-1)
|
|
|
|
|
endif
|
|
|
|
|
nrow = a_glob%m
|
|
|
|
|
ncol = a_glob%k
|
|
|
|
|
if (nrow /= ncol) then
|
|
|
|
|
write(0,*) 'a rectangular matrix ? ',nrow,ncol
|
|
|
|
|
call blacs_abort(icontxt,-1)
|
|
|
|
|
endif
|
|
|
|
|
nnzero = size(a_glob%aspk)
|
|
|
|
|
nrhs = 1
|
|
|
|
|
! broadcast informations to other processors
|
|
|
|
|
call igebs2d(icontxt, 'a', ' ', 1, 1, nrow, 1)
|
|
|
|
|
call igebs2d(icontxt, 'a', ' ', 1, 1, ncol, 1)
|
|
|
|
|
call igebs2d(icontxt, 'a', ' ', 1, 1, nnzero, 1)
|
|
|
|
|
call igebs2d(icontxt, 'a', ' ', 1, 1, nrhs, 1)
|
|
|
|
|
else !(myprow /= root)
|
|
|
|
|
! receive informations
|
|
|
|
|
call igebr2d(icontxt, 'a', ' ', 1, 1, nrow, 1, root, 0)
|
|
|
|
|
call igebr2d(icontxt, 'a', ' ', 1, 1, ncol, 1, root, 0)
|
|
|
|
|
call igebr2d(icontxt, 'a', ' ', 1, 1, nnzero, 1, root, 0)
|
|
|
|
|
call igebr2d(icontxt, 'a', ' ', 1, 1, nrhs, 1, root, 0)
|
|
|
|
|
end if ! allocate integer work area
|
|
|
|
|
liwork = max(nprow, nrow + ncol)
|
|
|
|
|
allocate(iwork(liwork), stat = ircode)
|
|
|
|
|
if (ircode /= 0) then
|
|
|
|
|
write(0,*) 'matdist allocation failed'
|
|
|
|
|
return
|
|
|
|
|
endif
|
|
|
|
|
if (myprow == root) then
|
|
|
|
|
write (*, fmt = *) 'start matdist',root, size(iwork)
|
|
|
|
|
endif
|
|
|
|
|
call f90_psdscall(nrow,nrow,parts,icontxt,desc_a,info)
|
|
|
|
|
call f90_psspall(a,desc_a,info,nnz=nnzero/nprow)
|
|
|
|
|
call f90_psdsall(nrow,b,desc_a,info)
|
|
|
|
|
isize = max(3*nb,ncol)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
allocate(blck%aspk(nnzero),blck%ia1(nnzero),blck%ia2(nnzero),stat=ircode)
|
|
|
|
|
if (ircode /= 0) then
|
|
|
|
|
write(0,*) 'error on allocating blck'
|
|
|
|
|
call blacs_abort(icontxt,-1)
|
|
|
|
|
stop
|
|
|
|
|
endif
|
|
|
|
|
|
|
|
|
|
blck%m = 1
|
|
|
|
|
blck%k = ncol
|
|
|
|
|
blck%fida = 'csr'
|
|
|
|
|
i_count = 1
|
|
|
|
|
|
|
|
|
|
do while (i_count.le.nrow)
|
|
|
|
|
call parts(i_count,nrow,nprow,iwork, length_row)
|
|
|
|
|
|
|
|
|
|
if (length_row.eq.1) then
|
|
|
|
|
j_count = i_count + 1
|
|
|
|
|
iproc = iwork(1)
|
|
|
|
|
call parts(j_count,nrow,nprow,iwork, length_row)
|
|
|
|
|
|
|
|
|
|
do while ((j_count.le.nrow).and.(j_count-i_count.lt.nb)&
|
|
|
|
|
&.and.(length_row.eq.1).and.(iwork(1).eq.iproc))
|
|
|
|
|
j_count = j_count + 1
|
|
|
|
|
if (j_count.le.nrow) &
|
|
|
|
|
& call parts(j_count,nrow,nprow,iwork, length_row)
|
|
|
|
|
end do
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
! now we should insert rows i_count..j_count-1
|
|
|
|
|
nnr = j_count - i_count
|
|
|
|
|
|
|
|
|
|
if (myprow == root) then
|
|
|
|
|
do j = i_count, j_count
|
|
|
|
|
blck%ia2(j-i_count+1) = a_glob%ia2(j) - &
|
|
|
|
|
& a_glob%ia2(i_count) + 1
|
|
|
|
|
enddo
|
|
|
|
|
|
|
|
|
|
k = a_glob%ia2(i_count)
|
|
|
|
|
do j = k, a_glob%ia2(j_count)-1
|
|
|
|
|
blck%aspk(j-k+1) = a_glob%aspk(j)
|
|
|
|
|
blck%ia1(j-k+1) = a_glob%ia1(j)
|
|
|
|
|
enddo
|
|
|
|
|
|
|
|
|
|
ll = blck%ia2(nnr+1) - 1
|
|
|
|
|
blck%m = nnr
|
|
|
|
|
blck%k = nrow
|
|
|
|
|
if (iproc == myprow) then
|
|
|
|
|
call f90_psspins(a,i_count,1,blck,desc_a,info)
|
|
|
|
|
call f90_psdsins(nnr,b,i_count,b_glob(i_count:j_count-1),&
|
|
|
|
|
&desc_a,info)
|
|
|
|
|
else
|
|
|
|
|
call igesd2d(icontxt,1,1,nnr,1,iproc,0)
|
|
|
|
|
call igesd2d(icontxt,1,1,ll,1,iproc,0)
|
|
|
|
|
call igesd2d(icontxt,nnr+1,1,blck%ia2,nnr+1,iproc,0)
|
|
|
|
|
call igesd2d(icontxt,ll,1,blck%ia1,ll,iproc,0)
|
|
|
|
|
call zgesd2d(icontxt,ll,1,blck%aspk,ll,iproc,0)
|
|
|
|
|
call zgesd2d(icontxt,nnr,1,b_glob(i_count:j_count-1),nnr,iproc,0)
|
|
|
|
|
call igerv2d(icontxt,1,1,ll,1,iproc,0)
|
|
|
|
|
endif
|
|
|
|
|
|
|
|
|
|
else if (myprow /= root) then
|
|
|
|
|
|
|
|
|
|
if (iproc == myprow) then
|
|
|
|
|
call igerv2d(icontxt,1,1,nnr,1,root,0)
|
|
|
|
|
call igerv2d(icontxt,1,1,ll,1,root,0)
|
|
|
|
|
call igerv2d(icontxt,nnr+1,1,blck%ia2,nnr+1,root,0)
|
|
|
|
|
call igerv2d(icontxt,ll,1,blck%ia1,ll,root,0)
|
|
|
|
|
call zgerv2d(icontxt,ll,1,blck%aspk,ll,root,0)
|
|
|
|
|
call zgerv2d(icontxt,nnr,1,b_glob(i_count:i_count+nnr-1),nnr,root,0)
|
|
|
|
|
call igesd2d(icontxt,1,1,ll,1,root,0)
|
|
|
|
|
blck%m = nnr
|
|
|
|
|
blck%k = nrow
|
|
|
|
|
call f90_psspins(a,i_count,1,blck,desc_a,info)
|
|
|
|
|
call f90_psdsins(nnr,b,i_count,b_glob(i_count:i_count+nnr-1),&
|
|
|
|
|
&desc_a,info)
|
|
|
|
|
endif
|
|
|
|
|
endif
|
|
|
|
|
|
|
|
|
|
i_count = j_count
|
|
|
|
|
else
|
|
|
|
|
! here processors are counted 1..nprow
|
|
|
|
|
do j_count = 1, length_row
|
|
|
|
|
k_count = iwork(j_count)
|
|
|
|
|
if (myprow == root) then
|
|
|
|
|
blck%ia2(1) = 1
|
|
|
|
|
blck%ia2(2) = 1
|
|
|
|
|
do j = a_glob%ia2(i_count), a_glob%ia2(i_count+1)-1
|
|
|
|
|
blck%aspk(blck%ia2(2)) = a_glob%aspk(j)
|
|
|
|
|
blck%ia1(blck%ia2(2)) = a_glob%ia1(j)
|
|
|
|
|
blck%ia2(2) =blck%ia2(2) + 1
|
|
|
|
|
enddo
|
|
|
|
|
ll = blck%ia2(2) - 1
|
|
|
|
|
if (k_count == myprow) then
|
|
|
|
|
blck%infoa(1) = ll
|
|
|
|
|
blck%infoa(2) = ll
|
|
|
|
|
blck%infoa(3) = 2
|
|
|
|
|
blck%infoa(4) = 1
|
|
|
|
|
blck%infoa(5) = 1
|
|
|
|
|
blck%infoa(6) = 1
|
|
|
|
|
blck%m = 1
|
|
|
|
|
blck%k = nrow
|
|
|
|
|
|
|
|
|
|
call f90_psspins(a,i_count,1,blck,desc_a,info)
|
|
|
|
|
call f90_psdsins(1,b,i_count,b_glob(i_count:i_count),&
|
|
|
|
|
&desc_a,info)
|
|
|
|
|
else
|
|
|
|
|
call igesd2d(icontxt,1,1,ll,1,k_count,0)
|
|
|
|
|
call igesd2d(icontxt,ll,1,blck%ia1,ll,k_count,0)
|
|
|
|
|
call zgesd2d(icontxt,ll,1,blck%aspk,ll,k_count,0)
|
|
|
|
|
call zgesd2d(icontxt,1,1,b_glob(i_count),1,k_count,0)
|
|
|
|
|
call igerv2d(icontxt,1,1,ll,1,k_count,0)
|
|
|
|
|
endif
|
|
|
|
|
else if (myprow /= root) then
|
|
|
|
|
if (k_count == myprow) then
|
|
|
|
|
call igerv2d(icontxt,1,1,ll,1,root,0)
|
|
|
|
|
blck%ia2(1) = 1
|
|
|
|
|
blck%ia2(2) = ll+1
|
|
|
|
|
call igerv2d(icontxt,ll,1,blck%ia1,ll,root,0)
|
|
|
|
|
call zgerv2d(icontxt,ll,1,blck%aspk,ll,root,0)
|
|
|
|
|
call zgerv2d(icontxt,1,1,b_glob(i_count),1,root,0)
|
|
|
|
|
call igesd2d(icontxt,1,1,ll,1,root,0)
|
|
|
|
|
blck%m = 1
|
|
|
|
|
blck%k = nrow
|
|
|
|
|
call f90_psspins(a,i_count,1,blck,desc_a,info)
|
|
|
|
|
call f90_psdsins(1,b,i_count,b_glob(i_count:i_count),&
|
|
|
|
|
&desc_a,info)
|
|
|
|
|
endif
|
|
|
|
|
endif
|
|
|
|
|
end do
|
|
|
|
|
i_count = i_count + 1
|
|
|
|
|
endif
|
|
|
|
|
end do
|
|
|
|
|
! default storage format for sparse matrix; we do not
|
|
|
|
|
! expect duplicated entries.
|
|
|
|
|
|
|
|
|
|
if (present(fmt)) then
|
|
|
|
|
afmt=fmt
|
|
|
|
|
else
|
|
|
|
|
afmt = 'csr'
|
|
|
|
|
endif
|
|
|
|
|
call f90_psspasb(a,desc_a,info,dup=1)
|
|
|
|
|
call f90_psdsasb(b,desc_a,info)
|
|
|
|
|
call spfree(blck,info)
|
|
|
|
|
deallocate(iwork)
|
|
|
|
|
if (myprow == root) write (*, fmt = *) 'end matdist'
|
|
|
|
|
return
|
|
|
|
|
end subroutine zmatdistf
|
|
|
|
|
|
|
|
|
|
end module mat_dist
|
|
|
|
|