|
|
|
@ -43,14 +43,13 @@
|
|
|
|
|
! y - type(psb_d_multivect_type) The input vector containing the entries of sub( Y ).
|
|
|
|
|
! desc_a - type(psb_desc_type). The communication descriptor.
|
|
|
|
|
! info - integer. Return code
|
|
|
|
|
! trans - logical(optional) Whether multivector X is transposed, default: .false.
|
|
|
|
|
! global - logical(optional) Whether to perform the global reduce, default: .true.
|
|
|
|
|
!
|
|
|
|
|
! Note: from a functional point of view, X and Y are input, but here
|
|
|
|
|
! they are declared INOUT because of the sync() methods.
|
|
|
|
|
!
|
|
|
|
|
!
|
|
|
|
|
function psb_dprod_multivect(x,y,desc_a,info,trans,global) result(res)
|
|
|
|
|
subroutine psb_dprod_multivect(x,y,res,desc_a,info,global)
|
|
|
|
|
use psb_desc_mod
|
|
|
|
|
use psb_d_base_mat_mod
|
|
|
|
|
use psb_check_mod
|
|
|
|
@ -59,11 +58,9 @@ function psb_dprod_multivect(x,y,desc_a,info,trans,global) result(res)
|
|
|
|
|
use psb_d_vect_mod
|
|
|
|
|
use psb_d_psblas_mod, psb_protect_name => psb_dprod_multivect
|
|
|
|
|
implicit none
|
|
|
|
|
real(psb_dpk_), allocatable :: res(:,:)
|
|
|
|
|
type(psb_d_multivect_type), intent(inout) :: x, y
|
|
|
|
|
type(psb_d_multivect_type), intent(inout) :: x, y, res
|
|
|
|
|
type(psb_desc_type), intent(in) :: desc_a
|
|
|
|
|
integer(psb_ipk_), intent(out) :: info
|
|
|
|
|
logical, intent(in), optional :: trans
|
|
|
|
|
logical, intent(in), optional :: global
|
|
|
|
|
|
|
|
|
|
! locals
|
|
|
|
@ -71,7 +68,7 @@ function psb_dprod_multivect(x,y,desc_a,info,trans,global) result(res)
|
|
|
|
|
integer(psb_ipk_) :: np, me, idx, ndm,&
|
|
|
|
|
& err_act, iix, jjx, iiy, jjy, i, j, nr
|
|
|
|
|
integer(psb_lpk_) :: ix, ijx, iy, ijy, m, n
|
|
|
|
|
logical :: global_, trans_
|
|
|
|
|
logical :: global_
|
|
|
|
|
character(len=20) :: name, ch_err
|
|
|
|
|
|
|
|
|
|
name='psb_dprod_multivect'
|
|
|
|
@ -99,12 +96,6 @@ function psb_dprod_multivect(x,y,desc_a,info,trans,global) result(res)
|
|
|
|
|
goto 9999
|
|
|
|
|
endif
|
|
|
|
|
|
|
|
|
|
if (present(trans)) then
|
|
|
|
|
trans_ = trans
|
|
|
|
|
else
|
|
|
|
|
trans_ = .false.
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
if (present(global)) then
|
|
|
|
|
global_ = global
|
|
|
|
|
else
|
|
|
|
@ -140,25 +131,26 @@ function psb_dprod_multivect(x,y,desc_a,info,trans,global) result(res)
|
|
|
|
|
|
|
|
|
|
nr = desc_a%get_local_rows()
|
|
|
|
|
if (nr > 0) then
|
|
|
|
|
res = x%prod(nr,y,trans_)
|
|
|
|
|
call x%prod(nr,y,res)
|
|
|
|
|
! adjust dot_local because overlapped elements are computed more than once
|
|
|
|
|
if (size(desc_a%ovrlap_elem,1)>0) then
|
|
|
|
|
if (x%v%is_dev()) call x%sync()
|
|
|
|
|
if (y%v%is_dev()) call y%sync()
|
|
|
|
|
if (res%v%is_dev()) call res%sync()
|
|
|
|
|
do j=1,x%get_ncols()
|
|
|
|
|
do i=1,size(desc_a%ovrlap_elem,1)
|
|
|
|
|
idx = desc_a%ovrlap_elem(i,1)
|
|
|
|
|
ndm = desc_a%ovrlap_elem(i,2)
|
|
|
|
|
res(j,:) = res(j,:) - (real(ndm-1)/real(ndm))*(x%v%v(idx,:)*y%v%v(idx,:))
|
|
|
|
|
res%v%v(j,:) = res%v%v(j,:) - (real(ndm-1)/real(ndm))*(x%v%v(idx,:)*y%v%v(idx,:))
|
|
|
|
|
end do
|
|
|
|
|
end do
|
|
|
|
|
end if
|
|
|
|
|
else
|
|
|
|
|
res = dzero
|
|
|
|
|
call res%zero()
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
! compute global sum
|
|
|
|
|
if (global_) call psb_sum(ctxt, res)
|
|
|
|
|
if (global_) call psb_sum(ctxt, res%v%v)
|
|
|
|
|
|
|
|
|
|
call psb_erractionrestore(err_act)
|
|
|
|
|
return
|
|
|
|
@ -167,7 +159,7 @@ function psb_dprod_multivect(x,y,desc_a,info,trans,global) result(res)
|
|
|
|
|
|
|
|
|
|
return
|
|
|
|
|
|
|
|
|
|
end function psb_dprod_multivect
|
|
|
|
|
end subroutine psb_dprod_multivect
|
|
|
|
|
!
|
|
|
|
|
! Function: psb_dprod_multivect_a
|
|
|
|
|
! psb_dprod computes the product of two distributed multivectors,
|
|
|
|
@ -181,14 +173,13 @@ end function psb_dprod_multivect
|
|
|
|
|
! y - real(:,:) The input vector containing the entries of sub( Y ).
|
|
|
|
|
! desc_a - type(psb_desc_type). The communication descriptor.
|
|
|
|
|
! info - integer. Return code
|
|
|
|
|
! trans - logical(optional) Whether multivector X is transposed, default: .false.
|
|
|
|
|
! global - logical(optional) Whether to perform the global reduce, default: .true.
|
|
|
|
|
!
|
|
|
|
|
! Note: from a functional point of view, X and Y are input, but here
|
|
|
|
|
! they are declared INOUT because of the sync() methods.
|
|
|
|
|
!
|
|
|
|
|
!
|
|
|
|
|
function psb_dprod_multivect_a(x,y,desc_a,info,trans,global) result(res)
|
|
|
|
|
subroutine psb_dprod_multivect_a(x,y,res,desc_a,info,global)
|
|
|
|
|
use psb_desc_mod
|
|
|
|
|
use psb_d_base_mat_mod
|
|
|
|
|
use psb_check_mod
|
|
|
|
@ -197,12 +188,10 @@ function psb_dprod_multivect_a(x,y,desc_a,info,trans,global) result(res)
|
|
|
|
|
use psb_d_vect_mod
|
|
|
|
|
use psb_d_psblas_mod, psb_protect_name => psb_dprod_multivect_a
|
|
|
|
|
implicit none
|
|
|
|
|
real(psb_dpk_), allocatable :: res(:,:)
|
|
|
|
|
type(psb_d_multivect_type), intent(inout) :: x
|
|
|
|
|
type(psb_d_multivect_type), intent(inout) :: x, res
|
|
|
|
|
real(psb_dpk_), intent(in) :: y(:,:)
|
|
|
|
|
type(psb_desc_type), intent(in) :: desc_a
|
|
|
|
|
integer(psb_ipk_), intent(out) :: info
|
|
|
|
|
logical, intent(in), optional :: trans
|
|
|
|
|
logical, intent(in), optional :: global
|
|
|
|
|
|
|
|
|
|
! locals
|
|
|
|
@ -210,7 +199,7 @@ function psb_dprod_multivect_a(x,y,desc_a,info,trans,global) result(res)
|
|
|
|
|
integer(psb_ipk_) :: np, me, idx, ndm,&
|
|
|
|
|
& err_act, iix, jjx, iiy, jjy, i, j, nr
|
|
|
|
|
integer(psb_lpk_) :: ix, ijx, iy, ijy, m, n
|
|
|
|
|
logical :: global_, trans_
|
|
|
|
|
logical :: global_
|
|
|
|
|
character(len=20) :: name, ch_err
|
|
|
|
|
|
|
|
|
|
name='psb_dprod_multivect'
|
|
|
|
@ -233,12 +222,6 @@ function psb_dprod_multivect_a(x,y,desc_a,info,trans,global) result(res)
|
|
|
|
|
goto 9999
|
|
|
|
|
endif
|
|
|
|
|
|
|
|
|
|
if (present(trans)) then
|
|
|
|
|
trans_ = trans
|
|
|
|
|
else
|
|
|
|
|
trans_ = .false.
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
if (present(global)) then
|
|
|
|
|
global_ = global
|
|
|
|
|
else
|
|
|
|
@ -268,164 +251,25 @@ function psb_dprod_multivect_a(x,y,desc_a,info,trans,global) result(res)
|
|
|
|
|
|
|
|
|
|
nr = desc_a%get_local_rows()
|
|
|
|
|
if (nr > 0) then
|
|
|
|
|
res = x%prod(nr,y,trans_)
|
|
|
|
|
call x%prod(nr,y,res)
|
|
|
|
|
! adjust dot_local because overlapped elements are computed more than once
|
|
|
|
|
if (size(desc_a%ovrlap_elem,1)>0) then
|
|
|
|
|
if (x%v%is_dev()) call x%sync()
|
|
|
|
|
if (res%v%is_dev()) call res%sync()
|
|
|
|
|
do j=1,x%get_ncols()
|
|
|
|
|
do i=1,size(desc_a%ovrlap_elem,1)
|
|
|
|
|
idx = desc_a%ovrlap_elem(i,1)
|
|
|
|
|
ndm = desc_a%ovrlap_elem(i,2)
|
|
|
|
|
res(j,:) = res(j,:) - (real(ndm-1)/real(ndm))*(x%v%v(idx,:)*y(idx,:))
|
|
|
|
|
res%v%v(j,:) = res%v%v(j,:) - (real(ndm-1)/real(ndm))*(x%v%v(idx,:)*y(idx,:))
|
|
|
|
|
end do
|
|
|
|
|
end do
|
|
|
|
|
end if
|
|
|
|
|
else
|
|
|
|
|
res = dzero
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
! compute global sum
|
|
|
|
|
if (global_) call psb_sum(ctxt, res)
|
|
|
|
|
|
|
|
|
|
call psb_erractionrestore(err_act)
|
|
|
|
|
return
|
|
|
|
|
|
|
|
|
|
9999 call psb_error_handler(ctxt,err_act)
|
|
|
|
|
|
|
|
|
|
return
|
|
|
|
|
|
|
|
|
|
end function psb_dprod_multivect_a
|
|
|
|
|
!
|
|
|
|
|
! Function: psb_dprod_m
|
|
|
|
|
! psb_dprod computes the product of two distributed multivectors,
|
|
|
|
|
!
|
|
|
|
|
! prod := ( X ) * ( Y ) or
|
|
|
|
|
! prod := ( X )**C * ( Y )
|
|
|
|
|
!
|
|
|
|
|
!
|
|
|
|
|
! Arguments:
|
|
|
|
|
! x - real(:,:) The input vector containing the entries of sub( X ).
|
|
|
|
|
! y - real(:,:) The input vector containing the entries of sub( Y ).
|
|
|
|
|
! desc_a - type(psb_desc_type). The communication descriptor.
|
|
|
|
|
! info - integer. Return code
|
|
|
|
|
! trans - logical(optional) Whether multivector X is transposed, default: .false.
|
|
|
|
|
! global - logical(optional) Whether to perform the global reduce, default: .true.
|
|
|
|
|
!
|
|
|
|
|
! Note: from a functional point of view, X and Y are input, but here
|
|
|
|
|
! they are declared INOUT because of the sync() methods.
|
|
|
|
|
!
|
|
|
|
|
!
|
|
|
|
|
function psb_dprod_m(x,y,desc_a,info,trans,global) result(res)
|
|
|
|
|
use psb_desc_mod
|
|
|
|
|
use psb_d_base_mat_mod
|
|
|
|
|
use psb_check_mod
|
|
|
|
|
use psb_error_mod
|
|
|
|
|
use psb_penv_mod
|
|
|
|
|
use psb_d_vect_mod
|
|
|
|
|
use psb_d_psblas_mod, psb_protect_name => psb_dprod_m
|
|
|
|
|
implicit none
|
|
|
|
|
real(psb_dpk_), allocatable :: res(:,:)
|
|
|
|
|
real(psb_dpk_), intent(in) :: x(:,:), y(:,:)
|
|
|
|
|
type(psb_desc_type), intent(in) :: desc_a
|
|
|
|
|
integer(psb_ipk_), intent(out) :: info
|
|
|
|
|
logical, intent(in), optional :: trans
|
|
|
|
|
logical, intent(in), optional :: global
|
|
|
|
|
|
|
|
|
|
! locals
|
|
|
|
|
type(psb_ctxt_type) :: ctxt
|
|
|
|
|
integer(psb_ipk_) :: np, me, idx, ndm,&
|
|
|
|
|
& err_act, iix, jjx, iiy, jjy, i, j, nr, x_n, y_n, lda, ldb
|
|
|
|
|
integer(psb_lpk_) :: ix, ijx, iy, ijy, m, n
|
|
|
|
|
logical :: global_, trans_
|
|
|
|
|
character(len=20) :: name, ch_err
|
|
|
|
|
|
|
|
|
|
name='psb_dprod_multivect'
|
|
|
|
|
info=psb_success_
|
|
|
|
|
call psb_erractionsave(err_act)
|
|
|
|
|
if (psb_errstatus_fatal()) then
|
|
|
|
|
info = psb_err_internal_error_ ; goto 9999
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
ctxt=desc_a%get_context()
|
|
|
|
|
call psb_info(ctxt, me, np)
|
|
|
|
|
if (np == -ione) then
|
|
|
|
|
info = psb_err_context_error_
|
|
|
|
|
call psb_errpush(info,name)
|
|
|
|
|
goto 9999
|
|
|
|
|
endif
|
|
|
|
|
|
|
|
|
|
if (present(trans)) then
|
|
|
|
|
trans_ = trans
|
|
|
|
|
else
|
|
|
|
|
trans_ = .false.
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
if (present(global)) then
|
|
|
|
|
global_ = global
|
|
|
|
|
else
|
|
|
|
|
global_ = .false.
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
ix = ione
|
|
|
|
|
ijx = ione
|
|
|
|
|
|
|
|
|
|
m = desc_a%get_global_rows()
|
|
|
|
|
|
|
|
|
|
! check vector correctness
|
|
|
|
|
n = size(x,2)
|
|
|
|
|
call psb_chkvect(m,n,size(x,1),ix,ijx,desc_a,info,iix,jjx)
|
|
|
|
|
if(info /= psb_success_) then
|
|
|
|
|
info=psb_err_from_subroutine_
|
|
|
|
|
ch_err='psb_chkvect'
|
|
|
|
|
call psb_errpush(info,name,a_err=ch_err)
|
|
|
|
|
goto 9999
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
if ((iix /= ione)) then
|
|
|
|
|
info=psb_err_ix_n1_iy_n1_unsupported_
|
|
|
|
|
call psb_errpush(info,name)
|
|
|
|
|
goto 9999
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
nr = desc_a%get_local_rows()
|
|
|
|
|
x_n = size(x,2)
|
|
|
|
|
y_n = size(y,2)
|
|
|
|
|
lda = size(x,1)
|
|
|
|
|
if (nr > 0) then
|
|
|
|
|
|
|
|
|
|
if (trans_) then
|
|
|
|
|
allocate(res(x_n,y_n))
|
|
|
|
|
res = dzero
|
|
|
|
|
ldb = size(y,1)
|
|
|
|
|
call dgemm('T','N',x_n,y_n,nr,done,x,lda,y,ldb,dzero,res,x_n)
|
|
|
|
|
else
|
|
|
|
|
allocate(res(lda,y_n))
|
|
|
|
|
res = dzero
|
|
|
|
|
ldb = x_n
|
|
|
|
|
call dgemm('N','N',nr,y_n,x_n,done,x,lda,y,ldb,dzero,res,lda)
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
! adjust dot_local because overlapped elements are computed more than once
|
|
|
|
|
if (size(desc_a%ovrlap_elem,1)>0) then
|
|
|
|
|
do j=1,x_n
|
|
|
|
|
do i=1,size(desc_a%ovrlap_elem,1)
|
|
|
|
|
idx = desc_a%ovrlap_elem(i,1)
|
|
|
|
|
ndm = desc_a%ovrlap_elem(i,2)
|
|
|
|
|
res(j,:) = res(j,:) - (real(ndm-1)/real(ndm))*(x(idx,:)*y(idx,:))
|
|
|
|
|
end do
|
|
|
|
|
end do
|
|
|
|
|
end if
|
|
|
|
|
else
|
|
|
|
|
if (trans_) then
|
|
|
|
|
allocate(res(x_n,y_n))
|
|
|
|
|
else
|
|
|
|
|
allocate(res(lda,y_n))
|
|
|
|
|
end if
|
|
|
|
|
res = dzero
|
|
|
|
|
call res%zero()
|
|
|
|
|
end if
|
|
|
|
|
|
|
|
|
|
! compute global sum
|
|
|
|
|
if (global_) call psb_sum(ctxt, res)
|
|
|
|
|
if (global_) call psb_sum(ctxt, res%v%v)
|
|
|
|
|
|
|
|
|
|
call psb_erractionrestore(err_act)
|
|
|
|
|
return
|
|
|
|
@ -434,4 +278,4 @@ function psb_dprod_m(x,y,desc_a,info,trans,global) result(res)
|
|
|
|
|
|
|
|
|
|
return
|
|
|
|
|
|
|
|
|
|
end function psb_dprod_m
|
|
|
|
|
end subroutine psb_dprod_multivect_a
|
|
|
|
|