You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
282 lines
10 KiB
Fortran
282 lines
10 KiB
Fortran
!
|
|
!
|
|
! AMG4PSBLAS version 1.0
|
|
! Algebraic Multigrid Package
|
|
! based on PSBLAS (Parallel Sparse BLAS version 3.7)
|
|
!
|
|
! (C) Copyright 2021
|
|
!
|
|
! Salvatore Filippone
|
|
! Pasqua D'Ambra
|
|
! Daniela di Serafino
|
|
!
|
|
! Redistribution and use in source and binary forms, with or without
|
|
! modification, are permitted provided that the following conditions
|
|
! are met:
|
|
! 1. Redistributions of source code must retain the above copyright
|
|
! notice, this list of conditions and the following disclaimer.
|
|
! 2. Redistributions in binary form must reproduce the above copyright
|
|
! notice, this list of conditions, and the following disclaimer in the
|
|
! documentation and/or other materials provided with the distribution.
|
|
! 3. The name of the AMG4PSBLAS group or the names of its contributors may
|
|
! not be used to endorse or promote products derived from this
|
|
! software without specific written permission.
|
|
!
|
|
! THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
! ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
|
|
! TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
|
|
! PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE AMG4PSBLAS GROUP OR ITS CONTRIBUTORS
|
|
! BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
! CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
! SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
! INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
! CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
! ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
|
! POSSIBILITY OF SUCH DAMAGE.
|
|
!
|
|
!
|
|
subroutine amg_s_poly_smoother_apply_vect(alpha,sm,x,beta,y,desc_data,trans,&
|
|
& sweeps,work,wv,info,init,initu)
|
|
|
|
use psb_base_mod
|
|
use amg_s_diag_solver
|
|
use psb_base_krylov_conv_mod, only : log_conv
|
|
use amg_s_poly_smoother, amg_protect_name => amg_s_poly_smoother_apply_vect
|
|
implicit none
|
|
type(psb_desc_type), intent(in) :: desc_data
|
|
class(amg_s_poly_smoother_type), intent(inout) :: sm
|
|
type(psb_s_vect_type),intent(inout) :: x
|
|
type(psb_s_vect_type),intent(inout) :: y
|
|
real(psb_spk_),intent(in) :: alpha,beta
|
|
character(len=1),intent(in) :: trans
|
|
integer(psb_ipk_), intent(in) :: sweeps! this is ignored here, the polynomial degree dictates the value
|
|
real(psb_spk_),target, intent(inout) :: work(:)
|
|
type(psb_s_vect_type),intent(inout) :: wv(:)
|
|
integer(psb_ipk_), intent(out) :: info
|
|
character, intent(in), optional :: init
|
|
type(psb_s_vect_type),intent(inout), optional :: initu
|
|
! Timers
|
|
logical, parameter :: do_timings=.true.
|
|
integer(psb_ipk_), save :: poly_1=-1, poly_2=-1, poly_3=-1
|
|
integer(psb_ipk_), save :: poly_mv=-1, poly_sv=-1, poly_vect=-1
|
|
!
|
|
integer(psb_ipk_) :: n_row,n_col
|
|
type(psb_s_vect_type) :: tx, ty, tz, r
|
|
real(psb_spk_), pointer :: aux(:)
|
|
type(psb_ctxt_type) :: ctxt
|
|
integer(psb_ipk_) :: np, me, i, err_act
|
|
character :: trans_, init_
|
|
real(psb_spk_) :: res, resdenum
|
|
character(len=20) :: name='d_poly_smoother_apply_v'
|
|
|
|
call psb_erractionsave(err_act)
|
|
|
|
info = psb_success_
|
|
ctxt = desc_data%get_context()
|
|
call psb_info(ctxt,me,np)
|
|
|
|
|
|
if (present(init)) then
|
|
init_ = psb_toupper(init)
|
|
else
|
|
init_='Z'
|
|
end if
|
|
|
|
trans_ = psb_toupper(trans)
|
|
select case(trans_)
|
|
case('N')
|
|
case('T','C')
|
|
case default
|
|
call psb_errpush(psb_err_iarg_invalid_i_,name)
|
|
goto 9999
|
|
end select
|
|
|
|
if (.not.allocated(sm%sv)) then
|
|
info = 1121
|
|
call psb_errpush(info,name)
|
|
goto 9999
|
|
end if
|
|
|
|
if ((do_timings).and.(poly_1==-1)) &
|
|
& poly_1 = psb_get_timer_idx("POLY: Chebychev4")
|
|
if ((do_timings).and.(poly_2==-1)) &
|
|
& poly_2 = psb_get_timer_idx("POLY: OptChebychev4")
|
|
if ((do_timings).and.(poly_3==-1)) &
|
|
& poly_3 = psb_get_timer_idx("POLY: OptChebychev1")
|
|
if ((do_timings).and.(poly_mv==-1)) &
|
|
& poly_mv = psb_get_timer_idx("POLY: spMV")
|
|
if ((do_timings).and.(poly_vect==-1)) &
|
|
& poly_vect = psb_get_timer_idx("POLY: Vectors")
|
|
if ((do_timings).and.(poly_sv==-1)) &
|
|
& poly_sv = psb_get_timer_idx("POLY: solver")
|
|
n_row = desc_data%get_local_rows()
|
|
n_col = desc_data%get_local_cols()
|
|
|
|
if (4*n_col <= size(work)) then
|
|
aux => work(:)
|
|
else
|
|
allocate(aux(4*n_col),stat=info)
|
|
if (info /= psb_success_) then
|
|
info=psb_err_alloc_request_
|
|
call psb_errpush(info,name,&
|
|
& i_err=(/4*n_col,izero,izero,izero,izero/),&
|
|
& a_err='real(psb_spk_)')
|
|
goto 9999
|
|
end if
|
|
endif
|
|
|
|
if (size(wv) < 4) then
|
|
info = psb_err_internal_error_
|
|
call psb_errpush(info,name,&
|
|
& a_err='invalid wv size in smoother_apply')
|
|
goto 9999
|
|
end if
|
|
|
|
associate(tx => wv(1), ty => wv(2), tz => wv(3), r => wv(4))
|
|
|
|
call psb_geaxpby(sone,x,szero,r,desc_data,info)
|
|
call tx%zero()
|
|
call ty%zero()
|
|
call tz%zero()
|
|
|
|
select case(sm%variant)
|
|
case(amg_cheb_4_)
|
|
if (do_timings) call psb_tic(poly_1)
|
|
block
|
|
real(psb_spk_) :: cz, cr
|
|
! b == x
|
|
! x == tx
|
|
!
|
|
do i=1, sm%pdegree-1
|
|
! B r_{k-1}
|
|
if (do_timings) call psb_tic(poly_sv)
|
|
call sm%sv%apply(sone,r,szero,ty,desc_data,trans_,aux,wv(5:),info,init='Z') ! ty = M^{-1} r
|
|
if (do_timings) call psb_toc(poly_sv)
|
|
cz = (2*i*sone-3)/(2*i*sone+sone)
|
|
cr = (8*i*sone-4)/((2*i*sone+sone)*sm%rho_ba)
|
|
if (do_timings) call psb_tic(poly_vect)
|
|
call psb_upd_xyz(cr,cz,sone,sone,ty,tz,tx,desc_data,info) ! zk = cz * zk-1 + cr * rk-1
|
|
if (do_timings) call psb_toc(poly_vect)
|
|
if (do_timings) call psb_tic(poly_mv)
|
|
call psb_spmm(-sone,sm%pa,tz,sone,r,desc_data,info,work=aux,trans=trans_)
|
|
if (do_timings) call psb_toc(poly_mv)
|
|
end do
|
|
if (do_timings) call psb_tic(poly_sv)
|
|
call sm%sv%apply(sone,r,szero,ty,desc_data,trans_,aux,wv(5:),info,init='Z') ! ty = M^{-1} r
|
|
if (do_timings) call psb_toc(poly_sv)
|
|
cz = (2*sm%pdegree*sone-3)/(2*sm%pdegree*sone+sone)
|
|
cr = (8*sm%pdegree*sone-4)/((2*sm%pdegree*sone+sone)*sm%rho_ba)
|
|
if (do_timings) call psb_tic(poly_vect)
|
|
call psb_upd_xyz(cr,cz,sone,sone,ty,tz,tx,desc_data,info)
|
|
if (do_timings) call psb_toc(poly_vect)
|
|
end block
|
|
if (do_timings) call psb_toc(poly_1)
|
|
|
|
case(amg_cheb_4_opt_)
|
|
if (do_timings) call psb_tic(poly_2)
|
|
block
|
|
real(psb_spk_) :: cz, cr
|
|
! b == x
|
|
! x == tx
|
|
!
|
|
if (allocated(sm%poly_beta)) then
|
|
if (size(sm%poly_beta) /= sm%pdegree) deallocate(sm%poly_beta)
|
|
end if
|
|
if (.not.allocated(sm%poly_beta)) then
|
|
call psb_realloc(sm%pdegree,sm%poly_beta,info)
|
|
sm%poly_beta(1:sm%pdegree) = amg_d_poly_beta_mat(1:sm%pdegree,sm%pdegree)
|
|
end if
|
|
|
|
do i=1, sm%pdegree-1
|
|
! B r_{k-1}
|
|
if (do_timings) call psb_tic(poly_sv)
|
|
call sm%sv%apply(sone,r,szero,ty,desc_data,trans_,aux,wv(5:),info,init='Z')
|
|
if (do_timings) call psb_toc(poly_sv)
|
|
cz = (2*i*sone-3)/(2*i*sone+sone)
|
|
cr = (8*i*sone-4)/((2*i*sone+sone)*sm%rho_ba)
|
|
if (do_timings) call psb_tic(poly_vect)
|
|
call psb_upd_xyz(cr,cz,sm%poly_beta(i),sone,ty,tz,tx,desc_data,info)
|
|
if (do_timings) call psb_toc(poly_vect)
|
|
if (do_timings) call psb_tic(poly_mv)
|
|
call psb_spmm(-sone,sm%pa,tz,sone,r,desc_data,info,work=aux,trans=trans_)
|
|
if (do_timings) call psb_toc(poly_mv)
|
|
end do
|
|
call sm%sv%apply(sone,r,szero,ty,desc_data,trans_,aux,wv(5:),info,init='Z')
|
|
cz = (2*sm%pdegree*sone-3)/(2*sm%pdegree*sone+sone)
|
|
cr = (8*sm%pdegree*sone-4)/((2*sm%pdegree*sone+sone)*sm%rho_ba)
|
|
if (do_timings) call psb_tic(poly_vect)
|
|
call psb_upd_xyz(cr,cz,sm%poly_beta(sm%pdegree),sone,ty,tz,tx,desc_data,info)
|
|
if (do_timings) call psb_toc(poly_vect)
|
|
end block
|
|
if (do_timings) call psb_toc(poly_2)
|
|
case(amg_cheb_1_opt_)
|
|
if (do_timings) call psb_tic(poly_3)
|
|
block
|
|
real(psb_spk_) :: sigma, theta, delta, rho_old, rho
|
|
! b == x
|
|
! x == tx
|
|
!
|
|
|
|
theta = (sone+sm%cf_a)/2
|
|
delta = (sone-sm%cf_a)/2
|
|
sigma = theta/delta
|
|
rho_old = sone/sigma
|
|
if (do_timings) call psb_tic(poly_sv)
|
|
call sm%sv%apply(sone,r,szero,ty,desc_data,trans_,aux,wv(5:),info,init='Z')
|
|
if (do_timings) call psb_toc(poly_sv)
|
|
call psb_geaxpby((sone/sm%rho_ba),ty,szero,r,desc_data,info)
|
|
if (do_timings) call psb_tic(poly_vect)
|
|
call psb_upd_xyz((sone/theta),szero,sone,sone,r,tz,tx,desc_data,info)
|
|
if (do_timings) call psb_toc(poly_vect)
|
|
|
|
! tz == d
|
|
do i=1, sm%pdegree-1
|
|
!
|
|
!
|
|
! r_{k-1} = r_k - (1/rho(BA)) B A d_k
|
|
if (do_timings) call psb_tic(poly_mv)
|
|
call psb_spmm(sone,sm%pa,tz,szero,ty,desc_data,info,work=aux,trans=trans_)
|
|
if (do_timings) call psb_toc(poly_mv)
|
|
if (do_timings) call psb_tic(poly_sv)
|
|
call sm%sv%apply(-(sone/sm%rho_ba),ty,sone,r,desc_data,trans_,aux,wv(5:),info,init='Z')
|
|
if (do_timings) call psb_toc(poly_sv)
|
|
!
|
|
! d_{k+1} = (rho rho_old) d_k + 2(rho/delta) r_{k+1}
|
|
rho = sone/(2*sigma - rho_old)
|
|
if (do_timings) call psb_tic(poly_vect)
|
|
call psb_upd_xyz((2*rho/delta),(rho*rho_old),sone,sone,r,tz,tx,desc_data,info)
|
|
if (do_timings) call psb_toc(poly_vect)
|
|
rho_old = rho
|
|
end do
|
|
end block
|
|
if (do_timings) call psb_toc(poly_3)
|
|
case default
|
|
info=psb_err_internal_error_
|
|
call psb_errpush(info,name,&
|
|
& a_err='wrong polynomial variant')
|
|
goto 9999
|
|
end select
|
|
|
|
if (info == psb_success_) call psb_geaxpby(alpha,tx,beta,y,desc_data,info)
|
|
|
|
if (info /= psb_success_) then
|
|
info=psb_err_internal_error_
|
|
call psb_errpush(info,name,&
|
|
& a_err='polynomial smoother')
|
|
goto 9999
|
|
end if
|
|
end associate
|
|
|
|
if (.not.(4*n_col <= size(work))) then
|
|
deallocate(aux)
|
|
endif
|
|
|
|
call psb_erractionrestore(err_act)
|
|
return
|
|
|
|
9999 call psb_error_handler(err_act)
|
|
|
|
return
|
|
|
|
end subroutine amg_s_poly_smoother_apply_vect
|