You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
240 lines
7.0 KiB
Fortran
240 lines
7.0 KiB
Fortran
! Parallel Sparse BLAS GPU plugin
|
|
! (C) Copyright 2013
|
|
!
|
|
! Salvatore Filippone
|
|
! Alessandro Fanfarillo
|
|
!
|
|
! Redistribution and use in source and binary forms, with or without
|
|
! modification, are permitted provided that the following conditions
|
|
! are met:
|
|
! 1. Redistributions of source code must retain the above copyright
|
|
! notice, this list of conditions and the following disclaimer.
|
|
! 2. Redistributions in binary form must reproduce the above copyright
|
|
! notice, this list of conditions, and the following disclaimer in the
|
|
! documentation and/or other materials provided with the distribution.
|
|
! 3. The name of the PSBLAS group or the names of its contributors may
|
|
! not be used to endorse or promote products derived from this
|
|
! software without specific written permission.
|
|
!
|
|
! THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
! ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
|
|
! TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
|
|
! PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE PSBLAS GROUP OR ITS CONTRIBUTORS
|
|
! BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
! CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
! SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
! INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
! CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
! ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
|
! POSSIBILITY OF SUCH DAMAGE.
|
|
!
|
|
|
|
subroutine psb_d_cuda_elg_csput_a(nz,ia,ja,val,a,imin,imax,jmin,jmax,info)
|
|
|
|
use psb_base_mod
|
|
use iso_c_binding
|
|
use elldev_mod
|
|
use psb_d_cuda_elg_mat_mod, psb_protect_name => psb_d_cuda_elg_csput_a
|
|
implicit none
|
|
|
|
class(psb_d_cuda_elg_sparse_mat), intent(inout) :: a
|
|
real(psb_dpk_), intent(in) :: val(:)
|
|
integer(psb_ipk_), intent(in) :: nz, ia(:), ja(:), imin,imax,jmin,jmax
|
|
integer(psb_ipk_), intent(out) :: info
|
|
|
|
|
|
integer(psb_ipk_) :: err_act
|
|
character(len=20) :: name='d_cuda_elg_csput_a'
|
|
logical, parameter :: debug=.false.
|
|
integer(psb_ipk_) :: nza, i,j,k, nzl, isza, int_err(5), debug_level, debug_unit
|
|
real(psb_dpk_) :: t1,t2,t3
|
|
type(c_ptr) :: devIdxUpd
|
|
|
|
call psb_erractionsave(err_act)
|
|
info = psb_success_
|
|
debug_unit = psb_get_debug_unit()
|
|
debug_level = psb_get_debug_level()
|
|
|
|
!!$ write(0,*) 'In ELG_csput_a'
|
|
if (nz <= 0) then
|
|
info = psb_err_iarg_neg_
|
|
int_err(1)=1
|
|
call psb_errpush(info,name,i_err=int_err)
|
|
goto 9999
|
|
end if
|
|
if (size(ia) < nz) then
|
|
info = psb_err_input_asize_invalid_i_
|
|
int_err(1)=2
|
|
call psb_errpush(info,name,i_err=int_err)
|
|
goto 9999
|
|
end if
|
|
|
|
if (size(ja) < nz) then
|
|
info = psb_err_input_asize_invalid_i_
|
|
int_err(1)=3
|
|
call psb_errpush(info,name,i_err=int_err)
|
|
goto 9999
|
|
end if
|
|
if (size(val) < nz) then
|
|
info = psb_err_input_asize_invalid_i_
|
|
int_err(1)=4
|
|
call psb_errpush(info,name,i_err=int_err)
|
|
goto 9999
|
|
end if
|
|
|
|
if (nz == 0) return
|
|
|
|
|
|
if (a%is_bld()) then
|
|
! Build phase should only ever be in COO
|
|
info = psb_err_invalid_mat_state_
|
|
|
|
else if (a%is_upd()) then
|
|
!!$ write(*,*) 'elg_csput_a '
|
|
if (a%is_dev()) call a%sync()
|
|
call a%psb_d_ell_sparse_mat%csput(nz,ia,ja,val,&
|
|
& imin,imax,jmin,jmax,info)
|
|
if (info /= psb_success_) then
|
|
call psb_errpush(info,name)
|
|
goto 9999
|
|
end if
|
|
call a%set_host()
|
|
else
|
|
! State is wrong.
|
|
info = psb_err_invalid_mat_state_
|
|
end if
|
|
if (info /= psb_success_) then
|
|
call psb_errpush(info,name)
|
|
goto 9999
|
|
end if
|
|
|
|
call psb_erractionrestore(err_act)
|
|
return
|
|
|
|
9999 call psb_error_handler(err_act)
|
|
|
|
return
|
|
|
|
end subroutine psb_d_cuda_elg_csput_a
|
|
|
|
|
|
|
|
subroutine psb_d_cuda_elg_csput_v(nz,ia,ja,val,a,imin,imax,jmin,jmax,info)
|
|
|
|
use psb_base_mod
|
|
use iso_c_binding
|
|
use elldev_mod
|
|
use psb_d_cuda_elg_mat_mod, psb_protect_name => psb_d_cuda_elg_csput_v
|
|
use psb_d_cuda_vect_mod
|
|
implicit none
|
|
|
|
class(psb_d_cuda_elg_sparse_mat), intent(inout) :: a
|
|
class(psb_d_base_vect_type), intent(inout) :: val
|
|
class(psb_i_base_vect_type), intent(inout) :: ia, ja
|
|
integer(psb_ipk_), intent(in) :: nz, imin,imax,jmin,jmax
|
|
integer(psb_ipk_), intent(out) :: info
|
|
|
|
|
|
integer(psb_ipk_) :: err_act
|
|
character(len=20) :: name='d_cuda_elg_csput_v'
|
|
logical, parameter :: debug=.false.
|
|
integer(psb_ipk_) :: nza, i,j,k, nzl, isza, int_err(5), debug_level, debug_unit, nrw
|
|
logical :: gpu_invoked
|
|
real(psb_dpk_) :: t1,t2,t3
|
|
type(c_ptr) :: devIdxUpd
|
|
integer(psb_ipk_), allocatable :: idxs(:)
|
|
logical, parameter :: debug_idxs=.false., debug_vals=.false.
|
|
|
|
|
|
call psb_erractionsave(err_act)
|
|
info = psb_success_
|
|
debug_unit = psb_get_debug_unit()
|
|
debug_level = psb_get_debug_level()
|
|
|
|
! write(0,*) 'In ELG_csput_v'
|
|
if (nz <= 0) then
|
|
info = psb_err_iarg_neg_
|
|
int_err(1)=1
|
|
call psb_errpush(info,name,i_err=int_err)
|
|
goto 9999
|
|
end if
|
|
if (ia%get_nrows() < nz) then
|
|
info = psb_err_input_asize_invalid_i_
|
|
int_err(1)=2
|
|
call psb_errpush(info,name,i_err=int_err)
|
|
goto 9999
|
|
end if
|
|
|
|
if (ja%get_nrows() < nz) then
|
|
info = psb_err_input_asize_invalid_i_
|
|
int_err(1)=3
|
|
call psb_errpush(info,name,i_err=int_err)
|
|
goto 9999
|
|
end if
|
|
if (val%get_nrows() < nz) then
|
|
info = psb_err_input_asize_invalid_i_
|
|
int_err(1)=4
|
|
call psb_errpush(info,name,i_err=int_err)
|
|
goto 9999
|
|
end if
|
|
|
|
if (nz == 0) return
|
|
|
|
|
|
if (a%is_bld()) then
|
|
! Build phase should only ever be in COO
|
|
info = psb_err_invalid_mat_state_
|
|
|
|
else if (a%is_upd()) then
|
|
|
|
t1=psb_wtime()
|
|
gpu_invoked = .false.
|
|
select type (ia)
|
|
class is (psb_i_vect_cuda)
|
|
select type (ja)
|
|
class is (psb_i_vect_cuda)
|
|
select type (val)
|
|
class is (psb_d_vect_cuda)
|
|
if (a%is_host()) call a%sync()
|
|
if (val%is_host()) call val%sync()
|
|
if (ia%is_host()) call ia%sync()
|
|
if (ja%is_host()) call ja%sync()
|
|
info = csputEllDeviceDouble(a%deviceMat,nz,&
|
|
& ia%deviceVect,ja%deviceVect,val%deviceVect)
|
|
call a%set_dev()
|
|
gpu_invoked=.true.
|
|
end select
|
|
end select
|
|
end select
|
|
if (.not.gpu_invoked) then
|
|
!!$ write(0,*)'Not gpu_invoked '
|
|
if (a%is_dev()) call a%sync()
|
|
call a%psb_d_ell_sparse_mat%csput(nz,ia,ja,val,&
|
|
& imin,imax,jmin,jmax,info)
|
|
call a%set_host()
|
|
end if
|
|
|
|
if (info /= 0) then
|
|
info = psb_err_internal_error_
|
|
end if
|
|
|
|
|
|
else
|
|
! State is wrong.
|
|
info = psb_err_invalid_mat_state_
|
|
end if
|
|
if (info /= psb_success_) then
|
|
call psb_errpush(info,name)
|
|
goto 9999
|
|
end if
|
|
|
|
call psb_erractionrestore(err_act)
|
|
return
|
|
|
|
9999 call psb_error_handler(err_act)
|
|
|
|
return
|
|
|
|
|
|
end subroutine psb_d_cuda_elg_csput_v
|