!!$ !!$ Parallel Sparse BLAS version 3.4 !!$ (C) Copyright 2006, 2010, 2015 !!$ Salvatore Filippone University of Rome Tor Vergata !!$ Alfredo Buttari CNRS-IRIT, Toulouse !!$ !!$ Redistribution and use in source and binary forms, with or without !!$ modification, are permitted provided that the following conditions !!$ are met: !!$ 1. Redistributions of source code must retain the above copyright !!$ notice, this list of conditions and the following disclaimer. !!$ 2. Redistributions in binary form must reproduce the above copyright !!$ notice, this list of conditions, and the following disclaimer in the !!$ documentation and/or other materials provided with the distribution. !!$ 3. The name of the PSBLAS group or the names of its contributors may !!$ not be used to endorse or promote products derived from this !!$ software without specific written permission. !!$ !!$ THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS !!$ ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED !!$ TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR !!$ PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE PSBLAS GROUP OR ITS CONTRIBUTORS !!$ BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR !!$ CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF !!$ SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS !!$ INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN !!$ CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) !!$ ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE !!$ POSSIBILITY OF SUCH DAMAGE. !!$ !!$ submodule (psb_z_csr_mat_mod) psb_z_csr_mat_impl_mod contains ! == =================================== ! ! ! ! Computational routines ! ! ! ! ! ! ! == =================================== subroutine psb_z_csr_csmv(alpha,a,x,beta,y,info,trans) use psb_error_mod use psb_string_mod implicit none class(psb_z_csr_sparse_mat), intent(in) :: a complex(psb_dpk_), intent(in) :: alpha, beta, x(:) complex(psb_dpk_), intent(inout) :: y(:) integer(psb_ipk_), intent(out) :: info character, optional, intent(in) :: trans character :: trans_ integer(psb_ipk_) :: i,j,k,m,n, nnz, ir, jc complex(psb_dpk_) :: acc logical :: tra, ctra integer(psb_ipk_) :: err_act integer(psb_ipk_) :: ierr(5) character(len=20) :: name='z_csr_csmv' logical, parameter :: debug=.false. call psb_erractionsave(err_act) info = psb_success_ if (a%is_dev()) call a%sync() if (present(trans)) then trans_ = trans else trans_ = 'N' end if if (.not.a%is_asb()) then info = psb_err_invalid_mat_state_ call psb_errpush(info,name) goto 9999 endif tra = (psb_toupper(trans_) == 'T') ctra = (psb_toupper(trans_) == 'C') if (tra.or.ctra) then m = a%get_ncols() n = a%get_nrows() else n = a%get_ncols() m = a%get_nrows() end if if (size(x,1) 0) then if (debug_level >= psb_debug_serial_) & & write(debug_unit,*) trim(name),& & ': Discarded entries not belonging to us.' info = psb_success_ end if call a%set_host() else ! State is wrong. info = psb_err_invalid_mat_state_ end if if (info /= psb_success_) then call psb_errpush(info,name) goto 9999 end if call psb_erractionrestore(err_act) return 9999 call psb_error_handler(err_act) return contains subroutine psb_z_csr_srch_upd(nz,ia,ja,val,a,& & imin,imax,jmin,jmax,info,gtl) use psb_const_mod use psb_realloc_mod use psb_string_mod use psb_sort_mod implicit none class(psb_z_csr_sparse_mat), intent(inout) :: a integer(psb_ipk_), intent(in) :: nz, imin,imax,jmin,jmax integer(psb_ipk_), intent(in) :: ia(:),ja(:) complex(psb_dpk_), intent(in) :: val(:) integer(psb_ipk_), intent(out) :: info integer(psb_ipk_), intent(in), optional :: gtl(:) integer(psb_ipk_) :: i,ir,ic, ilr, ilc, ip, & & i1,i2,nr,nc,nnz,dupl,ng integer(psb_ipk_) :: debug_level, debug_unit character(len=20) :: name='z_csr_srch_upd' info = psb_success_ debug_unit = psb_get_debug_unit() debug_level = psb_get_debug_level() dupl = a%get_dupl() if (.not.a%is_sorted()) then info = -4 return end if ilr = -1 ilc = -1 nnz = a%get_nzeros() nr = a%get_nrows() nc = a%get_ncols() if (present(gtl)) then ng = size(gtl) select case(dupl) case(psb_dupl_ovwrt_,psb_dupl_err_) ! Overwrite. ! Cannot test for error, should have been caught earlier. ilr = -1 ilc = -1 do i=1, nz ir = ia(i) ic = ja(i) if ((ir >=1).and.(ir<=ng).and.(ic>=1).and.(ic<=ng)) then ir = gtl(ir) ic = gtl(ic) if ((ir > 0).and.(ir <= nr)) then i1 = a%irp(ir) i2 = a%irp(ir+1) nc=i2-i1 ip = psb_ibsrch(ic,nc,a%ja(i1:i2-1)) if (ip>0) then a%val(i1+ip-1) = val(i) else info = max(info,3) end if else info = max(info,2) end if else info = max(info,1) end if end do case(psb_dupl_add_) ! Add ilr = -1 ilc = -1 do i=1, nz ir = ia(i) ic = ja(i) if ((ir >=1).and.(ir<=ng).and.(ic>=1).and.(ic<=ng)) then ir = gtl(ir) ic = gtl(ic) if ((ir > 0).and.(ir <= nr)) then i1 = a%irp(ir) i2 = a%irp(ir+1) nc = i2-i1 ip = psb_ibsrch(ic,nc,a%ja(i1:i2-1)) if (ip>0) then a%val(i1+ip-1) = a%val(i1+ip-1) + val(i) else info = max(info,3) end if else info = max(info,2) end if else info = max(info,1) end if end do case default info = -3 if (debug_level >= psb_debug_serial_) & & write(debug_unit,*) trim(name),& & ': Duplicate handling: ',dupl end select else select case(dupl) case(psb_dupl_ovwrt_,psb_dupl_err_) ! Overwrite. ! Cannot test for error, should have been caught earlier. ilr = -1 ilc = -1 do i=1, nz ir = ia(i) ic = ja(i) if ((ir > 0).and.(ir <= nr)) then i1 = a%irp(ir) i2 = a%irp(ir+1) nc=i2-i1 ip = psb_ibsrch(ic,nc,a%ja(i1:i2-1)) if (ip>0) then a%val(i1+ip-1) = val(i) else info = max(info,3) end if else info = max(info,2) end if end do case(psb_dupl_add_) ! Add ilr = -1 ilc = -1 do i=1, nz ir = ia(i) ic = ja(i) if ((ir > 0).and.(ir <= nr)) then i1 = a%irp(ir) i2 = a%irp(ir+1) nc = i2-i1 ip = psb_ibsrch(ic,nc,a%ja(i1:i2-1)) if (ip>0) then a%val(i1+ip-1) = a%val(i1+ip-1) + val(i) else info = max(info,3) end if else info = max(info,2) end if end do case default info = -3 if (debug_level >= psb_debug_serial_) & & write(debug_unit,*) trim(name),& & ': Duplicate handling: ',dupl end select end if end subroutine psb_z_csr_srch_upd end subroutine psb_z_csr_csput_a subroutine psb_z_csr_reinit(a,clear) use psb_error_mod implicit none class(psb_z_csr_sparse_mat), intent(inout) :: a logical, intent(in), optional :: clear integer(psb_ipk_) :: err_act, info integer(psb_ipk_) :: ierr(5) character(len=20) :: name='reinit' logical :: clear_ logical, parameter :: debug=.false. call psb_erractionsave(err_act) info = psb_success_ if (a%is_dev()) call a%sync() if (present(clear)) then clear_ = clear else clear_ = .true. end if if (a%is_bld() .or. a%is_upd()) then ! do nothing return else if (a%is_asb()) then if (clear_) a%val(:) = zzero call a%set_upd() call a%set_host() else info = psb_err_invalid_mat_state_ call psb_errpush(info,name) goto 9999 end if call psb_erractionrestore(err_act) return 9999 call psb_error_handler(err_act) return end subroutine psb_z_csr_reinit subroutine psb_z_csr_trim(a) use psb_realloc_mod use psb_error_mod implicit none class(psb_z_csr_sparse_mat), intent(inout) :: a integer(psb_ipk_) :: err_act, info, nz, m integer(psb_ipk_) :: ierr(5) character(len=20) :: name='trim' logical, parameter :: debug=.false. call psb_erractionsave(err_act) info = psb_success_ m = a%get_nrows() nz = a%get_nzeros() if (info == psb_success_) call psb_realloc(m+1,a%irp,info) if (info == psb_success_) call psb_realloc(nz,a%ja,info) if (info == psb_success_) call psb_realloc(nz,a%val,info) if (info /= psb_success_) goto 9999 call psb_erractionrestore(err_act) return 9999 call psb_error_handler(err_act) return end subroutine psb_z_csr_trim subroutine psb_z_csr_print(iout,a,iv,head,ivr,ivc) use psb_string_mod implicit none integer(psb_ipk_), intent(in) :: iout class(psb_z_csr_sparse_mat), intent(in) :: a integer(psb_ipk_), intent(in), optional :: iv(:) character(len=*), optional :: head integer(psb_ipk_), intent(in), optional :: ivr(:), ivc(:) integer(psb_ipk_) :: err_act integer(psb_ipk_) :: ierr(5) character(len=20) :: name='z_csr_print' logical, parameter :: debug=.false. character(len=*), parameter :: datatype='complex' character(len=80) :: frmtv integer(psb_ipk_) :: irs,ics,i,j, nmx, ni, nr, nc, nz if (present(head)) then write(iout,'(a)') '%%MatrixMarket matrix coordinate complex general' write(iout,'(a,a)') '% ',head write(iout,'(a)') '%' write(iout,'(a,a)') '% COO' endif if (a%is_dev()) call a%sync() nr = a%get_nrows() nc = a%get_ncols() nz = a%get_nzeros() nmx = max(nr,nc,1) ni = floor(log10(1.0*nmx)) + 1 if (datatype=='real') then write(frmtv,'(a,i3.3,a,i3.3,a)') '(2(i',ni,',1x),es26.18,1x,2(i',ni,',1x))' else write(frmtv,'(a,i3.3,a,i3.3,a)') '(2(i',ni,',1x),2(es26.18,1x),2(i',ni,',1x))' end if write(iout,*) nr, nc, nz if(present(iv)) then do i=1, nr do j=a%irp(i),a%irp(i+1)-1 write(iout,frmtv) iv(i),iv(a%ja(j)),a%val(j) end do enddo else if (present(ivr).and..not.present(ivc)) then do i=1, nr do j=a%irp(i),a%irp(i+1)-1 write(iout,frmtv) ivr(i),(a%ja(j)),a%val(j) end do enddo else if (present(ivr).and.present(ivc)) then do i=1, nr do j=a%irp(i),a%irp(i+1)-1 write(iout,frmtv) ivr(i),ivc(a%ja(j)),a%val(j) end do enddo else if (.not.present(ivr).and.present(ivc)) then do i=1, nr do j=a%irp(i),a%irp(i+1)-1 write(iout,frmtv) (i),ivc(a%ja(j)),a%val(j) end do enddo else if (.not.present(ivr).and..not.present(ivc)) then do i=1, nr do j=a%irp(i),a%irp(i+1)-1 write(iout,frmtv) (i),(a%ja(j)),a%val(j) end do enddo endif endif end subroutine psb_z_csr_print subroutine psb_z_cp_csr_from_coo(a,b,info) use psb_const_mod use psb_realloc_mod use psb_z_base_mat_mod implicit none class(psb_z_csr_sparse_mat), intent(inout) :: a class(psb_z_coo_sparse_mat), intent(in) :: b integer(psb_ipk_), intent(out) :: info type(psb_z_coo_sparse_mat) :: tmp integer(psb_ipk_), allocatable :: itemp(:) !locals logical :: rwshr_ integer(psb_ipk_) :: nza, nr, nc, i,j,k,ip,irw, err_act, ncl integer(psb_ipk_), Parameter :: maxtry=8 integer(psb_ipk_) :: debug_level, debug_unit character(len=20) :: name='z_cp_csr_from_coo' info = psb_success_ debug_unit = psb_get_debug_unit() debug_level = psb_get_debug_level() if (.not.b%is_by_rows()) then ! This is to have fix_coo called behind the scenes call tmp%cp_from_coo(b,info) if (info /= psb_success_) return nr = tmp%get_nrows() nc = tmp%get_ncols() nza = tmp%get_nzeros() a%psb_z_base_sparse_mat = tmp%psb_z_base_sparse_mat ! Dirty trick: call move_alloc to have the new data allocated just once. call move_alloc(tmp%ia,itemp) call move_alloc(tmp%ja,a%ja) call move_alloc(tmp%val,a%val) call psb_realloc(max(nr+1,nc+1),a%irp,info) call tmp%free() else if (info /= psb_success_) return if (b%is_dev()) call b%sync() nr = b%get_nrows() nc = b%get_ncols() nza = b%get_nzeros() a%psb_z_base_sparse_mat = b%psb_z_base_sparse_mat ! Dirty trick: call move_alloc to have the new data allocated just once. call psb_safe_ab_cpy(b%ia,itemp,info) if (info == psb_success_) call psb_safe_ab_cpy(b%ja,a%ja,info) if (info == psb_success_) call psb_safe_ab_cpy(b%val,a%val,info) if (info == psb_success_) call psb_realloc(max(nr+1,nc+1),a%irp,info) endif a%irp(:) = 0 do k=1,nza i = itemp(k) a%irp(i) = a%irp(i) + 1 end do ip = 1 do i=1,nr ncl = a%irp(i) a%irp(i) = ip ip = ip + ncl end do a%irp(nr+1) = ip call a%set_host() end subroutine psb_z_cp_csr_from_coo subroutine psb_z_cp_csr_to_coo(a,b,info) use psb_const_mod use psb_z_base_mat_mod implicit none class(psb_z_csr_sparse_mat), intent(in) :: a class(psb_z_coo_sparse_mat), intent(inout) :: b integer(psb_ipk_), intent(out) :: info integer(psb_ipk_), allocatable :: itemp(:) !locals logical :: rwshr_ integer(psb_ipk_) :: nza, nr, nc,i,j,irw, err_act integer(psb_ipk_), Parameter :: maxtry=8 integer(psb_ipk_) :: debug_level, debug_unit character(len=20) :: name info = psb_success_ if (a%is_dev()) call a%sync() nr = a%get_nrows() nc = a%get_ncols() nza = a%get_nzeros() call b%allocate(nr,nc,nza) b%psb_z_base_sparse_mat = a%psb_z_base_sparse_mat do i=1, nr do j=a%irp(i),a%irp(i+1)-1 b%ia(j) = i b%ja(j) = a%ja(j) b%val(j) = a%val(j) end do end do call b%set_nzeros(a%get_nzeros()) call b%set_sort_status(psb_row_major_) call b%set_asb() call b%set_host() end subroutine psb_z_cp_csr_to_coo subroutine psb_z_mv_csr_to_coo(a,b,info) use psb_const_mod use psb_realloc_mod use psb_z_base_mat_mod implicit none class(psb_z_csr_sparse_mat), intent(inout) :: a class(psb_z_coo_sparse_mat), intent(inout) :: b integer(psb_ipk_), intent(out) :: info integer(psb_ipk_), allocatable :: itemp(:) !locals logical :: rwshr_ integer(psb_ipk_) :: nza, nr, nc,i,j,k,irw, err_act integer(psb_ipk_), Parameter :: maxtry=8 integer(psb_ipk_) :: debug_level, debug_unit character(len=20) :: name info = psb_success_ if (a%is_dev()) call a%sync() nr = a%get_nrows() nc = a%get_ncols() nza = a%get_nzeros() b%psb_z_base_sparse_mat = a%psb_z_base_sparse_mat call b%set_nzeros(a%get_nzeros()) call move_alloc(a%ja,b%ja) call move_alloc(a%val,b%val) call psb_realloc(nza,b%ia,info) if (info /= psb_success_) return do i=1, nr do j=a%irp(i),a%irp(i+1)-1 b%ia(j) = i end do end do call a%free() call b%set_sort_status(psb_row_major_) call b%set_asb() call b%set_host() end subroutine psb_z_mv_csr_to_coo subroutine psb_z_mv_csr_from_coo(a,b,info) use psb_const_mod use psb_realloc_mod use psb_error_mod use psb_z_base_mat_mod implicit none class(psb_z_csr_sparse_mat), intent(inout) :: a class(psb_z_coo_sparse_mat), intent(inout) :: b integer(psb_ipk_), intent(out) :: info integer(psb_ipk_), allocatable :: itemp(:) !locals logical :: rwshr_ integer(psb_ipk_) :: nza, nr, nc, i,j,k, ip,irw, err_act, ncl integer(psb_ipk_), Parameter :: maxtry=8 integer(psb_ipk_) :: debug_level, debug_unit character(len=20) :: name='mv_from_coo' info = psb_success_ debug_unit = psb_get_debug_unit() debug_level = psb_get_debug_level() if (b%is_dev()) call b%sync() if (.not.b%is_by_rows()) call b%fix(info) if (info /= psb_success_) return nr = b%get_nrows() nc = b%get_ncols() nza = b%get_nzeros() a%psb_z_base_sparse_mat = b%psb_z_base_sparse_mat ! Dirty trick: call move_alloc to have the new data allocated just once. call move_alloc(b%ia,itemp) call move_alloc(b%ja,a%ja) call move_alloc(b%val,a%val) call psb_realloc(max(nr+1,nc+1),a%irp,info) call b%free() a%irp(:) = 0 do k=1,nza i = itemp(k) a%irp(i) = a%irp(i) + 1 end do ip = 1 do i=1,nr ncl = a%irp(i) a%irp(i) = ip ip = ip + ncl end do a%irp(nr+1) = ip call a%set_host() end subroutine psb_z_mv_csr_from_coo subroutine psb_z_mv_csr_to_fmt(a,b,info) use psb_const_mod use psb_z_base_mat_mod implicit none class(psb_z_csr_sparse_mat), intent(inout) :: a class(psb_z_base_sparse_mat), intent(inout) :: b integer(psb_ipk_), intent(out) :: info !locals type(psb_z_coo_sparse_mat) :: tmp logical :: rwshr_ integer(psb_ipk_) :: nza, nr, i,j,irw, err_act, nc integer(psb_ipk_), Parameter :: maxtry=8 integer(psb_ipk_) :: debug_level, debug_unit character(len=20) :: name info = psb_success_ select type (b) type is (psb_z_coo_sparse_mat) call a%mv_to_coo(b,info) ! Need to fix trivial copies! type is (psb_z_csr_sparse_mat) if (a%is_dev()) call a%sync() b%psb_z_base_sparse_mat = a%psb_z_base_sparse_mat call move_alloc(a%irp, b%irp) call move_alloc(a%ja, b%ja) call move_alloc(a%val, b%val) call a%free() call b%set_host() class default call a%mv_to_coo(tmp,info) if (info == psb_success_) call b%mv_from_coo(tmp,info) end select end subroutine psb_z_mv_csr_to_fmt subroutine psb_z_cp_csr_to_fmt(a,b,info) use psb_const_mod use psb_z_base_mat_mod use psb_realloc_mod implicit none class(psb_z_csr_sparse_mat), intent(in) :: a class(psb_z_base_sparse_mat), intent(inout) :: b integer(psb_ipk_), intent(out) :: info !locals type(psb_z_coo_sparse_mat) :: tmp logical :: rwshr_ integer(psb_ipk_) :: nz, nr, i,j,irw, err_act, nc integer(psb_ipk_), Parameter :: maxtry=8 integer(psb_ipk_) :: debug_level, debug_unit character(len=20) :: name info = psb_success_ select type (b) type is (psb_z_coo_sparse_mat) call a%cp_to_coo(b,info) type is (psb_z_csr_sparse_mat) if (a%is_dev()) call a%sync() b%psb_z_base_sparse_mat = a%psb_z_base_sparse_mat nr = a%get_nrows() nz = a%get_nzeros() if (info == 0) call psb_safe_cpy( a%irp(1:nr+1), b%irp , info) if (info == 0) call psb_safe_cpy( a%ja(1:nz), b%ja , info) if (info == 0) call psb_safe_cpy( a%val(1:nz), b%val , info) call b%set_host() class default call a%cp_to_coo(tmp,info) if (info == psb_success_) call b%mv_from_coo(tmp,info) end select end subroutine psb_z_cp_csr_to_fmt subroutine psb_z_mv_csr_from_fmt(a,b,info) use psb_const_mod use psb_z_base_mat_mod implicit none class(psb_z_csr_sparse_mat), intent(inout) :: a class(psb_z_base_sparse_mat), intent(inout) :: b integer(psb_ipk_), intent(out) :: info !locals type(psb_z_coo_sparse_mat) :: tmp logical :: rwshr_ integer(psb_ipk_) :: nza, nr, i,j,irw, err_act, nc integer(psb_ipk_), Parameter :: maxtry=8 integer(psb_ipk_) :: debug_level, debug_unit character(len=20) :: name info = psb_success_ select type (b) type is (psb_z_coo_sparse_mat) call a%mv_from_coo(b,info) type is (psb_z_csr_sparse_mat) if (b%is_dev()) call b%sync() a%psb_z_base_sparse_mat = b%psb_z_base_sparse_mat call move_alloc(b%irp, a%irp) call move_alloc(b%ja, a%ja) call move_alloc(b%val, a%val) call b%free() call a%set_host() class default call b%mv_to_coo(tmp,info) if (info == psb_success_) call a%mv_from_coo(tmp,info) end select end subroutine psb_z_mv_csr_from_fmt subroutine psb_z_cp_csr_from_fmt(a,b,info) use psb_const_mod use psb_z_base_mat_mod use psb_realloc_mod implicit none class(psb_z_csr_sparse_mat), intent(inout) :: a class(psb_z_base_sparse_mat), intent(in) :: b integer(psb_ipk_), intent(out) :: info !locals type(psb_z_coo_sparse_mat) :: tmp logical :: rwshr_ integer(psb_ipk_) :: nz, nr, i,j,irw, err_act, nc integer(psb_ipk_), Parameter :: maxtry=8 integer(psb_ipk_) :: debug_level, debug_unit character(len=20) :: name info = psb_success_ select type (b) type is (psb_z_coo_sparse_mat) call a%cp_from_coo(b,info) type is (psb_z_csr_sparse_mat) if (b%is_dev()) call b%sync() a%psb_z_base_sparse_mat = b%psb_z_base_sparse_mat nr = b%get_nrows() nz = b%get_nzeros() if (info == 0) call psb_safe_cpy( b%irp(1:nr+1), a%irp , info) if (info == 0) call psb_safe_cpy( b%ja(1:nz) , a%ja , info) if (info == 0) call psb_safe_cpy( b%val(1:nz) , a%val , info) call a%set_host() class default call b%cp_to_coo(tmp,info) if (info == psb_success_) call a%mv_from_coo(tmp,info) end select end subroutine psb_z_cp_csr_from_fmt subroutine psb_zcsrspspmm(a,b,c,info) use psb_serial_mod, psb_protect_name => psb_zcsrspspmm implicit none class(psb_z_csr_sparse_mat), intent(in) :: a,b type(psb_z_csr_sparse_mat), intent(out) :: c integer(psb_ipk_), intent(out) :: info integer(psb_ipk_) :: nze, ma,na,mb,nb, nzc, nza, nzb,nzeb character(len=20) :: name integer(psb_ipk_) :: err_act name='psb_csrspspmm' call psb_erractionsave(err_act) info = psb_success_ if (a%is_dev()) call a%sync() if (b%is_dev()) call b%sync() ma = a%get_nrows() na = a%get_ncols() mb = b%get_nrows() nb = b%get_ncols() if ( mb /= na ) then write(psb_err_unit,*) 'Mismatch in SPSPMM: ',ma,na,mb,nb endif nza = a%get_nzeros() nzb = b%get_nzeros() nzc = 2*(nza+nzb) nze = ma*(((nza+ma-1)/ma)*((nzb+mb-1)/mb) ) nzeb = (((nza+na-1)/na)*((nzb+nb-1)/nb))*nb ! Estimate number of nonzeros on output. ! Turns out this is often a large overestimate. call c%allocate(ma,nb,min(nzc,nze,nzeb)) call csr_spspmm(a,b,c,info) call c%set_asb() call c%set_host() call psb_erractionrestore(err_act) return 9999 call psb_error_handler(err_act) return contains subroutine csr_spspmm(a,b,c,info) implicit none type(psb_z_csr_sparse_mat), intent(in) :: a,b type(psb_z_csr_sparse_mat), intent(inout) :: c integer(psb_ipk_), intent(out) :: info integer(psb_ipk_) :: ma,na,mb,nb integer(psb_ipk_), allocatable :: irow(:), idxs(:) complex(psb_dpk_), allocatable :: row(:) integer(psb_ipk_) :: i,j,k,irw,icl,icf, iret, & & nzc,nnzre, isz, ipb, irwsz, nrc, nze complex(psb_dpk_) :: cfb info = psb_success_ ma = a%get_nrows() na = a%get_ncols() mb = b%get_nrows() nb = b%get_ncols() nze = min(size(c%val),size(c%ja)) isz = max(ma,na,mb,nb) call psb_realloc(isz,row,info) if (info == 0) call psb_realloc(isz,idxs,info) if (info == 0) call psb_realloc(isz,irow,info) if (info /= 0) return row = dzero irow = 0 nzc = 1 do j = 1,ma c%irp(j) = nzc nrc = 0 do k = a%irp(j), a%irp(j+1)-1 irw = a%ja(k) cfb = a%val(k) irwsz = b%irp(irw+1)-b%irp(irw) do i = b%irp(irw),b%irp(irw+1)-1 icl = b%ja(i) if (irow(icl) 0 ) then if ((nzc+nrc)>nze) then nze = max(ma*((nzc+j-1)/j),nzc+2*nrc) call psb_realloc(nze,c%val,info) if (info == 0) call psb_realloc(nze,c%ja,info) if (info /= 0) return end if call psb_msort(idxs(1:nrc)) do i=1, nrc irw = idxs(i) c%ja(nzc) = irw c%val(nzc) = row(irw) row(irw) = dzero nzc = nzc + 1 end do end if end do c%irp(ma+1) = nzc end subroutine csr_spspmm end subroutine psb_zcsrspspmm end submodule psb_z_csr_mat_impl_mod