From 663fa5b8e5e7b85f994213c75ac378bd4f22f812 Mon Sep 17 00:00:00 2001 From: Salvatore Filippone Date: Fri, 27 Jul 2018 14:36:46 +0100 Subject: [PATCH] Implement TRIL/TRIU with blocking. --- base/serial/impl/psb_c_base_mat_impl.F90 | 22 ++++++++++++---------- base/serial/impl/psb_d_base_mat_impl.F90 | 22 ++++++++++++---------- base/serial/impl/psb_s_base_mat_impl.F90 | 22 ++++++++++++---------- base/serial/impl/psb_z_base_mat_impl.F90 | 22 ++++++++++++---------- 4 files changed, 48 insertions(+), 40 deletions(-) diff --git a/base/serial/impl/psb_c_base_mat_impl.F90 b/base/serial/impl/psb_c_base_mat_impl.F90 index 954e2143..9a81f286 100644 --- a/base/serial/impl/psb_c_base_mat_impl.F90 +++ b/base/serial/impl/psb_c_base_mat_impl.F90 @@ -645,7 +645,7 @@ subroutine psb_c_base_tril(a,l,info,& logical, intent(in), optional :: rscale,cscale class(psb_c_coo_sparse_mat), optional, intent(out) :: u - integer(psb_ipk_) :: err_act, nzin, nzout, i, j, k + integer(psb_ipk_) :: err_act, nzin, nzout, i, j, k, ibk integer(psb_ipk_) :: imin_, imax_, jmin_, jmax_, mb,nb, diag_, nzlin, nzuin, nz integer(psb_ipk_), allocatable :: ia(:), ja(:) complex(psb_spk_), allocatable :: val(:) @@ -653,6 +653,7 @@ subroutine psb_c_base_tril(a,l,info,& character(len=20) :: name='tril' logical :: rscale_, cscale_ logical, parameter :: debug=.false. + integer(psb_ipk_), parameter :: nbk=8 call psb_erractionsave(err_act) info = psb_success_ @@ -715,12 +716,12 @@ subroutine psb_c_base_tril(a,l,info,& call psb_realloc(max(mb,nb),ia,info) call psb_realloc(max(mb,nb),ja,info) call psb_realloc(max(mb,nb),val,info) - do i=imin_,imax_ - call a%csget(i,i,nzout,ia,ja,val,info,& + do i=imin_,imax_, nbk + ibk = min(nbk,imax_-i+1) + call a%csget(i,i+ibk-1,nzout,ia,ja,val,info,& & jmin=jmin_, jmax=jmax_) do k=1, nzout - j = ja(k) - if (j-i<=diag_) then + if ((ja(k)-ia(k))<=diag_) then nzlin = nzlin + 1 l%ia(nzlin) = ia(k) l%ja(nzlin) = ja(k) @@ -796,7 +797,7 @@ subroutine psb_c_base_triu(a,u,info,& logical, intent(in), optional :: rscale,cscale class(psb_c_coo_sparse_mat), optional, intent(out) :: l - integer(psb_ipk_) :: err_act, nzin, nzout, i, j, k + integer(psb_ipk_) :: err_act, nzin, nzout, i, j, k, ibk integer(psb_ipk_) :: imin_, imax_, jmin_, jmax_, mb,nb, diag_, nzlin, nzuin, nz integer(psb_ipk_), allocatable :: ia(:), ja(:) complex(psb_spk_), allocatable :: val(:) @@ -804,6 +805,7 @@ subroutine psb_c_base_triu(a,u,info,& character(len=20) :: name='triu' logical :: rscale_, cscale_ logical, parameter :: debug=.false. + integer(psb_ipk_), parameter :: nbk=8 call psb_erractionsave(err_act) info = psb_success_ @@ -866,12 +868,12 @@ subroutine psb_c_base_triu(a,u,info,& call psb_realloc(max(mb,nb),ia,info) call psb_realloc(max(mb,nb),ja,info) call psb_realloc(max(mb,nb),val,info) - do i=imin_,imax_ - call a%csget(i,i,nzout,ia,ja,val,info,& + do i=imin_,imax_, nbk + ibk = min(nbk,imax_-i+1) + call a%csget(i,i+ibk-1,nzout,ia,ja,val,info,& & jmin=jmin_, jmax=jmax_) do k=1, nzout - j = ja(k) - if (j-i