Implement TRIL/TRIU with blocking.

scsr
Salvatore Filippone 7 years ago
parent ce33f6b6ed
commit 663fa5b8e5

@ -645,7 +645,7 @@ subroutine psb_c_base_tril(a,l,info,&
logical, intent(in), optional :: rscale,cscale logical, intent(in), optional :: rscale,cscale
class(psb_c_coo_sparse_mat), optional, intent(out) :: u class(psb_c_coo_sparse_mat), optional, intent(out) :: u
integer(psb_ipk_) :: err_act, nzin, nzout, i, j, k integer(psb_ipk_) :: err_act, nzin, nzout, i, j, k, ibk
integer(psb_ipk_) :: imin_, imax_, jmin_, jmax_, mb,nb, diag_, nzlin, nzuin, nz integer(psb_ipk_) :: imin_, imax_, jmin_, jmax_, mb,nb, diag_, nzlin, nzuin, nz
integer(psb_ipk_), allocatable :: ia(:), ja(:) integer(psb_ipk_), allocatable :: ia(:), ja(:)
complex(psb_spk_), allocatable :: val(:) complex(psb_spk_), allocatable :: val(:)
@ -653,6 +653,7 @@ subroutine psb_c_base_tril(a,l,info,&
character(len=20) :: name='tril' character(len=20) :: name='tril'
logical :: rscale_, cscale_ logical :: rscale_, cscale_
logical, parameter :: debug=.false. logical, parameter :: debug=.false.
integer(psb_ipk_), parameter :: nbk=8
call psb_erractionsave(err_act) call psb_erractionsave(err_act)
info = psb_success_ info = psb_success_
@ -715,12 +716,12 @@ subroutine psb_c_base_tril(a,l,info,&
call psb_realloc(max(mb,nb),ia,info) call psb_realloc(max(mb,nb),ia,info)
call psb_realloc(max(mb,nb),ja,info) call psb_realloc(max(mb,nb),ja,info)
call psb_realloc(max(mb,nb),val,info) call psb_realloc(max(mb,nb),val,info)
do i=imin_,imax_ do i=imin_,imax_, nbk
call a%csget(i,i,nzout,ia,ja,val,info,& ibk = min(nbk,imax_-i+1)
call a%csget(i,i+ibk-1,nzout,ia,ja,val,info,&
& jmin=jmin_, jmax=jmax_) & jmin=jmin_, jmax=jmax_)
do k=1, nzout do k=1, nzout
j = ja(k) if ((ja(k)-ia(k))<=diag_) then
if (j-i<=diag_) then
nzlin = nzlin + 1 nzlin = nzlin + 1
l%ia(nzlin) = ia(k) l%ia(nzlin) = ia(k)
l%ja(nzlin) = ja(k) l%ja(nzlin) = ja(k)
@ -796,7 +797,7 @@ subroutine psb_c_base_triu(a,u,info,&
logical, intent(in), optional :: rscale,cscale logical, intent(in), optional :: rscale,cscale
class(psb_c_coo_sparse_mat), optional, intent(out) :: l class(psb_c_coo_sparse_mat), optional, intent(out) :: l
integer(psb_ipk_) :: err_act, nzin, nzout, i, j, k integer(psb_ipk_) :: err_act, nzin, nzout, i, j, k, ibk
integer(psb_ipk_) :: imin_, imax_, jmin_, jmax_, mb,nb, diag_, nzlin, nzuin, nz integer(psb_ipk_) :: imin_, imax_, jmin_, jmax_, mb,nb, diag_, nzlin, nzuin, nz
integer(psb_ipk_), allocatable :: ia(:), ja(:) integer(psb_ipk_), allocatable :: ia(:), ja(:)
complex(psb_spk_), allocatable :: val(:) complex(psb_spk_), allocatable :: val(:)
@ -804,6 +805,7 @@ subroutine psb_c_base_triu(a,u,info,&
character(len=20) :: name='triu' character(len=20) :: name='triu'
logical :: rscale_, cscale_ logical :: rscale_, cscale_
logical, parameter :: debug=.false. logical, parameter :: debug=.false.
integer(psb_ipk_), parameter :: nbk=8
call psb_erractionsave(err_act) call psb_erractionsave(err_act)
info = psb_success_ info = psb_success_
@ -866,12 +868,12 @@ subroutine psb_c_base_triu(a,u,info,&
call psb_realloc(max(mb,nb),ia,info) call psb_realloc(max(mb,nb),ia,info)
call psb_realloc(max(mb,nb),ja,info) call psb_realloc(max(mb,nb),ja,info)
call psb_realloc(max(mb,nb),val,info) call psb_realloc(max(mb,nb),val,info)
do i=imin_,imax_ do i=imin_,imax_, nbk
call a%csget(i,i,nzout,ia,ja,val,info,& ibk = min(nbk,imax_-i+1)
call a%csget(i,i+ibk-1,nzout,ia,ja,val,info,&
& jmin=jmin_, jmax=jmax_) & jmin=jmin_, jmax=jmax_)
do k=1, nzout do k=1, nzout
j = ja(k) if ((ja(k)-ia(k))<diag_) then
if (j-i<diag_) then
nzlin = nzlin + 1 nzlin = nzlin + 1
l%ia(nzlin) = ia(k) l%ia(nzlin) = ia(k)
l%ja(nzlin) = ja(k) l%ja(nzlin) = ja(k)

@ -645,7 +645,7 @@ subroutine psb_d_base_tril(a,l,info,&
logical, intent(in), optional :: rscale,cscale logical, intent(in), optional :: rscale,cscale
class(psb_d_coo_sparse_mat), optional, intent(out) :: u class(psb_d_coo_sparse_mat), optional, intent(out) :: u
integer(psb_ipk_) :: err_act, nzin, nzout, i, j, k integer(psb_ipk_) :: err_act, nzin, nzout, i, j, k, ibk
integer(psb_ipk_) :: imin_, imax_, jmin_, jmax_, mb,nb, diag_, nzlin, nzuin, nz integer(psb_ipk_) :: imin_, imax_, jmin_, jmax_, mb,nb, diag_, nzlin, nzuin, nz
integer(psb_ipk_), allocatable :: ia(:), ja(:) integer(psb_ipk_), allocatable :: ia(:), ja(:)
real(psb_dpk_), allocatable :: val(:) real(psb_dpk_), allocatable :: val(:)
@ -653,6 +653,7 @@ subroutine psb_d_base_tril(a,l,info,&
character(len=20) :: name='tril' character(len=20) :: name='tril'
logical :: rscale_, cscale_ logical :: rscale_, cscale_
logical, parameter :: debug=.false. logical, parameter :: debug=.false.
integer(psb_ipk_), parameter :: nbk=8
call psb_erractionsave(err_act) call psb_erractionsave(err_act)
info = psb_success_ info = psb_success_
@ -715,12 +716,12 @@ subroutine psb_d_base_tril(a,l,info,&
call psb_realloc(max(mb,nb),ia,info) call psb_realloc(max(mb,nb),ia,info)
call psb_realloc(max(mb,nb),ja,info) call psb_realloc(max(mb,nb),ja,info)
call psb_realloc(max(mb,nb),val,info) call psb_realloc(max(mb,nb),val,info)
do i=imin_,imax_ do i=imin_,imax_, nbk
call a%csget(i,i,nzout,ia,ja,val,info,& ibk = min(nbk,imax_-i+1)
call a%csget(i,i+ibk-1,nzout,ia,ja,val,info,&
& jmin=jmin_, jmax=jmax_) & jmin=jmin_, jmax=jmax_)
do k=1, nzout do k=1, nzout
j = ja(k) if ((ja(k)-ia(k))<=diag_) then
if (j-i<=diag_) then
nzlin = nzlin + 1 nzlin = nzlin + 1
l%ia(nzlin) = ia(k) l%ia(nzlin) = ia(k)
l%ja(nzlin) = ja(k) l%ja(nzlin) = ja(k)
@ -796,7 +797,7 @@ subroutine psb_d_base_triu(a,u,info,&
logical, intent(in), optional :: rscale,cscale logical, intent(in), optional :: rscale,cscale
class(psb_d_coo_sparse_mat), optional, intent(out) :: l class(psb_d_coo_sparse_mat), optional, intent(out) :: l
integer(psb_ipk_) :: err_act, nzin, nzout, i, j, k integer(psb_ipk_) :: err_act, nzin, nzout, i, j, k, ibk
integer(psb_ipk_) :: imin_, imax_, jmin_, jmax_, mb,nb, diag_, nzlin, nzuin, nz integer(psb_ipk_) :: imin_, imax_, jmin_, jmax_, mb,nb, diag_, nzlin, nzuin, nz
integer(psb_ipk_), allocatable :: ia(:), ja(:) integer(psb_ipk_), allocatable :: ia(:), ja(:)
real(psb_dpk_), allocatable :: val(:) real(psb_dpk_), allocatable :: val(:)
@ -804,6 +805,7 @@ subroutine psb_d_base_triu(a,u,info,&
character(len=20) :: name='triu' character(len=20) :: name='triu'
logical :: rscale_, cscale_ logical :: rscale_, cscale_
logical, parameter :: debug=.false. logical, parameter :: debug=.false.
integer(psb_ipk_), parameter :: nbk=8
call psb_erractionsave(err_act) call psb_erractionsave(err_act)
info = psb_success_ info = psb_success_
@ -866,12 +868,12 @@ subroutine psb_d_base_triu(a,u,info,&
call psb_realloc(max(mb,nb),ia,info) call psb_realloc(max(mb,nb),ia,info)
call psb_realloc(max(mb,nb),ja,info) call psb_realloc(max(mb,nb),ja,info)
call psb_realloc(max(mb,nb),val,info) call psb_realloc(max(mb,nb),val,info)
do i=imin_,imax_ do i=imin_,imax_, nbk
call a%csget(i,i,nzout,ia,ja,val,info,& ibk = min(nbk,imax_-i+1)
call a%csget(i,i+ibk-1,nzout,ia,ja,val,info,&
& jmin=jmin_, jmax=jmax_) & jmin=jmin_, jmax=jmax_)
do k=1, nzout do k=1, nzout
j = ja(k) if ((ja(k)-ia(k))<diag_) then
if (j-i<diag_) then
nzlin = nzlin + 1 nzlin = nzlin + 1
l%ia(nzlin) = ia(k) l%ia(nzlin) = ia(k)
l%ja(nzlin) = ja(k) l%ja(nzlin) = ja(k)

@ -645,7 +645,7 @@ subroutine psb_s_base_tril(a,l,info,&
logical, intent(in), optional :: rscale,cscale logical, intent(in), optional :: rscale,cscale
class(psb_s_coo_sparse_mat), optional, intent(out) :: u class(psb_s_coo_sparse_mat), optional, intent(out) :: u
integer(psb_ipk_) :: err_act, nzin, nzout, i, j, k integer(psb_ipk_) :: err_act, nzin, nzout, i, j, k, ibk
integer(psb_ipk_) :: imin_, imax_, jmin_, jmax_, mb,nb, diag_, nzlin, nzuin, nz integer(psb_ipk_) :: imin_, imax_, jmin_, jmax_, mb,nb, diag_, nzlin, nzuin, nz
integer(psb_ipk_), allocatable :: ia(:), ja(:) integer(psb_ipk_), allocatable :: ia(:), ja(:)
real(psb_spk_), allocatable :: val(:) real(psb_spk_), allocatable :: val(:)
@ -653,6 +653,7 @@ subroutine psb_s_base_tril(a,l,info,&
character(len=20) :: name='tril' character(len=20) :: name='tril'
logical :: rscale_, cscale_ logical :: rscale_, cscale_
logical, parameter :: debug=.false. logical, parameter :: debug=.false.
integer(psb_ipk_), parameter :: nbk=8
call psb_erractionsave(err_act) call psb_erractionsave(err_act)
info = psb_success_ info = psb_success_
@ -715,12 +716,12 @@ subroutine psb_s_base_tril(a,l,info,&
call psb_realloc(max(mb,nb),ia,info) call psb_realloc(max(mb,nb),ia,info)
call psb_realloc(max(mb,nb),ja,info) call psb_realloc(max(mb,nb),ja,info)
call psb_realloc(max(mb,nb),val,info) call psb_realloc(max(mb,nb),val,info)
do i=imin_,imax_ do i=imin_,imax_, nbk
call a%csget(i,i,nzout,ia,ja,val,info,& ibk = min(nbk,imax_-i+1)
call a%csget(i,i+ibk-1,nzout,ia,ja,val,info,&
& jmin=jmin_, jmax=jmax_) & jmin=jmin_, jmax=jmax_)
do k=1, nzout do k=1, nzout
j = ja(k) if ((ja(k)-ia(k))<=diag_) then
if (j-i<=diag_) then
nzlin = nzlin + 1 nzlin = nzlin + 1
l%ia(nzlin) = ia(k) l%ia(nzlin) = ia(k)
l%ja(nzlin) = ja(k) l%ja(nzlin) = ja(k)
@ -796,7 +797,7 @@ subroutine psb_s_base_triu(a,u,info,&
logical, intent(in), optional :: rscale,cscale logical, intent(in), optional :: rscale,cscale
class(psb_s_coo_sparse_mat), optional, intent(out) :: l class(psb_s_coo_sparse_mat), optional, intent(out) :: l
integer(psb_ipk_) :: err_act, nzin, nzout, i, j, k integer(psb_ipk_) :: err_act, nzin, nzout, i, j, k, ibk
integer(psb_ipk_) :: imin_, imax_, jmin_, jmax_, mb,nb, diag_, nzlin, nzuin, nz integer(psb_ipk_) :: imin_, imax_, jmin_, jmax_, mb,nb, diag_, nzlin, nzuin, nz
integer(psb_ipk_), allocatable :: ia(:), ja(:) integer(psb_ipk_), allocatable :: ia(:), ja(:)
real(psb_spk_), allocatable :: val(:) real(psb_spk_), allocatable :: val(:)
@ -804,6 +805,7 @@ subroutine psb_s_base_triu(a,u,info,&
character(len=20) :: name='triu' character(len=20) :: name='triu'
logical :: rscale_, cscale_ logical :: rscale_, cscale_
logical, parameter :: debug=.false. logical, parameter :: debug=.false.
integer(psb_ipk_), parameter :: nbk=8
call psb_erractionsave(err_act) call psb_erractionsave(err_act)
info = psb_success_ info = psb_success_
@ -866,12 +868,12 @@ subroutine psb_s_base_triu(a,u,info,&
call psb_realloc(max(mb,nb),ia,info) call psb_realloc(max(mb,nb),ia,info)
call psb_realloc(max(mb,nb),ja,info) call psb_realloc(max(mb,nb),ja,info)
call psb_realloc(max(mb,nb),val,info) call psb_realloc(max(mb,nb),val,info)
do i=imin_,imax_ do i=imin_,imax_, nbk
call a%csget(i,i,nzout,ia,ja,val,info,& ibk = min(nbk,imax_-i+1)
call a%csget(i,i+ibk-1,nzout,ia,ja,val,info,&
& jmin=jmin_, jmax=jmax_) & jmin=jmin_, jmax=jmax_)
do k=1, nzout do k=1, nzout
j = ja(k) if ((ja(k)-ia(k))<diag_) then
if (j-i<diag_) then
nzlin = nzlin + 1 nzlin = nzlin + 1
l%ia(nzlin) = ia(k) l%ia(nzlin) = ia(k)
l%ja(nzlin) = ja(k) l%ja(nzlin) = ja(k)

@ -645,7 +645,7 @@ subroutine psb_z_base_tril(a,l,info,&
logical, intent(in), optional :: rscale,cscale logical, intent(in), optional :: rscale,cscale
class(psb_z_coo_sparse_mat), optional, intent(out) :: u class(psb_z_coo_sparse_mat), optional, intent(out) :: u
integer(psb_ipk_) :: err_act, nzin, nzout, i, j, k integer(psb_ipk_) :: err_act, nzin, nzout, i, j, k, ibk
integer(psb_ipk_) :: imin_, imax_, jmin_, jmax_, mb,nb, diag_, nzlin, nzuin, nz integer(psb_ipk_) :: imin_, imax_, jmin_, jmax_, mb,nb, diag_, nzlin, nzuin, nz
integer(psb_ipk_), allocatable :: ia(:), ja(:) integer(psb_ipk_), allocatable :: ia(:), ja(:)
complex(psb_dpk_), allocatable :: val(:) complex(psb_dpk_), allocatable :: val(:)
@ -653,6 +653,7 @@ subroutine psb_z_base_tril(a,l,info,&
character(len=20) :: name='tril' character(len=20) :: name='tril'
logical :: rscale_, cscale_ logical :: rscale_, cscale_
logical, parameter :: debug=.false. logical, parameter :: debug=.false.
integer(psb_ipk_), parameter :: nbk=8
call psb_erractionsave(err_act) call psb_erractionsave(err_act)
info = psb_success_ info = psb_success_
@ -715,12 +716,12 @@ subroutine psb_z_base_tril(a,l,info,&
call psb_realloc(max(mb,nb),ia,info) call psb_realloc(max(mb,nb),ia,info)
call psb_realloc(max(mb,nb),ja,info) call psb_realloc(max(mb,nb),ja,info)
call psb_realloc(max(mb,nb),val,info) call psb_realloc(max(mb,nb),val,info)
do i=imin_,imax_ do i=imin_,imax_, nbk
call a%csget(i,i,nzout,ia,ja,val,info,& ibk = min(nbk,imax_-i+1)
call a%csget(i,i+ibk-1,nzout,ia,ja,val,info,&
& jmin=jmin_, jmax=jmax_) & jmin=jmin_, jmax=jmax_)
do k=1, nzout do k=1, nzout
j = ja(k) if ((ja(k)-ia(k))<=diag_) then
if (j-i<=diag_) then
nzlin = nzlin + 1 nzlin = nzlin + 1
l%ia(nzlin) = ia(k) l%ia(nzlin) = ia(k)
l%ja(nzlin) = ja(k) l%ja(nzlin) = ja(k)
@ -796,7 +797,7 @@ subroutine psb_z_base_triu(a,u,info,&
logical, intent(in), optional :: rscale,cscale logical, intent(in), optional :: rscale,cscale
class(psb_z_coo_sparse_mat), optional, intent(out) :: l class(psb_z_coo_sparse_mat), optional, intent(out) :: l
integer(psb_ipk_) :: err_act, nzin, nzout, i, j, k integer(psb_ipk_) :: err_act, nzin, nzout, i, j, k, ibk
integer(psb_ipk_) :: imin_, imax_, jmin_, jmax_, mb,nb, diag_, nzlin, nzuin, nz integer(psb_ipk_) :: imin_, imax_, jmin_, jmax_, mb,nb, diag_, nzlin, nzuin, nz
integer(psb_ipk_), allocatable :: ia(:), ja(:) integer(psb_ipk_), allocatable :: ia(:), ja(:)
complex(psb_dpk_), allocatable :: val(:) complex(psb_dpk_), allocatable :: val(:)
@ -804,6 +805,7 @@ subroutine psb_z_base_triu(a,u,info,&
character(len=20) :: name='triu' character(len=20) :: name='triu'
logical :: rscale_, cscale_ logical :: rscale_, cscale_
logical, parameter :: debug=.false. logical, parameter :: debug=.false.
integer(psb_ipk_), parameter :: nbk=8
call psb_erractionsave(err_act) call psb_erractionsave(err_act)
info = psb_success_ info = psb_success_
@ -866,12 +868,12 @@ subroutine psb_z_base_triu(a,u,info,&
call psb_realloc(max(mb,nb),ia,info) call psb_realloc(max(mb,nb),ia,info)
call psb_realloc(max(mb,nb),ja,info) call psb_realloc(max(mb,nb),ja,info)
call psb_realloc(max(mb,nb),val,info) call psb_realloc(max(mb,nb),val,info)
do i=imin_,imax_ do i=imin_,imax_, nbk
call a%csget(i,i,nzout,ia,ja,val,info,& ibk = min(nbk,imax_-i+1)
call a%csget(i,i+ibk-1,nzout,ia,ja,val,info,&
& jmin=jmin_, jmax=jmax_) & jmin=jmin_, jmax=jmax_)
do k=1, nzout do k=1, nzout
j = ja(k) if ((ja(k)-ia(k))<diag_) then
if (j-i<diag_) then
nzlin = nzlin + 1 nzlin = nzlin + 1
l%ia(nzlin) = ia(k) l%ia(nzlin) = ia(k)
l%ja(nzlin) = ja(k) l%ja(nzlin) = ja(k)

Loading…
Cancel
Save