!!$ !!$ Parallel Sparse BLAS version 3.1 !!$ (C) Copyright 2006, 2007, 2008, 2009, 2010, 2012, 2013 !!$ Salvatore Filippone University of Rome Tor Vergata !!$ Alfredo Buttari CNRS-IRIT, Toulouse !!$ !!$ Redistribution and use in source and binary forms, with or without !!$ modification, are permitted provided that the following conditions !!$ are met: !!$ 1. Redistributions of source code must retain the above copyright !!$ notice, this list of conditions and the following disclaimer. !!$ 2. Redistributions in binary form must reproduce the above copyright !!$ notice, this list of conditions, and the following disclaimer in the !!$ documentation and/or other materials provided with the distribution. !!$ 3. The name of the PSBLAS group or the names of its contributors may !!$ not be used to endorse or promote products derived from this !!$ software without specific written permission. !!$ !!$ THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS !!$ ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED !!$ TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR !!$ PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE PSBLAS GROUP OR ITS CONTRIBUTORS !!$ BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR !!$ CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF !!$ SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS !!$ INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN !!$ CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) !!$ ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE !!$ POSSIBILITY OF SUCH DAMAGE. !!$ !!$ program shift_invert use psb_base_mod use psb_prec_mod use psb_krylov_mod use psb_util_mod implicit none ! input parameters character(len=40) :: kmethd, ptype, mtrx_file, rhs_file ! sparse matrices and preconditioner type(psb_dspmat_type) :: a, aux_a, id, a2, b type(psb_d_csr_sparse_mat)::acsr, icsr type(psb_dprec_type) :: prec ! dense matrices real(psb_dpk_), allocatable, target :: aux_b(:,:), d(:) complex(psb_dpk_), allocatable, target :: H(:,:),eig(:),work(:),Z(:,:) real(psb_dpk_), allocatable , save :: x_col_glob(:), r_col_glob(:) real(psb_dpk_), pointer :: b_col_glob(:) type(psb_d_vect_type) :: b_col, x_col, r_col type (psb_d_vect_type), allocatable, target :: V(:) integer(psb_ipk_), allocatable , save :: indexes(:) ! communications data structure type(psb_desc_type):: desc_a integer(psb_ipk_) :: ictxt, iam, np ! solver paramters integer(psb_ipk_) :: iter, itmax, ierr, itrace, ircode, ipart,& & methd, istopc, irst, nr, sort, annz integer(psb_long_int_k_) :: amatsize, descsize, nbytes real(psb_dpk_) :: err, eps,cond character(len=5) :: afmt character(len=20) :: name, ch_err character(len=2) :: filefmt integer(psb_ipk_), parameter :: iunit=12 integer(psb_ipk_) :: times=0 integer(psb_ipk_) :: iparm(20) ! other variables integer(psb_ipk_) :: i,info,j,m_problem integer(psb_ipk_) :: internal, m,ii,nnzero,ji real(psb_dpk_) :: t1, t2, r_amax, b_amax,& &scale,resmx,resmxp, flops, bdwdth real(psb_dpk_) :: tt1, tt2, tflops, tprec, sigma,dotprod,norm integer(psb_ipk_) :: nrhs, nrow, n_row, dim, nv, ne,dim_H integer(psb_ipk_), allocatable :: ivg(:), ipv(:) call psb_init(ictxt) call psb_info(ictxt,iam,np) if (iam < 0) then ! This should not happen, but just in case call psb_exit(ictxt) stop endif name='shift_invert_real' if(psb_get_errstatus() /= 0) goto 9999 info=psb_success_ call psb_set_errverbosity(2) ! ! Hello world ! if (iam == psb_root_) then write(*,*) 'Welcome to PSBLAS version: ',psb_version_string_ write(*,*) 'This is the ',trim(name),' sample program' read(psb_inp_unit,*) mtrx_file read(psb_inp_unit,*) filefmt read(psb_inp_unit,*) ipart read(psb_inp_unit,*) ptype read(psb_inp_unit,*) kmethd read(psb_inp_unit,*) dim_H read(psb_inp_unit,*) sigma read(psb_inp_unit,*) eps end if call psb_bcast(ictxt,mtrx_file) call psb_bcast(ictxt,filefmt) call psb_bcast(ictxt,ipart) call psb_bcast(ictxt,dim_H) call psb_bcast(ictxt,kmethd) call psb_bcast(ictxt,ptype) call psb_bcast(ictxt,sigma) call psb_bcast(ictxt,eps) rhs_file = 'NONE' afmt = 'CSR' call psb_barrier(ictxt) t1 = psb_wtime() ! read the input matrix to be processed and (possibly) the rhs nrhs = 1 if (iam==psb_root_) then select case(psb_toupper(filefmt)) case('MM') ! For Matrix Market we have an input file for the matrix ! and an (optional) second file for the RHS. call mm_mat_read(aux_a,info,iunit=iunit,filename=mtrx_file) if (info == psb_success_) then if (rhs_file /= 'NONE') then call mm_array_read(aux_b,info,iunit=iunit,filename=rhs_file) end if end if case ('HB') ! For Harwell-Boeig we have a single file which may or may not ! contain an RHS. call hb_read(aux_a,info,iunit=iunit,b=aux_b,filename=mtrx_file) case ('AD') call adj_read(aux_a,mtrx_file,iunit,desc_a,info) case default info = -1 write(psb_err_unit,*) 'Wrong choice for fileformat ', filefmt end select if (info /= psb_success_) then write(psb_err_unit,*) 'Error while reading input matrix ' call psb_abort(ictxt) end if m_problem = aux_a%get_nrows() annz=aux_a%get_nzeros() call psb_bcast(ictxt,m_problem) ! At this point aux_b may still be unallocated if (psb_size(aux_b,dim=1)==m_problem) then ! if any rhs were present, broadcast the first one write(psb_err_unit,'("Ok, got an rhs ")') b_col_glob =>aux_b(:,1) else ! write(psb_out_unit,'("Generating an rhs...")') ! write(psb_out_unit,'(" ")') call psb_realloc(m_problem,1,aux_b,ircode) if (ircode /= 0) then call psb_errpush(psb_err_alloc_dealloc_,name) goto 9999 endif b_col_glob => aux_b(:,1) do i=1, m_problem b_col_glob(i) = 1.d0 enddo endif call psb_bcast(ictxt,b_col_glob(1:m_problem)) else call psb_bcast(ictxt,m_problem) call psb_realloc(m_problem,1,aux_b,ircode) if (ircode /= 0) then call psb_errpush(psb_err_alloc_dealloc_,name) goto 9999 endif b_col_glob =>aux_b(:,1) call psb_bcast(ictxt,b_col_glob(1:m_problem)) end if ! switch over different partition types if (ipart == 0) then call psb_barrier(ictxt) if (iam==psb_root_) write(psb_out_unit,'("Partition type: block")') allocate(ivg(m_problem),ipv(np)) do i=1,m_problem call part_block(i,m_problem,np,ipv,nv) ivg(i) = ipv(1) enddo call psb_matdist(aux_a, a,ictxt, & & desc_a,b_col_glob,b_col,info,fmt=afmt,v=ivg) else if (ipart == 2) then if (iam==psb_root_) then !write(psb_out_unit,'("Partition type: graph")') !write(psb_out_unit,'(" ")') ! write(psb_err_unit,'("Build type: graph")') call build_mtpart(aux_a,np) endif call psb_barrier(ictxt) call distr_mtpart(psb_root_,ictxt) call getv_mtpart(ivg) call psb_matdist(aux_a, a, ictxt, & & desc_a,b_col_glob,b_col,info,fmt=afmt,v=ivg) else if (iam==psb_root_) write(psb_out_unit,'("Partition type: block")') call psb_matdist(aux_a, a, ictxt, & & desc_a,b_col_glob,b_col,info,fmt=afmt,parts=part_block) end if call lapl(a,b) ! !a2=a-sigma*id ! !sigma = 100 call csshift(b,a2,sigma,ictxt) ! ! prepare the preconditioner. ! !if(iam == psb_root_) write(psb_out_unit,'("Setting preconditioner to : ", a) ') ptype call psb_precinit(prec,ptype,info) call psb_barrier(ictxt) !t1 = psb_wtime() call psb_precbld(a2,desc_a,prec,info) if(info /= psb_success_) then info=psb_err_from_subroutine_ ch_err='psb_precbld' call psb_errpush(info,name,a_err=ch_err) goto 9999 end if tprec = psb_wtime()-t1 if (iam == psb_root_) write(psb_out_unit,'("Preconditioner time : ",es12.5)')tprec allocate(H(dim_H,dim_H)) allocate (V(dim_H+1)) do i=1,dim_H+1 call psb_geall(V(i),desc_a,info) call psb_geasb(V(i),desc_a,info) enddo call V(1)%set(done) call psb_amx(ictxt, t2) !if (iam==psb_root_) then ! write(psb_out_unit,'(" ")') ! write(psb_out_unit,'("Time to read and partition matrix : ",es12.5)')t2 ! write(psb_out_unit,'(" ")') !end if call psb_barrier(ictxt) t2 = psb_wtime()-t1-tprec if (iam == psb_root_) write(psb_out_unit,'("Preconditioner time : ",es12.5)')t2 norm = psb_norm2(V(1),desc_a, info) H(2,1)=cmplx(norm,0.0) norm = 1/norm call psb_geaxpby(dzero,V(1),norm,V(1),desc_a,info) do i=2,dim_H+1 !A*V(i)=V(i-1) call psb_krylov(kmethd,a2,prec,V(i-1),V(i),eps,desc_a,info,& & itmax=1000,iter=iter,err=err,itrace=-1,istop=2,irst=002) !if (iam==psb_root_) write(*,'("iter : "i20)') iter ! Gram-Schmitt's reorthogonalisation do j=1,i-1 dotprod= psb_gedot(V(i),V(j),desc_a,info) ! dotprod = (V(i) dot V(j)) call psb_geaxpby(-dotprod,V(j),done,V(i),desc_a, info)!V(i)=V(i)-V(j)*dotprod H(j,i-1)=cmplx(dotprod,0.0) end do norm = psb_norm2(V(i),desc_a,info) if (i .ne. dim_H+1) then H(i,i-1)=cmplx(norm,0.0) endif norm=1/norm call psb_geaxpby(dzero,V(i),norm,V(i),desc_a, info) enddo t2=psb_wtime()-t1-tprec if (iam==psb_root_) write (psb_out_unit,'("temps de arnoldi : " ,es12.5 )') t2 if(iam==psb_root_) then allocate(eig(dim_H),work(dim_h),Z(dim_H,dim_H),stat = info) call ZHSEQR('E','N',dim_H,1,dim_H,H,dim_H,eig,Z,dim_H,work,dim_H,info) !sort H's eigenvalues allocate(indexes(1:dim_H)) call psb_qsort(eig,indexes,psb_alsort_up_,psb_sort_ovw_idx_) do i=1,dim_H eig (i) = cmplx(sigma,0.0)+1/eig(i) !write(psb_out_unit, '("eig(i), i", g20.4, i10)')real(eig(i)),i enddo end if call psb_barrier(ictxt) t2 = psb_wtime() - t1 call psb_amx(ictxt,t2) nr = desc_a%get_global_rows() amatsize = psb_sizeof(a) descsize = psb_sizeof(desc_a) call psb_sum(ictxt,annz) call psb_sum(ictxt,amatsize) call psb_sum(ictxt,descsize) if (iam==psb_root_) then flops = 2.d0*times*annz tflops=flops !write(psb_out_unit,'("Matrix: ",a)') mtrx_file !write(psb_out_unit,'("Test on : ",i20," processors")') np !write(psb_out_unit,'("Size of matrix : ",i20," ")') nr !write(psb_out_unit,'("Number of nonzeros : ",i20," ")') annz !write(psb_out_unit,'("Memory occupation : ",i20," ")') amatsize !write(psb_out_unit,'("Number of flops (",i0," iters) : ",F20.0," ")') times,flops !write(*,'("eigenvalues near from ", g20.4," : ")') sigma !do i=dim_H/3,dim_H ! write(psb_out_unit,'(g20.4,g20.4)')real(eig(i)),aimag(eig(i)) !enddo open(15, FILE="resultats.dat", position = 'append',ACTION="WRITE") write (15,'(F20.6,F20.6,F20.4)')real(eig(dim_H-1)),real(eig(dim_H)),t2 close(15) DEALLOCATE (work,eig,Z) end if call psb_gefree(b_col, desc_a,info) call psb_gefree(x_col, desc_a,info) call psb_spfree(a, desc_a,info) call psb_spfree(a2, desc_a,info) call psb_spfree(b, desc_a,info) call psb_cdfree(desc_a,info) do i=1,dim_H call psb_gefree(V(i), desc_a,info) enddo DEALLOCATE (H) DEALLOCATE (V) 9999 continue if(info /= 0) then call psb_error(ictxt) end if call psb_exit(ictxt) stop contains subroutine csshift(a,b,sigma,ictx) type(psb_dspmat_type), intent(in) :: a type(psb_dspmat_type), intent(out) :: b real(psb_dpk_) :: sigma integer(psb_ipk_)::ictx type(psb_d_coo_sparse_mat) :: acoo integer(psb_ipk_) :: nz,n,info,i call a%cp_to(acoo) if (sigma/=0.0) then nz=acoo%get_nzeros() n=a%get_nrows() call acoo%reallocate(nz+n) call acoo%set_dupl(psb_dupl_add_) do i=1,n acoo%val(nz+i)=-sigma acoo%ia(nz+i)= i acoo%ja(nz+i)= i enddo call acoo%set_nzeros(nz+n) call acoo%fix(info) ! do i=1,nz ! if(acoo%ja(i)==acoo%ia(i)) then ! write(psb_out_unit,'(i10,i10,g20.4)')acoo%ja(i),i, acoo%val(i) ! end if ! enddo !write(psb_out_unit,'("autant de nzeros apres fix ?",i10)') acoo%get_nzeros()-nz end if call b%mv_from(acoo) call b%cscnv(info,'CSR') end subroutine csshift subroutine adj_read (a,filename,iunit,desc_a,info) type(psb_dspmat_type), intent (inout) :: a character(len=40) :: filename integer (psb_ipk_) :: iunit type(psb_desc_type):: desc_a integer (psb_ipk_) :: info integer(psb_ipk_) :: i,nnzero,nrows integer (psb_ipk_) :: iError type(psb_d_coo_sparse_mat) :: acoo open(iunit, FILE=filename, STATUS="OLD", ACTION="READ") read(iunit, *) nrows , nnzero call acoo%allocate(nrows,nrows,nnzero) do i = 1,nnzero read(iunit, *) acoo%ia(i),acoo%ja(i) acoo%ia(i)=acoo%ia(i)+1 acoo%ja(i)=acoo%ja(i)+1 acoo%val(i)=1.0 end do close(UNIT=iunit) !call psb_spall(a,desc_a,info,nnzero) !call psb_spins(nnzero, ia, ja, val, a, desc_a, info) call acoo%set_nzeros(nnzero) call acoo%fix(info) call a%mv_from(acoo) call a%cscnv(info,type='csr') end subroutine adj_read subroutine lapl(a,b) type(psb_dspmat_type),intent(in)::a type(psb_dspmat_type),intent(out)::b type(psb_d_coo_sparse_mat) :: acoo integer(psb_ipk_) :: nz,n,info,i real(psb_dpk_), allocatable :: K(:) call a%cp_to(acoo) nz=acoo%get_nzeros() n=a%get_nrows() allocate(K(n)) do i=1,n K(i)=0 enddo do i=1,nz K(acoo%ia(i))=K(acoo%ia(i))+acoo%val(i) acoo%val(i)=-acoo%val(i) enddo call acoo%reallocate(nz+n) call acoo%set_dupl(psb_dupl_add_) do i=1,n acoo%val(nz+i)=K(i) acoo%ia(nz+i)= i acoo%ja(nz+i)= i enddo call acoo%set_nzeros(nz+n) call acoo%fix(info) do i=1,nz ! if(acoo%ja(i)==acoo%ia(i)) then ! write(psb_out_unit,'(i10,i10,g20.4)')acoo%ia(i),acoo%ja(i),acoo%val(i) ! end if enddo call b%mv_from(acoo) call b%cscnv(info,'CSR') deallocate (K) end subroutine lapl end program shift_invert