! ! Parallel Sparse BLAS version 3.5 ! (C) Copyright 2006-2018 ! Salvatore Filippone ! Alfredo Buttari ! ! Redistribution and use in source and binary forms, with or without ! modification, are permitted provided that the following conditions ! are met: ! 1. Redistributions of source code must retain the above copyright ! notice, this list of conditions and the following disclaimer. ! 2. Redistributions in binary form must reproduce the above copyright ! notice, this list of conditions, and the following disclaimer in the ! documentation and/or other materials provided with the distribution. ! 3. The name of the PSBLAS group or the names of its contributors may ! not be used to endorse or promote products derived from this ! software without specific written permission. ! ! THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS ! ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED ! TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR ! PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE PSBLAS GROUP OR ITS CONTRIBUTORS ! BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR ! CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF ! SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS ! INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN ! CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ! ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE ! POSSIBILITY OF SUCH DAMAGE. ! ! module psi_d_collective_mod use psi_penv_mod use psb_desc_const_mod interface psb_max module procedure psb_dmaxs, psb_dmaxv, psb_dmaxm end interface interface psb_min module procedure psb_dmins, psb_dminv, psb_dminm end interface psb_min interface psb_nrm2 module procedure psb_d_nrm2s, psb_d_nrm2v end interface psb_nrm2 interface psb_sum module procedure psb_dsums, psb_dsumv, psb_dsumm end interface interface psb_amx module procedure psb_damxs, psb_damxv, psb_damxm end interface interface psb_amn module procedure psb_damns, psb_damnv, psb_damnm end interface interface psb_bcast module procedure psb_dbcasts, psb_dbcastv, psb_dbcastm end interface psb_bcast interface psb_scan_sum module procedure psb_dscan_sums, psb_dscan_sumv end interface psb_scan_sum interface psb_exscan_sum module procedure psb_dexscan_sums, psb_dexscan_sumv end interface psb_exscan_sum interface psb_simple_a2av module procedure psb_d_simple_a2av end interface psb_simple_a2av interface psb_simple_triad_a2av module procedure psb_d_e_simple_triad_a2av, psb_d_m_simple_triad_a2av end interface psb_simple_triad_a2av contains ! !!!!!!!!!!!!!!!!!!!!!! ! ! Reduction operations ! ! !!!!!!!!!!!!!!!!!!!!!! ! !!!!!!!!!!!!!!!!!!!!!!!!!!!!!! ! ! MAX ! ! !!!!!!!!!!!!!!!!!!!!!!!!!!!!!! subroutine psb_dmaxs(ctxt,dat,root,mode,request) #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,1,psb_mpi_r_dpk_,mpi_max,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,1,psb_mpi_r_dpk_,mpi_max,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_max,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_max,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_dmaxs subroutine psb_dmaxv(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat(:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_max,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_max,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_max,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_max,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_dmaxv subroutine psb_dmaxm(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat(:,:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_max,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_max,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_max,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_max,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_dmaxm ! ! MIN: Minimum Value ! subroutine psb_dmins(ctxt,dat,root,mode,request) #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,1,psb_mpi_r_dpk_,mpi_min,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,1,psb_mpi_r_dpk_,mpi_min,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_min,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_min,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_dmins subroutine psb_dminv(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat(:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_min,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_min,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_min,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_min,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_dminv subroutine psb_dminm(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat(:,:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_min,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_min,root_,icomm,info) end if else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_min,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_min,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_dminm ! !!!!!!!!!!!! ! ! Norm 2, only for reals ! ! !!!!!!!!!!!! subroutine psb_d_nrm2s(ctxt,dat,root,mode,request) #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_dnrm2_op,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_dnrm2_op,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_dnrm2_op,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_dnrm2_op,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_d_nrm2s subroutine psb_d_nrm2v(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat(:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,size(dat),psb_mpi_r_dpk_,& & mpi_dnrm2_op,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,size(dat),psb_mpi_r_dpk_,& & mpi_dnrm2_op,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_dnrm2_op,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_dnrm2_op,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_d_nrm2v ! ! SUM ! subroutine psb_dsums(ctxt,dat,root,mode,request) #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_sum,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_sum,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_sum,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_sum,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_dsums subroutine psb_dsumv(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat(:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_sum,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_sum,root_,icomm,info) end if else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_sum,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_sum,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) endif end if #endif end subroutine psb_dsumv subroutine psb_dsumm(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat(:,:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_sum,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_sum,root_,icomm,info) end if else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_sum,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_sum,root_, icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) endif end if #endif end subroutine psb_dsumm ! ! AMX: Maximum Absolute Value ! subroutine psb_damxs(ctxt,dat,root,mode,request) #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_damx_op,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_damx_op,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_damx_op,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_damx_op,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_damxs subroutine psb_damxv(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat(:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,size(dat),& psb_mpi_r_dpk_,mpi_damx_op,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_damx_op,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_damx_op,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_damx_op,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_damxv subroutine psb_damxm(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat(:,:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_damx_op,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_damx_op,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_damx_op,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_damx_op,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_damxm ! ! AMN: Minimum Absolute Value ! subroutine psb_damns(ctxt,dat,root,mode,request) #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_damn_op,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_damn_op,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_damn_op,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_damn_op,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_damns subroutine psb_damnv(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat(:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_damn_op,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_damn_op,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_damn_op,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_damn_op,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_damnv subroutine psb_damnm(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat(:,:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_damn_op,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_damn_op,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_damn_op,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_damn_op,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_damnm ! ! BCAST Broadcast ! subroutine psb_dbcasts(ctxt,dat,root,mode,request) #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = psb_root_ endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then call mpi_bcast(dat,1,psb_mpi_r_dpk_,root_,icomm,info) else if (collective_start) then call mpi_ibcast(dat,1,psb_mpi_r_dpk_,root_,icomm,request,info) else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_dbcasts subroutine psb_dbcastv(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat(:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = psb_root_ endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then call mpi_bcast(dat,size(dat),psb_mpi_r_dpk_,root_,icomm,info) else if (collective_start) then call mpi_ibcast(dat,size(dat),psb_mpi_r_dpk_,root_,icomm,request,info) else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_dbcastv subroutine psb_dbcastm(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat(:,:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = psb_root_ endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then call mpi_bcast(dat,size(dat),psb_mpi_r_dpk_,root_,icomm,info) else if (collective_start) then call mpi_ibcast(dat,size(dat),psb_mpi_r_dpk_,root_,icomm,request,info) else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_dbcastm ! !!!!!!!!!!!!!!!!!!!!!!!!!!!!!! ! ! SCAN ! ! !!!!!!!!!!!!!!!!!!!!!!!!!!!!!! subroutine psb_dscan_sums(ctxt,dat,mode,request) #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request real(psb_dpk_), intent(inout) :: dat real(psb_dpk_) :: dat_ integer(psb_ipk_) :: iam, np, info integer(psb_mpk_) :: minfo integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then call mpi_scan(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_sum,icomm,minfo) else if (collective_start) then call mpi_iscan(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_sum,icomm,request,minfo) else if (collective_end) then call mpi_wait(request,status,minfo) end if end if #endif end subroutine psb_dscan_sums subroutine psb_dexscan_sums(ctxt,dat,mode,request) #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request real(psb_dpk_) :: dat_ integer(psb_ipk_) :: iam, np, info integer(psb_mpk_) :: minfo integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then call mpi_exscan(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_sum,icomm,minfo) else if (collective_start) then call mpi_iexscan(MPI_IN_PLACE,dat,1,& & psb_mpi_r_dpk_,mpi_sum,icomm,request,minfo) else if (collective_end) then call mpi_wait(request,status,minfo) end if end if #else dat = dzero #endif end subroutine psb_dexscan_sums subroutine psb_dscan_sumv(ctxt,dat,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat(:) integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_ipk_) :: iam, np, info integer(psb_mpk_) :: minfo integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then call mpi_scan(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_sum,icomm,minfo) else if (collective_start) then call mpi_iscan(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_sum,icomm,request,info) else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_dscan_sumv subroutine psb_dexscan_sumv(ctxt,dat,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt real(psb_dpk_), intent(inout) :: dat(:) integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request real(psb_dpk_), allocatable :: dat_(:) integer(psb_ipk_) :: iam, np, info integer(psb_mpk_) :: minfo integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then call mpi_exscan(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_sum,icomm,minfo) else if (collective_start) then call mpi_iexscan(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_r_dpk_,mpi_sum,icomm,request,info) else if (collective_end) then call mpi_wait(request,status,info) end if end if #else dat = dzero #endif end subroutine psb_dexscan_sumv subroutine psb_d_simple_a2av(valsnd,sdsz,bsdindx,& & valrcv,rvsz,brvindx,ctxt,info) use psi_d_p2p_mod implicit none real(psb_dpk_), intent(in) :: valsnd(:) real(psb_dpk_), intent(out) :: valrcv(:) integer(psb_mpk_), intent(in) :: bsdindx(:), brvindx(:), sdsz(:), rvsz(:) type(psb_ctxt_type), intent(in) :: ctxt integer(psb_ipk_), intent(out) :: info integer(psb_ipk_) :: iam, np, i,j,k, ip, ipx, idx, sz call psb_info(ctxt,iam,np) if (min(size(bsdindx),size(brvindx),size(sdsz),size(rvsz)) 0) then idx = bsdindx(ip+1) call psb_snd(ctxt,valsnd(idx+1:idx+sz),ip) end if end do do ip = 0, np-1 sz = rvsz(ip+1) if (sz > 0) then idx = brvindx(ip+1) call psb_rcv(ctxt,valrcv(idx+1:idx+sz),ip) end if end do end subroutine psb_d_simple_a2av subroutine psb_d_m_simple_triad_a2av(valsnd,iasnd,jasnd,sdsz,bsdindx,& & valrcv,iarcv,jarcv,rvsz,brvindx,ctxt,info) #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif real(psb_dpk_), intent(in) :: valsnd(:) integer(psb_mpk_), intent(in) :: iasnd(:), jasnd(:) real(psb_dpk_), intent(out) :: valrcv(:) integer(psb_mpk_), intent(out) :: iarcv(:), jarcv(:) integer(psb_mpk_), intent(in) :: bsdindx(:), brvindx(:), sdsz(:), rvsz(:) type(psb_ctxt_type), intent(in) :: ctxt integer(psb_ipk_), intent(out) :: info !Local variables integer(psb_ipk_) :: iam, np, i,j,k, ip, ipx, idx, sz, counter integer(psb_mpk_) :: proc_to_comm, p2ptag, p2pstat(mpi_status_size), iret, icomm integer(psb_mpk_), allocatable :: prcid(:), rvhd(:,:) call psb_info(ctxt,iam,np) icomm = psb_get_mpi_comm(ctxt) if (min(size(bsdindx),size(brvindx),size(sdsz),size(rvsz)) 0) then prcid(ip+1) = psb_get_mpi_rank(ctxt,ip) idx = brvindx(ip+1) p2ptag = psb_double_tag call mpi_irecv(valrcv(idx+1:idx+sz),sz,& & psb_mpi_r_dpk_,prcid(ip+1),& & p2ptag, icomm,rvhd(ip+1,1),iret) p2ptag = psb_int_swap_tag call mpi_irecv(iarcv(idx+1:idx+sz),sz,& & psb_mpi_mpk_,prcid(ip+1),& & p2ptag, icomm,rvhd(ip+1,2),iret) call mpi_irecv(jarcv(idx+1:idx+sz),sz,& & psb_mpi_mpk_,prcid(ip+1),& & p2ptag, icomm,rvhd(ip+1,3),iret) end if Enddo do ip = 0, np-1 sz = sdsz(ip+1) if (sz > 0) then if (prcid(ip+1)<0) prcid(ip+1) = psb_get_mpi_rank(ctxt,ip) idx = bsdindx(ip+1) p2ptag = psb_double_tag call mpi_send(valsnd(idx+1:idx+sz),sz,& & psb_mpi_r_dpk_,prcid(ip+1),& & p2ptag, icomm,iret) p2ptag = psb_int_swap_tag call mpi_send(iasnd(idx+1:idx+sz),sz,& & psb_mpi_mpk_,prcid(ip+1),& & p2ptag, icomm,iret) call mpi_send(jasnd(idx+1:idx+sz),sz,& & psb_mpi_mpk_,prcid(ip+1),& & p2ptag, icomm,iret) end if Enddo do ip = 0, np-1 sz = rvsz(ip+1) if (sz > 0) then call mpi_wait(rvhd(ip+1,1),p2pstat,iret) call mpi_wait(rvhd(ip+1,2),p2pstat,iret) call mpi_wait(rvhd(ip+1,3),p2pstat,iret) end if Enddo end subroutine psb_d_m_simple_triad_a2av subroutine psb_d_e_simple_triad_a2av(valsnd,iasnd,jasnd,sdsz,bsdindx,& & valrcv,iarcv,jarcv,rvsz,brvindx,ctxt,info) #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif real(psb_dpk_), intent(in) :: valsnd(:) integer(psb_epk_), intent(in) :: iasnd(:), jasnd(:) real(psb_dpk_), intent(out) :: valrcv(:) integer(psb_epk_), intent(out) :: iarcv(:), jarcv(:) integer(psb_mpk_), intent(in) :: bsdindx(:), brvindx(:), sdsz(:), rvsz(:) type(psb_ctxt_type), intent(in) :: ctxt integer(psb_ipk_), intent(out) :: info !Local variables integer(psb_ipk_) :: iam, np, i,j,k, ip, ipx, idx, sz, counter integer(psb_mpk_) :: proc_to_comm, p2ptag, p2pstat(mpi_status_size), iret, icomm integer(psb_mpk_), allocatable :: prcid(:), rvhd(:,:) call psb_info(ctxt,iam,np) icomm = psb_get_mpi_comm(ctxt) if (min(size(bsdindx),size(brvindx),size(sdsz),size(rvsz)) 0) then prcid(ip+1) = psb_get_mpi_rank(ctxt,ip) idx = brvindx(ip+1) p2ptag = psb_double_tag call mpi_irecv(valrcv(idx+1:idx+sz),sz,& & psb_mpi_r_dpk_,prcid(ip+1),& & p2ptag, icomm,rvhd(ip+1,1),iret) p2ptag = psb_int_swap_tag call mpi_irecv(iarcv(idx+1:idx+sz),sz,& & psb_mpi_epk_,prcid(ip+1),& & p2ptag, icomm,rvhd(ip+1,2),iret) call mpi_irecv(jarcv(idx+1:idx+sz),sz,& & psb_mpi_epk_,prcid(ip+1),& & p2ptag, icomm,rvhd(ip+1,3),iret) end if Enddo do ip = 0, np-1 sz = sdsz(ip+1) if (sz > 0) then if (prcid(ip+1)<0) prcid(ip+1) = psb_get_mpi_rank(ctxt,ip) idx = bsdindx(ip+1) p2ptag = psb_double_tag call mpi_send(valsnd(idx+1:idx+sz),sz,& & psb_mpi_r_dpk_,prcid(ip+1),& & p2ptag, icomm,iret) p2ptag = psb_int_swap_tag call mpi_send(iasnd(idx+1:idx+sz),sz,& & psb_mpi_epk_,prcid(ip+1),& & p2ptag, icomm,iret) call mpi_send(jasnd(idx+1:idx+sz),sz,& & psb_mpi_epk_,prcid(ip+1),& & p2ptag, icomm,iret) end if Enddo do ip = 0, np-1 sz = rvsz(ip+1) if (sz > 0) then call mpi_wait(rvhd(ip+1,1),p2pstat,iret) call mpi_wait(rvhd(ip+1,2),p2pstat,iret) call mpi_wait(rvhd(ip+1,3),p2pstat,iret) end if Enddo end subroutine psb_d_e_simple_triad_a2av end module psi_d_collective_mod