! ! Parallel Sparse BLAS version 3.5 ! (C) Copyright 2006-2018 ! Salvatore Filippone ! Alfredo Buttari ! ! Redistribution and use in source and binary forms, with or without ! modification, are permitted provided that the following conditions ! are met: ! 1. Redistributions of source code must retain the above copyright ! notice, this list of conditions and the following disclaimer. ! 2. Redistributions in binary form must reproduce the above copyright ! notice, this list of conditions, and the following disclaimer in the ! documentation and/or other materials provided with the distribution. ! 3. The name of the PSBLAS group or the names of its contributors may ! not be used to endorse or promote products derived from this ! software without specific written permission. ! ! THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS ! ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED ! TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR ! PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE PSBLAS GROUP OR ITS CONTRIBUTORS ! BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR ! CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF ! SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS ! INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN ! CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ! ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE ! POSSIBILITY OF SUCH DAMAGE. ! ! module psi_c_collective_mod use psi_penv_mod use psb_desc_const_mod interface psb_sum module procedure psb_csums, psb_csumv, psb_csumm end interface interface psb_amx module procedure psb_camxs, psb_camxv, psb_camxm end interface interface psb_amn module procedure psb_camns, psb_camnv, psb_camnm end interface interface psb_bcast module procedure psb_cbcasts, psb_cbcastv, psb_cbcastm end interface psb_bcast interface psb_scan_sum module procedure psb_cscan_sums, psb_cscan_sumv end interface psb_scan_sum interface psb_exscan_sum module procedure psb_cexscan_sums, psb_cexscan_sumv end interface psb_exscan_sum interface psb_simple_a2av module procedure psb_c_simple_a2av end interface psb_simple_a2av interface psb_simple_triad_a2av module procedure psb_c_e_simple_triad_a2av, psb_c_m_simple_triad_a2av end interface psb_simple_triad_a2av contains ! !!!!!!!!!!!!!!!!!!!!!! ! ! Reduction operations ! ! !!!!!!!!!!!!!!!!!!!!!! ! ! SUM ! subroutine psb_csums(ctxt,dat,root,mode,request) #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt complex(psb_spk_), intent(inout) :: dat integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,1,& & psb_mpi_c_spk_,mpi_sum,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,1,& & psb_mpi_c_spk_,mpi_sum,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,1,& & psb_mpi_c_spk_,mpi_sum,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,1,& & psb_mpi_c_spk_,mpi_sum,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_csums subroutine psb_csumv(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt complex(psb_spk_), intent(inout) :: dat(:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_sum,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_sum,root_,icomm,info) end if else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_sum,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_sum,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) endif end if #endif end subroutine psb_csumv subroutine psb_csumm(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt complex(psb_spk_), intent(inout) :: dat(:,:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_sum,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_sum,root_,icomm,info) end if else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_sum,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_sum,root_, icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) endif end if #endif end subroutine psb_csumm ! ! AMX: Maximum Absolute Value ! subroutine psb_camxs(ctxt,dat,root,mode,request) #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt complex(psb_spk_), intent(inout) :: dat integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,1,& & psb_mpi_c_spk_,mpi_camx_op,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,1,& & psb_mpi_c_spk_,mpi_camx_op,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,1,& & psb_mpi_c_spk_,mpi_camx_op,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,1,& & psb_mpi_c_spk_,mpi_camx_op,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_camxs subroutine psb_camxv(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt complex(psb_spk_), intent(inout) :: dat(:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,size(dat),& psb_mpi_c_spk_,mpi_camx_op,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_camx_op,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_camx_op,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_camx_op,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_camxv subroutine psb_camxm(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt complex(psb_spk_), intent(inout) :: dat(:,:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_camx_op,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_camx_op,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_camx_op,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_camx_op,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_camxm ! ! AMN: Minimum Absolute Value ! subroutine psb_camns(ctxt,dat,root,mode,request) #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt complex(psb_spk_), intent(inout) :: dat integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,1,& & psb_mpi_c_spk_,mpi_camn_op,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,1,& & psb_mpi_c_spk_,mpi_camn_op,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,1,& & psb_mpi_c_spk_,mpi_camn_op,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,1,& & psb_mpi_c_spk_,mpi_camn_op,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_camns subroutine psb_camnv(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt complex(psb_spk_), intent(inout) :: dat(:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_camn_op,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_camn_op,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_camn_op,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_camn_op,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_camnv subroutine psb_camnm(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt complex(psb_spk_), intent(inout) :: dat(:,:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = -1 endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then if (root_ == -1) then call mpi_allreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_camn_op,icomm,info) else call mpi_reduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_camn_op,root_,icomm,info) endif else if (collective_start) then if (root_ == -1) then call mpi_iallreduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_camn_op,icomm,request,info) else call mpi_ireduce(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_camn_op,root_,icomm,request,info) end if else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_camnm ! ! BCAST Broadcast ! subroutine psb_cbcasts(ctxt,dat,root,mode,request) #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt complex(psb_spk_), intent(inout) :: dat integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = psb_root_ endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then call mpi_bcast(dat,1,psb_mpi_c_spk_,root_,icomm,info) else if (collective_start) then call mpi_ibcast(dat,1,psb_mpi_c_spk_,root_,icomm,request,info) else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_cbcasts subroutine psb_cbcastv(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt complex(psb_spk_), intent(inout) :: dat(:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = psb_root_ endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then call mpi_bcast(dat,size(dat),psb_mpi_c_spk_,root_,icomm,info) else if (collective_start) then call mpi_ibcast(dat,size(dat),psb_mpi_c_spk_,root_,icomm,request,info) else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_cbcastv subroutine psb_cbcastm(ctxt,dat,root,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt complex(psb_spk_), intent(inout) :: dat(:,:) integer(psb_mpk_), intent(in), optional :: root integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_mpk_) :: root_ integer(psb_mpk_) :: iam, np, info integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) if (present(root)) then root_ = root else root_ = psb_root_ endif icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then call mpi_bcast(dat,size(dat),psb_mpi_c_spk_,root_,icomm,info) else if (collective_start) then call mpi_ibcast(dat,size(dat),psb_mpi_c_spk_,root_,icomm,request,info) else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_cbcastm ! !!!!!!!!!!!!!!!!!!!!!!!!!!!!!! ! ! SCAN ! ! !!!!!!!!!!!!!!!!!!!!!!!!!!!!!! subroutine psb_cscan_sums(ctxt,dat,mode,request) #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request complex(psb_spk_), intent(inout) :: dat complex(psb_spk_) :: dat_ integer(psb_ipk_) :: iam, np, info integer(psb_mpk_) :: minfo integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then call mpi_scan(MPI_IN_PLACE,dat,1,& & psb_mpi_c_spk_,mpi_sum,icomm,minfo) else if (collective_start) then call mpi_iscan(MPI_IN_PLACE,dat,1,& & psb_mpi_c_spk_,mpi_sum,icomm,request,minfo) else if (collective_end) then call mpi_wait(request,status,minfo) end if end if #endif end subroutine psb_cscan_sums subroutine psb_cexscan_sums(ctxt,dat,mode,request) #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt complex(psb_spk_), intent(inout) :: dat integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request complex(psb_spk_) :: dat_ integer(psb_ipk_) :: iam, np, info integer(psb_mpk_) :: minfo integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then call mpi_exscan(MPI_IN_PLACE,dat,1,& & psb_mpi_c_spk_,mpi_sum,icomm,minfo) else if (collective_start) then call mpi_iexscan(MPI_IN_PLACE,dat,1,& & psb_mpi_c_spk_,mpi_sum,icomm,request,minfo) else if (collective_end) then call mpi_wait(request,status,minfo) end if end if #else dat = czero #endif end subroutine psb_cexscan_sums subroutine psb_cscan_sumv(ctxt,dat,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt complex(psb_spk_), intent(inout) :: dat(:) integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request integer(psb_ipk_) :: iam, np, info integer(psb_mpk_) :: minfo integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then call mpi_scan(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_sum,icomm,minfo) else if (collective_start) then call mpi_iscan(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_sum,icomm,request,info) else if (collective_end) then call mpi_wait(request,status,info) end if end if #endif end subroutine psb_cscan_sumv subroutine psb_cexscan_sumv(ctxt,dat,mode,request) use psb_realloc_mod #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif type(psb_ctxt_type), intent(in) :: ctxt complex(psb_spk_), intent(inout) :: dat(:) integer(psb_ipk_), intent(in), optional :: mode integer(psb_mpk_), intent(inout), optional :: request complex(psb_spk_), allocatable :: dat_(:) integer(psb_ipk_) :: iam, np, info integer(psb_mpk_) :: minfo integer(psb_mpk_) :: icomm integer(psb_mpk_) :: status(mpi_status_size) logical :: collective_start, collective_end, collective_sync #if !defined(SERIAL_MPI) call psb_info(ctxt,iam,np) icomm = psb_get_mpi_comm(ctxt) if (present(mode)) then collective_sync = .false. collective_start = iand(mode,psb_collective_start_) /= 0 collective_end = iand(mode,psb_collective_end_) /= 0 if (.not.present(request)) then collective_sync = .true. collective_start = .false. collective_end = .false. end if else collective_sync = .true. collective_start = .false. collective_end = .false. end if if (collective_sync) then call mpi_exscan(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_sum,icomm,minfo) else if (collective_start) then call mpi_iexscan(MPI_IN_PLACE,dat,size(dat),& & psb_mpi_c_spk_,mpi_sum,icomm,request,info) else if (collective_end) then call mpi_wait(request,status,info) end if end if #else dat = czero #endif end subroutine psb_cexscan_sumv subroutine psb_c_simple_a2av(valsnd,sdsz,bsdindx,& & valrcv,rvsz,brvindx,ctxt,info) use psi_c_p2p_mod implicit none complex(psb_spk_), intent(in) :: valsnd(:) complex(psb_spk_), intent(out) :: valrcv(:) integer(psb_mpk_), intent(in) :: bsdindx(:), brvindx(:), sdsz(:), rvsz(:) type(psb_ctxt_type), intent(in) :: ctxt integer(psb_ipk_), intent(out) :: info integer(psb_ipk_) :: iam, np, i,j,k, ip, ipx, idx, sz call psb_info(ctxt,iam,np) if (min(size(bsdindx),size(brvindx),size(sdsz),size(rvsz)) 0) then idx = bsdindx(ip+1) call psb_snd(ctxt,valsnd(idx+1:idx+sz),ip) end if end do do ip = 0, np-1 sz = rvsz(ip+1) if (sz > 0) then idx = brvindx(ip+1) call psb_rcv(ctxt,valrcv(idx+1:idx+sz),ip) end if end do end subroutine psb_c_simple_a2av subroutine psb_c_m_simple_triad_a2av(valsnd,iasnd,jasnd,sdsz,bsdindx,& & valrcv,iarcv,jarcv,rvsz,brvindx,ctxt,info) #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif complex(psb_spk_), intent(in) :: valsnd(:) integer(psb_mpk_), intent(in) :: iasnd(:), jasnd(:) complex(psb_spk_), intent(out) :: valrcv(:) integer(psb_mpk_), intent(out) :: iarcv(:), jarcv(:) integer(psb_mpk_), intent(in) :: bsdindx(:), brvindx(:), sdsz(:), rvsz(:) type(psb_ctxt_type), intent(in) :: ctxt integer(psb_ipk_), intent(out) :: info !Local variables integer(psb_ipk_) :: iam, np, i,j,k, ip, ipx, idx, sz, counter integer(psb_mpk_) :: proc_to_comm, p2ptag, p2pstat(mpi_status_size), iret, icomm integer(psb_mpk_), allocatable :: prcid(:), rvhd(:,:) call psb_info(ctxt,iam,np) icomm = psb_get_mpi_comm(ctxt) if (min(size(bsdindx),size(brvindx),size(sdsz),size(rvsz)) 0) then prcid(ip+1) = psb_get_mpi_rank(ctxt,ip) idx = brvindx(ip+1) p2ptag = psb_complex_tag call mpi_irecv(valrcv(idx+1:idx+sz),sz,& & psb_mpi_c_spk_,prcid(ip+1),& & p2ptag, icomm,rvhd(ip+1,1),iret) p2ptag = psb_int_swap_tag call mpi_irecv(iarcv(idx+1:idx+sz),sz,& & psb_mpi_mpk_,prcid(ip+1),& & p2ptag, icomm,rvhd(ip+1,2),iret) call mpi_irecv(jarcv(idx+1:idx+sz),sz,& & psb_mpi_mpk_,prcid(ip+1),& & p2ptag, icomm,rvhd(ip+1,3),iret) end if Enddo do ip = 0, np-1 sz = sdsz(ip+1) if (sz > 0) then if (prcid(ip+1)<0) prcid(ip+1) = psb_get_mpi_rank(ctxt,ip) idx = bsdindx(ip+1) p2ptag = psb_complex_tag call mpi_send(valsnd(idx+1:idx+sz),sz,& & psb_mpi_c_spk_,prcid(ip+1),& & p2ptag, icomm,iret) p2ptag = psb_int_swap_tag call mpi_send(iasnd(idx+1:idx+sz),sz,& & psb_mpi_mpk_,prcid(ip+1),& & p2ptag, icomm,iret) call mpi_send(jasnd(idx+1:idx+sz),sz,& & psb_mpi_mpk_,prcid(ip+1),& & p2ptag, icomm,iret) end if Enddo do ip = 0, np-1 sz = rvsz(ip+1) if (sz > 0) then call mpi_wait(rvhd(ip+1,1),p2pstat,iret) call mpi_wait(rvhd(ip+1,2),p2pstat,iret) call mpi_wait(rvhd(ip+1,3),p2pstat,iret) end if Enddo end subroutine psb_c_m_simple_triad_a2av subroutine psb_c_e_simple_triad_a2av(valsnd,iasnd,jasnd,sdsz,bsdindx,& & valrcv,iarcv,jarcv,rvsz,brvindx,ctxt,info) #ifdef MPI_MOD use mpi #endif implicit none #ifdef MPI_H include 'mpif.h' #endif complex(psb_spk_), intent(in) :: valsnd(:) integer(psb_epk_), intent(in) :: iasnd(:), jasnd(:) complex(psb_spk_), intent(out) :: valrcv(:) integer(psb_epk_), intent(out) :: iarcv(:), jarcv(:) integer(psb_mpk_), intent(in) :: bsdindx(:), brvindx(:), sdsz(:), rvsz(:) type(psb_ctxt_type), intent(in) :: ctxt integer(psb_ipk_), intent(out) :: info !Local variables integer(psb_ipk_) :: iam, np, i,j,k, ip, ipx, idx, sz, counter integer(psb_mpk_) :: proc_to_comm, p2ptag, p2pstat(mpi_status_size), iret, icomm integer(psb_mpk_), allocatable :: prcid(:), rvhd(:,:) call psb_info(ctxt,iam,np) icomm = psb_get_mpi_comm(ctxt) if (min(size(bsdindx),size(brvindx),size(sdsz),size(rvsz)) 0) then prcid(ip+1) = psb_get_mpi_rank(ctxt,ip) idx = brvindx(ip+1) p2ptag = psb_complex_tag call mpi_irecv(valrcv(idx+1:idx+sz),sz,& & psb_mpi_c_spk_,prcid(ip+1),& & p2ptag, icomm,rvhd(ip+1,1),iret) p2ptag = psb_int_swap_tag call mpi_irecv(iarcv(idx+1:idx+sz),sz,& & psb_mpi_epk_,prcid(ip+1),& & p2ptag, icomm,rvhd(ip+1,2),iret) call mpi_irecv(jarcv(idx+1:idx+sz),sz,& & psb_mpi_epk_,prcid(ip+1),& & p2ptag, icomm,rvhd(ip+1,3),iret) end if Enddo do ip = 0, np-1 sz = sdsz(ip+1) if (sz > 0) then if (prcid(ip+1)<0) prcid(ip+1) = psb_get_mpi_rank(ctxt,ip) idx = bsdindx(ip+1) p2ptag = psb_complex_tag call mpi_send(valsnd(idx+1:idx+sz),sz,& & psb_mpi_c_spk_,prcid(ip+1),& & p2ptag, icomm,iret) p2ptag = psb_int_swap_tag call mpi_send(iasnd(idx+1:idx+sz),sz,& & psb_mpi_epk_,prcid(ip+1),& & p2ptag, icomm,iret) call mpi_send(jasnd(idx+1:idx+sz),sz,& & psb_mpi_epk_,prcid(ip+1),& & p2ptag, icomm,iret) end if Enddo do ip = 0, np-1 sz = rvsz(ip+1) if (sz > 0) then call mpi_wait(rvhd(ip+1,1),p2pstat,iret) call mpi_wait(rvhd(ip+1,2),p2pstat,iret) call mpi_wait(rvhd(ip+1,3),p2pstat,iret) end if Enddo end subroutine psb_c_e_simple_triad_a2av end module psi_c_collective_mod