Fixed in-line docs.

17 years ago · 3297eb7d04
parent 0911703866
commit 3297eb7d04
140 changed files with 990 additions and 197 deletions
--- a/base/comm/psb_dgather.f90
+++ b/base/comm/psb_dgather.f90
@ -33,7 +33,7 @@
 ! Subroutine: psb_dgatherm
 !   This subroutine gathers pieces of a distributed dense matrix into a local one.
 !
-! Parameters:
+! Arguments:
 !   globx     -  real,dimension(:,:).          The local matrix into which gather 
 !                                                the distributed pieces.
 !   locx      -  real,dimension(:,:).          The local piece of the distributed 
@ -204,7 +204,7 @@ end subroutine psb_dgatherm
 ! Subroutine: psb_dgatherv
 !   This subroutine gathers pieces of a distributed dense vector into a local one.
 !
-! Parameters:
+! Arguments:
 !   globx     -  real,dimension(:).            The local vector into which gather the 
 !                                                  distributed pieces.
 !   locx      -  real,dimension(:).            The local piece of the ditributed
--- a/base/comm/psb_dhalo.f90
+++ b/base/comm/psb_dhalo.f90
@ -34,7 +34,7 @@
 !   This subroutine performs the exchange of the halo elements in a 
 !   distributed dense matrix between all the processes.
 !
-! Parameters:
+! Arguments:
 !   x         -  real,dimension(:,:).          The local part of the dense matrix.
 !   desc_a    -  type(<psb_desc_type>).        The communication descriptor.
 !   info      -  integer.                      Eventually returns an error code.
@ -250,7 +250,7 @@ end subroutine psb_dhalom
 !   This subroutine performs the exchange of the halo elements in a 
 !   distributed dense vector between all the processes.
 !
-! Parameters:
+! Arguments:
 !   x         -  real,dimension(:).            The local part of the dense vector.
 !   desc_a    -  type(<psb_desc_type>).        The communication descriptor.
 !   info      -  integer.                      Eventually returns an error code.
--- a/base/comm/psb_dovrl.f90
+++ b/base/comm/psb_dovrl.f90
@ -34,7 +34,7 @@
 !   This subroutine performs the exchange of the overlap elements in a 
 !   distributed dense matrix between all the processes.
 !
-! Parameters:
+! Arguments:
 !   x           -  real,dimension(:,:).         The local part of the dense matrix.
 !   desc_a      -  type(<psb_desc_type>).       The communication descriptor.
 !   info        -  integer.                     A return code.
@ -254,7 +254,7 @@ end subroutine psb_dovrlm
 !   This subroutine performs the exchange of the overlap elements in a 
 !   distributed dense vector between all the processes.
 !
-! Parameters:
+! Arguments:
 !   x           -  real,dimension(:).          The local part of the dense vector.
 !   desc_a      -  type(<psb_desc_type>).        The communication descriptor.
 !   info        -  integer.                      Eventually returns an error code.
--- a/base/comm/psb_dscatter.F90
+++ b/base/comm/psb_dscatter.F90
@ -34,7 +34,7 @@
 !   This subroutine scatters a global matrix locally owned by one process
 !   into pieces that are local to alle the processes.
 !
-! Parameters:
+! Arguments:
 !   globx     -  real,dimension(:,:).          The global matrix to scatter.
 !   locx      -  real,dimension(:,:).          The local piece of the ditributed matrix.
 !   desc_a    -  type(<psb_desc_type>).        The communication descriptor.
@ -263,7 +263,7 @@ end subroutine psb_dscatterm
 !   This subroutine scatters a global vector locally owned by one process
 !   into pieces that are local to alle the processes.
 !
-! Parameters:
+! Arguments:
 !   globx     -  real,dimension(:).            The global vector to scatter.
 !   locx      -  real,dimension(:).            The local piece of the ditributed vector.
 !   desc_a    -  type(<psb_desc_type>).        The communication descriptor.
--- a/base/comm/psb_igather.f90
+++ b/base/comm/psb_igather.f90
@ -33,7 +33,7 @@
 ! Subroutine: psb_igatherm
 !   This subroutine gathers pieces of a distributed dense matrix into a local one.
 !
-! Parameters:
+! Arguments:
 !   globx     -  integer,dimension(:,:).          The local matrix into which gather 
 !                                                the distributed pieces.
 !   locx      -  integer,dimension(:,:).          The local piece of the distributed 
@ -204,7 +204,7 @@ end subroutine psb_igatherm
 ! Subroutine: psb_igatherv
 !   This subroutine gathers pieces of a distributed dense vector into a local one.
 !
-! Parameters:
+! Arguments:
 !   globx     -  integer,dimension(:).            The local vector into which gather the 
 !                                                  distributed pieces.
 !   locx      -  integer,dimension(:).            The local piece of the ditributed
--- a/base/comm/psb_ihalo.f90
+++ b/base/comm/psb_ihalo.f90
@ -35,7 +35,7 @@
 !   This subroutine performs the exchange of the halo elements in a 
 !    distributed dense matrix between all the processes.
 !
-! Parameters:
+! Arguments:
 !   x         -  integer,dimension(:,:).       The local part of the dense matrix.
 !   desc_a    -  type(<psb_desc_type>).        The communication descriptor.
 !   info      -  integer.                      Eventually returns an error code.
@ -252,7 +252,7 @@ end subroutine psb_ihalom
 !   This subroutine performs the exchange of the halo elements in a 
 !    distributed dense matrix between all the processes.
 !
-! Parameters:
+! Arguments:
 !   x         -  integer,dimension(:).         The local part of the dense matrix.
 !   desc_a    -  type(<psb_desc_type>).        The communication descriptor.
 !   info      -  integer.                      Eventually returns an error code.
--- a/base/comm/psb_iscatter.F90
+++ b/base/comm/psb_iscatter.F90
@ -34,7 +34,7 @@
 !   This subroutine scatters a global matrix locally owned by one process
 !   into pieces that are local to alle the processes.
 !
-! Parameters:
+! Arguments:
 !   globx     -  integer,dimension(:,:).          The global matrix to scatter.
 !   locx      -  integer,dimension(:,:).          The local piece of the ditributed matrix.
 !   desc_a    -  type(<psb_desc_type>).        The communication descriptor.
@ -261,7 +261,7 @@ end subroutine psb_iscatterm
 !   This subroutine scatters a global vector locally owned by one process
 !   into pieces that are local to alle the processes.
 !
-! Parameters:
+! Arguments:
 !   globx     -  integer,dimension(:).            The global vector to scatter.
 !   locx      -  integer,dimension(:).            The local piece of the ditributed vector.
 !   desc_a    -  type(<psb_desc_type>).        The communication descriptor.
--- a/base/comm/psb_zgather.f90
+++ b/base/comm/psb_zgather.f90
@ -33,7 +33,7 @@
 ! Subroutine: psb_zgatherm
 !   This subroutine gathers pieces of a distributed dense matrix into a local one.
 !
-! Parameters:
+! Arguments:
 !   globx     -  cplx,dimension(:,:).          The local matrix into which gather 
 !                                                  the distributed pieces.
 !   locx      -  cplx,dimension(:,:).          The local piece of the distributed 
@ -206,7 +206,7 @@ end subroutine psb_zgatherm
 ! Subroutine: psb_zgatherv
 !   This subroutine gathers pieces of a distributed dense vector into a local one.
 !
-! Parameters:
+! Arguments:
 !   globx     -  cplx,dimension(:).            The local vector into which gather 
 !                                                  the distributed pieces.
 !   locx      -  cplx,dimension(:).            The local piece of the distributed 
--- a/base/comm/psb_zhalo.f90
+++ b/base/comm/psb_zhalo.f90
@ -34,7 +34,7 @@
 !   This subroutine performs the exchange of the halo elements in a 
 !    distributed dense matrix between all the processes.
 !
-! Parameters:
+! Arguments:
 !   x         -  real,dimension(:,:).          The local part of the dense matrix.
 !   desc_a    -  type(<psb_desc_type>).        The communication descriptor.
 !   info      -  integer.                      Eventually returns an error code.
@ -249,7 +249,7 @@ end subroutine psb_zhalom
 !   This subroutine performs the exchange of the halo elements in a 
 !    distributed dense vector between all the processes.
 !
-! Parameters:
+! Arguments:
 !   x         -  real,dimension(:).            The local part of the dense vector.
 !   desc_a    -  type(<psb_desc_type>).        The communication descriptor.
 !   info      -  integer.                      Eventually returns an error code.
--- a/base/comm/psb_zovrl.f90
+++ b/base/comm/psb_zovrl.f90
@ -34,7 +34,7 @@
 !   This subroutine performs the exchange of the overlap elements in a 
 !    distributed dense matrix between all the processes.
 !
-! Parameters:
+! Arguments:
 !   x           -  real,dimension(:,:).        The local part of the dense matrix.
 !   desc_a      -  type(<psb_desc_type>).      The communication descriptor.
 !   info        -  integer.                    Returns an output  code.
@ -254,7 +254,7 @@ end subroutine psb_zovrlm
 !   This subroutine performs the exchange of the overlap elements in a 
 !    distributed dense vector between all the processes.
 !
-! Parameters:
+! Arguments:
 !   x           -  real,dimension(:).          The local part of the dense vector.
 !   desc_a      -  type(<psb_desc_type>).        The communication descriptor.
 !   info        -  integer.                      Eventually returns an error code.
--- a/base/comm/psb_zscatter.F90
+++ b/base/comm/psb_zscatter.F90
@ -34,7 +34,7 @@
 !   This subroutine scatters a global matrix locally owned by one process
 !   into pieces that are local to alle the processes.
 !
-! Parameters:
+! Arguments:
 !   globx     -  complex,dimension(:,:).          The global matrix to scatter.
 !   locx      -  complex,dimension(:,:).          The local piece of the ditributed matrix.
 !   desc_a    -  type(<psb_desc_type>).        The communication descriptor.
@ -265,7 +265,7 @@ end subroutine psb_zscatterm
 !   This subroutine scatters a global vector locally owned by one process
 !   into pieces that are local to alle the processes.
 !
-! Parameters:
+! Arguments:
 !   globx     -  complex,dimension(:).         The global vector to scatter.
 !   locx      -  complex,dimension(:).         The local piece of the ditributed vector.
 !   desc_a    -  type(<psb_desc_type>).        The communication descriptor.
--- a/base/internals/psi_crea_bnd_elem.f90
+++ b/base/internals/psi_crea_bnd_elem.f90
@ -37,7 +37,7 @@
 !    otherwise its size is equal to the number of boundary indices on the 
 !    current (calling) process. 
 ! 
-! Parameters: 
+! Arguments: 
 !    bndel(:) - integer, allocatable      Array containing the output list              
 !    desc_a   - type(<psb_desc_type>).    The communication descriptor.        
 !    info     - integer.                  return code.
--- a/base/internals/psi_crea_index.f90
+++ b/base/internals/psi_crea_index.f90
@ -36,7 +36,7 @@
 !    Converts a list of data exchanges from build format to assembled format. 
 !    See below for a description of the formats.
 !
-! Parameters:
+! Arguments:
 ! desc_a       - type(psb_desc_type)   The descriptor; in this context only the index 
 !                                       mapping parts are used.
 ! index_in(:)  - integer               The index list, build format  
--- a/base/internals/psi_crea_ovr_elem.f90
+++ b/base/internals/psi_crea_ovr_elem.f90
@ -36,7 +36,7 @@
 !   the number of processes sharing it (minimum: 2). List is ended by -1.
 !   See also description in base/modules/psb_desc_type.f90
 ! 
-! Parameters: 
+! Arguments: 
 !    ovr_elem(:) - integer, allocatable      Array containing the output list              
 !    desc_a   - type(<psb_desc_type>).    The communication descriptor.        
 !    info     - integer.                  return code.
--- a/base/internals/psi_dl_check.f90
+++ b/base/internals/psi_dl_check.f90
@ -36,7 +36,7 @@
 !   then process j should depend on i (even if the data to be sent in one of the
 !   directions happens to be empty)
 ! 
-! Parameters: 
+! Arguments: 
 !    dep_list(:,:) - integer             Initial dependency lists
 !    dl_lda        - integer             Allocated size of dep_list
 !    np            - integer             Total number of processes.
--- a/base/internals/psi_dswapdata.F90
+++ b/base/internals/psi_dswapdata.F90
@ -28,6 +28,58 @@
 !!$  POSSIBILITY OF SUCH DAMAGE.
 !!$ 
 !!$  
+!
+! File: psi_Xswapdata.F90
+!
+! Subroutine: psi_Xswapdatam
+!   Does the data exchange among processes. Essentially this is doing 
+!   a variable all-to-all data exchange (ALLTOALLV in MPI parlance), but 
+!   it is capable of pruning empty exchanges, which are very likely in out 
+!   application environment. All the variants have the same structure 
+!   In all these subroutines X may be:    I    Integer
+!                                         D    real(kind(1.d0))
+!                                         Z    complex(kind(1.d0))
+!   Basically the operation is as follows: on each process, we identify 
+!   sections SND(Y) and RCV(Y); then we do a SEND(PACK(SND(Y)));
+!   then we receive, and we do an update with Y = UNPACK(RCV(Y)) + BETA * Y 
+!   but only on the elements involved in the UNPACK operation. 
+!   Thus: for halo data exchange, the receive section is confined in the 
+!   halo indices, and BETA=0, whereas for overlap exchange the receive section 
+!   is scattered in the owned indices, and BETA=1.
+! 
+! Arguments: 
+!    flag     - integer                 Choose the algorithm for data exchange: 
+!                                       this is chosen through bit fields. 
+!                                        swap_mpi  = iand(flag,psb_swap_mpi_)  /= 0
+!                                        swap_sync = iand(flag,psb_swap_sync_) /= 0
+!                                        swap_send = iand(flag,psb_swap_send_) /= 0
+!                                        swap_recv = iand(flag,psb_swap_recv_) /= 0
+!                                       if (swap_mpi):  use underlying MPI_ALLTOALLV.
+!                                       if (swap_sync): use PSB_SND and PSB_RCV in 
+!                                                       synchronized pairs
+!                                       if (swap_send .and. swap_recv): use mpi_irecv 
+!                                                       and mpi_send
+!                                       if (swap_send): use psb_snd (but need another 
+!                                                       call with swap_recv to complete)
+!                                       if (swap_recv): use psb_rcv (completing a 
+!                                                       previous call with swap_send)
+!
+!
+!    n        - integer                 Number of columns in Y               
+!    beta     - X                       Choose overwrite or sum. 
+!    y(:,:)   - X                       The data area                        
+!    desc_a   - type(<psb_desc_type>).  The communication descriptor.        
+!    work(:)  - X                       Buffer space. If not sufficient, will do 
+!                                       our own internal allocation.
+!    info     - integer.                return code.
+!    data     - integer                 which list is to be used to exchange data
+!                                       default psb_comm_halo_
+!                                       psb_comm_halo_    use halo_index
+!                                       psb_comm_ext_     use ext_index 
+!                                       psb_comm_ovrl_    use ovrl_index
+!
+!
+!
 subroutine psi_dswapdatam(flag,n,beta,y,desc_a,work,info,data)

  use psi_mod, psb_protect_name => psi_dswapdatam
@ -451,6 +503,57 @@ end subroutine psi_dswapdatam
 !!$  POSSIBILITY OF SUCH DAMAGE.
 !!$ 
 !!$  
+!
+! File: psi_Xswapdata.F90
+!
+! Subroutine: psi_Xswapdatav
+!   Does the data exchange among processes. Essentially this is doing 
+!   a variable all-to-all data exchange (ALLTOALLV in MPI parlance), but 
+!   it is capable of pruning empty exchanges, which are very likely in out 
+!   application environment. All the variants have the same structure 
+!   In all these subroutines X may be:    I    Integer
+!                                         D    real(kind(1.d0))
+!                                         Z    complex(kind(1.d0))
+!   Basically the operation is as follows: on each process, we identify 
+!   sections SND(Y) and RCV(Y); then we do a SEND(PACK(SND(Y)));
+!   then we receive, and we do an update with Y = UNPACK(RCV(Y)) + BETA * Y 
+!   but only on the elements involved in the UNPACK operation. 
+!   Thus: for halo data exchange, the receive section is confined in the 
+!   halo indices, and BETA=0, whereas for overlap exchange the receive section 
+!   is scattered in the owned indices, and BETA=1.
+! 
+! Arguments: 
+!    flag     - integer                 Choose the algorithm for data exchange: 
+!                                       this is chosen through bit fields. 
+!                                        swap_mpi  = iand(flag,psb_swap_mpi_)  /= 0
+!                                        swap_sync = iand(flag,psb_swap_sync_) /= 0
+!                                        swap_send = iand(flag,psb_swap_send_) /= 0
+!                                        swap_recv = iand(flag,psb_swap_recv_) /= 0
+!                                       if (swap_mpi):  use underlying MPI_ALLTOALLV.
+!                                       if (swap_sync): use PSB_SND and PSB_RCV in 
+!                                                       synchronized pairs
+!                                       if (swap_send .and. swap_recv): use mpi_irecv 
+!                                                       and mpi_send
+!                                       if (swap_send): use psb_snd (but need another 
+!                                                       call with swap_recv to complete)
+!                                       if (swap_recv): use psb_rcv (completing a 
+!                                                       previous call with swap_send)
+!
+!
+!    n        - integer                 Number of columns in Y               
+!    beta     - X                       Choose overwrite or sum. 
+!    y(:)     - X                       The data area                        
+!    desc_a   - type(<psb_desc_type>).  The communication descriptor.        
+!    work(:)  - X                       Buffer space. If not sufficient, will do 
+!                                       our own internal allocation.
+!    info     - integer.                return code.
+!    data     - integer                 which list is to be used to exchange data
+!                                       default psb_comm_halo_
+!                                       psb_comm_halo_    use halo_index
+!                                       psb_comm_ext_     use ext_index 
+!                                       psb_comm_ovrl_    use ovrl_index
+!
+!
 subroutine psi_dswapdatav(flag,beta,y,desc_a,work,info,data)

  use psi_mod, psb_protect_name => psi_dswapdatav
--- a/base/internals/psi_dswaptran.F90
+++ b/base/internals/psi_dswaptran.F90
@ -28,6 +28,61 @@
 !!$  POSSIBILITY OF SUCH DAMAGE.
 !!$ 
 !!$  
+!
+! File: psi_Xswaptran.F90
+!
+! Subroutine: psi_Xswaptranm
+!   Does the data exchange among processes. This is similar to Xswapdata, but
+!   the list is read "in reverse", i.e. indices that are normally SENT are used 
+!   for the RECEIVE part and vice-versa. This is the basic data exchange operation
+!   for doing the product of a sparse matrix by a vector. 
+!   Essentially this is doing a variable all-to-all data exchange
+!   (ALLTOALLV in MPI parlance), but 
+!   it is capable of pruning empty exchanges, which are very likely in out 
+!   application environment. All the variants have the same structure 
+!   In all these subroutines X may be:    I    Integer
+!                                         D    real(kind(1.d0))
+!                                         Z    complex(kind(1.d0))
+!   Basically the operation is as follows: on each process, we identify 
+!   sections SND(Y) and RCV(Y); then we do a SEND(PACK(SND(Y)));
+!   then we receive, and we do an update with Y = UNPACK(RCV(Y)) + BETA * Y 
+!   but only on the elements involved in the UNPACK operation. 
+!   Thus: for halo data exchange, the receive section is confined in the 
+!   halo indices, and BETA=0, whereas for overlap exchange the receive section 
+!   is scattered in the owned indices, and BETA=1.
+! 
+! Arguments: 
+!    flag     - integer                 Choose the algorithm for data exchange: 
+!                                       this is chosen through bit fields. 
+!                                        swap_mpi  = iand(flag,psb_swap_mpi_)  /= 0
+!                                        swap_sync = iand(flag,psb_swap_sync_) /= 0
+!                                        swap_send = iand(flag,psb_swap_send_) /= 0
+!                                        swap_recv = iand(flag,psb_swap_recv_) /= 0
+!                                       if (swap_mpi):  use underlying MPI_ALLTOALLV.
+!                                       if (swap_sync): use PSB_SND and PSB_RCV in 
+!                                                       synchronized pairs
+!                                       if (swap_send .and. swap_recv): use mpi_irecv 
+!                                                       and mpi_send
+!                                       if (swap_send): use psb_snd (but need another 
+!                                                       call with swap_recv to complete)
+!                                       if (swap_recv): use psb_rcv (completing a 
+!                                                       previous call with swap_send)
+!
+!
+!    n        - integer                 Number of columns in Y               
+!    beta     - X                       Choose overwrite or sum. 
+!    y(:,:)   - X                       The data area                        
+!    desc_a   - type(<psb_desc_type>).  The communication descriptor.        
+!    work(:)  - X                       Buffer space. If not sufficient, will do 
+!                                       our own internal allocation.
+!    info     - integer.                return code.
+!    data     - integer                 which list is to be used to exchange data
+!                                       default psb_comm_halo_
+!                                       psb_comm_halo_    use halo_index
+!                                       psb_comm_ext_     use ext_index 
+!                                       psb_comm_ovrl_    use ovrl_index
+!
+!
 subroutine psi_dswaptranm(flag,n,beta,y,desc_a,work,info,data)

  use psi_mod, psb_protect_name => psi_dswaptranm
@ -442,6 +497,61 @@ end subroutine psi_dswaptranm
 !!$  POSSIBILITY OF SUCH DAMAGE.
 !!$ 
 !!$  
+!
+! File: psi_Xswaptran.F90
+!
+! Subroutine: psi_Xswaptranv
+!   Does the data exchange among processes. This is similar to Xswapdata, but
+!   the list is read "in reverse", i.e. indices that are normally SENT are used 
+!   for the RECEIVE part and vice-versa. This is the basic data exchange operation
+!   for doing the product of a sparse matrix by a vector. 
+!   Essentially this is doing a variable all-to-all data exchange
+!   (ALLTOALLV in MPI parlance), but 
+!   it is capable of pruning empty exchanges, which are very likely in out 
+!   application environment. All the variants have the same structure 
+!   In all these subroutines X may be:    I    Integer
+!                                         D    real(kind(1.d0))
+!                                         Z    complex(kind(1.d0))
+!   Basically the operation is as follows: on each process, we identify 
+!   sections SND(Y) and RCV(Y); then we do a SEND(PACK(SND(Y)));
+!   then we receive, and we do an update with Y = UNPACK(RCV(Y)) + BETA * Y 
+!   but only on the elements involved in the UNPACK operation. 
+!   Thus: for halo data exchange, the receive section is confined in the 
+!   halo indices, and BETA=0, whereas for overlap exchange the receive section 
+!   is scattered in the owned indices, and BETA=1.
+! 
+! Arguments: 
+!    flag     - integer                 Choose the algorithm for data exchange: 
+!                                       this is chosen through bit fields. 
+!                                        swap_mpi  = iand(flag,psb_swap_mpi_)  /= 0
+!                                        swap_sync = iand(flag,psb_swap_sync_) /= 0
+!                                        swap_send = iand(flag,psb_swap_send_) /= 0
+!                                        swap_recv = iand(flag,psb_swap_recv_) /= 0
+!                                       if (swap_mpi):  use underlying MPI_ALLTOALLV.
+!                                       if (swap_sync): use PSB_SND and PSB_RCV in 
+!                                                       synchronized pairs
+!                                       if (swap_send .and. swap_recv): use mpi_irecv 
+!                                                       and mpi_send
+!                                       if (swap_send): use psb_snd (but need another 
+!                                                       call with swap_recv to complete)
+!                                       if (swap_recv): use psb_rcv (completing a 
+!                                                       previous call with swap_send)
+!
+!
+!    n        - integer                 Number of columns in Y               
+!    beta     - X                       Choose overwrite or sum. 
+!    y(:)     - X                       The data area                        
+!    desc_a   - type(<psb_desc_type>).  The communication descriptor.        
+!    work(:)  - X                       Buffer space. If not sufficient, will do 
+!                                       our own internal allocation.
+!    info     - integer.                return code.
+!    data     - integer                 which list is to be used to exchange data
+!                                       default psb_comm_halo_
+!                                       psb_comm_halo_    use halo_index
+!                                       psb_comm_ext_     use ext_index 
+!                                       psb_comm_ovrl_    use ovrl_index
+!
+!
 subroutine psi_dswaptranv(flag,beta,y,desc_a,work,info,data)

  use psi_mod, psb_protect_name => psi_dswaptranv
--- a/base/internals/psi_fnd_owner.f90
+++ b/base/internals/psi_fnd_owner.f90
@ -27,7 +27,22 @@
 !!$  ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 !!$  POSSIBILITY OF SUCH DAMAGE.
 !!$ 
-!!$  
+!!$ 
+!
+! File: psi_fnd_owner.f90
+!
+! Subroutine: psi_fnd_owner
+!   Figure out who owns  global indices. 
+! 
+! Arguments: 
+!    nv       - integer                   Number of indices required on  the calling
+!                                         process 
+!    idx(:)   - integer                   Required indices on the calling process
+!    iprc(:)  - integer, allocatable      Output: process identifiers for the corresponding
+!                                         indices
+!    desc_a   - type(<psb_desc_type>).    The communication descriptor.        
+!    info     - integer.                  return code.
+! 
 subroutine psi_fnd_owner(nv,idx,iprc,desc,info)
  use psb_descriptor_type
  use psb_serial_mod
@ -80,10 +95,20 @@ subroutine psi_fnd_owner(nv,idx,iprc,desc,info)
    write(0,*) 'Invalid input descriptor in psi_fnd_owner'
  end if

+  !
+  ! The basic idea is very simple. 
+  ! First we figure out the total number of requests.
+  ! Second we build the aggregate list of requests (with psb_amx)
+  ! Third, we figure out locally whether we own the indices (whoever is 
+  ! asking for them) and build our part of the reply (we shift process 
+  !  indices so that they're 1-based)
+  ! Fourth, we do a psb_amx on the replies so that we have everybody's answers
+  ! Fifth, we extract the answers for our local query, and shift back the 
+  ! process indices to 0-based.

  Allocate(hidx(np+1),hsz(np),stat=info)
  if (info /= 0) then 
-    call psb_errpush(4010,name,a_err='Allocate')
+    call psb_errpush(4010,name,a_err='Allocate') 
    goto 9999      
  end if
  hsz       = 0
--- a/base/internals/psi_idx_cnv.f90
+++ b/base/internals/psi_idx_cnv.f90
@ -28,6 +28,20 @@
 !!$  POSSIBILITY OF SUCH DAMAGE.
 !!$ 
 !!$  
+!
+! File: psi_idx_cnv.f90
+!
+! Subroutine: psi_idx_cnv1
+!   Converts a bunch of indices from global to local numbering. 
+!   
+! 
+! Arguments: 
+!    nv       - integer                   Number of indices required 
+!    idxin(:) - integer                   Required indices,   overwritten on output.
+!    desc     - type(<psb_desc_type>).    The communication descriptor.        
+!    info     - integer.                  return code.
+!    mask(:)  - logical, optional         Only do the conversion for specific indices.
+!    owned    - logical,optional          Restrict to local indices, no halo (default false)
 subroutine psi_idx_cnv1(nv,idxin,desc,info,mask,owned)
  use psb_descriptor_type
  use psb_serial_mod
@ -167,7 +181,21 @@ end subroutine psi_idx_cnv1
 !!$  POSSIBILITY OF SUCH DAMAGE.
 !!$ 
 !!$  
-
+!
+! File: psi_idx_cnv.f90
+!
+! Subroutine: psi_idx_cnv2
+!   Converts a bunch of indices from global to local numbering. 
+!   
+! 
+! Arguments: 
+!    nv        - integer                   Number of indices required 
+!    idxin(:)  - integer                   Required indices
+!    idxout(:) - integer                   Output values, negative for invalid input.
+!    desc      - type(<psb_desc_type>).    The communication descriptor.        
+!    info      - integer.                  return code.
+!    mask(:)   - logical, optional         Only do the conversion for specific indices.
+!    owned     - logical,optional          Restrict to local indices, no halo (default false)
 subroutine psi_idx_cnv2(nv,idxin,idxout,desc,info,mask,owned)
  use psb_descriptor_type
  use psb_serial_mod
@ -251,9 +279,19 @@ subroutine psi_idx_cnv2(nv,idxin,idxout,desc,info,mask,owned)
    owned_ = .false.
  endif

-
+  !
+  ! The input descriptor may be in any state
+  !
  if (psb_is_large_desc(desc)) then 
+    !
+    ! Large descriptor: the size of the index space is such that
+    ! we decided not to allocate the glob_to_loc(:) map.
+    !
    if (psb_is_bld_desc(desc)) then 
+      !
+      ! During the build phase of a large descriptor the indices 
+      ! are kept in an AVL tree.
+      !
      do i = 1, nv
        if (mask_(i)) then 
          ip = idxin(i) 
@ -274,6 +312,12 @@ subroutine psi_idx_cnv2(nv,idxin,idxout,desc,info,mask,owned)
        end if
      enddo
    else if (psb_is_asb_desc(desc)) then 
+      !
+      ! When a large descriptor is assembled the indices 
+      ! are kept in a (hashed) list of ordered lists, 
+      ! hence psi_inner_cnv does the hashing and binary search.
+      !
+
      if (.not.allocated(desc%hashv)) then 
        write(0,*) 'Inconsistent input to inner_cnv'
      end if
@ -283,6 +327,10 @@ subroutine psi_idx_cnv2(nv,idxin,idxout,desc,info,mask,owned)

  else

+    !
+    ! Not a large descriptor, so we have  the glob_to_loc(:) map
+    ! available. 
+    !
    do i = 1, nv
      if (mask_(i)) then 
        ip = idxin(i) 
@ -355,6 +403,20 @@ end subroutine psi_idx_cnv2
 !!$  POSSIBILITY OF SUCH DAMAGE.
 !!$ 
 !!$  
+!
+! File: psi_idx_cnv.f90
+!
+! Subroutine: psi_idx_cnvs
+!   Converts an index from global to local numbering. 
+!   
+! 
+! Arguments: 
+!    idxin     - integer                   Required index   
+!    idxout    - integer                   Output value, negative for invalid input.
+!    desc      - type(<psb_desc_type>).    The communication descriptor.        
+!    info      - integer.                  return code.
+!    mask      - logical, optional         Only do the conversion if true.
+!    owned     - logical,optional          Restrict to local indices, no halo (default false)
 subroutine psi_idx_cnvs(idxin,idxout,desc,info,mask,owned)

  use psi_mod, psb_protect_name => psi_idx_cnvs
--- a/base/internals/psi_idx_ins_cnv.f90
+++ b/base/internals/psi_idx_ins_cnv.f90
@ -28,6 +28,25 @@
 !!$  POSSIBILITY OF SUCH DAMAGE.
 !!$ 
 !!$  
+!
+! File: psi_idx_ins_cnv.f90
+!
+! Subroutine: psi_idx_ins_cnv1
+!   Converts a bunch of indices from global to local numbering. 
+!   This routine is called while the descriptor is in the build state;
+!   the idea is that if an index is not yet marked as local, it is a new 
+!   connection to another process, i.e. a new entry into the halo. 
+!   But we still need the mask, because we have to take out the column indices 
+!   corresponding to row indices we do not own (see psb_cdins for how this is used). 
+! 
+! Arguments: 
+!    nv        - integer                   Number of indices required 
+!    idxin(:)  - integer                   Required indices, overwritten on output
+!                                          output is negative for masked entries
+!    desc      - type(<psb_desc_type>).    The communication descriptor.        
+!    info      - integer.                  return code.
+!    mask(:)   - logical, optional         Only do the conversion for specific indices.
+!    
 subroutine psi_idx_ins_cnv1(nv,idxin,desc,info,mask)
  use psi_mod, psb_protect_name => psi_idx_ins_cnv1
  use psb_descriptor_type
@ -159,7 +178,25 @@ end subroutine psi_idx_ins_cnv1
 !!$  POSSIBILITY OF SUCH DAMAGE.
 !!$ 
 !!$  
-
+!
+! File: psi_idx_ins_cnv.f90
+!
+! Subroutine: psi_idx_ins_cnv2
+!   Converts a bunch of indices from global to local numbering. 
+!   This routine is called while the descriptor is in the build state;
+!   the idea is that if an index is not yet marked as local, it is a new 
+!   connection to another process, i.e. a new entry into the halo. 
+!   But we still need the mask, because we have to take out the column indices 
+!   corresponding to row indices we do not own (see psb_cdins for how this is used). 
+! 
+! Arguments: 
+!    nv        - integer                   Number of indices required 
+!    idxin(:)  - integer                   Required indices
+!    idxout(:) - integer                   Output values (negative for masked entries)
+!    desc      - type(<psb_desc_type>).    The communication descriptor.        
+!    info      - integer.                  return code.
+!    mask(:)   - logical, optional         Only do the conversion for specific indices.
+!    
 subroutine psi_idx_ins_cnv2(nv,idxin,idxout,desc,info,mask)
  use psi_mod, psb_protect_name => psi_idx_ins_cnv2
  use psb_descriptor_type
@ -399,6 +436,24 @@ end subroutine psi_idx_ins_cnv2
 !!$  POSSIBILITY OF SUCH DAMAGE.
 !!$ 
 !!$  
+!
+! File: psi_idx_ins_cnv.f90
+!
+! Subroutine: psi_idx_ins_cnvs
+!   Converts an index  from global to local numbering. 
+!   This routine is called while the descriptor is in the build state;
+!   the idea is that if an index is not yet marked as local, it is a new 
+!   connection to another process, i.e. a new entry into the halo. 
+!   But we still need the mask, because we have to take out the column indices 
+!   corresponding to row indices we do not own (see psb_cdins for how this is used). 
+! 
+! Arguments: 
+!    idxin     - integer                   Required index s
+!    idxout    - integer                   Output value  (negative for masked entries)
+!    desc      - type(<psb_desc_type>).    The communication descriptor.        
+!    info      - integer.                  return code.
+!    mask      - logical, optional         Only do the conversion for specific indices.
+!    
 subroutine psi_idx_ins_cnvs(idxin,idxout,desc,info,mask)
  use psi_mod, psb_protect_name => psi_idx_ins_cnvs
  use psb_descriptor_type
--- a/base/internals/psi_iswapdata.F90
+++ b/base/internals/psi_iswapdata.F90
@ -28,6 +28,57 @@
 !!$  POSSIBILITY OF SUCH DAMAGE.
 !!$ 
 !!$  
+!
+! File: psi_Xswapdata.F90
+!
+! Subroutine: psi_Xswapdatam
+!   Does the data exchange among processes. Essentially this is doing 
+!   a variable all-to-all data exchange (ALLTOALLV in MPI parlance), but 
+!   it is capable of pruning empty exchanges, which are very likely in out 
+!   application environment. All the variants have the same structure 
+!   In all these subroutines X may be:    I    Integer
+!                                         D    real(kind(1.d0))
+!                                         Z    complex(kind(1.d0))
+!   Basically the operation is as follows: on each process, we identify 
+!   sections SND(Y) and RCV(Y); then we do a SEND(PACK(SND(Y)));
+!   then we receive, and we do an update with Y = UNPACK(RCV(Y)) + BETA * Y 
+!   but only on the elements involved in the UNPACK operation. 
+!   Thus: for halo data exchange, the receive section is confined in the 
+!   halo indices, and BETA=0, whereas for overlap exchange the receive section 
+!   is scattered in the owned indices, and BETA=1.
+! 
+! Arguments: 
+!    flag     - integer                 Choose the algorithm for data exchange: 
+!                                       this is chosen through bit fields. 
+!                                        swap_mpi  = iand(flag,psb_swap_mpi_)  /= 0
+!                                        swap_sync = iand(flag,psb_swap_sync_) /= 0
+!                                        swap_send = iand(flag,psb_swap_send_) /= 0
+!                                        swap_recv = iand(flag,psb_swap_recv_) /= 0
+!                                       if (swap_mpi):  use underlying MPI_ALLTOALLV.
+!                                       if (swap_sync): use PSB_SND and PSB_RCV in 
+!                                                       synchronized pairs
+!                                       if (swap_send .and. swap_recv): use mpi_irecv 
+!                                                       and mpi_send
+!                                       if (swap_send): use psb_snd (but need another 
+!                                                       call with swap_recv to complete)
+!                                       if (swap_recv): use psb_rcv (completing a 
+!                                                       previous call with swap_send)
+!
+!
+!    n        - integer                 Number of columns in Y               
+!    beta     - X                       Choose overwrite or sum. 
+!    y(:,:)   - X                       The data area                        
+!    desc_a   - type(<psb_desc_type>).  The communication descriptor.        
+!    work(:)  - X                       Buffer space. If not sufficient, will do 
+!                                       our own internal allocation.
+!    info     - integer.                return code.
+!    data     - integer                 which list is to be used to exchange data
+!                                       default psb_comm_halo_
+!                                       psb_comm_halo_    use halo_index
+!                                       psb_comm_ext_     use ext_index 
+!                                       psb_comm_ovrl_    use ovrl_index
+!
+!
 subroutine psi_iswapdatam(flag,n,beta,y,desc_a,work,info,data)

  use psi_mod, psb_protect_name => psi_iswapdatam
@ -451,6 +502,57 @@ end subroutine psi_iswapdatam
 !!$  POSSIBILITY OF SUCH DAMAGE.
 !!$ 
 !!$  
+!
+! File: psi_Xswapdata.F90
+!
+! Subroutine: psi_Xswapdatav
+!   Does the data exchange among processes. Essentially this is doing 
+!   a variable all-to-all data exchange (ALLTOALLV in MPI parlance), but 
+!   it is capable of pruning empty exchanges, which are very likely in out 
+!   application environment. All the variants have the same structure 
+!   In all these subroutines X may be:    I    Integer
+!                                         D    real(kind(1.d0))
+!                                         Z    complex(kind(1.d0))
+!   Basically the operation is as follows: on each process, we identify 
+!   sections SND(Y) and RCV(Y); then we do a SEND(PACK(SND(Y)));
+!   then we receive, and we do an update with Y = UNPACK(RCV(Y)) + BETA * Y 
+!   but only on the elements involved in the UNPACK operation. 
+!   Thus: for halo data exchange, the receive section is confined in the 
+!   halo indices, and BETA=0, whereas for overlap exchange the receive section 
+!   is scattered in the owned indices, and BETA=1.
+! 
+! Arguments: 
+!    flag     - integer                 Choose the algorithm for data exchange: 
+!                                       this is chosen through bit fields. 
+!                                        swap_mpi  = iand(flag,psb_swap_mpi_)  /= 0
+!                                        swap_sync = iand(flag,psb_swap_sync_) /= 0
+!                                        swap_send = iand(flag,psb_swap_send_) /= 0
+!                                        swap_recv = iand(flag,psb_swap_recv_) /= 0
+!                                       if (swap_mpi):  use underlying MPI_ALLTOALLV.
+!                                       if (swap_sync): use PSB_SND and PSB_RCV in 
+!                                                       synchronized pairs
+!                                       if (swap_send .and. swap_recv): use mpi_irecv 
+!                                                       and mpi_send
+!                                       if (swap_send): use psb_snd (but need another 
+!                                                       call with swap_recv to complete)
+!                                       if (swap_recv): use psb_rcv (completing a 
+!                                                       previous call with swap_send)
+!
+!
+!    n        - integer                 Number of columns in Y               
+!    beta     - X                       Choose overwrite or sum. 
+!    y(:)     - X                       The data area                        
+!    desc_a   - type(<psb_desc_type>).  The communication descriptor.        
+!    work(:)  - X                       Buffer space. If not sufficient, will do 
+!                                       our own internal allocation.
+!    info     - integer.                return code.
+!    data     - integer                 which list is to be used to exchange data
+!                                       default psb_comm_halo_
+!                                       psb_comm_halo_    use halo_index
+!                                       psb_comm_ext_     use ext_index 
+!                                       psb_comm_ovrl_    use ovrl_index
+!
+!
 subroutine psi_iswapdatav(flag,beta,y,desc_a,work,info,data)

  use psi_mod, psb_protect_name => psi_iswapdatav
--- a/base/internals/psi_iswaptran.F90
+++ b/base/internals/psi_iswaptran.F90
@ -28,6 +28,61 @@
 !!$  POSSIBILITY OF SUCH DAMAGE.
 !!$ 
 !!$  
+!
+! File: psi_Xswaptran.F90
+!
+! Subroutine: psi_Xswaptranm
+!   Does the data exchange among processes. This is similar to Xswapdata, but
+!   the list is read "in reverse", i.e. indices that are normally SENT are used 
+!   for the RECEIVE part and vice-versa. This is the basic data exchange operation
+!   for doing the product of a sparse matrix by a vector. 
+!   Essentially this is doing a variable all-to-all data exchange
+!   (ALLTOALLV in MPI parlance), but 
+!   it is capable of pruning empty exchanges, which are very likely in out 
+!   application environment. All the variants have the same structure 
+!   In all these subroutines X may be:    I    Integer
+!                                         D    real(kind(1.d0))
+!                                         Z    complex(kind(1.d0))
+!   Basically the operation is as follows: on each process, we identify 
+!   sections SND(Y) and RCV(Y); then we do a SEND(PACK(SND(Y)));
+!   then we receive, and we do an update with Y = UNPACK(RCV(Y)) + BETA * Y 
+!   but only on the elements involved in the UNPACK operation. 
+!   Thus: for halo data exchange, the receive section is confined in the 
+!   halo indices, and BETA=0, whereas for overlap exchange the receive section 
+!   is scattered in the owned indices, and BETA=1.
+! 
+! Arguments: 
+!    flag     - integer                 Choose the algorithm for data exchange: 
+!                                       this is chosen through bit fields. 
+!                                        swap_mpi  = iand(flag,psb_swap_mpi_)  /= 0
+!                                        swap_sync = iand(flag,psb_swap_sync_) /= 0
+!                                        swap_send = iand(flag,psb_swap_send_) /= 0
+!                                        swap_recv = iand(flag,psb_swap_recv_) /= 0
+!                                       if (swap_mpi):  use underlying MPI_ALLTOALLV.
+!                                       if (swap_sync): use PSB_SND and PSB_RCV in 
+!                                                       synchronized pairs
+!                                       if (swap_send .and. swap_recv): use mpi_irecv 
+!                                                       and mpi_send
+!                                       if (swap_send): use psb_snd (but need another 
+!                                                       call with swap_recv to complete)
+!                                       if (swap_recv): use psb_rcv (completing a 
+!                                                       previous call with swap_send)
+!
+!
+!    n        - integer                 Number of columns in Y               
+!    beta     - X                       Choose overwrite or sum. 
+!    y(:,:)   - X                       The data area                        
+!    desc_a   - type(<psb_desc_type>).  The communication descriptor.        
+!    work(:)  - X                       Buffer space. If not sufficient, will do 
+!                                       our own internal allocation.
+!    info     - integer.                return code.
+!    data     - integer                 which list is to be used to exchange data
+!                                       default psb_comm_halo_
+!                                       psb_comm_halo_    use halo_index
+!                                       psb_comm_ext_     use ext_index 
+!                                       psb_comm_ovrl_    use ovrl_index
+!
+!
 subroutine psi_iswaptranm(flag,n,beta,y,desc_a,work,info,data)

  use psi_mod, psb_protect_name => psi_iswaptranm
@ -441,6 +496,61 @@ end subroutine psi_iswaptranm
 !!$  POSSIBILITY OF SUCH DAMAGE.
 !!$ 
 !!$  
+!
+! File: psi_Xswaptran.F90
+!
+! Subroutine: psi_Xswaptranv
+!   Does the data exchange among processes. This is similar to Xswapdata, but
+!   the list is read "in reverse", i.e. indices that are normally SENT are used 
+!   for the RECEIVE part and vice-versa. This is the basic data exchange operation
+!   for doing the product of a sparse matrix by a vector. 
+!   Essentially this is doing a variable all-to-all data exchange
+!   (ALLTOALLV in MPI parlance), but 
+!   it is capable of pruning empty exchanges, which are very likely in out 
+!   application environment. All the variants have the same structure 
+!   In all these subroutines X may be:    I    Integer
+!                                         D    real(kind(1.d0))
+!                                         Z    complex(kind(1.d0))
+!   Basically the operation is as follows: on each process, we identify 
+!   sections SND(Y) and RCV(Y); then we do a SEND(PACK(SND(Y)));
+!   then we receive, and we do an update with Y = UNPACK(RCV(Y)) + BETA * Y 
+!   but only on the elements involved in the UNPACK operation. 
+!   Thus: for halo data exchange, the receive section is confined in the 
+!   halo indices, and BETA=0, whereas for overlap exchange the receive section 
+!   is scattered in the owned indices, and BETA=1.
+! 
+! Arguments: 
+!    flag     - integer                 Choose the algorithm for data exchange: 
+!                                       this is chosen through bit fields. 
+!                                        swap_mpi  = iand(flag,psb_swap_mpi_)  /= 0
+!                                        swap_sync = iand(flag,psb_swap_sync_) /= 0
+!                                        swap_send = iand(flag,psb_swap_send_) /= 0
+!                                        swap_recv = iand(flag,psb_swap_recv_) /= 0
+!                                       if (swap_mpi):  use underlying MPI_ALLTOALLV.
+!                                       if (swap_sync): use PSB_SND and PSB_RCV in 
+!                                                       synchronized pairs
+!                                       if (swap_send .and. swap_recv): use mpi_irecv 
+!                                                       and mpi_send
+!                                       if (swap_send): use psb_snd (but need another 
+!                                                       call with swap_recv to complete)
+!                                       if (swap_recv): use psb_rcv (completing a 
+!                                                       previous call with swap_send)
+!
+!
+!    n        - integer                 Number of columns in Y               
+!    beta     - X                       Choose overwrite or sum. 
+!    y(:)     - X                       The data area                        
+!    desc_a   - type(<psb_desc_type>).  The communication descriptor.        
+!    work(:)  - X                       Buffer space. If not sufficient, will do 
+!                                       our own internal allocation.
+!    info     - integer.                return code.
+!    data     - integer                 which list is to be used to exchange data
+!                                       default psb_comm_halo_
+!                                       psb_comm_halo_    use halo_index
+!                                       psb_comm_ext_     use ext_index 
+!                                       psb_comm_ovrl_    use ovrl_index
+!
+!
 subroutine psi_iswaptranv(flag,beta,y,desc_a,work,info,data)

  use psi_mod, psb_protect_name => psi_iswaptranv
--- a/base/internals/psi_zswapdata.F90
+++ b/base/internals/psi_zswapdata.F90
@ -28,6 +28,57 @@
 !!$  POSSIBILITY OF SUCH DAMAGE.
 !!$ 
 !!$  
+!
+! File: psi_Xswapdata.F90
+!
+! Subroutine: psi_Xswapdatam
+!   Does the data exchange among processes. Essentially this is doing 
+!   a variable all-to-all data exchange (ALLTOALLV in MPI parlance), but 
+!   it is capable of pruning empty exchanges, which are very likely in out 
+!   application environment. All the variants have the same structure 
+!   In all these subroutines X may be:    I    Integer
+!                                         D    real(kind(1.d0))
+!                                         Z    complex(kind(1.d0))
+!   Basically the operation is as follows: on each process, we identify 
+!   sections SND(Y) and RCV(Y); then we do a SEND(PACK(SND(Y)));
+!   then we receive, and we do an update with Y = UNPACK(RCV(Y)) + BETA * Y 
+!   but only on the elements involved in the UNPACK operation. 
+!   Thus: for halo data exchange, the receive section is confined in the 
+!   halo indices, and BETA=0, whereas for overlap exchange the receive section 
+!   is scattered in the owned indices, and BETA=1.
+! 
+! Arguments: 
+!    flag     - integer                 Choose the algorithm for data exchange: 
+!                                       this is chosen through bit fields. 
+!                                        swap_mpi  = iand(flag,psb_swap_mpi_)  /= 0
+!                                        swap_sync = iand(flag,psb_swap_sync_) /= 0
+!                                        swap_send = iand(flag,psb_swap_send_) /= 0
+!                                        swap_recv = iand(flag,psb_swap_recv_) /= 0
+!                                       if (swap_mpi):  use underlying MPI_ALLTOALLV.
+!                                       if (swap_sync): use PSB_SND and PSB_RCV in 
+!                                                       synchronized pairs
+!                                       if (swap_send .and. swap_recv): use mpi_irecv 
+!                                                       and mpi_send
+!                                       if (swap_send): use psb_snd (but need another 
+!                                                       call with swap_recv to complete)
+!                                       if (swap_recv): use psb_rcv (completing a 
+!                                                       previous call with swap_send)
+!
+!
+!    n        - integer                 Number of columns in Y               
+!    beta     - X                       Choose overwrite or sum. 
+!    y(:,:)   - X                       The data area                        
+!    desc_a   - type(<psb_desc_type>).  The communication descriptor.        
+!    work(:)  - X                       Buffer space. If not sufficient, will do 
+!                                       our own internal allocation.
+!    info     - integer.                return code.
+!    data     - integer                 which list is to be used to exchange data
+!                                       default psb_comm_halo_
+!                                       psb_comm_halo_    use halo_index
+!                                       psb_comm_ext_     use ext_index 
+!                                       psb_comm_ovrl_    use ovrl_index
+!
+!
 subroutine psi_zswapdatam(flag,n,beta,y,desc_a,work,info,data)

  use psi_mod, psb_protect_name => psi_zswapdatam
@ -451,6 +502,57 @@ end subroutine psi_zswapdatam
 !!$  POSSIBILITY OF SUCH DAMAGE.
 !!$ 
 !!$  
+!
+! File: psi_Xswapdata.F90
+!
+! Subroutine: psi_Xswapdatav
+!   Does the data exchange among processes. Essentially this is doing 
+!   a variable all-to-all data exchange (ALLTOALLV in MPI parlance), but 
+!   it is capable of pruning empty exchanges, which are very likely in out 
+!   application environment. All the variants have the same structure 
+!   In all these subroutines X may be:    I    Integer
+!                                         D    real(kind(1.d0))
+!                                         Z    complex(kind(1.d0))
+!   Basically the operation is as follows: on each process, we identify 
+!   sections SND(Y) and RCV(Y); then we do a SEND(PACK(SND(Y)));
+!   then we receive, and we do an update with Y = UNPACK(RCV(Y)) + BETA * Y 
+!   but only on the elements involved in the UNPACK operation. 
+!   Thus: for halo data exchange, the receive section is confined in the 
+!   halo indices, and BETA=0, whereas for overlap exchange the receive section 
+!   is scattered in the owned indices, and BETA=1.
+! 
+! Arguments: 
+!    flag     - integer                 Choose the algorithm for data exchange: 
+!                                       this is chosen through bit fields. 
+!                                        swap_mpi  = iand(flag,psb_swap_mpi_)  /= 0
+!                                        swap_sync = iand(flag,psb_swap_sync_) /= 0
+!                                        swap_send = iand(flag,psb_swap_send_) /= 0
+!                                        swap_recv = iand(flag,psb_swap_recv_) /= 0
+!                                       if (swap_mpi):  use underlying MPI_ALLTOALLV.
+!                                       if (swap_sync): use PSB_SND and PSB_RCV in 
+!                                                       synchronized pairs
+!                                       if (swap_send .and. swap_recv): use mpi_irecv 
+!                                                       and mpi_send
+!                                       if (swap_send): use psb_snd (but need another 
+!                                                       call with swap_recv to complete)
+!                                       if (swap_recv): use psb_rcv (completing a 
+!                                                       previous call with swap_send)
+!
+!
+!    n        - integer                 Number of columns in Y               
+!    beta     - X                       Choose overwrite or sum. 
+!    y(:)     - X                       The data area                        
+!    desc_a   - type(<psb_desc_type>).  The communication descriptor.        
+!    work(:)  - X                       Buffer space. If not sufficient, will do 
+!                                       our own internal allocation.
+!    info     - integer.                return code.
+!    data     - integer                 which list is to be used to exchange data
+!                                       default psb_comm_halo_
+!                                       psb_comm_halo_    use halo_index
+!                                       psb_comm_ext_     use ext_index 
+!                                       psb_comm_ovrl_    use ovrl_index
+!
+!
 subroutine psi_zswapdatav(flag,beta,y,desc_a,work,info,data)

  use psi_mod, psb_protect_name => psi_zswapdatav
--- a/base/internals/psi_zswaptran.F90
+++ b/base/internals/psi_zswaptran.F90
@ -28,6 +28,61 @@
 !!$  POSSIBILITY OF SUCH DAMAGE.
 !!$ 
 !!$  
+!
+! File: psi_Xswaptran.F90
+!
+! Subroutine: psi_Xswaptranm
+!   Does the data exchange among processes. This is similar to Xswapdata, but
+!   the list is read "in reverse", i.e. indices that are normally SENT are used 
+!   for the RECEIVE part and vice-versa. This is the basic data exchange operation
+!   for doing the product of a sparse matrix by a vector. 
+!   Essentially this is doing a variable all-to-all data exchange
+!   (ALLTOALLV in MPI parlance), but 
+!   it is capable of pruning empty exchanges, which are very likely in out 
+!   application environment. All the variants have the same structure 
+!   In all these subroutines X may be:    I    Integer
+!                                         D    real(kind(1.d0))
+!                                         Z    complex(kind(1.d0))
+!   Basically the operation is as follows: on each process, we identify 
+!   sections SND(Y) and RCV(Y); then we do a SEND(PACK(SND(Y)));
+!   then we receive, and we do an update with Y = UNPACK(RCV(Y)) + BETA * Y 
+!   but only on the elements involved in the UNPACK operation. 
+!   Thus: for halo data exchange, the receive section is confined in the 
+!   halo indices, and BETA=0, whereas for overlap exchange the receive section 
+!   is scattered in the owned indices, and BETA=1.
+! 
+! Arguments: 
+!    flag     - integer                 Choose the algorithm for data exchange: 
+!                                       this is chosen through bit fields. 
+!                                        swap_mpi  = iand(flag,psb_swap_mpi_)  /= 0
+!                                        swap_sync = iand(flag,psb_swap_sync_) /= 0
+!                                        swap_send = iand(flag,psb_swap_send_) /= 0
+!                                        swap_recv = iand(flag,psb_swap_recv_) /= 0
+!                                       if (swap_mpi):  use underlying MPI_ALLTOALLV.
+!                                       if (swap_sync): use PSB_SND and PSB_RCV in 
+!                                                       synchronized pairs
+!                                       if (swap_send .and. swap_recv): use mpi_irecv 
+!                                                       and mpi_send
+!                                       if (swap_send): use psb_snd (but need another 
+!                                                       call with swap_recv to complete)
+!                                       if (swap_recv): use psb_rcv (completing a 
+!                                                       previous call with swap_send)
+!
+!
+!    n        - integer                 Number of columns in Y               
+!    beta     - X                       Choose overwrite or sum. 
+!    y(:,:)   - X                       The data area                        
+!    desc_a   - type(<psb_desc_type>).  The communication descriptor.        
+!    work(:)  - X                       Buffer space. If not sufficient, will do 
+!                                       our own internal allocation.
+!    info     - integer.                return code.
+!    data     - integer                 which list is to be used to exchange data
+!                                       default psb_comm_halo_
+!                                       psb_comm_halo_    use halo_index
+!                                       psb_comm_ext_     use ext_index 
+!                                       psb_comm_ovrl_    use ovrl_index
+!
+!
 subroutine psi_zswaptranm(flag,n,beta,y,desc_a,work,info,data)

  use psi_mod, psb_protect_name => psi_zswaptranm
@ -442,6 +497,61 @@ end subroutine psi_zswaptranm
 !!$  POSSIBILITY OF SUCH DAMAGE.
 !!$ 
 !!$  
+!
+! File: psi_Xswaptran.F90
+!
+! Subroutine: psi_Xswaptranv
+!   Does the data exchange among processes. This is similar to Xswapdata, but
+!   the list is read "in reverse", i.e. indices that are normally SENT are used 
+!   for the RECEIVE part and vice-versa. This is the basic data exchange operation
+!   for doing the product of a sparse matrix by a vector. 
+!   Essentially this is doing a variable all-to-all data exchange
+!   (ALLTOALLV in MPI parlance), but 
+!   it is capable of pruning empty exchanges, which are very likely in out 
+!   application environment. All the variants have the same structure 
+!   In all these subroutines X may be:    I    Integer
+!                                         D    real(kind(1.d0))
+!                                         Z    complex(kind(1.d0))
+!   Basically the operation is as follows: on each process, we identify 
+!   sections SND(Y) and RCV(Y); then we do a SEND(PACK(SND(Y)));
+!   then we receive, and we do an update with Y = UNPACK(RCV(Y)) + BETA * Y 
+!   but only on the elements involved in the UNPACK operation. 
+!   Thus: for halo data exchange, the receive section is confined in the 
+!   halo indices, and BETA=0, whereas for overlap exchange the receive section 
+!   is scattered in the owned indices, and BETA=1.
+! 
+! Arguments: 
+!    flag     - integer                 Choose the algorithm for data exchange: 
+!                                       this is chosen through bit fields. 
+!                                        swap_mpi  = iand(flag,psb_swap_mpi_)  /= 0
+!                                        swap_sync = iand(flag,psb_swap_sync_) /= 0
+!                                        swap_send = iand(flag,psb_swap_send_) /= 0
+!                                        swap_recv = iand(flag,psb_swap_recv_) /= 0
+!                                       if (swap_mpi):  use underlying MPI_ALLTOALLV.
+!                                       if (swap_sync): use PSB_SND and PSB_RCV in 
+!                                                       synchronized pairs
+!                                       if (swap_send .and. swap_recv): use mpi_irecv 
+!                                                       and mpi_send
+!                                       if (swap_send): use psb_snd (but need another 
+!                                                       call with swap_recv to complete)
+!                                       if (swap_recv): use psb_rcv (completing a 
+!                                                       previous call with swap_send)
+!
+!
+!    n        - integer                 Number of columns in Y               
+!    beta     - X                       Choose overwrite or sum. 
+!    y(:)     - X                       The data area                        
+!    desc_a   - type(<psb_desc_type>).  The communication descriptor.        
+!    work(:)  - X                       Buffer space. If not sufficient, will do 
+!                                       our own internal allocation.
+!    info     - integer.                return code.
+!    data     - integer                 which list is to be used to exchange data
+!                                       default psb_comm_halo_
+!                                       psb_comm_halo_    use halo_index
+!                                       psb_comm_ext_     use ext_index 
+!                                       psb_comm_ovrl_    use ovrl_index
+!
+!
 subroutine psi_zswaptranv(flag,beta,y,desc_a,work,info,data)

  use psb_error_mod
--- a/base/modules/psi_mod.f90
+++ b/base/modules/psi_mod.f90
@ -421,6 +421,14 @@ contains
    integer, intent(inout) :: x(:)

    integer :: i, ih, key, idx,nh,tmp,lb,ub,lm
+    !
+    ! When a large descriptor is assembled the indices 
+    ! are kept in a (hashed) list of ordered lists. 
+    ! Thus we first hash the index, then we do a binary search on the 
+    ! ordered sublist. The hashing is based on the low-order bits 
+    ! for a width of psb_hash_bits 
+    !
+    
    do i=1, n
      key = x(i) 
      ih  = iand(key,hashmask)
@ -460,6 +468,13 @@ contains
    integer, intent(out) :: y(:)

    integer :: i, ih, key, idx,nh,tmp,lb,ub,lm
+    !
+    ! When a large descriptor is assembled the indices 
+    ! are kept in a (hashed) list of ordered lists. 
+    ! Thus we first hash the index, then we do a binary search on the 
+    ! ordered sublist. The hashing is based on the low-order bits 
+    ! for a width of psb_hash_bits 
+    !
    
    do i=1, n
      key = x(i) 
--- a/base/psblas/psb_damax.f90
+++ b/base/psblas/psb_damax.f90
@ -37,7 +37,7 @@
 !
 !    where sub( X ) denotes X(1:N,JX:).
 !
-! Parameters:
+! Arguments:
 !    x      -  real,dimension(:,:).       The input vector.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
 !    info   -  integer.                   Eventually returns an error code.
@ -164,7 +164,7 @@ end function psb_damax
 !
 !    normi := max(abs(X(i))  
 !
-! Parameters:
+! Arguments:
 !    x      -  real,dimension(:).         The input vector.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
 !    info   -  integer.                   Eventually returns an error code.
@ -285,7 +285,7 @@ end function psb_damaxv
 !
 !    where sub( X ) denotes X(1:N,JX:).
 !
-! Parameters:
+! Arguments:
 !    res    -  real.                      The result.
 !    x      -  real,dimension(:,:).       The input vector.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
@ -407,7 +407,7 @@ end subroutine psb_damaxvs
 !
 !    normi := max(abs(X(i))  
 !
-! Parameters:
+! Arguments:
 !    res    -  real.                      The result.
 !    x      -  real,dimension(:).         The input vector.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
--- a/base/psblas/psb_dasum.f90
+++ b/base/psblas/psb_dasum.f90
@ -37,7 +37,7 @@
 !
 !    where sub( X ) denotes X(1:N,JX:).
 !
-! Parameters:
+! Arguments:
 !    x      -  real,dimension(:,:).       The input vector.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
 !    info   -  integer.                   Eventually returns an error code.
@ -182,7 +182,7 @@ end function psb_dasum
 !
 !    norm1 := sum(X(i))
 !
-! Parameters:
+! Arguments:
 !    x      -  real,dimension(:).       The input vector.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
 !    info   -  integer.                   Eventually returns an error code.
@ -319,7 +319,7 @@ end function psb_dasumv
 !
 !    norm1 := sum(X(i))
 !
-! Parameters:
+! Arguments:
 !    res    -  real.                      The result.
 !    x      -  real,dimension(:).         The input vector.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
--- a/base/psblas/psb_daxpby.f90
+++ b/base/psblas/psb_daxpby.f90
@ -39,7 +39,7 @@
 !
 !    sub( Y ) denotes Y(:,JY).
 !
-! Parameters:
+! Arguments:
 !    alpha  -  real.                      The scalar used to multiply each component of sub( X ).
 !    x      -  real,dimension(:,:).       The input vector containing the entries of sub( X ).
 !    beta   -  real.                      The scalar used to multiply each component of sub( Y ).
@ -195,7 +195,7 @@ end subroutine psb_daxpby
 !
 !    Y := beta * Y + alpha * X
 !
-! Parameters:
+! Arguments:
 !    alpha  -  real.                      The scalar used to multiply each component of X.
 !    x      -  real,dimension(:).         The input vector containing the entries of X.
 !    beta   -  real.                      The scalar used to multiply each component of Y.
--- a/base/psblas/psb_ddot.f90
+++ b/base/psblas/psb_ddot.f90
@ -39,7 +39,7 @@
 !
 !    sub( Y ) denotes Y(:,JY).
 !
-! Parameters:
+! Arguments:
 !    x      -  real,dimension(:,:).       The input vector containing the entries of sub( X ).
 !    y      -  real,dimension(:,:).       The input vector containing the entries of sub( Y ).
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
@ -196,7 +196,7 @@ end function psb_ddot
 !
 !    dot := X**T * Y
 !
-! Parameters:
+! Arguments:
 !    x      -  real,dimension(:).         The input vector containing the entries of X.
 !    y      -  real,dimension(:).         The input vector containing the entries of Y.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
@ -333,7 +333,7 @@ end function psb_ddotv
 !
 !    dot := X**T * Y
 !
-! Parameters:
+! Arguments:
 !    res    -  real.                      The result.
 !    x      -  real,dimension(:).         The input vector containing the entries of X.
 !    y      -  real,dimension(:).         The input vector containing the entries of Y.
@ -474,7 +474,7 @@ end subroutine psb_ddotvs
 !
 !    sub( Y ) denotes Y(:,JY).
 !
-! Parameters:
+! Arguments:
 !    res    -  real.                      The result.
 !    x      -  real,dimension(:,:).       The input vector containing the entries of sub( X ).
 !    y      -  real,dimension(:,:).       The input vector containing the entries of sub( Y ).
--- a/base/psblas/psb_dnrm2.f90
+++ b/base/psblas/psb_dnrm2.f90
@ -37,7 +37,7 @@
 !
 !    where sub( X ) denotes X(:,JX).
 !
-! Parameters:
+! Arguments:
 !    x      -  real,dimension(:,:).       The input vector containing the entries of sub( X ).
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
 !    info   -  integer.                   Eventually returns an error code.
@ -176,7 +176,7 @@ end function psb_dnrm2
 !
 !    norm2 := sqrt ( X**T * X)
 !
-! Parameters:
+! Arguments:
 !    x      -  real,dimension(:).         The input vector containing the entries of X.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
 !    info   -  integer.                   Eventually returns an error code.
@ -310,7 +310,7 @@ end function psb_dnrm2v
 !
 !    norm2 := sqrt ( X**T * X)
 !
-! Parameters:
+! Arguments:
 !    res    -  real.                      The result.
 !    x      -  real,dimension(:).         The input vector containing the entries of X.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
--- a/base/psblas/psb_dnrmi.f90
+++ b/base/psblas/psb_dnrmi.f90
@ -35,7 +35,7 @@
 !
 !    normi := max(abs(sum(A(i,j))))                                                                                   
 !
-! Parameters:
+! Arguments:
 !    a      -  type(<psb_dspmat_type>).   The sparse matrix containing A.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
 !    info   -  integer.                   Eventually returns an error code.
--- a/base/psblas/psb_dspmm.f90
+++ b/base/psblas/psb_dspmm.f90
@ -62,7 +62,7 @@
 !  alpha and beta are scalars, and sub( X ) and sub( Y ) are distributed
 !  vectors and A is a M-by-N distributed matrix.
 !
-! Parameters:   
+! Arguments:   
 !    alpha  -  real.                        The scalar alpha.
 !    a      -  type(<psb_dspmat_type>).     The sparse matrix containing A.
 !    x      -  real,dimension(:,:).         The input vector containing the entries of sub( X ).
@ -402,7 +402,7 @@ end subroutine psb_dspmm
 !  alpha and beta are scalars, and X and Y are distributed
 !  vectors and A is a M-by-N distributed matrix.
 !
-! Parameters:   
+! Arguments:   
 !    alpha  -  real.                        The scalar alpha.
 !    a      -  type(<psb_dspmat_type>).     The sparse matrix containing A.
 !    x      -  real,dimension(:).           The input vector containing the entries of X.
--- a/base/psblas/psb_dspsm.f90
+++ b/base/psblas/psb_dspsm.f90
@ -54,7 +54,7 @@
 !  sub( X ) is a distributed
 !  vector and T is a M-by-M distributed triangular matrix.
 !
-! Parameters:   
+! Arguments:   
 !    alpha  -  real.                        The scalar alpha.
 !    a      -  type(<psb_dspmat_type>).     The sparse matrix containing A.
 !    x      -  real,dimension(:,:).         The input vector containing the entries of sub( X ).
@ -364,7 +364,7 @@ end subroutine psb_dspsm
 !  X is a distributed
 !  vector and T is a M-by-M distributed triangular matrix.
 !
-! Parameters:   
+! Arguments:   
 !    alpha  -  real.                        The scalar alpha.
 !    a      -  type(<psb_dspmat_type>).     The sparse matrix containing A.
 !    x      -  real,dimension(:).           The input vector containing the entries of X.
--- a/base/psblas/psb_zamax.f90
+++ b/base/psblas/psb_zamax.f90
@ -37,7 +37,7 @@
 !
 !    where sub( X ) denotes X(1:N,JX:).
 !
-! Parameters:
+! Arguments:
 !    x      -  real,dimension(:,:).       The input vector.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
 !    info   -  integer.                   Eventually returns an error code.
@ -167,7 +167,7 @@ end function psb_zamax
 !
 !    normi := max(abs(X(i))  
 !
-! Parameters:
+! Arguments:
 !    x      -  real,dimension(:).         The input vector.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
 !    info   -  integer.                   Eventually returns an error code.
@ -293,7 +293,7 @@ end function psb_zamaxv
 !
 !    where sub( X ) denotes X(1:N,JX:).
 !
-! Parameters:
+! Arguments:
 !    res    -  real.                      The result.
 !    x      -  real,dimension(:,:).       The input vector.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
@ -419,7 +419,7 @@ end subroutine psb_zamaxvs
 !
 !    normi := max(abs(X(i))  
 !
-! Parameters:
+! Arguments:
 !    res    -  real.                      The result.
 !    x      -  real,dimension(:).         The input vector.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
--- a/base/psblas/psb_zasum.f90
+++ b/base/psblas/psb_zasum.f90
@ -37,7 +37,7 @@
 !
 !    where sub( X ) denotes X(1:N,JX:).
 !
-! Parameters:
+! Arguments:
 !    x      -  real,dimension(:,:).       The input vector.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
 !    info   -  integer.                   Eventually returns an error code.
@ -187,7 +187,7 @@ end function psb_zasum
 !
 !    norm1 := sum(X(i))
 !
-! Parameters:
+! Arguments:
 !    x      -  real,dimension(:).       The input vector.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
 !    info   -  integer.                   Eventually returns an error code.
@ -330,7 +330,7 @@ end function psb_zasumv
 !
 !    norm1 := sum(X(i))
 !
-! Parameters:
+! Arguments:
 !    res    -  real.                      The result.
 !    x      -  real,dimension(:).         The input vector.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
--- a/base/psblas/psb_zaxpby.f90
+++ b/base/psblas/psb_zaxpby.f90
@ -39,7 +39,7 @@
 !
 !    sub( Y ) denotes Y(:,JY).
 !
-! Parameters:
+! Arguments:
 !    alpha  -  real.                      The scalar used to multiply each component of sub( X ).
 !    x      -  real,dimension(:,:).       The input vector containing the entries of sub( X ).
 !    beta   -  real.                      The scalar used to multiply each component of sub( Y ).
@ -193,7 +193,7 @@ end subroutine psb_zaxpby
 !
 !    Y := beta * Y + alpha * X
 !
-! Parameters:
+! Arguments:
 !    alpha  -  real.                      The scalar used to multiply each component of X.
 !    x      -  real,dimension(:).         The input vector containing the entries of X.
 !    beta   -  real.                      The scalar used to multiply each component of Y.
--- a/base/psblas/psb_zdot.f90
+++ b/base/psblas/psb_zdot.f90
@ -39,7 +39,7 @@
 !
 !    sub( Y ) denotes Y(:,JY).
 !
-! Parameters:
+! Arguments:
 !    x      -  real,dimension(:,:).       The input vector containing the entries of sub( X ).
 !    y      -  real,dimension(:,:).       The input vector containing the entries of sub( Y ).
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
@ -195,7 +195,7 @@ end function psb_zdot
 !
 !    dot := X**T * Y
 !
-! Parameters:
+! Arguments:
 !    x      -  real,dimension(:).         The input vector containing the entries of X.
 !    y      -  real,dimension(:).         The input vector containing the entries of Y.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
@ -332,7 +332,7 @@ end function psb_zdotv
 !
 !    dot := X**T * Y
 !
-! Parameters:
+! Arguments:
 !    res    -  real.                      The result.
 !    x      -  real,dimension(:).         The input vector containing the entries of X.
 !    y      -  real,dimension(:).         The input vector containing the entries of Y.
@ -472,7 +472,7 @@ end subroutine psb_zdotvs
 !
 !    sub( Y ) denotes Y(:,JY).
 !
-! Parameters:
+! Arguments:
 !    res    -  real.                      The result.
 !    x      -  real,dimension(:,:).       The input vector containing the entries of sub( X ).
 !    y      -  real,dimension(:,:).       The input vector containing the entries of sub( Y ).
--- a/base/psblas/psb_znrm2.f90
+++ b/base/psblas/psb_znrm2.f90
@ -37,7 +37,7 @@
 !
 !    where sub( X ) denotes X(:,JX).
 !
-! Parameters:
+! Arguments:
 !    x      -  real,dimension(:,:).       The input vector containing the entries of sub( X ).
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
 !    info   -  integer.                   Eventually returns an error code.
@ -175,7 +175,7 @@ end function psb_znrm2
 !
 !    norm2 := sqrt ( X**T * X)
 !
-! Parameters:
+! Arguments:
 !    x      -  real,dimension(:).         The input vector containing the entries of X.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
 !    info   -  integer.                   Eventually returns an error code.
@ -309,7 +309,7 @@ end function psb_znrm2v
 !
 !    norm2 := sqrt ( X**T * X)
 !
-! Parameters:
+! Arguments:
 !    res    -  real.                      The result.
 !    x      -  real,dimension(:).         The input vector containing the entries of X.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
--- a/base/psblas/psb_znrmi.f90
+++ b/base/psblas/psb_znrmi.f90
@ -35,7 +35,7 @@
 !
 !    normi := max(abs(sum(A(i,j))))                                                                                   
 !
-! Parameters:
+! Arguments:
 !    a      -  type(<psb_dspmat_type>).   The sparse matrix containing A.
 !    desc_a -  type(<psb_desc_type>).     The communication descriptor.
 !    info   -  integer.                   Eventually returns an error code.
--- a/base/psblas/psb_zspmm.f90
+++ b/base/psblas/psb_zspmm.f90
@ -62,7 +62,7 @@
 !  alpha and beta are scalars, and sub( X ) and sub( Y ) are distributed
 !  vectors and A is a M-by-N distributed matrix.
 !
-! Parameters:   
+! Arguments:   
 !    alpha  -  real.                        The scalar alpha.
 !    a      -  type(<psb_zspmat_type>).     The sparse matrix containing A.
 !    x      -  real,dimension(:,:).         The input vector containing the entries of sub( X ).
@ -396,7 +396,7 @@ end subroutine psb_zspmm
 !  alpha and beta are scalars, and X and Y are distributed
 !  vectors and A is a M-by-N distributed matrix.
 !
-! Parameters:   
+! Arguments:   
 !    alpha  -  real.                        The scalar alpha.
 !    a      -  type(<psb_zspmat_type>).     The sparse matrix containing A.
 !    x      -  real,dimension(:).           The input vector containing the entries of X.
--- a/base/psblas/psb_zspsm.f90
+++ b/base/psblas/psb_zspsm.f90
@ -54,7 +54,7 @@
 !  sub( X ) is a distributed
 !  vector and T is a M-by-M distributed triangular matrix.
 !
-! Parameters:   
+! Arguments:   
 !    alpha  -  real.                        The scalar alpha.
 !    a      -  type(<psb_zspmat_type>).     The sparse matrix containing A.
 !    x      -  real,dimension(:,:).         The input vector containing the entries of sub( X ).
@ -367,7 +367,7 @@ end subroutine psb_zspsm
 !  X is a distributed
 !  vector and T is a M-by-M distributed triangular matrix.
 !
-! Parameters:   
+! Arguments:   
 !    alpha  -  real.                        The scalar alpha.
 !    a      -  type(<psb_zspmat_type>).     The sparse matrix containing A.
 !    x      -  real,dimension(:).           The input vector containing the entries of X.
--- a/base/serial/aux/msort_dw.f90
+++ b/base/serial/aux/msort_dw.f90
@ -32,7 +32,7 @@
 ! Subroutine: msort_dw
 !   This subroutine sorts an integer array into ascending order.
 !
-! Parameters:
+! Arguments:
 !   n         -  integer                   Input: size of the array 
 !   k         -  integer(*)                input: array of keys to be sorted
 !   l         -  integer(0:n+1)           output: link list 
--- a/base/serial/aux/msort_up.f90
+++ b/base/serial/aux/msort_up.f90
@ -32,7 +32,7 @@
 ! Subroutine: msort_up
 !   This subroutine sorts an integer array into ascending order.
 !
-! Parameters:
+! Arguments:
 !   n         -  integer                   Input: size of the array 
 !   k         -  integer(*)                input: array of keys to be sorted
 !   l         -  integer(0:n+1)           output: link list 
--- a/base/serial/psb_dcsmm.f90
+++ b/base/serial/psb_dcsmm.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_dcsmm.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:
 subroutine psb_dcsmm(alpha,a,b,beta,c,info,trans)
  use psb_spmat_type
  use psb_error_mod
--- a/base/serial/psb_dcsmv.f90
+++ b/base/serial/psb_dcsmv.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_dcsmv.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 subroutine psb_dcsmv(alpha,a,b,beta,c,info,trans)
  use psb_spmat_type
--- a/base/serial/psb_dcsnmi.f90
+++ b/base/serial/psb_dcsnmi.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_dcsnmi.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 real(kind(1.d0)) function psb_dcsnmi(a,info,trans)

--- a/base/serial/psb_dcsprt.f90
+++ b/base/serial/psb_dcsprt.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_dcsprt.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 !*****************************************************************************
 !*                                                                           *
--- a/base/serial/psb_dcsrp.f90
+++ b/base/serial/psb_dcsrp.f90
@ -35,7 +35,7 @@
 !    Apply a right permutation to a sparse matrix, i.e. permute the column 
 !    indices. 
 ! 
-! Parameters: 
+! Arguments: 
 !    trans   - character.                       Whether iperm or its transpose 
 !                                               should be applied
 !    iperm   - integer, dimension(:)            A permutation vector; its size 
--- a/base/serial/psb_dcsrws.f90
+++ b/base/serial/psb_dcsrws.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_dcsrws.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 subroutine psb_dcsrws(rw,a,info,trans)
  use psb_spmat_type
--- a/base/serial/psb_dcssm.f90
+++ b/base/serial/psb_dcssm.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_dcssm.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 subroutine psb_dcssm(alpha,t,b,beta,c,info,trans,unitd,d)
  use psb_spmat_type
--- a/base/serial/psb_dcssv.f90
+++ b/base/serial/psb_dcssv.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_dcssv.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 subroutine psb_dcssv(alpha,t,b,beta,c,info,trans,unitd,d)
  use psb_spmat_type
--- a/base/serial/psb_dfixcoo.f90
+++ b/base/serial/psb_dfixcoo.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_dfixcoo.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 subroutine psb_dfixcoo(a,info,idir)
  use psb_spmat_type
--- a/base/serial/psb_dgelp.f90
+++ b/base/serial/psb_dgelp.f90
@ -34,7 +34,7 @@
 ! Subroutine: psb_dgelp
 !             Apply a left permutation to a dense matrix
 !
-! Parameters:
+! Arguments:
 ! trans    - character. 
 ! iperm    - integer.
 ! x        - real, dimension(:,:).
@ -164,7 +164,7 @@ end subroutine psb_dgelp
 ! Subroutine: psb_dgelpv
 !             Apply a left permutation to a dense matrix
 !
-! Parameters:
+! Arguments:
 ! trans    - character. 
 ! iperm    - integer.
 ! x        - real, dimension(:).
--- a/base/serial/psb_dipcoo2csc.f90
+++ b/base/serial/psb_dipcoo2csc.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_dipcoo2csc.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 subroutine psb_dipcoo2csc(a,info,clshr)
  use psb_spmat_type
--- a/base/serial/psb_dipcoo2csr.f90
+++ b/base/serial/psb_dipcoo2csr.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_dipcoo2csr.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 subroutine psb_dipcoo2csr(a,info,rwshr)
  use psb_spmat_type
--- a/base/serial/psb_dipcsr2coo.f90
+++ b/base/serial/psb_dipcsr2coo.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_dipcsr2coo.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 Subroutine psb_dipcsr2coo(a,info)
  use psb_spmat_type
--- a/base/serial/psb_dneigh.f90
+++ b/base/serial/psb_dneigh.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_dneigh.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 subroutine psb_dneigh(a,idx,neigh,n,info,lev)

--- a/base/serial/psb_dnumbmm.f90
+++ b/base/serial/psb_dnumbmm.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_dnumbmm.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:
 !
 !
 ! Note: This subroutine performs the numerical product of two sparse matrices.
--- a/base/serial/psb_drwextd.f90
+++ b/base/serial/psb_drwextd.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_drwextd.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:
 !
 ! We have a problem here: 1. How to handle well all the formats? 
 !                         2. What should we do with rowscale? Does it only 
--- a/base/serial/psb_dspclip.f90
+++ b/base/serial/psb_dspclip.f90
@ -31,7 +31,7 @@
 ! File:  psb_dspclip.f90 
 ! Subroutine: psb_dspclip
 !    Creates a "clipped" copy of input matrix A. Output is always in COO. 
-! Parameters:
+! Arguments:

 !*****************************************************************************
 !*                                                                           *
--- a/base/serial/psb_dspcnv.f90
+++ b/base/serial/psb_dspcnv.f90
@ -34,7 +34,7 @@
 !    This subroutine performs the assembly of
 !    the local part of a sparse distributed matrix
 !
-! Parameters:
+! Arguments:
 !   a      -  type(<psb_spmat_type>).         The input matrix to be assembled.
 !   b      -  type(<psb_spmat_type>).         The assembled output matrix.
 !   info   -  integer.                        Eventually returns an error code.
--- a/base/serial/psb_dspgetrow.f90
+++ b/base/serial/psb_dspgetrow.f90
@ -31,7 +31,7 @@
 ! File:  psb_dspgetrow.f90 
 ! Subroutine: psb_dspgetrow
 !    Gets one or more rows from a sparse matrix. 
-! Parameters:
+! Arguments:
 !*****************************************************************************
 !*                                                                           *
 !*                                                                           *
--- a/base/serial/psb_dspgtblk.f90
+++ b/base/serial/psb_dspgtblk.f90
@ -31,7 +31,7 @@
 ! File:  psb_dspgtblk.f90 
 ! Subroutine: psb_dspgtblk
 !    Gets one or more rows from a sparse matrix. 
-! Parameters:
+! Arguments:
 !*****************************************************************************
 !*                                                                           *
 !* Takes a specified row from matrix A and copies into matrix B (possibly    *
--- a/base/serial/psb_dspgtdiag.f90
+++ b/base/serial/psb_dspgtdiag.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_dspgtdiag.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 !*****************************************************************************
 !*                                                                           *
--- a/base/serial/psb_dspscal.f90
+++ b/base/serial/psb_dspscal.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_dspscal.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 !*****************************************************************************
 !*                                                                           *
--- a/base/serial/psb_dsymbmm.f90
+++ b/base/serial/psb_dsymbmm.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_dsymbmm.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:
 !
 !
 ! Note: This subroutine performs the symbolic product of two sparse matrices.
--- a/base/serial/psb_dtransp.f90
+++ b/base/serial/psb_dtransp.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_dtransp.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 subroutine psb_dtransp(a,b,c,fmt)
  use psb_spmat_type
--- a/base/serial/psb_zcsmm.f90
+++ b/base/serial/psb_zcsmm.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_zcsmm.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:
 subroutine psb_zcsmm(alpha,a,b,beta,c,info,trans)
  use psb_spmat_type
  use psb_error_mod
--- a/base/serial/psb_zcsmv.f90
+++ b/base/serial/psb_zcsmv.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_zcsmv.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 subroutine psb_zcsmv(alpha,a,b,beta,c,info,trans)
  use psb_spmat_type
--- a/base/serial/psb_zcsnmi.f90
+++ b/base/serial/psb_zcsnmi.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_zcsnmi.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 real(kind(1.d0)) function psb_zcsnmi(a,info,trans)

--- a/base/serial/psb_zcsprt.f90
+++ b/base/serial/psb_zcsprt.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_zcsprt.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 !*****************************************************************************
 !*                                                                           *
--- a/base/serial/psb_zcsrp.f90
+++ b/base/serial/psb_zcsrp.f90
@ -35,7 +35,7 @@
 !    Apply a right permutation to a sparse matrix, i.e. permute the column 
 !    indices. 
 ! 
-! Parameters: 
+! Arguments: 
 !    trans   - character.                       Whether iperm or its transpose 
 !                                               should be applied
 !    iperm   - integer, dimension(:)            A permutation vector; its size 
--- a/base/serial/psb_zcsrws.f90
+++ b/base/serial/psb_zcsrws.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_zcsrws.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 subroutine psb_zcsrws(rw,a,info,trans)
  use psb_spmat_type
--- a/base/serial/psb_zcssm.f90
+++ b/base/serial/psb_zcssm.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_zcssm.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 subroutine psb_zcssm(alpha,t,b,beta,c,info,trans,unitd,d)
  use psb_spmat_type
--- a/base/serial/psb_zcssv.f90
+++ b/base/serial/psb_zcssv.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_zcssv.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 subroutine psb_zcssv(alpha,t,b,beta,c,info,trans,unitd,d)
  use psb_spmat_type
--- a/base/serial/psb_zfixcoo.f90
+++ b/base/serial/psb_zfixcoo.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_zfixcoo.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 Subroutine psb_zfixcoo(a,info,idir)
  use psb_spmat_type
--- a/base/serial/psb_zgelp.f90
+++ b/base/serial/psb_zgelp.f90
@ -34,7 +34,7 @@
 ! Subroutine: psb_zgelp
 !             Apply a left permutation to a dense matrix
 !
-! Parameters:
+! Arguments:
 ! trans    - character. 
 ! iperm    - integer.
 ! x        - real, dimension(:,:).
@ -167,7 +167,7 @@ end subroutine psb_zgelp
 ! Subroutine: psb_zgelpv
 !             Apply a left permutation to a dense matrix
 !
-! Parameters:
+! Arguments:
 ! trans    - character. 
 ! iperm    - integer.
 ! x        - real, dimension(:).
--- a/base/serial/psb_zipcoo2csc.f90
+++ b/base/serial/psb_zipcoo2csc.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_zipcoo2csc.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 subroutine psb_zipcoo2csc(a,info,clshr)
  use psb_spmat_type
--- a/base/serial/psb_zipcoo2csr.f90
+++ b/base/serial/psb_zipcoo2csr.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_zipcoo2csr.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 subroutine psb_zipcoo2csr(a,info,rwshr)
  use psb_spmat_type
--- a/base/serial/psb_zipcsr2coo.f90
+++ b/base/serial/psb_zipcsr2coo.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_zipcsr2coo.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 Subroutine psb_zipcsr2coo(a,info)
  use psb_spmat_type
--- a/base/serial/psb_zneigh.f90
+++ b/base/serial/psb_zneigh.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_zneigh.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 subroutine psb_zneigh(a,idx,neigh,n,info,lev)

--- a/base/serial/psb_znumbmm.f90
+++ b/base/serial/psb_znumbmm.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_dnumbmm.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:
 !
 !
 ! Note: This subroutine performs the numerical product of two sparse matrices.
--- a/base/serial/psb_zrwextd.f90
+++ b/base/serial/psb_zrwextd.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_zrwextd.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:
 !
 ! We have a problem here: 1. How to handle well all the formats? 
 !                         2. What should we do with rowscale? Does it only 
--- a/base/serial/psb_zspclip.f90
+++ b/base/serial/psb_zspclip.f90
@ -31,7 +31,7 @@
 ! File:  psb_zspclip.f90 
 ! Subroutine: psb_zspclip
 !    Creates a "clipped" copy of input matrix A. Output is always in COO. 
-! Parameters:
+! Arguments:

 !*****************************************************************************
 !*                                                                           *
--- a/base/serial/psb_zspcnv.f90
+++ b/base/serial/psb_zspcnv.f90
@ -34,7 +34,7 @@
 !    This subroutine performs the assembly of
 !    the local part of a sparse distributed matrix
 !
-! Parameters:
+! Arguments:
 !   a      -  type(<psb_spmat_type>).         The input matrix to be assembled.
 !   b      -  type(<psb_spmat_type>).         The assembled output matrix.
 !   info   -  integer.                        Eventually returns an error code.
--- a/base/serial/psb_zspgetrow.f90
+++ b/base/serial/psb_zspgetrow.f90
@ -31,7 +31,7 @@
 ! File:  psb_zspgetrow.f90 
 ! Subroutine: psb_zspgetrow
 !    Gets one or more rows from a sparse matrix. 
-! Parameters:
+! Arguments:
 !*****************************************************************************
 !*                                                                           *
 !*                                                                           *
--- a/base/serial/psb_zspgtblk.f90
+++ b/base/serial/psb_zspgtblk.f90
@ -31,7 +31,7 @@
 ! File:  psb_zspgtblk.f90 
 ! Subroutine: psb_zspgtblk
 !    Gets one or more rows from a sparse matrix. 
-! Parameters:
+! Arguments:
 !*****************************************************************************
 !*                                                                           *
 !* Takes a specified row from matrix A and copies into matrix B (possibly    *
--- a/base/serial/psb_zspgtdiag.f90
+++ b/base/serial/psb_zspgtdiag.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_zspgtdiag.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 !*****************************************************************************
 !*                                                                           *
--- a/base/serial/psb_zspscal.f90
+++ b/base/serial/psb_zspscal.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_zspscal.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 !*****************************************************************************
 !*                                                                           *
--- a/base/serial/psb_zsymbmm.f90
+++ b/base/serial/psb_zsymbmm.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_zsymbmm.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:
 !
 !
 ! Note: This subroutine performs the symbolic product of two sparse matrices.
--- a/base/serial/psb_ztransc.f90
+++ b/base/serial/psb_ztransc.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_ztransc.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 subroutine psb_ztransc(a,b,c,fmt)
  use psb_spmat_type
--- a/base/serial/psb_ztransp.f90
+++ b/base/serial/psb_ztransp.f90
@ -30,7 +30,7 @@
 !!$  
 ! File:  psb_ztransp.f90 
 ! Subroutine: 
-! Parameters:
+! Arguments:

 subroutine psb_ztransp(a,b,c,fmt)
  use psb_spmat_type
--- a/base/tools/psb_cd_inloc.f90
+++ b/base/tools/psb_cd_inloc.f90
@ -35,7 +35,7 @@
 !    of indices that are assigned to the current process. The global size 
 !    is equal to the largest index found on any process. 
 ! 
-! Parameters: 
+! Arguments: 
 !    v       - integer, dimension(:).         The array containg the partitioning scheme.
 !    ictxt - integer.                         The communication context.
 !    desc_a  - type(<psb_desc_type>).         The communication descriptor.
--- a/base/tools/psb_cdals.f90
+++ b/base/tools/psb_cdals.f90
@ -34,7 +34,7 @@
 !    Allocate descriptor
 !    and checks correctness of PARTS subroutine
 ! 
-! Parameters: 
+! Arguments: 
 !    m       - integer.                       The number of rows.
 !    n       - integer.                       The number of columns.
 !    parts   - external subroutine.           The routine that contains the 
--- a/base/tools/psb_cdalv.f90
+++ b/base/tools/psb_cdalv.f90
@ -36,7 +36,7 @@
 !    on all calling processes.
 !    
 ! 
-! Parameters: 
+! Arguments: 
 !    v       - integer, dimension(:).         The array containg the partitioning scheme.
 !    ictxt - integer.                         The communication context.
 !    desc_a  - type(<psb_desc_type>).         The communication descriptor.
--- a/base/tools/psb_cdcpy.f90
+++ b/base/tools/psb_cdcpy.f90
@ -33,7 +33,7 @@
 ! Subroutine: psb_cdcpy
 !   Produces a clone of a descriptor.
 ! 
-! Parameters: 
+! Arguments: 
 !    desc_in  - type(<psb_desc_type>).         The communication descriptor to be cloned.
 !    desc_out - type(<psb_desc_type>).         The output communication descriptor.
 !    info     - integer.                       Return code.
--- a/base/tools/psb_cdfree.f90
+++ b/base/tools/psb_cdfree.f90
@ -33,7 +33,7 @@
 ! Subroutine: psb_cdfree
 !   Frees a descriptor data structure.
 ! 
-! Parameters: 
+! Arguments: 
 !    desc_a   - type(<psb_desc_type>).         The communication descriptor to be freed.
 !    info     - integer.                       return code.
 subroutine psb_cdfree(desc_a,info)
--- a/base/tools/psb_cdins.f90
+++ b/base/tools/psb_cdins.f90
@ -33,7 +33,7 @@
 ! Subroutine: psb_cdins
 !   Takes as input a cloud of points and updates the descriptor accordingly.
 ! 
-! Parameters: 
+! Arguments: 
 !    nz       - integer.                       The number of points to insert.
 !    ia       - integer,dimension(:).          The row indices of the points.
 !    ja       - integer,dimension(:).          The column indices of the points.
--- a/base/tools/psb_cdprt.f90
+++ b/base/tools/psb_cdprt.f90
@ -33,7 +33,7 @@
 ! Subroutine: psb_cdprt
 !    Prints the descriptor to an output file
 ! 
-! Parameters: 
+! Arguments: 
 !    iout          - integer.                The output unit to print to.
 !    desc_p        - type(<psb_desc_type>).  The communication descriptor to be printed.
 !    glob          - logical(otpional).      Wheter to print out global or local data.
--- a/base/tools/psb_cdren.f90
+++ b/base/tools/psb_cdren.f90
@ -35,7 +35,7 @@
 ! Subroutine: psb_cdren
 !    Updates a communication descriptor according to a renumbering scheme.
 ! 
-! Parameters: 
+! Arguments: 
 !    trans    - character.                     Whether iperm or its transpose 
 !                                              should be applied.
 !    iperm    - integer,dimension(:).          The renumbering scheme.
--- a/Show More
+++ b/Show More