|
|
@ -1,7 +1,6 @@
|
|
|
|
#include "MatchBoxPC.h"
|
|
|
|
#include "MatchBoxPC.h"
|
|
|
|
#include <omp.h>
|
|
|
|
#include <omp.h>
|
|
|
|
#include <stdio.h>
|
|
|
|
#include <stdio.h>
|
|
|
|
|
|
|
|
|
|
|
|
// ***********************************************************************
|
|
|
|
// ***********************************************************************
|
|
|
|
//
|
|
|
|
//
|
|
|
|
// MatchboxP: A C++ library for approximate weighted matching
|
|
|
|
// MatchboxP: A C++ library for approximate weighted matching
|
|
|
@ -314,17 +313,17 @@ void dalgoDistEdgeApproxDomEdgesLinearSearchMesgBndlSmallMateCMP(
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
/*
|
|
|
|
* Not parallelizable
|
|
|
|
* Not parallelizable
|
|
|
|
*/
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
|
|
for (i = 0; i < numGhostVertices; i++) { //O(|Ghost Vertices|)
|
|
|
|
for (i = 0; i < numGhostVertices; i++) { //O(|Ghost Vertices|)
|
|
|
|
verGhostPtr[i + 1] = verGhostPtr[i] + Counter[i];
|
|
|
|
verGhostPtr[i + 1] = verGhostPtr[i] + Counter[i];
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
cout<<verGhostPtr[i]<<"\t"; fflush(stdout);
|
|
|
|
cout<<verGhostPtr[i]<<"\t"; fflush(stdout);
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} // End of single region
|
|
|
|
} // End of single region
|
|
|
|
|
|
|
|
|
|
|
|
#ifdef TIME_TRACKER
|
|
|
|
#ifdef TIME_TRACKER
|
|
|
|
verGhostPtrInitialization = MPI_Wtime() - verGhostPtrInitialization;
|
|
|
|
verGhostPtrInitialization = MPI_Wtime() - verGhostPtrInitialization;
|
|
|
@ -458,41 +457,41 @@ void dalgoDistEdgeApproxDomEdgesLinearSearchMesgBndlSmallMateCMP(
|
|
|
|
*/
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
|
|
#pragma omp for schedule(static)
|
|
|
|
#pragma omp for schedule(static)
|
|
|
|
for ( v=0; v < NLVer; v++ ) {
|
|
|
|
for ( v=0; v < NLVer; v++ ) {
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
cout<<"\n("<<myRank<<")Processing: "<<v+StartIndex<<endl; fflush(stdout);
|
|
|
|
cout<<"\n("<<myRank<<")Processing: "<<v+StartIndex<<endl; fflush(stdout);
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
//Start: PARALLEL_COMPUTE_CANDIDATE_MATE_B(v)
|
|
|
|
//Start: PARALLEL_COMPUTE_CANDIDATE_MATE_B(v)
|
|
|
|
candidateMate[v] = firstComputeCandidateMate(verLocPtr[v], verLocPtr[v + 1], verLocInd, edgeLocWeight);
|
|
|
|
candidateMate[v] = firstComputeCandidateMate(verLocPtr[v], verLocPtr[v + 1], verLocInd, edgeLocWeight);
|
|
|
|
//End: PARALLEL_COMPUTE_CANDIDATE_MATE_B(v)
|
|
|
|
//End: PARALLEL_COMPUTE_CANDIDATE_MATE_B(v)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
/*
|
|
|
|
* PARALLEL_PROCESS_EXPOSED_VERTEX_B
|
|
|
|
* PARALLEL_PROCESS_EXPOSED_VERTEX_B
|
|
|
|
* The sequential version could be a bit more
|
|
|
|
* The sequential version could be a bit more
|
|
|
|
* efficient.
|
|
|
|
* efficient.
|
|
|
|
*
|
|
|
|
*
|
|
|
|
* TODO: Maybe it is possible to append the values of QLocalVtx, QGhostVtx, QMsgType and QOwner
|
|
|
|
* TODO: Maybe it is possible to append the values of QLocalVtx, QGhostVtx, QMsgType and QOwner
|
|
|
|
* first in a local variable and then, only at the end, append them to the real data structure
|
|
|
|
* first in a local variable and then, only at the end, append them to the real data structure
|
|
|
|
* to remove the critical sections.
|
|
|
|
* to remove the critical sections.
|
|
|
|
*
|
|
|
|
*
|
|
|
|
* TODO: Test when it's more efficient to execute this code
|
|
|
|
* TODO: Test when it's more efficient to execute this code
|
|
|
|
* in parallel.
|
|
|
|
* in parallel.
|
|
|
|
*/
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
|
|
MilanLongInt size = numGhostVertices; //TODO how can I decide a more meaningfull size?
|
|
|
|
MilanLongInt size = numGhostVertices; //TODO how can I decide a more meaningfull size?
|
|
|
|
//Fail messages
|
|
|
|
//Fail messages
|
|
|
|
privateQLocalVtx.~staticQueue();
|
|
|
|
privateQLocalVtx.~staticQueue();
|
|
|
|
privateQGhostVtx.~staticQueue();
|
|
|
|
privateQGhostVtx.~staticQueue();
|
|
|
|
privateQMsgType.~staticQueue();
|
|
|
|
privateQMsgType.~staticQueue();
|
|
|
|
privateQOwner.~staticQueue();
|
|
|
|
privateQOwner.~staticQueue();
|
|
|
|
privateU.~staticQueue();
|
|
|
|
privateU.~staticQueue();
|
|
|
|
|
|
|
|
|
|
|
|
new(&privateU) staticQueue(NLVer + numGhostVertices); //TODO how can I put a meaningfull size?
|
|
|
|
new(&privateU) staticQueue(NLVer + numGhostVertices); //TODO how can I put a meaningfull size?
|
|
|
|
new(&privateQLocalVtx) staticQueue(size);
|
|
|
|
new(&privateQLocalVtx) staticQueue(size);
|
|
|
|
new(&privateQGhostVtx) staticQueue(size);
|
|
|
|
new(&privateQGhostVtx) staticQueue(size);
|
|
|
|
new(&privateQMsgType) staticQueue(size);
|
|
|
|
new(&privateQMsgType) staticQueue(size);
|
|
|
|
new(&privateQOwner) staticQueue(size);
|
|
|
|
new(&privateQOwner) staticQueue(size);
|
|
|
|
|
|
|
|
|
|
|
|
#pragma omp for reduction(+: msgInd, NumMessagesBundled, myCard, PCounter[:numProcs]) schedule(static)
|
|
|
|
#pragma omp for reduction(+: msgInd, NumMessagesBundled, myCard, PCounter[:numProcs]) schedule(static)
|
|
|
|
for (v = 0; v < NLVer; v++) {
|
|
|
|
for (v = 0; v < NLVer; v++) {
|
|
|
@ -574,7 +573,7 @@ void dalgoDistEdgeApproxDomEdgesLinearSearchMesgBndlSmallMateCMP(
|
|
|
|
//Start: PARALLEL_PROCESS_CROSS_EDGE_B(v)
|
|
|
|
//Start: PARALLEL_PROCESS_CROSS_EDGE_B(v)
|
|
|
|
#pragma omp critical
|
|
|
|
#pragma omp critical
|
|
|
|
{
|
|
|
|
{
|
|
|
|
if (Counter[Ghost2LocalMap[w]] > 0) {
|
|
|
|
if (Counter[Ghost2LocalMap[w]] > 0) {
|
|
|
|
|
|
|
|
|
|
|
|
Counter[Ghost2LocalMap[w]] -= 1; //Decrement
|
|
|
|
Counter[Ghost2LocalMap[w]] -= 1; //Decrement
|
|
|
|
if (Counter[Ghost2LocalMap[w]] == 0) {
|
|
|
|
if (Counter[Ghost2LocalMap[w]] == 0) {
|
|
|
@ -614,6 +613,8 @@ void dalgoDistEdgeApproxDomEdgesLinearSearchMesgBndlSmallMateCMP(
|
|
|
|
|
|
|
|
|
|
|
|
} //End of if(w >=0)
|
|
|
|
} //End of if(w >=0)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
//This piece of code is executed a really small amount of times, I will not allocate a
|
|
|
|
|
|
|
|
//huge amount of memory to the private data structures.
|
|
|
|
adj11 = verLocPtr[v];
|
|
|
|
adj11 = verLocPtr[v];
|
|
|
|
adj12 = verLocPtr[v + 1];
|
|
|
|
adj12 = verLocPtr[v + 1];
|
|
|
|
for (k1 = adj11; k1 < adj12; k1++) {
|
|
|
|
for (k1 = adj11; k1 < adj12; k1++) {
|
|
|
@ -632,28 +633,16 @@ void dalgoDistEdgeApproxDomEdgesLinearSearchMesgBndlSmallMateCMP(
|
|
|
|
assert(ghostOwner != -1);
|
|
|
|
assert(ghostOwner != -1);
|
|
|
|
assert(ghostOwner != myRank);
|
|
|
|
assert(ghostOwner != myRank);
|
|
|
|
PCounter[ghostOwner]++;
|
|
|
|
PCounter[ghostOwner]++;
|
|
|
|
privateQLocalVtx.push_back(v + StartIndex);
|
|
|
|
QLocalVtx.push_back(v + StartIndex);
|
|
|
|
privateQGhostVtx.push_back(w);
|
|
|
|
QGhostVtx.push_back(w);
|
|
|
|
privateQMsgType.push_back(FAILURE);
|
|
|
|
QMsgType.push_back(FAILURE);
|
|
|
|
privateQOwner.push_back(ghostOwner);
|
|
|
|
QOwner.push_back(ghostOwner);
|
|
|
|
|
|
|
|
|
|
|
|
} //End of if(GHOST)
|
|
|
|
} //End of if(GHOST)
|
|
|
|
} //End of for loop
|
|
|
|
} //End of for loop
|
|
|
|
//End: PARALLEL_PROCESS_EXPOSED_VERTEX_B(v)
|
|
|
|
//End: PARALLEL_PROCESS_EXPOSED_VERTEX_B(v)
|
|
|
|
} //End of for ( v=0; v < NLVer; v++ )
|
|
|
|
} //End of for ( v=0; v < NLVer; v++ )
|
|
|
|
|
|
|
|
|
|
|
|
#pragma omp critical(privateMsg)
|
|
|
|
|
|
|
|
{
|
|
|
|
|
|
|
|
while (!privateQLocalVtx.empty()) {
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
QLocalVtx.push_back(privateQLocalVtx.pop_back());
|
|
|
|
|
|
|
|
QGhostVtx.push_back(privateQGhostVtx.pop_back());
|
|
|
|
|
|
|
|
QMsgType.push_back(privateQMsgType.pop_back());
|
|
|
|
|
|
|
|
QOwner.push_back(privateQOwner.pop_back());
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
#pragma omp critical(U)
|
|
|
|
#pragma omp critical(U)
|
|
|
|
{
|
|
|
|
{
|
|
|
|
while (!privateU.empty())
|
|
|
|
while (!privateU.empty())
|
|
|
@ -668,261 +657,258 @@ void dalgoDistEdgeApproxDomEdgesLinearSearchMesgBndlSmallMateCMP(
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
cout<<"\n("<<myRank<<"=========================************==============================="<<endl; fflush(stdout);
|
|
|
|
cout<<"\n("<<myRank<<"=========================************==============================="<<endl; fflush(stdout);
|
|
|
|
fflush(stdout);
|
|
|
|
fflush(stdout);
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
///////////////////////////////////////////////////////////////////////////////////
|
|
|
|
///////////////////////////////////////////////////////////////////////////////////
|
|
|
|
/////////////////////////// PROCESS MATCHED VERTICES //////////////////////////////
|
|
|
|
/////////////////////////// PROCESS MATCHED VERTICES //////////////////////////////
|
|
|
|
///////////////////////////////////////////////////////////////////////////////////
|
|
|
|
///////////////////////////////////////////////////////////////////////////////////
|
|
|
|
isEmpty = false;
|
|
|
|
isEmpty = false;
|
|
|
|
|
|
|
|
|
|
|
|
#ifdef COUNT_LOCAL_VERTEX
|
|
|
|
#ifdef COUNT_LOCAL_VERTEX
|
|
|
|
MilanLongInt localVertices = 0;
|
|
|
|
MilanLongInt localVertices = 0;
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
|
|
//TODO what would be the optimal UCHUNK
|
|
|
|
//TODO what would be the optimal UCHUNK
|
|
|
|
vector <MilanLongInt> Us;
|
|
|
|
vector <MilanLongInt> Us;
|
|
|
|
Us.reserve(UCHUNK);
|
|
|
|
Us.reserve(UCHUNK);
|
|
|
|
|
|
|
|
|
|
|
|
while( true ) {
|
|
|
|
while( true ) {
|
|
|
|
|
|
|
|
|
|
|
|
Us.clear();
|
|
|
|
Us.clear();
|
|
|
|
#pragma omp critical(U)
|
|
|
|
#pragma omp critical(U)
|
|
|
|
{
|
|
|
|
{
|
|
|
|
//If U is emptu and there are no new node to add to U
|
|
|
|
//If U is emptu and there are no new node to add to U
|
|
|
|
if (U.empty() && privateU.empty())
|
|
|
|
if (U.empty() && privateU.empty())
|
|
|
|
isEmpty = true;
|
|
|
|
isEmpty = true;
|
|
|
|
else {
|
|
|
|
else {
|
|
|
|
if (U.empty() && !privateU.empty()) // If U is empty but there are nodes in private U
|
|
|
|
if (U.empty() && !privateU.empty()) // If U is empty but there are nodes in private U
|
|
|
|
while (!privateU.empty()) {
|
|
|
|
while (!privateU.empty()) {
|
|
|
|
U.push_back(privateU.pop_front());
|
|
|
|
U.push_back(privateU.pop_front());
|
|
|
|
myCard += privateMyCard;
|
|
|
|
myCard += privateMyCard;
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
for (int i = 0; i < UCHUNK; i++) { // Pop the new nodes
|
|
|
|
|
|
|
|
if (U.empty()) break;
|
|
|
|
|
|
|
|
Us.push_back(U.pop_front());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
for (int i = 0; i < UCHUNK; i++) { // Pop the new nodes
|
|
|
|
|
|
|
|
if (U.empty()) break;
|
|
|
|
|
|
|
|
Us.push_back(U.pop_front());
|
|
|
|
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} // End of critical U
|
|
|
|
} // End of critical U
|
|
|
|
if (isEmpty) break;
|
|
|
|
if (isEmpty) break;
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
for (MilanLongInt u : Us)
|
|
|
|
for (MilanLongInt u : Us)
|
|
|
|
{
|
|
|
|
{
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
cout<<"\n("<<myRank<<")u: "<<u; fflush(stdout);
|
|
|
|
cout<<"\n("<<myRank<<")u: "<<u; fflush(stdout);
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
if ((u >= StartIndex) && (u <= EndIndex)) { //Process Only the Local Vertices
|
|
|
|
if ((u >= StartIndex) && (u <= EndIndex)) { //Process Only the Local Vertices
|
|
|
|
|
|
|
|
|
|
|
|
#ifdef COUNT_LOCAL_VERTEX
|
|
|
|
#ifdef COUNT_LOCAL_VERTEX
|
|
|
|
localVertices ++;
|
|
|
|
localVertices ++;
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
|
|
//Get the Adjacency list for u
|
|
|
|
//Get the Adjacency list for u
|
|
|
|
adj1 = verLocPtr[u - StartIndex]; //Pointer
|
|
|
|
adj1 = verLocPtr[u - StartIndex]; //Pointer
|
|
|
|
adj2 = verLocPtr[u - StartIndex + 1];
|
|
|
|
adj2 = verLocPtr[u - StartIndex + 1];
|
|
|
|
for (k = adj1; k < adj2; k++) {
|
|
|
|
for (k = adj1; k < adj2; k++) {
|
|
|
|
v = verLocInd[k];
|
|
|
|
v = verLocInd[k];
|
|
|
|
|
|
|
|
|
|
|
|
if ((v >= StartIndex) && (v <= EndIndex)) { //If Local Vertex:
|
|
|
|
|
|
|
|
#pragma omp critical(innerProcessMatched)
|
|
|
|
|
|
|
|
{
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
if ((v >= StartIndex) && (v <= EndIndex)) { //If Local Vertex:
|
|
|
|
if ((v >= StartIndex) && (v <= EndIndex)) { //If Local Vertex:
|
|
|
|
|
|
|
|
#pragma omp critical(innerProcessMatched)
|
|
|
|
|
|
|
|
{
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
//If the current vertex is pointing to a matched vertex and is not matched
|
|
|
|
|
|
|
|
//FIXME is there a way to make candidateMate private?
|
|
|
|
|
|
|
|
// for the moment it could generate an error.
|
|
|
|
|
|
|
|
if (not isAlreadyMatched(v, StartIndex, EndIndex, GMate, Mate, Ghost2LocalMap) and
|
|
|
|
|
|
|
|
candidateMate[v - StartIndex] == u) {
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
//Start: PARALLEL_PROCESS_EXPOSED_VERTEX_B(v)
|
|
|
|
|
|
|
|
//Start: PARALLEL_COMPUTE_CANDIDATE_MATE_B(v)
|
|
|
|
|
|
|
|
w = computeCandidateMate(verLocPtr[v - StartIndex],
|
|
|
|
|
|
|
|
verLocPtr[v - StartIndex + 1],
|
|
|
|
|
|
|
|
edgeLocWeight, 0,
|
|
|
|
|
|
|
|
verLocInd,
|
|
|
|
|
|
|
|
StartIndex,
|
|
|
|
|
|
|
|
EndIndex,
|
|
|
|
|
|
|
|
GMate,
|
|
|
|
|
|
|
|
Mate,
|
|
|
|
|
|
|
|
Ghost2LocalMap);
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
candidateMate[v - StartIndex] = w;
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
//End: PARALLEL_COMPUTE_CANDIDATE_MATE_B(v)
|
|
|
|
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
cout<<"\n("<<myRank<<")"<<v<<" Points to: "<<w; fflush(stdout);
|
|
|
|
cout<<"\n("<<myRank<<")v: "<<v<<" c(v)= "<<candidateMate[v-StartIndex]<<" Mate[v]: "<<Mate[v];
|
|
|
|
|
|
|
|
fflush(stdout);
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
//If found a dominating edge:
|
|
|
|
|
|
|
|
if (w >= 0) {
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
//TODO is it possible to lock without a critical region?
|
|
|
|
|
|
|
|
//TODO there must be a more elegant and efficient way to do this
|
|
|
|
|
|
|
|
while(true) {
|
|
|
|
|
|
|
|
if (omp_test_lock(&MateLock[v - StartIndex])) {
|
|
|
|
|
|
|
|
if (omp_test_lock(&MateLock[w - StartIndex])) break;
|
|
|
|
|
|
|
|
else omp_unset_lock(&MateLock[v - StartIndex]);
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
if ((w < StartIndex) || (w > EndIndex)) { //A ghost
|
|
|
|
//If the current vertex is pointing to a matched vertex and is not matched
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
//FIXME is there a way to make candidateMate private?
|
|
|
|
cout<<"\n("<<myRank<<")Sending a request message:";
|
|
|
|
// for the moment it could generate an error.
|
|
|
|
cout<<"\n("<<myRank<<")Ghost is "<<w<<" Owner is: "<<findOwnerOfGhost(w, verDistance, myRank, numProcs);
|
|
|
|
if (not isAlreadyMatched(v, StartIndex, EndIndex, GMate, Mate, Ghost2LocalMap) and
|
|
|
|
#endif
|
|
|
|
candidateMate[v - StartIndex] == u) {
|
|
|
|
|
|
|
|
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
|
|
|
|
cout<<"\n("<<myRank<<")v: "<<v<<" c(v)= "<<candidateMate[v-StartIndex]<<" Mate[v]: "<<Mate[v];
|
|
|
|
|
|
|
|
fflush(stdout);
|
|
|
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
//If the current vertex is pointing to a matched vertex and is not matched
|
|
|
|
|
|
|
|
//FIXME is there a way to make candidateMate private?
|
|
|
|
|
|
|
|
// for the moment it could generate errors.
|
|
|
|
|
|
|
|
if (not isAlreadyMatched(v, StartIndex, EndIndex, GMate, Mate, Ghost2LocalMap) and
|
|
|
|
|
|
|
|
candidateMate[v - StartIndex] == u) {
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
//Start: PARALLEL_PROCESS_EXPOSED_VERTEX_B(v)
|
|
|
|
//Start: PARALLEL_PROCESS_EXPOSED_VERTEX_B(v)
|
|
|
|
//Start: PARALLEL_COMPUTE_CANDIDATE_MATE_B(v)
|
|
|
|
//Start: PARALLEL_COMPUTE_CANDIDATE_MATE_B(v)
|
|
|
|
w = computeCandidateMate(verLocPtr[v - StartIndex],
|
|
|
|
w = computeCandidateMate(verLocPtr[v - StartIndex],
|
|
|
|
verLocPtr[v - StartIndex + 1],
|
|
|
|
verLocPtr[v - StartIndex + 1],
|
|
|
|
edgeLocWeight, 0,
|
|
|
|
edgeLocWeight, 0,
|
|
|
|
verLocInd,
|
|
|
|
verLocInd,
|
|
|
|
StartIndex,
|
|
|
|
StartIndex,
|
|
|
|
EndIndex,
|
|
|
|
EndIndex,
|
|
|
|
GMate,
|
|
|
|
GMate,
|
|
|
|
Mate,
|
|
|
|
Mate,
|
|
|
|
Ghost2LocalMap);
|
|
|
|
Ghost2LocalMap);
|
|
|
|
|
|
|
|
|
|
|
|
candidateMate[v - StartIndex] = w;
|
|
|
|
candidateMate[v - StartIndex] = w;
|
|
|
|
|
|
|
|
|
|
|
|
//End: PARALLEL_COMPUTE_CANDIDATE_MATE_B(v)
|
|
|
|
//End: PARALLEL_COMPUTE_CANDIDATE_MATE_B(v)
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
cout<<"\n("<<myRank<<")"<<v<<" Points to: "<<w; fflush(stdout);
|
|
|
|
cout<<"\n("<<myRank<<")"<<v<<" Points to: "<<w; fflush(stdout);
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
} //End of if(CandidateMate(w) = v
|
|
|
|
//If found a dominating edge:
|
|
|
|
} //End of Else
|
|
|
|
if (w >= 0) {
|
|
|
|
|
|
|
|
|
|
|
|
omp_unset_lock(&MateLock[v - StartIndex]);
|
|
|
|
//TODO is it possible to lock without a critical region?
|
|
|
|
omp_unset_lock(&MateLock[w - StartIndex]);
|
|
|
|
//TODO there must be a more elegant and efficient way to do this
|
|
|
|
|
|
|
|
while(true) {
|
|
|
|
|
|
|
|
if (omp_test_lock(&MateLock[v - StartIndex])) {
|
|
|
|
|
|
|
|
if (omp_test_lock(&MateLock[w - StartIndex])) break;
|
|
|
|
|
|
|
|
else omp_unset_lock(&MateLock[v - StartIndex]);
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
} //End of if(w >=0)
|
|
|
|
|
|
|
|
else {
|
|
|
|
|
|
|
|
adj11 = verLocPtr[v - StartIndex];
|
|
|
|
|
|
|
|
adj12 = verLocPtr[v - StartIndex + 1];
|
|
|
|
|
|
|
|
for (k1 = adj11; k1 < adj12; k1++) {
|
|
|
|
|
|
|
|
w = verLocInd[k1];
|
|
|
|
|
|
|
|
if ((w < StartIndex) || (w > EndIndex)) { //A ghost
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
if ((w < StartIndex) || (w > EndIndex)) { //A ghost
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
cout<<"\n("<<myRank<<")Sending a request message:";
|
|
|
|
cout<<"\n("<<myRank<<")Sending a request message:";
|
|
|
|
cout<<"\n("<<myRank<<")Ghost is "<<w<<" Owner is: "<<findOwnerOfGhost(w, verDistance, myRank, numProcs);
|
|
|
|
cout<<"\n("<<myRank<<")Ghost is "<<w<<" Owner is: "<<findOwnerOfGhost(w, verDistance, myRank, numProcs);
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
QLocalVtx.push_back(v);
|
|
|
|
ghostOwner = findOwnerOfGhost(w, verDistance, myRank, numProcs);
|
|
|
|
QGhostVtx.push_back(w);
|
|
|
|
assert(ghostOwner != -1);
|
|
|
|
QMsgType.push_back(REQUEST);
|
|
|
|
assert(ghostOwner != myRank);
|
|
|
|
ghostOwner = findOwnerOfGhost(w, verDistance, myRank, numProcs);
|
|
|
|
QOwner.push_back(ghostOwner);
|
|
|
|
assert(ghostOwner != -1);
|
|
|
|
QLocalVtx.push_back(v);
|
|
|
|
assert(ghostOwner != myRank);
|
|
|
|
QGhostVtx.push_back(w);
|
|
|
|
QOwner.push_back(ghostOwner);
|
|
|
|
QMsgType.push_back(REQUEST);
|
|
|
|
PCounter[ghostOwner]++;
|
|
|
|
PCounter[ghostOwner]++;
|
|
|
|
NumMessagesBundled++;
|
|
|
|
NumMessagesBundled++;
|
|
|
|
msgInd++;
|
|
|
|
msgInd++;
|
|
|
|
if (candidateMate[NLVer + Ghost2LocalMap[w]] == v) {
|
|
|
|
} //End of if(GHOST)
|
|
|
|
Mate[v - StartIndex] = w; //v is a local vertex
|
|
|
|
} //End of for loop
|
|
|
|
GMate[Ghost2LocalMap[w]] = v; //w is a ghost vertex
|
|
|
|
} // End of Else: w == -1
|
|
|
|
//Q.push_back(u);
|
|
|
|
//End: PARALLEL_PROCESS_EXPOSED_VERTEX_B(v)
|
|
|
|
privateU.push_back(v);
|
|
|
|
|
|
|
|
privateU.push_back(w);
|
|
|
|
} //End of If (candidateMate[v-StartIndex] == u
|
|
|
|
privateMyCard++;
|
|
|
|
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
|
|
|
|
cout<<"\n("<<myRank<<")MATCH: ("<<v<<","<<w<<") "; fflush(stdout);
|
|
|
|
if (candidateMate[NLVer + Ghost2LocalMap[w]] == v) {
|
|
|
|
#endif
|
|
|
|
Mate[v - StartIndex] = w; //v is a local vertex
|
|
|
|
//Decrement the counter:
|
|
|
|
GMate[Ghost2LocalMap[w]] = v; //w is a ghost vertex
|
|
|
|
//Start: PARALLEL_PROCESS_CROSS_EDGE_B(v,w)
|
|
|
|
//Q.push_back(u);
|
|
|
|
if (Counter[Ghost2LocalMap[w]] > 0) {
|
|
|
|
privateU.push_back(v);
|
|
|
|
Counter[Ghost2LocalMap[w]] = Counter[Ghost2LocalMap[w]] - 1; //Decrement
|
|
|
|
privateU.push_back(w);
|
|
|
|
if (Counter[Ghost2LocalMap[w]] == 0) {
|
|
|
|
privateMyCard++;
|
|
|
|
S--; //Decrement S
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
cout<<"\n("<<myRank<<")MATCH: ("<<v<<","<<w<<") "; fflush(stdout);
|
|
|
|
cout<<"\n("<<myRank<<")Decrementing S: Ghost vertex "<<w<<" has received all its messages";
|
|
|
|
|
|
|
|
fflush(stdout);
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
//Decrement the counter:
|
|
|
|
}
|
|
|
|
//Start: PARALLEL_PROCESS_CROSS_EDGE_B(v,w)
|
|
|
|
} //End of if Counter[w] > 0
|
|
|
|
if (Counter[Ghost2LocalMap[w]] > 0) {
|
|
|
|
//End: PARALLEL_PROCESS_CROSS_EDGE_B(v,w)
|
|
|
|
Counter[Ghost2LocalMap[w]] = Counter[Ghost2LocalMap[w]] - 1; //Decrement
|
|
|
|
} //End of if CandidateMate[w] = v
|
|
|
|
if (Counter[Ghost2LocalMap[w]] == 0) {
|
|
|
|
} //End of if a Ghost Vertex
|
|
|
|
S--; //Decrement S
|
|
|
|
else { //w is a local vertex
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
if (candidateMate[w - StartIndex] == v) {
|
|
|
|
cout<<"\n("<<myRank<<")Decrementing S: Ghost vertex "<<w<<" has received all its messages";
|
|
|
|
Mate[v - StartIndex] = w; //v is a local vertex
|
|
|
|
fflush(stdout);
|
|
|
|
Mate[w - StartIndex] = v; //w is a local vertex
|
|
|
|
|
|
|
|
//Q.push_back(u);
|
|
|
|
|
|
|
|
privateU.push_back(v);
|
|
|
|
|
|
|
|
privateU.push_back(w);
|
|
|
|
|
|
|
|
privateMyCard++;
|
|
|
|
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
|
|
|
|
cout<<"\n("<<myRank<<")MATCH: ("<<v<<","<<w<<") "; fflush(stdout);
|
|
|
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
} //End of if(CandidateMate(w) = v
|
|
|
|
|
|
|
|
} //End of Else
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
omp_unset_lock(&MateLock[v - StartIndex]);
|
|
|
|
|
|
|
|
omp_unset_lock(&MateLock[w - StartIndex]);
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
} //End of if(w >=0)
|
|
|
|
|
|
|
|
else {
|
|
|
|
|
|
|
|
adj11 = verLocPtr[v - StartIndex];
|
|
|
|
|
|
|
|
adj12 = verLocPtr[v - StartIndex + 1];
|
|
|
|
|
|
|
|
for (k1 = adj11; k1 < adj12; k1++) {
|
|
|
|
|
|
|
|
w = verLocInd[k1];
|
|
|
|
|
|
|
|
if ((w < StartIndex) || (w > EndIndex)) { //A ghost
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
|
|
|
|
cout<<"\n("<<myRank<<")Sending a failure message: ";
|
|
|
|
|
|
|
|
cout<<"\n("<<myRank<<")Ghost is "<<w<<" Owner is: "<<findOwnerOfGhost(w, verDistance, myRank, numProcs);
|
|
|
|
|
|
|
|
fflush(stdout);
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
/* MPI_Bsend(&Message[0], 3, MPI_INT, inputSubGraph.findOwner(w),
|
|
|
|
} //End of if Counter[w] > 0
|
|
|
|
ComputeTag, comm); */
|
|
|
|
|
|
|
|
QLocalVtx.push_back(v);
|
|
|
|
|
|
|
|
QGhostVtx.push_back(w);
|
|
|
|
|
|
|
|
QMsgType.push_back(FAILURE);
|
|
|
|
|
|
|
|
//ghostOwner = inputSubGraph.findOwner(w);
|
|
|
|
|
|
|
|
ghostOwner = findOwnerOfGhost(w, verDistance, myRank, numProcs);
|
|
|
|
|
|
|
|
assert(ghostOwner != -1);
|
|
|
|
|
|
|
|
assert(ghostOwner != myRank);
|
|
|
|
|
|
|
|
QOwner.push_back(ghostOwner);
|
|
|
|
|
|
|
|
PCounter[ghostOwner]++;
|
|
|
|
|
|
|
|
NumMessagesBundled++;
|
|
|
|
|
|
|
|
msgInd++;
|
|
|
|
|
|
|
|
} //End of if(GHOST)
|
|
|
|
|
|
|
|
} //End of for loop
|
|
|
|
|
|
|
|
} // End of Else: w == -1
|
|
|
|
|
|
|
|
//End: PARALLEL_PROCESS_EXPOSED_VERTEX_B(v)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
} //End of If (candidateMate[v-StartIndex] == u
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
} //End of critical region if
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
} //End of if ( (v >= StartIndex) && (v <= EndIndex) ) //If Local Vertex:
|
|
|
|
|
|
|
|
else { //Neighbor is a ghost vertex
|
|
|
|
|
|
|
|
|
|
|
|
#pragma omp critical(innerProcessMatched)
|
|
|
|
#pragma omp critical(innerProcessMatched)
|
|
|
|
{
|
|
|
|
{
|
|
|
|
|
|
|
|
|
|
|
|
while(!omp_test_lock(&MateLock[u - StartIndex]));
|
|
|
|
while(!omp_test_lock(&MateLock[u - StartIndex]));
|
|
|
|
|
|
|
|
|
|
|
|
if (candidateMate[NLVer + Ghost2LocalMap[v]] == u)
|
|
|
|
if (candidateMate[NLVer + Ghost2LocalMap[v]] == u)
|
|
|
|
candidateMate[NLVer + Ghost2LocalMap[v]] = -1;
|
|
|
|
candidateMate[NLVer + Ghost2LocalMap[v]] = -1;
|
|
|
|
if (v != Mate[u - StartIndex]) { //u is local
|
|
|
|
if (v != Mate[u - StartIndex]) { //u is local
|
|
|
|
//Build the Message Packet:
|
|
|
|
//Build the Message Packet:
|
|
|
|
//Message[0] = u; //LOCAL
|
|
|
|
//Message[0] = u; //LOCAL
|
|
|
|
//Message[1] = v; //GHOST
|
|
|
|
//Message[1] = v; //GHOST
|
|
|
|
//Message[2] = SUCCESS; //TYPE
|
|
|
|
//Message[2] = SUCCESS; //TYPE
|
|
|
|
//Send a Request (Asynchronous)
|
|
|
|
//Send a Request (Asynchronous)
|
|
|
|
|
|
|
|
|
|
|
|
if (candidateMate[w - StartIndex] == v) {
|
|
|
|
|
|
|
|
Mate[v - StartIndex] = w; //v is a local vertex
|
|
|
|
|
|
|
|
Mate[w - StartIndex] = v; //w is a local vertex
|
|
|
|
|
|
|
|
privateU.push_back(v);
|
|
|
|
|
|
|
|
privateU.push_back(w);
|
|
|
|
|
|
|
|
privateMyCard++;
|
|
|
|
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
cout<<"\n("<<myRank<<")MATCH: ("<<v<<","<<w<<") "; fflush(stdout);
|
|
|
|
cout<<"\n("<<myRank<<")Sending a success message: ";
|
|
|
|
|
|
|
|
cout<<"\n("<<myRank<<")Ghost is "<<v<<" Owner is: "<<findOwnerOfGhost(v, verDistance, myRank, numProcs)<<"\n"; fflush(stdout);
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
} //End of if(CandidateMate(w) = v
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
QLocalVtx.push_back(u);
|
|
|
|
QLocalVtx.push_back(u);
|
|
|
|
QGhostVtx.push_back(v);
|
|
|
|
QGhostVtx.push_back(v);
|
|
|
|
QMsgType.push_back(SUCCESS);
|
|
|
|
QMsgType.push_back(SUCCESS);
|
|
|
|
ghostOwner = findOwnerOfGhost(v, verDistance, myRank, numProcs);
|
|
|
|
ghostOwner = findOwnerOfGhost(v, verDistance, myRank, numProcs);
|
|
|
|
assert(ghostOwner != -1);
|
|
|
|
assert(ghostOwner != -1);
|
|
|
|
assert(ghostOwner != myRank);
|
|
|
|
assert(ghostOwner != myRank);
|
|
|
|
QOwner.push_back(ghostOwner);
|
|
|
|
QOwner.push_back(ghostOwner);
|
|
|
|
PCounter[ghostOwner]++;
|
|
|
|
PCounter[ghostOwner]++;
|
|
|
|
NumMessagesBundled++;
|
|
|
|
NumMessagesBundled++;
|
|
|
|
msgInd++;
|
|
|
|
msgInd++;
|
|
|
|
} //End of If( v != Mate[u] )
|
|
|
|
} //End of If( v != Mate[u] )
|
|
|
|
|
|
|
|
|
|
|
|
omp_unset_lock(&MateLock[u - StartIndex]);
|
|
|
|
omp_unset_lock(&MateLock[u - StartIndex]);
|
|
|
|
|
|
|
|
|
|
|
|
} //End of critical region
|
|
|
|
} //End of critical region
|
|
|
|
} //End of Else //A Ghost Vertex
|
|
|
|
} //End of Else //A Ghost Vertex
|
|
|
|
|
|
|
|
|
|
|
|
} //End of For Loop adj(u)
|
|
|
|
} //End of For Loop adj(u)
|
|
|
|
|
|
|
|
|
|
|
|
} //End of if ( (u >= StartIndex) && (u <= EndIndex) ) //Process Only If a Local Vertex
|
|
|
|
} //End of if ( (u >= StartIndex) && (u <= EndIndex) ) //Process Only If a Local Vertex
|
|
|
|
|
|
|
|
|
|
|
|
//Avoid to ask for the critical section if there is nothing to add
|
|
|
|
//Avoid to ask for the critical section if there is nothing to add
|
|
|
|
if (privateU.size() < UCHUNK && !U.empty()) continue;
|
|
|
|
if (privateU.size() < UCHUNK && !U.empty()) continue;
|
|
|
|
#pragma omp critical(U)
|
|
|
|
#pragma omp critical(U)
|
|
|
|
{
|
|
|
|
{
|
|
|
|
while (!privateU.empty()) {
|
|
|
|
while (!privateU.empty()) {
|
|
|
|
U.push_back(privateU.pop_front());
|
|
|
|
U.push_back(privateU.pop_front());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
myCard += privateMyCard;
|
|
|
|
myCard += privateMyCard;
|
|
|
|
} //End of critical U
|
|
|
|
} //End of critical U
|
|
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} //End of while ( /*!Q.empty()*/ !U.empty() )
|
|
|
|
} //End of while ( /*!Q.empty()*/ !U.empty() )
|
|
|
|
|
|
|
|
|
|
|
|
#pragma omp critical(privateMsg)
|
|
|
|
#pragma omp critical(privateMsg)
|
|
|
|
{
|
|
|
|
{
|
|
|
@ -938,20 +924,20 @@ void dalgoDistEdgeApproxDomEdgesLinearSearchMesgBndlSmallMateCMP(
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
#ifdef COUNT_LOCAL_VERTEX
|
|
|
|
#ifdef COUNT_LOCAL_VERTEX
|
|
|
|
printf("Count local vertexes: %ld for thread %d of processor %d\n",
|
|
|
|
printf("Count local vertexes: %ld for thread %d of processor %d\n",
|
|
|
|
localVertices,
|
|
|
|
localVertices,
|
|
|
|
omp_get_thread_num(),
|
|
|
|
omp_get_thread_num(),
|
|
|
|
myRank);
|
|
|
|
myRank);
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
///////////////////////// END OF PROCESS MATCHED VERTICES /////////////////////////
|
|
|
|
///////////////////////// END OF PROCESS MATCHED VERTICES /////////////////////////
|
|
|
|
#ifdef DEBUG_HANG_
|
|
|
|
#ifdef DEBUG_HANG_
|
|
|
|
if (myRank == 0) cout<<"\n("<<myRank<<") Send Bundles" <<endl; fflush(stdout);
|
|
|
|
if (myRank == 0) cout<<"\n("<<myRank<<") Send Bundles" <<endl; fflush(stdout);
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
/////////////////////////////////////////////////////////////////////////////////////////
|
|
|
|
/////////////////////////////////////////////////////////////////////////////////////////
|
|
|
|
///////////////////////////// SEND BUNDLED MESSAGES /////////////////////////////////////
|
|
|
|
///////////////////////////// SEND BUNDLED MESSAGES /////////////////////////////////////
|
|
|
|
/////////////////////////////////////////////////////////////////////////////////////////
|
|
|
|
/////////////////////////////////////////////////////////////////////////////////////////
|
|
|
|
#pragma omp barrier
|
|
|
|
#pragma omp barrier
|
|
|
|
#pragma omp master
|
|
|
|
#pragma omp master
|
|
|
|
{
|
|
|
|
{
|
|
|
@ -980,15 +966,15 @@ void dalgoDistEdgeApproxDomEdgesLinearSearchMesgBndlSmallMateCMP(
|
|
|
|
//Build the Message Bundle packet:
|
|
|
|
//Build the Message Bundle packet:
|
|
|
|
|
|
|
|
|
|
|
|
//OMP Not parallelizable
|
|
|
|
//OMP Not parallelizable
|
|
|
|
for (MilanInt i=0; i<NumMessagesBundled; i++) { // Changed by Fabio to be an integer, addresses needs to be integers!
|
|
|
|
for (MilanInt i=0; i<NumMessagesBundled; i++) { // Changed by Fabio to be an integer, addresses needs to be integers!
|
|
|
|
myIndex = ( PCumulative[QOwner[i]] + PCounter[QOwner[i]] )*3;
|
|
|
|
myIndex = ( PCumulative[QOwner[i]] + PCounter[QOwner[i]] )*3;
|
|
|
|
PMessageBundle[myIndex+0] = QLocalVtx[i];
|
|
|
|
PMessageBundle[myIndex+0] = QLocalVtx[i];
|
|
|
|
PMessageBundle[myIndex+1] = QGhostVtx[i];
|
|
|
|
PMessageBundle[myIndex+1] = QGhostVtx[i];
|
|
|
|
PMessageBundle[myIndex+2] = QMsgType[i];
|
|
|
|
PMessageBundle[myIndex+2] = QMsgType[i];
|
|
|
|
PCounter[QOwner[i]]++;
|
|
|
|
PCounter[QOwner[i]]++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
//Send the Bundled Messages: Use ISend
|
|
|
|
//Send the Bundled Messages: Use ISend
|
|
|
|
|
|
|
|
|
|
|
|
try {
|
|
|
|
try {
|
|
|
|
SRequest.reserve(numProcs * 2); //At most two messages per processor
|
|
|
|
SRequest.reserve(numProcs * 2); //At most two messages per processor
|
|
|
@ -1044,7 +1030,7 @@ void dalgoDistEdgeApproxDomEdgesLinearSearchMesgBndlSmallMateCMP(
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
cout<<"\n("<<myRank<<")Number of Ghost edges = "<<numGhostEdges;
|
|
|
|
cout<<"\n("<<myRank<<")Number of Ghost edges = "<<numGhostEdges;
|
|
|
|
cout<<"\n("<<myRank<<")Total number of potential message X 2 = "<<numGhostEdges*2;
|
|
|
|
cout<<"\n("<<myRank<<")Total number of potential message X 2 = "<<numGhostEdges*2;
|
|
|
|
cout<<"\n("<<myRank<<")Number messages already sent in bundles = "<<NumMessagesBundled;
|
|
|
|
cout<<"\n("<<myRank<<")Number messages already sent in bundles = "<<NumMessagesBundled;
|
|
|
|
if (numGhostEdges>0) {
|
|
|
|
if (numGhostEdges>0) {
|
|
|
@ -1053,21 +1039,21 @@ void dalgoDistEdgeApproxDomEdgesLinearSearchMesgBndlSmallMateCMP(
|
|
|
|
fflush(stdout);
|
|
|
|
fflush(stdout);
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
|
|
//Allocate memory for MPI Send messages:
|
|
|
|
//Allocate memory for MPI Send messages:
|
|
|
|
/* WILL COME BACK HERE - NO NEED TO STORE ALL THIS MEMORY !! */
|
|
|
|
/* WILL COME BACK HERE - NO NEED TO STORE ALL THIS MEMORY !! */
|
|
|
|
OneMessageSize=0;
|
|
|
|
OneMessageSize=0;
|
|
|
|
MPI_Pack_size(3, TypeMap<MilanLongInt>(), comm, &OneMessageSize); //Size of one message packet
|
|
|
|
MPI_Pack_size(3, TypeMap<MilanLongInt>(), comm, &OneMessageSize); //Size of one message packet
|
|
|
|
//How many messages to send?
|
|
|
|
//How many messages to send?
|
|
|
|
//Potentially three kinds of messages will be sent/received:
|
|
|
|
//Potentially three kinds of messages will be sent/received:
|
|
|
|
//Request, Success, Failure.
|
|
|
|
//Request, Success, Failure.
|
|
|
|
//But only two will be sent from a given processor.
|
|
|
|
//But only two will be sent from a given processor.
|
|
|
|
//Substract the number of messages that have already been sent as bundled messages:
|
|
|
|
//Substract the number of messages that have already been sent as bundled messages:
|
|
|
|
numMessagesToSend = numGhostEdges*2 - NumMessagesBundled;
|
|
|
|
numMessagesToSend = numGhostEdges*2 - NumMessagesBundled;
|
|
|
|
BufferSize = (OneMessageSize+MPI_BSEND_OVERHEAD)*numMessagesToSend;
|
|
|
|
BufferSize = (OneMessageSize+MPI_BSEND_OVERHEAD)*numMessagesToSend;
|
|
|
|
|
|
|
|
|
|
|
|
Buffer=0;
|
|
|
|
Buffer=0;
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
#ifdef PRINT_DEBUG_INFO_
|
|
|
|
cout<<"\n("<<myRank<<")Size of One Message from PACK= "<<OneMessageSize;
|
|
|
|
cout<<"\n("<<myRank<<")Size of One Message from PACK= "<<OneMessageSize;
|
|
|
|
cout<<"\n("<<myRank<<")Size of Message overhead = "<<MPI_BSEND_OVERHEAD;
|
|
|
|
cout<<"\n("<<myRank<<")Size of Message overhead = "<<MPI_BSEND_OVERHEAD;
|
|
|
|
cout<<"\n("<<myRank<<")Number of Ghost edges = "<<numGhostEdges;
|
|
|
|
cout<<"\n("<<myRank<<")Number of Ghost edges = "<<numGhostEdges;
|
|
|
|
cout<<"\n("<<myRank<<")Number of remaining message = "<<numMessagesToSend;
|
|
|
|
cout<<"\n("<<myRank<<")Number of remaining message = "<<numMessagesToSend;
|
|
|
@ -1075,15 +1061,15 @@ void dalgoDistEdgeApproxDomEdgesLinearSearchMesgBndlSmallMateCMP(
|
|
|
|
cout<<"\n("<<myRank<<")Attaching Buffer on.. ";
|
|
|
|
cout<<"\n("<<myRank<<")Attaching Buffer on.. ";
|
|
|
|
fflush(stdout);
|
|
|
|
fflush(stdout);
|
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
if ( BufferSize > 0 ) {
|
|
|
|
if ( BufferSize > 0 ) {
|
|
|
|
Buffer = (MilanLongInt *) malloc(BufferSize); //Allocate memory
|
|
|
|
Buffer = (MilanLongInt *) malloc(BufferSize); //Allocate memory
|
|
|
|
if ( Buffer == 0 ) {
|
|
|
|
if ( Buffer == 0 ) {
|
|
|
|
cout<<"Error in function algoDistEdgeApproxDominatingEdgesLinearSearch: \n";
|
|
|
|
cout<<"Error in function algoDistEdgeApproxDominatingEdgesLinearSearch: \n";
|
|
|
|
cout<<"Not enough memory to allocate for send buffer on process "<<myRank<<"\n";
|
|
|
|
cout<<"Not enough memory to allocate for send buffer on process "<<myRank<<"\n";
|
|
|
|
exit(1);
|
|
|
|
exit(1);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
MPI_Buffer_attach(Buffer, BufferSize); //Attach the Buffer
|
|
|
|
MPI_Buffer_attach(Buffer, BufferSize); //Attach the Buffer
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} //End of master
|
|
|
|
} //End of master
|
|
|
|
|
|
|
|
|
|
|
|
} // end of parallel region
|
|
|
|
} // end of parallel region
|
|
|
@ -1707,10 +1693,10 @@ inline MilanInt findOwnerOfGhost(MilanLongInt vtxIndex, MilanLongInt *mVerDistan
|
|
|
|
* @return
|
|
|
|
* @return
|
|
|
|
*/
|
|
|
|
*/
|
|
|
|
inline MilanLongInt firstComputeCandidateMate(MilanLongInt adj1,
|
|
|
|
inline MilanLongInt firstComputeCandidateMate(MilanLongInt adj1,
|
|
|
|
MilanLongInt adj2,
|
|
|
|
MilanLongInt adj2,
|
|
|
|
MilanLongInt* verLocInd,
|
|
|
|
MilanLongInt* verLocInd,
|
|
|
|
MilanReal* edgeLocWeight)
|
|
|
|
MilanReal* edgeLocWeight)
|
|
|
|
{
|
|
|
|
{
|
|
|
|
MilanInt w = -1;
|
|
|
|
MilanInt w = -1;
|
|
|
|
MilanReal heaviestEdgeWt = MilanRealMin; //Assign the smallest Value possible first LDBL_MIN
|
|
|
|
MilanReal heaviestEdgeWt = MilanRealMin; //Assign the smallest Value possible first LDBL_MIN
|
|
|
|
int finalK;
|
|
|
|
int finalK;
|
|
|
@ -1738,12 +1724,12 @@ inline MilanLongInt firstComputeCandidateMate(MilanLongInt adj1,
|
|
|
|
* @return
|
|
|
|
* @return
|
|
|
|
*/
|
|
|
|
*/
|
|
|
|
inline bool isAlreadyMatched(MilanLongInt node,
|
|
|
|
inline bool isAlreadyMatched(MilanLongInt node,
|
|
|
|
MilanLongInt StartIndex,
|
|
|
|
MilanLongInt StartIndex,
|
|
|
|
MilanLongInt EndIndex,
|
|
|
|
MilanLongInt EndIndex,
|
|
|
|
vector <MilanLongInt> &GMate,
|
|
|
|
vector <MilanLongInt> &GMate,
|
|
|
|
MilanLongInt* Mate,
|
|
|
|
MilanLongInt* Mate,
|
|
|
|
map <MilanLongInt, MilanLongInt> &Ghost2LocalMap
|
|
|
|
map <MilanLongInt, MilanLongInt> &Ghost2LocalMap
|
|
|
|
) {
|
|
|
|
) {
|
|
|
|
|
|
|
|
|
|
|
|
bool result = false;
|
|
|
|
bool result = false;
|
|
|
|
#pragma omp critical(Mate)
|
|
|
|
#pragma omp critical(Mate)
|
|
|
@ -1776,15 +1762,15 @@ inline bool isAlreadyMatched(MilanLongInt node,
|
|
|
|
* @return
|
|
|
|
* @return
|
|
|
|
*/
|
|
|
|
*/
|
|
|
|
inline MilanLongInt computeCandidateMate(MilanLongInt adj1,
|
|
|
|
inline MilanLongInt computeCandidateMate(MilanLongInt adj1,
|
|
|
|
MilanLongInt adj2,
|
|
|
|
MilanLongInt adj2,
|
|
|
|
MilanReal* edgeLocWeight,
|
|
|
|
MilanReal* edgeLocWeight,
|
|
|
|
MilanLongInt k,
|
|
|
|
MilanLongInt k,
|
|
|
|
MilanLongInt* verLocInd,
|
|
|
|
MilanLongInt* verLocInd,
|
|
|
|
MilanLongInt StartIndex,
|
|
|
|
MilanLongInt StartIndex,
|
|
|
|
MilanLongInt EndIndex,
|
|
|
|
MilanLongInt EndIndex,
|
|
|
|
vector <MilanLongInt>& GMate,
|
|
|
|
vector <MilanLongInt>& GMate,
|
|
|
|
MilanLongInt* Mate,
|
|
|
|
MilanLongInt* Mate,
|
|
|
|
map <MilanLongInt, MilanLongInt>& Ghost2LocalMap)
|
|
|
|
map <MilanLongInt, MilanLongInt>& Ghost2LocalMap)
|
|
|
|
{
|
|
|
|
{
|
|
|
|
MilanInt w = -1;
|
|
|
|
MilanInt w = -1;
|
|
|
|
MilanReal heaviestEdgeWt = MilanRealMin; //Assign the smallest Value possible first LDBL_MIN
|
|
|
|
MilanReal heaviestEdgeWt = MilanRealMin; //Assign the smallest Value possible first LDBL_MIN
|
|
|
|