Skip to content
Snippets Groups Projects
Commit 1e29ce7a authored by Anna Wellmann's avatar Anna Wellmann
Browse files

Use function to find send and receive neighbors in exchange

parent e00aee75
No related branches found
No related tags found
1 merge request!104Add Communication Hiding to GPU version
......@@ -111,11 +111,8 @@ void exchangeCollDataXGPU27(Parameter *para, vf::gpu::Communicator *comm, CudaMe
void prepareExchangeCollDataYGPU27(Parameter *para, int level, int streamIndex, bool useReducedCommunicationAfterFtoC)
{
cudaStream_t stream = (streamIndex == -1) ? CU_STREAM_LEGACY : para->getStreamManager()->getStream(streamIndex);
std::vector<ProcessNeighbor27> *sendProcessNeighbor;
if (useReducedCommunicationAfterFtoC)
sendProcessNeighbor = &para->getParD(level)->sendProcessNeighborsAfterFtoCY;
else
sendProcessNeighbor = &para->getParD(level)->sendProcessNeighborY;
std::vector<ProcessNeighbor27> *sendProcessNeighbor =
getSendProcessNeighborY(useReducedCommunicationAfterFtoC, para, level);
for (unsigned int i = 0; i < (unsigned int)(para->getNumberOfProcessNeighborsY(level, "send")); i++)
GetSendFsPostDev27(para->getParD(level)->d0SP.f[0],
......@@ -132,9 +129,14 @@ void prepareExchangeCollDataYGPU27(Parameter *para, int level, int streamIndex,
}
void exchangeCollDataYGPU27(Parameter *para, vf::gpu::Communicator *comm, CudaMemoryManager *cudaManager, int level,
int streamIndex)
int streamIndex, bool useReducedCommunicationAfterFtoC)
{
cudaStream_t stream = (streamIndex == -1) ? CU_STREAM_LEGACY : para->getStreamManager()->getStream(streamIndex);
std::vector<ProcessNeighbor27> *sendProcessNeighbor =
getSendProcessNeighborY(useReducedCommunicationAfterFtoC, para, level);
std::vector<ProcessNeighbor27> *recvProcessNeighbor =
getRecvProcessNeighborY(useReducedCommunicationAfterFtoC, para, level);
///////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
//copy Device to Host
for (unsigned int i = 0; i < (unsigned int)(para->getNumberOfProcessNeighborsY(level, "send")); i++)
......@@ -218,6 +220,24 @@ void exchangeCollDataYGPU27(Parameter *para, vf::gpu::Communicator *comm, CudaMe
}
///////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
}
std::vector<ProcessNeighbor27> *getSendProcessNeighborY(bool useReducedCommunicationAfterFtoC, Parameter *para,
int level)
{
if (useReducedCommunicationAfterFtoC)
return &para->getParD(level)->sendProcessNeighborsAfterFtoCY;
else
return &para->getParD(level)->sendProcessNeighborY;
}
std::vector<ProcessNeighbor27> *getRecvProcessNeighborY(bool useReducedCommunicationAfterFtoC, Parameter *para,
int level)
{
if (useReducedCommunicationAfterFtoC)
return &para->getParD(level)->recvProcessNeighborsAfterFtoCY;
else
return &para->getParD(level)->recvProcessNeighborY;
}
////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
......
......@@ -17,9 +17,11 @@ extern "C" void exchangePostCollDataGPU27(Parameter* para, vf::gpu::Communicator
extern "C" void prepareExchangeCollDataXGPU27(Parameter *para, int level, int streamIndex);
extern "C" void exchangeCollDataXGPU27(Parameter *para, vf::gpu::Communicator *comm, CudaMemoryManager *cudaManager,
int level, int streamIndex);
extern "C" void prepareExchangeCollDataYGPU27(Parameter *para, int level, int streamIndex, bool useReducedCommunicationAfterFtoC = false);
extern "C" void prepareExchangeCollDataYGPU27(Parameter *para, int level, int streamIndex,
bool useReducedCommunicationAfterFtoC = false);
std::vector<ProcessNeighbor27> *getSendProcessNeighborY(bool useReducedCommunicationAfterFtoC, Parameter *para, int level);
extern "C" void exchangeCollDataYGPU27(Parameter *para, vf::gpu::Communicator *comm, CudaMemoryManager *cudaManager,
int level, int streamIndex);
int level, int streamIndex, bool useReducedCommunicationAfterFtoC = false);
extern "C" void prepareExchangeCollDataZGPU27(Parameter *para, int level, int streamIndex);
extern "C" void exchangeCollDataZGPU27(Parameter *para, vf::gpu::Communicator *comm, CudaMemoryManager *cudaManager,
int level, int streamIndex);
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment