[591] | 1 | #include "xios_spl.hpp" |
---|
[300] | 2 | #include "context_client.hpp" |
---|
| 3 | #include "context_server.hpp" |
---|
| 4 | #include "event_client.hpp" |
---|
| 5 | #include "buffer_out.hpp" |
---|
| 6 | #include "buffer_client.hpp" |
---|
| 7 | #include "type.hpp" |
---|
| 8 | #include "event_client.hpp" |
---|
| 9 | #include "context.hpp" |
---|
[382] | 10 | #include "mpi.hpp" |
---|
[347] | 11 | #include "timer.hpp" |
---|
[401] | 12 | #include "cxios.hpp" |
---|
[300] | 13 | |
---|
[335] | 14 | namespace xios |
---|
[300] | 15 | { |
---|
[512] | 16 | /*! |
---|
| 17 | \param [in] parent Pointer to context on client side |
---|
| 18 | \param [in] intraComm_ communicator of group client |
---|
| 19 | \param [in] interComm_ communicator of group server |
---|
| 20 | \cxtSer [in] cxtSer Pointer to context of server side. (It is only used on case of attached mode) |
---|
| 21 | */ |
---|
[595] | 22 | CContextClient::CContextClient(CContext* parent, MPI_Comm intraComm_, MPI_Comm interComm_, CContext* cxtSer) |
---|
[917] | 23 | : mapBufferSize_(), parentServer(cxtSer), maxBufferedEvents(4) |
---|
[300] | 24 | { |
---|
[595] | 25 | context = parent; |
---|
| 26 | intraComm = intraComm_; |
---|
| 27 | interComm = interComm_; |
---|
| 28 | MPI_Comm_rank(intraComm, &clientRank); |
---|
| 29 | MPI_Comm_size(intraComm, &clientSize); |
---|
[509] | 30 | |
---|
[595] | 31 | int flag; |
---|
| 32 | MPI_Comm_test_inter(interComm, &flag); |
---|
| 33 | if (flag) MPI_Comm_remote_size(interComm, &serverSize); |
---|
| 34 | else MPI_Comm_size(interComm, &serverSize); |
---|
[509] | 35 | |
---|
[595] | 36 | if (clientSize < serverSize) |
---|
| 37 | { |
---|
| 38 | int serverByClient = serverSize / clientSize; |
---|
| 39 | int remain = serverSize % clientSize; |
---|
| 40 | int rankStart = serverByClient * clientRank; |
---|
[300] | 41 | |
---|
[595] | 42 | if (clientRank < remain) |
---|
| 43 | { |
---|
| 44 | serverByClient++; |
---|
| 45 | rankStart += clientRank; |
---|
| 46 | } |
---|
| 47 | else |
---|
| 48 | rankStart += remain; |
---|
| 49 | |
---|
| 50 | for (int i = 0; i < serverByClient; i++) |
---|
| 51 | ranksServerLeader.push_back(rankStart + i); |
---|
[988] | 52 | |
---|
| 53 | ranksServerNotLeader.resize(0); |
---|
[595] | 54 | } |
---|
| 55 | else |
---|
| 56 | { |
---|
| 57 | int clientByServer = clientSize / serverSize; |
---|
| 58 | int remain = clientSize % serverSize; |
---|
| 59 | |
---|
| 60 | if (clientRank < (clientByServer + 1) * remain) |
---|
| 61 | { |
---|
| 62 | if (clientRank % (clientByServer + 1) == 0) |
---|
| 63 | ranksServerLeader.push_back(clientRank / (clientByServer + 1)); |
---|
[988] | 64 | else |
---|
| 65 | ranksServerNotLeader.push_back(clientRank / (clientByServer + 1)); |
---|
[595] | 66 | } |
---|
| 67 | else |
---|
| 68 | { |
---|
| 69 | int rank = clientRank - (clientByServer + 1) * remain; |
---|
| 70 | if (rank % clientByServer == 0) |
---|
| 71 | ranksServerLeader.push_back(remain + rank / clientByServer); |
---|
[988] | 72 | else |
---|
| 73 | ranksServerNotLeader.push_back(remain + rank / clientByServer); |
---|
| 74 | } |
---|
[595] | 75 | } |
---|
| 76 | |
---|
| 77 | timeLine = 0; |
---|
[300] | 78 | } |
---|
| 79 | |
---|
[512] | 80 | /*! |
---|
| 81 | In case of attached mode, the current context must be reset to context for client |
---|
| 82 | \param [in] event Event sent to server |
---|
| 83 | */ |
---|
[300] | 84 | void CContextClient::sendEvent(CEventClient& event) |
---|
| 85 | { |
---|
[731] | 86 | list<int> ranks = event.getRanks(); |
---|
[1033] | 87 | |
---|
[595] | 88 | if (!event.isEmpty()) |
---|
[300] | 89 | { |
---|
[731] | 90 | list<int> sizes = event.getSizes(); |
---|
[300] | 91 | |
---|
[1033] | 92 | // We force the getBuffers call to be non-blocking on the servers |
---|
| 93 | list<CBufferOut*> buffList; |
---|
| 94 | bool couldBuffer = getBuffers(ranks, sizes, buffList, !CXios::isClient); |
---|
[509] | 95 | |
---|
[1033] | 96 | if (couldBuffer) |
---|
| 97 | { |
---|
| 98 | event.send(timeLine, sizes, buffList); |
---|
[731] | 99 | |
---|
[1033] | 100 | checkBuffers(ranks); |
---|
| 101 | |
---|
| 102 | if (isAttachedModeEnabled()) // couldBuffer is always true in attached mode |
---|
| 103 | { |
---|
| 104 | waitEvent(ranks); |
---|
| 105 | CContext::setCurrent(context->getId()); |
---|
| 106 | } |
---|
| 107 | } |
---|
| 108 | else |
---|
| 109 | { |
---|
| 110 | tmpBufferedEvent.ranks = ranks; |
---|
| 111 | tmpBufferedEvent.sizes = sizes; |
---|
| 112 | |
---|
| 113 | for (list<int>::const_iterator it = sizes.begin(); it != sizes.end(); it++) |
---|
| 114 | tmpBufferedEvent.buffers.push_back(new CBufferOut(*it)); |
---|
| 115 | |
---|
| 116 | event.send(timeLine, tmpBufferedEvent.sizes, tmpBufferedEvent.buffers); |
---|
| 117 | } |
---|
[300] | 118 | } |
---|
| 119 | |
---|
[1033] | 120 | timeLine++; |
---|
| 121 | } |
---|
| 122 | |
---|
| 123 | /*! |
---|
| 124 | * Send the temporarily buffered event (if any). |
---|
| 125 | * |
---|
| 126 | * \return true if a temporarily buffered event could be sent, false otherwise |
---|
| 127 | */ |
---|
| 128 | bool CContextClient::sendTemporarilyBufferedEvent() |
---|
| 129 | { |
---|
| 130 | bool couldSendTmpBufferedEvent = false; |
---|
| 131 | |
---|
| 132 | if (hasTemporarilyBufferedEvent()) |
---|
[511] | 133 | { |
---|
[1033] | 134 | list<CBufferOut*> buffList; |
---|
| 135 | if (getBuffers(tmpBufferedEvent.ranks, tmpBufferedEvent.sizes, buffList, true)) // Non-blocking call |
---|
| 136 | { |
---|
| 137 | list<CBufferOut*>::iterator it, itBuffer; |
---|
| 138 | |
---|
| 139 | for (it = tmpBufferedEvent.buffers.begin(), itBuffer = buffList.begin(); it != tmpBufferedEvent.buffers.end(); it++, itBuffer++) |
---|
| 140 | (*itBuffer)->put((char*)(*it)->start(), (*it)->count()); |
---|
| 141 | |
---|
| 142 | checkBuffers(tmpBufferedEvent.ranks); |
---|
| 143 | |
---|
| 144 | tmpBufferedEvent.clear(); |
---|
| 145 | |
---|
| 146 | couldSendTmpBufferedEvent = true; |
---|
| 147 | } |
---|
[511] | 148 | } |
---|
| 149 | |
---|
[1033] | 150 | return couldSendTmpBufferedEvent; |
---|
[300] | 151 | } |
---|
[509] | 152 | |
---|
[512] | 153 | /*! |
---|
| 154 | If client is also server (attached mode), after sending event, it should process right away |
---|
| 155 | the incoming event. |
---|
| 156 | \param [in] ranks list rank of server connected this client |
---|
| 157 | */ |
---|
[300] | 158 | void CContextClient::waitEvent(list<int>& ranks) |
---|
| 159 | { |
---|
[595] | 160 | parentServer->server->setPendingEvent(); |
---|
| 161 | while (checkBuffers(ranks)) |
---|
[300] | 162 | { |
---|
[595] | 163 | parentServer->server->listen(); |
---|
| 164 | parentServer->server->checkPendingRequest(); |
---|
[300] | 165 | } |
---|
[386] | 166 | |
---|
[595] | 167 | while (parentServer->server->hasPendingEvent()) |
---|
[386] | 168 | { |
---|
[595] | 169 | parentServer->server->eventLoop(); |
---|
[386] | 170 | } |
---|
[300] | 171 | } |
---|
| 172 | |
---|
[512] | 173 | /*! |
---|
[1033] | 174 | * Get buffers for each connection to the servers. This function blocks until there is enough room in the buffers unless |
---|
| 175 | * it is explicitly requested to be non-blocking. |
---|
| 176 | * |
---|
| 177 | * \param [in] serverList list of rank of connected server |
---|
| 178 | * \param [in] sizeList size of message corresponding to each connection |
---|
| 179 | * \param [out] retBuffers list of buffers that can be used to store an event |
---|
| 180 | * \param [in] nonBlocking whether this function should be non-blocking |
---|
| 181 | * \return whether the already allocated buffers could be used |
---|
[512] | 182 | */ |
---|
[1033] | 183 | bool CContextClient::getBuffers(const list<int>& serverList, const list<int>& sizeList, list<CBufferOut*>& retBuffers, bool nonBlocking /*= false*/) |
---|
[300] | 184 | { |
---|
[1033] | 185 | list<int>::const_iterator itServer, itSize; |
---|
[595] | 186 | list<CClientBuffer*> bufferList; |
---|
[1033] | 187 | map<int,CClientBuffer*>::const_iterator it; |
---|
[595] | 188 | list<CClientBuffer*>::iterator itBuffer; |
---|
[884] | 189 | bool areBuffersFree; |
---|
[300] | 190 | |
---|
[595] | 191 | for (itServer = serverList.begin(); itServer != serverList.end(); itServer++) |
---|
[300] | 192 | { |
---|
[595] | 193 | it = buffers.find(*itServer); |
---|
| 194 | if (it == buffers.end()) |
---|
[300] | 195 | { |
---|
[595] | 196 | newBuffer(*itServer); |
---|
| 197 | it = buffers.find(*itServer); |
---|
[509] | 198 | } |
---|
[595] | 199 | bufferList.push_back(it->second); |
---|
[300] | 200 | } |
---|
[347] | 201 | |
---|
| 202 | CTimer::get("Blocking time").resume(); |
---|
[884] | 203 | do |
---|
[300] | 204 | { |
---|
[884] | 205 | areBuffersFree = true; |
---|
[595] | 206 | for (itBuffer = bufferList.begin(), itSize = sizeList.begin(); itBuffer != bufferList.end(); itBuffer++, itSize++) |
---|
[884] | 207 | areBuffersFree &= (*itBuffer)->isBufferFree(*itSize); |
---|
| 208 | |
---|
| 209 | if (!areBuffersFree) |
---|
[300] | 210 | { |
---|
[884] | 211 | checkBuffers(); |
---|
| 212 | context->server->listen(); |
---|
[300] | 213 | } |
---|
[1033] | 214 | } while (!areBuffersFree && !nonBlocking); |
---|
[347] | 215 | CTimer::get("Blocking time").suspend(); |
---|
| 216 | |
---|
[1033] | 217 | if (areBuffersFree) |
---|
[300] | 218 | { |
---|
[1033] | 219 | for (itBuffer = bufferList.begin(), itSize = sizeList.begin(); itBuffer != bufferList.end(); itBuffer++, itSize++) |
---|
| 220 | retBuffers.push_back((*itBuffer)->getBuffer(*itSize)); |
---|
[300] | 221 | } |
---|
[1033] | 222 | |
---|
| 223 | return areBuffersFree; |
---|
[300] | 224 | } |
---|
[509] | 225 | |
---|
[512] | 226 | /*! |
---|
| 227 | Make a new buffer for a certain connection to server with specific rank |
---|
| 228 | \param [in] rank rank of connected server |
---|
| 229 | */ |
---|
[300] | 230 | void CContextClient::newBuffer(int rank) |
---|
| 231 | { |
---|
[724] | 232 | if (!mapBufferSize_.count(rank)) |
---|
| 233 | { |
---|
| 234 | error(0) << "WARNING: Unexpected request for buffer to communicate with server " << rank << std::endl; |
---|
| 235 | mapBufferSize_[rank] = CXios::minBufferSize; |
---|
[1192] | 236 | maxEventSizes[rank] = CXios::minBufferSize; |
---|
[724] | 237 | } |
---|
[1192] | 238 | CClientBuffer* buffer = buffers[rank] = new CClientBuffer(interComm, rank, mapBufferSize_[rank], maxEventSizes[rank], maxBufferedEvents); |
---|
[725] | 239 | // Notify the server |
---|
| 240 | CBufferOut* bufOut = buffer->getBuffer(sizeof(StdSize)); |
---|
| 241 | bufOut->put(mapBufferSize_[rank]); // Stupid C++ |
---|
| 242 | buffer->checkBuffer(); |
---|
[509] | 243 | } |
---|
[300] | 244 | |
---|
[512] | 245 | /*! |
---|
| 246 | Verify state of buffers. Buffer is under pending state if there is no message on it |
---|
| 247 | \return state of buffers, pending(true), ready(false) |
---|
| 248 | */ |
---|
[300] | 249 | bool CContextClient::checkBuffers(void) |
---|
| 250 | { |
---|
[595] | 251 | map<int,CClientBuffer*>::iterator itBuff; |
---|
| 252 | bool pending = false; |
---|
| 253 | for (itBuff = buffers.begin(); itBuff != buffers.end(); itBuff++) pending |= itBuff->second->checkBuffer(); |
---|
| 254 | return pending; |
---|
[509] | 255 | } |
---|
[300] | 256 | |
---|
[512] | 257 | //! Release all buffers |
---|
[300] | 258 | void CContextClient::releaseBuffers(void) |
---|
| 259 | { |
---|
[595] | 260 | map<int,CClientBuffer*>::iterator itBuff; |
---|
| 261 | for (itBuff = buffers.begin(); itBuff != buffers.end(); itBuff++) delete itBuff->second; |
---|
[509] | 262 | } |
---|
[300] | 263 | |
---|
[512] | 264 | /*! |
---|
| 265 | Verify state of buffers corresponding to a connection |
---|
| 266 | \param [in] ranks list rank of server to which client connects to |
---|
| 267 | \return state of buffers, pending(true), ready(false) |
---|
| 268 | */ |
---|
[300] | 269 | bool CContextClient::checkBuffers(list<int>& ranks) |
---|
| 270 | { |
---|
[595] | 271 | list<int>::iterator it; |
---|
| 272 | bool pending = false; |
---|
| 273 | for (it = ranks.begin(); it != ranks.end(); it++) pending |= buffers[*it]->checkBuffer(); |
---|
| 274 | return pending; |
---|
[509] | 275 | } |
---|
[300] | 276 | |
---|
[512] | 277 | /*! |
---|
[917] | 278 | * Set the buffer size for each connection. Warning: This function is collective. |
---|
| 279 | * |
---|
| 280 | * \param [in] mapSize maps the rank of the connected servers to the size of the correspoinding buffer |
---|
| 281 | * \param [in] maxEventSize maps the rank of the connected servers to the size of the biggest event |
---|
[512] | 282 | */ |
---|
[917] | 283 | void CContextClient::setBufferSize(const std::map<int,StdSize>& mapSize, const std::map<int,StdSize>& maxEventSize) |
---|
[509] | 284 | { |
---|
| 285 | mapBufferSize_ = mapSize; |
---|
[1192] | 286 | maxEventSizes = maxEventSize; |
---|
[917] | 287 | |
---|
| 288 | // Compute the maximum number of events that can be safely buffered. |
---|
| 289 | double minBufferSizeEventSizeRatio = std::numeric_limits<double>::max(); |
---|
| 290 | for (std::map<int,StdSize>::const_iterator it = mapSize.begin(), ite = mapSize.end(); it != ite; ++it) |
---|
| 291 | { |
---|
[1471] | 292 | double ratio = double(it->second) / maxEventSizes[it->first]; |
---|
[917] | 293 | if (ratio < minBufferSizeEventSizeRatio) minBufferSizeEventSizeRatio = ratio; |
---|
| 294 | } |
---|
| 295 | MPI_Allreduce(MPI_IN_PLACE, &minBufferSizeEventSizeRatio, 1, MPI_DOUBLE, MPI_MIN, intraComm); |
---|
| 296 | |
---|
| 297 | if (minBufferSizeEventSizeRatio < 1.0) |
---|
[1198] | 298 | { |
---|
[917] | 299 | ERROR("void CContextClient::setBufferSize(const std::map<int,StdSize>& mapSize, const std::map<int,StdSize>& maxEventSize)", |
---|
| 300 | << "The buffer sizes and the maximum events sizes are incoherent."); |
---|
[1198] | 301 | } |
---|
[1197] | 302 | else if (minBufferSizeEventSizeRatio == std::numeric_limits<double>::max()) |
---|
| 303 | minBufferSizeEventSizeRatio = 1.0; // In this case, maxBufferedEvents will never be used but we want to avoid any floating point exception |
---|
[917] | 304 | |
---|
| 305 | maxBufferedEvents = size_t(2 * minBufferSizeEventSizeRatio) // there is room for two local buffers on the server |
---|
| 306 | + size_t(minBufferSizeEventSizeRatio) // one local buffer can always be fully used |
---|
| 307 | + 1; // the other local buffer might contain only one event |
---|
[509] | 308 | } |
---|
| 309 | |
---|
[595] | 310 | /*! |
---|
| 311 | Get leading server in the group of connected server |
---|
| 312 | \return ranks of leading servers |
---|
| 313 | */ |
---|
[988] | 314 | const std::list<int>& CContextClient::getRanksServerNotLeader(void) const |
---|
| 315 | { |
---|
| 316 | return ranksServerNotLeader; |
---|
| 317 | } |
---|
| 318 | |
---|
| 319 | /*! |
---|
| 320 | Check if client connects to leading server |
---|
| 321 | \return connected(true), not connected (false) |
---|
| 322 | */ |
---|
| 323 | bool CContextClient::isServerNotLeader(void) const |
---|
| 324 | { |
---|
| 325 | return !ranksServerNotLeader.empty(); |
---|
| 326 | } |
---|
| 327 | |
---|
| 328 | /*! |
---|
| 329 | Get leading server in the group of connected server |
---|
| 330 | \return ranks of leading servers |
---|
| 331 | */ |
---|
[595] | 332 | const std::list<int>& CContextClient::getRanksServerLeader(void) const |
---|
| 333 | { |
---|
| 334 | return ranksServerLeader; |
---|
| 335 | } |
---|
[509] | 336 | |
---|
[595] | 337 | /*! |
---|
| 338 | Check if client connects to leading server |
---|
| 339 | \return connected(true), not connected (false) |
---|
| 340 | */ |
---|
| 341 | bool CContextClient::isServerLeader(void) const |
---|
| 342 | { |
---|
| 343 | return !ranksServerLeader.empty(); |
---|
| 344 | } |
---|
[300] | 345 | |
---|
[704] | 346 | /*! |
---|
| 347 | * Check if the attached mode is used. |
---|
| 348 | * |
---|
| 349 | * \return true if and only if attached mode is used |
---|
| 350 | */ |
---|
| 351 | bool CContextClient::isAttachedModeEnabled() const |
---|
| 352 | { |
---|
| 353 | return (parentServer != 0); |
---|
| 354 | } |
---|
[697] | 355 | |
---|
[512] | 356 | /*! |
---|
| 357 | Finalize context client and do some reports |
---|
| 358 | */ |
---|
[300] | 359 | void CContextClient::finalize(void) |
---|
| 360 | { |
---|
[595] | 361 | map<int,CClientBuffer*>::iterator itBuff; |
---|
[1033] | 362 | bool stop = false; |
---|
[731] | 363 | |
---|
[1033] | 364 | CTimer::get("Blocking time").resume(); |
---|
| 365 | while (hasTemporarilyBufferedEvent()) |
---|
| 366 | { |
---|
| 367 | checkBuffers(); |
---|
| 368 | sendTemporarilyBufferedEvent(); |
---|
| 369 | } |
---|
| 370 | CTimer::get("Blocking time").suspend(); |
---|
| 371 | |
---|
[595] | 372 | CEventClient event(CContext::GetType(), CContext::EVENT_ID_CONTEXT_FINALIZE); |
---|
[300] | 373 | if (isServerLeader()) |
---|
| 374 | { |
---|
[595] | 375 | CMessage msg; |
---|
| 376 | const std::list<int>& ranks = getRanksServerLeader(); |
---|
| 377 | for (std::list<int>::const_iterator itRank = ranks.begin(), itRankEnd = ranks.end(); itRank != itRankEnd; ++itRank) |
---|
| 378 | event.push(*itRank, 1, msg); |
---|
| 379 | sendEvent(event); |
---|
[300] | 380 | } |
---|
[595] | 381 | else sendEvent(event); |
---|
[509] | 382 | |
---|
[347] | 383 | CTimer::get("Blocking time").resume(); |
---|
[1033] | 384 | while (!stop) |
---|
[300] | 385 | { |
---|
[595] | 386 | checkBuffers(); |
---|
[1033] | 387 | if (hasTemporarilyBufferedEvent()) |
---|
| 388 | sendTemporarilyBufferedEvent(); |
---|
| 389 | |
---|
| 390 | stop = true; |
---|
| 391 | for (itBuff = buffers.begin(); itBuff != buffers.end(); itBuff++) stop &= !itBuff->second->hasPendingRequest(); |
---|
[300] | 392 | } |
---|
[347] | 393 | CTimer::get("Blocking time").suspend(); |
---|
[509] | 394 | |
---|
[595] | 395 | std::map<int,StdSize>::const_iterator itbMap = mapBufferSize_.begin(), |
---|
| 396 | iteMap = mapBufferSize_.end(), itMap; |
---|
[511] | 397 | StdSize totalBuf = 0; |
---|
| 398 | for (itMap = itbMap; itMap != iteMap; ++itMap) |
---|
| 399 | { |
---|
[595] | 400 | report(10) << " Memory report : Context <" << context->getId() << "> : client side : memory used for buffer of each connection to server" << endl |
---|
| 401 | << " +) To server with rank " << itMap->first << " : " << itMap->second << " bytes " << endl; |
---|
[511] | 402 | totalBuf += itMap->second; |
---|
| 403 | } |
---|
[595] | 404 | report(0) << " Memory report : Context <" << context->getId() << "> : client side : total memory used for buffer " << totalBuf << " bytes" << endl; |
---|
[511] | 405 | |
---|
[595] | 406 | releaseBuffers(); |
---|
[300] | 407 | } |
---|
[509] | 408 | } |
---|