source: XIOS/dev/dev_olga/src/context_client.cpp @ 1139

Last change on this file since 1139 was 1139, checked in by oabramkina, 7 years ago

Fixing a bug in context finalization. Now context finalization is done in two stages.
Tested on Cure with test_regular and test_xios2_cmip6.

  • Property copyright set to
    Software name : XIOS (Xml I/O Server)
    http://forge.ipsl.jussieu.fr/ioserver
    Creation date : January 2009
    Licence : CeCCIL version2
    see license file in root directory : Licence_CeCILL_V2-en.txt
    or http://www.cecill.info/licences/Licence_CeCILL_V2-en.html
    Holder : CEA/LSCE (Laboratoire des Sciences du CLimat et de l'Environnement)
    CNRS/IPSL (Institut Pierre Simon Laplace)
    Project Manager : Yann Meurdesoif
    yann.meurdesoif@cea.fr
  • Property svn:eol-style set to native
File size: 15.1 KB
RevLine 
[591]1#include "xios_spl.hpp"
[300]2#include "context_client.hpp"
3#include "context_server.hpp"
4#include "event_client.hpp"
5#include "buffer_out.hpp"
6#include "buffer_client.hpp"
7#include "type.hpp"
8#include "event_client.hpp"
9#include "context.hpp"
[382]10#include "mpi.hpp"
[347]11#include "timer.hpp"
[401]12#include "cxios.hpp"
[1130]13#include "server.hpp"
[300]14
[335]15namespace xios
[300]16{
[512]17    /*!
18    \param [in] parent Pointer to context on client side
19    \param [in] intraComm_ communicator of group client
20    \param [in] interComm_ communicator of group server
[983]21    \cxtSer [in] cxtSer Pointer to context of server side. (It is only used in case of attached mode).
[512]22    */
[595]23    CContextClient::CContextClient(CContext* parent, MPI_Comm intraComm_, MPI_Comm interComm_, CContext* cxtSer)
[917]24     : mapBufferSize_(), parentServer(cxtSer), maxBufferedEvents(4)
[300]25    {
[595]26      context = parent;
27      intraComm = intraComm_;
28      interComm = interComm_;
29      MPI_Comm_rank(intraComm, &clientRank);
30      MPI_Comm_size(intraComm, &clientSize);
[509]31
[595]32      int flag;
33      MPI_Comm_test_inter(interComm, &flag);
34      if (flag) MPI_Comm_remote_size(interComm, &serverSize);
35      else  MPI_Comm_size(interComm, &serverSize);
[509]36
[595]37      if (clientSize < serverSize)
38      {
39        int serverByClient = serverSize / clientSize;
40        int remain = serverSize % clientSize;
41        int rankStart = serverByClient * clientRank;
[300]42
[595]43        if (clientRank < remain)
44        {
45          serverByClient++;
46          rankStart += clientRank;
47        }
48        else
49          rankStart += remain;
50
51        for (int i = 0; i < serverByClient; i++)
52          ranksServerLeader.push_back(rankStart + i);
[1021]53
54        ranksServerNotLeader.resize(0);      }
[595]55      else
56      {
57        int clientByServer = clientSize / serverSize;
58        int remain = clientSize % serverSize;
59
60        if (clientRank < (clientByServer + 1) * remain)
61        {
62          if (clientRank % (clientByServer + 1) == 0)
63            ranksServerLeader.push_back(clientRank / (clientByServer + 1));
[1021]64          else
65            ranksServerNotLeader.push_back(clientRank / (clientByServer + 1));
[595]66        }
67        else
68        {
69          int rank = clientRank - (clientByServer + 1) * remain;
70          if (rank % clientByServer == 0)
71            ranksServerLeader.push_back(remain + rank / clientByServer);
[1021]72          else
73            ranksServerNotLeader.push_back(remain + rank / clientByServer);
[595]74        }
75      }
76
77      timeLine = 0;
[300]78    }
79
[512]80    /*!
81    In case of attached mode, the current context must be reset to context for client
82    \param [in] event Event sent to server
83    */
[300]84    void CContextClient::sendEvent(CEventClient& event)
85    {
[731]86      list<int> ranks = event.getRanks();
[1054]87
[595]88      if (!event.isEmpty())
[300]89      {
[731]90        list<int> sizes = event.getSizes();
[300]91
[1130]92        // We force the getBuffers call to be non-blocking on classical servers
[1054]93        list<CBufferOut*> buffList;
[1130]94        bool couldBuffer = getBuffers(ranks, sizes, buffList, (!CXios::isClient && (CServer::serverLevel == 0) ));
95        //bool couldBuffer = getBuffers(ranks, sizes, buffList, false );
[509]96
[1054]97        if (couldBuffer)
98        {
99          event.send(timeLine, sizes, buffList);
[731]100
[1054]101          checkBuffers(ranks);
102
103          if (isAttachedModeEnabled()) // couldBuffer is always true in attached mode
104          {
105            waitEvent(ranks);
106            CContext::setCurrent(context->getId());
107          }
108        }
109        else
110        {
111          tmpBufferedEvent.ranks = ranks;
112          tmpBufferedEvent.sizes = sizes;
113
114          for (list<int>::const_iterator it = sizes.begin(); it != sizes.end(); it++)
115            tmpBufferedEvent.buffers.push_back(new CBufferOut(*it));
116
117          event.send(timeLine, tmpBufferedEvent.sizes, tmpBufferedEvent.buffers);
118        }
[300]119      }
120
[1054]121      timeLine++;
122    }
123
124    /*!
125     * Send the temporarily buffered event (if any).
126     *
127     * \return true if a temporarily buffered event could be sent, false otherwise
128     */
129    bool CContextClient::sendTemporarilyBufferedEvent()
130    {
131      bool couldSendTmpBufferedEvent = false;
132
133      if (hasTemporarilyBufferedEvent())
[511]134      {
[1054]135        list<CBufferOut*> buffList;
136        if (getBuffers(tmpBufferedEvent.ranks, tmpBufferedEvent.sizes, buffList, true)) // Non-blocking call
137        {
138          list<CBufferOut*>::iterator it, itBuffer;
139
140          for (it = tmpBufferedEvent.buffers.begin(), itBuffer = buffList.begin(); it != tmpBufferedEvent.buffers.end(); it++, itBuffer++)
141            (*itBuffer)->put((char*)(*it)->start(), (*it)->count());
142
143          checkBuffers(tmpBufferedEvent.ranks);
144
145          tmpBufferedEvent.clear();
146
147          couldSendTmpBufferedEvent = true;
148        }
[511]149      }
150
[1054]151      return couldSendTmpBufferedEvent;
[300]152    }
[509]153
[512]154    /*!
155    If client is also server (attached mode), after sending event, it should process right away
156    the incoming event.
157    \param [in] ranks list rank of server connected this client
158    */
[300]159    void CContextClient::waitEvent(list<int>& ranks)
160    {
[595]161      parentServer->server->setPendingEvent();
162      while (checkBuffers(ranks))
[300]163      {
[595]164        parentServer->server->listen();
165        parentServer->server->checkPendingRequest();
[300]166      }
[386]167
[595]168      while (parentServer->server->hasPendingEvent())
[386]169      {
[595]170       parentServer->server->eventLoop();
[386]171      }
[300]172    }
173
[1054]174
[512]175    /*!
[1054]176     * Get buffers for each connection to the servers. This function blocks until there is enough room in the buffers unless
177     * it is explicitly requested to be non-blocking.
178     *
179     * \param [in] serverList list of rank of connected server
180     * \param [in] sizeList size of message corresponding to each connection
181     * \param [out] retBuffers list of buffers that can be used to store an event
182     * \param [in] nonBlocking whether this function should be non-blocking
183     * \return whether the already allocated buffers could be used
[512]184    */
[1071]185    bool CContextClient::getBuffers(const list<int>& serverList, const list<int>& sizeList, list<CBufferOut*>& retBuffers,
186                                    bool nonBlocking /*= false*/)
[300]187    {
[1054]188      list<int>::const_iterator itServer, itSize;
[595]189      list<CClientBuffer*> bufferList;
[1054]190      map<int,CClientBuffer*>::const_iterator it;
[595]191      list<CClientBuffer*>::iterator itBuffer;
[884]192      bool areBuffersFree;
[300]193
[595]194      for (itServer = serverList.begin(); itServer != serverList.end(); itServer++)
[300]195      {
[595]196        it = buffers.find(*itServer);
197        if (it == buffers.end())
[300]198        {
[595]199          newBuffer(*itServer);
200          it = buffers.find(*itServer);
[509]201        }
[595]202        bufferList.push_back(it->second);
[300]203      }
[347]204
205      CTimer::get("Blocking time").resume();
[884]206      do
[300]207      {
[884]208        areBuffersFree = true;
[595]209        for (itBuffer = bufferList.begin(), itSize = sizeList.begin(); itBuffer != bufferList.end(); itBuffer++, itSize++)
[884]210          areBuffersFree &= (*itBuffer)->isBufferFree(*itSize);
211
212        if (!areBuffersFree)
[300]213        {
[884]214          checkBuffers();
[1130]215          if (CServer::serverLevel == 0)
216            context->server->listen();
[1071]217
[1130]218          else if (CServer::serverLevel == 1)
219          {
220            context->server->listen();
221            for (int i = 0; i < context->serverPrimServer.size(); ++i)
222              context->serverPrimServer[i]->listen();
223          }
224
225          else if (CServer::serverLevel == 2)
226            context->server->listen();
227
[300]228        }
[1054]229      } while (!areBuffersFree && !nonBlocking);
[1130]230
[347]231      CTimer::get("Blocking time").suspend();
232
[1054]233      if (areBuffersFree)
[300]234      {
[1054]235        for (itBuffer = bufferList.begin(), itSize = sizeList.begin(); itBuffer != bufferList.end(); itBuffer++, itSize++)
236          retBuffers.push_back((*itBuffer)->getBuffer(*itSize));
[300]237      }
[1054]238
239      return areBuffersFree;
[300]240   }
[509]241
[512]242   /*!
243   Make a new buffer for a certain connection to server with specific rank
244   \param [in] rank rank of connected server
245   */
[300]246   void CContextClient::newBuffer(int rank)
247   {
[1071]248     if (!mapBufferSize_.count(rank))
249     {
250       error(0) << "WARNING: Unexpected request for buffer to communicate with server " << rank << std::endl;
251       mapBufferSize_[rank] = CXios::minBufferSize;
252     }
253     CClientBuffer* buffer = buffers[rank] = new CClientBuffer(interComm, rank, mapBufferSize_[rank], maxBufferedEvents);
254     // Notify the server
255     CBufferOut* bufOut = buffer->getBuffer(sizeof(StdSize));
256     bufOut->put(mapBufferSize_[rank]); // Stupid C++
257     buffer->checkBuffer();
[509]258   }
[300]259
[512]260   /*!
261   Verify state of buffers. Buffer is under pending state if there is no message on it
262   \return state of buffers, pending(true), ready(false)
263   */
[300]264   bool CContextClient::checkBuffers(void)
265   {
[595]266      map<int,CClientBuffer*>::iterator itBuff;
267      bool pending = false;
[1130]268      for (itBuff = buffers.begin(); itBuff != buffers.end(); itBuff++)
269        pending |= itBuff->second->checkBuffer();
[595]270      return pending;
[509]271   }
[300]272
[512]273   //! Release all buffers
[1071]274   void CContextClient::releaseBuffers()
[300]275   {
[595]276      map<int,CClientBuffer*>::iterator itBuff;
[1077]277      for (itBuff = buffers.begin(); itBuff != buffers.end(); itBuff++)
[1139]278      {
[1077]279          delete itBuff->second;
[1139]280      }
[1077]281      buffers.clear();
[509]282   }
[300]283
[512]284   /*!
285   Verify state of buffers corresponding to a connection
286   \param [in] ranks list rank of server to which client connects to
287   \return state of buffers, pending(true), ready(false)
288   */
[300]289   bool CContextClient::checkBuffers(list<int>& ranks)
290   {
[595]291      list<int>::iterator it;
292      bool pending = false;
293      for (it = ranks.begin(); it != ranks.end(); it++) pending |= buffers[*it]->checkBuffer();
294      return pending;
[509]295   }
[300]296
[512]297   /*!
[917]298    * Set the buffer size for each connection. Warning: This function is collective.
299    *
300    * \param [in] mapSize maps the rank of the connected servers to the size of the correspoinding buffer
301    * \param [in] maxEventSize maps the rank of the connected servers to the size of the biggest event
[512]302   */
[917]303   void CContextClient::setBufferSize(const std::map<int,StdSize>& mapSize, const std::map<int,StdSize>& maxEventSize)
[509]304   {
305     mapBufferSize_ = mapSize;
[917]306
307     // Compute the maximum number of events that can be safely buffered.
308     double minBufferSizeEventSizeRatio = std::numeric_limits<double>::max();
309     for (std::map<int,StdSize>::const_iterator it = mapSize.begin(), ite = mapSize.end(); it != ite; ++it)
310     {
311       double ratio = double(it->second) / maxEventSize.at(it->first);
312       if (ratio < minBufferSizeEventSizeRatio) minBufferSizeEventSizeRatio = ratio;
313     }
314     MPI_Allreduce(MPI_IN_PLACE, &minBufferSizeEventSizeRatio, 1, MPI_DOUBLE, MPI_MIN, intraComm);
315
316     if (minBufferSizeEventSizeRatio < 1.0)
317       ERROR("void CContextClient::setBufferSize(const std::map<int,StdSize>& mapSize, const std::map<int,StdSize>& maxEventSize)",
318             << "The buffer sizes and the maximum events sizes are incoherent.");
319
320     maxBufferedEvents = size_t(2 * minBufferSizeEventSizeRatio) // there is room for two local buffers on the server
321                          + size_t(minBufferSizeEventSizeRatio)  // one local buffer can always be fully used
322                          + 1;                                   // the other local buffer might contain only one event
[509]323   }
324
[1021]325   /*!
326    Get leading server in the group of connected server
327    \return ranks of leading servers
328    */
329    const std::list<int>& CContextClient::getRanksServerNotLeader(void) const
330    {
331      return ranksServerNotLeader;
332    }
333
334    /*!
335    Check if client connects to leading server
336    \return connected(true), not connected (false)
337    */
338    bool CContextClient::isServerNotLeader(void) const
339    {
340      return !ranksServerNotLeader.empty();
341    }
342
[595]343  /*!
344  Get leading server in the group of connected server
345  \return ranks of leading servers
346  */
347  const std::list<int>& CContextClient::getRanksServerLeader(void) const
348  {
349    return ranksServerLeader;
350  }
[509]351
[595]352  /*!
353  Check if client connects to leading server
354  \return connected(true), not connected (false)
355  */
356  bool CContextClient::isServerLeader(void) const
357  {
358    return !ranksServerLeader.empty();
359  }
[300]360
[704]361  /*!
362   * Check if the attached mode is used.
363   *
364   * \return true if and only if attached mode is used
365   */
366  bool CContextClient::isAttachedModeEnabled() const
367  {
368    return (parentServer != 0);
369  }
[697]370
[512]371   /*!
[1130]372   * Finalize context client and do some reports. Function is non-blocking.
[512]373   */
[1130]374  void CContextClient::finalize(void)
[1054]375  {
376    map<int,CClientBuffer*>::iterator itBuff;
377    bool stop = false;
[731]378
[1054]379    CTimer::get("Blocking time").resume();
380    while (hasTemporarilyBufferedEvent())
381    {
382      checkBuffers();
383      sendTemporarilyBufferedEvent();
384    }
385    CTimer::get("Blocking time").suspend();
[509]386
[1054]387    CEventClient event(CContext::GetType(), CContext::EVENT_ID_CONTEXT_FINALIZE);
388    if (isServerLeader())
389    {
390      CMessage msg;
391      const std::list<int>& ranks = getRanksServerLeader();
392      for (std::list<int>::const_iterator itRank = ranks.begin(), itRankEnd = ranks.end(); itRank != itRankEnd; ++itRank)
393        event.push(*itRank, 1, msg);
394      sendEvent(event);
395    }
396    else sendEvent(event);
[509]397
[1054]398    CTimer::get("Blocking time").resume();
[1130]399//    while (!stop)
[1054]400    {
401      checkBuffers();
402      if (hasTemporarilyBufferedEvent())
403        sendTemporarilyBufferedEvent();
[511]404
[1054]405      stop = true;
[1130]406//      for (itBuff = buffers.begin(); itBuff != buffers.end(); itBuff++) stop &= !itBuff->second->hasPendingRequest();
[1054]407    }
408    CTimer::get("Blocking time").suspend();
409
410    std::map<int,StdSize>::const_iterator itbMap = mapBufferSize_.begin(),
411                                          iteMap = mapBufferSize_.end(), itMap;
[1071]412
[1054]413    StdSize totalBuf = 0;
414    for (itMap = itbMap; itMap != iteMap; ++itMap)
415    {
416      report(10) << " Memory report : Context <" << context->getId() << "> : client side : memory used for buffer of each connection to server" << endl
417                 << "  +) To server with rank " << itMap->first << " : " << itMap->second << " bytes " << endl;
418      totalBuf += itMap->second;
419    }
420    report(0) << " Memory report : Context <" << context->getId() << "> : client side : total memory used for buffer " << totalBuf << " bytes" << endl;
421
[1130]422    //releaseBuffers(); // moved to CContext::finalize()
[1054]423  }
[1130]424
425  /*!
[1139]426  * Finalize context client and do some reports. Function is non-blocking.
[1130]427  */
[1139]428 void CContextClient::postFinalize(void)
429 {
430   map<int,CClientBuffer*>::iterator itBuff;
431   bool stop = false;
432
433   CTimer::get("Blocking time").resume();
434   while (hasTemporarilyBufferedEvent())
435   {
436     checkBuffers();
437     sendTemporarilyBufferedEvent();
438   }
439   CTimer::get("Blocking time").suspend();
440
441   CEventClient event(CContext::GetType(), CContext::EVENT_ID_CONTEXT_POST_FINALIZE);
442   if (isServerLeader())
443   {
444     CMessage msg;
445     const std::list<int>& ranks = getRanksServerLeader();
446     for (std::list<int>::const_iterator itRank = ranks.begin(), itRankEnd = ranks.end(); itRank != itRankEnd; ++itRank)
447       event.push(*itRank, 1, msg);
448     sendEvent(event);
449   }
450   else sendEvent(event);
451
452   CTimer::get("Blocking time").resume();
453//    while (!stop)
454   {
455     checkBuffers();
456     if (hasTemporarilyBufferedEvent())
457       sendTemporarilyBufferedEvent();
458
459     stop = true;
460   }
461   CTimer::get("Blocking time").suspend();
462
463 }
464
465  /*!
466  */
[1130]467  bool CContextClient::havePendingRequests(void)
468  {
469    bool pending = false;
470    map<int,CClientBuffer*>::iterator itBuff;
471    for (itBuff = buffers.begin(); itBuff != buffers.end(); itBuff++)
472      pending |= itBuff->second->hasPendingRequest();
473    return pending;
474  }
475
476
[509]477}
Note: See TracBrowser for help on using the repository browser.