/******************************************************************************** * Copyright (C) 2016-2017 GSI Helmholtzzentrum fuer Schwerionenforschung GmbH * * * * This software is distributed under the terms of the * * GNU Lesser General Public Licence (LGPL) version 3, * * copied verbatim in the file "LICENSE" * ********************************************************************************/ #include "FairMQLogger.h" #include "FairMQTransportFactorySHM.h" #include #include #include #include #include #include #include #include #include #include // std::system using namespace std; using namespace fair::mq::shmem; namespace bfs = boost::filesystem; namespace bpt = boost::posix_time; namespace bipc = boost::interprocess; FairMQ::Transport FairMQTransportFactorySHM::fTransportType = FairMQ::Transport::SHM; FairMQTransportFactorySHM::FairMQTransportFactorySHM(const string& id, const FairMQProgOptions* config) : FairMQTransportFactory(id) , fSessionName("default") , fContext(nullptr) , fHeartbeatThread() , fSendHeartbeats(true) , fShMutex(nullptr) , fDeviceCounter(nullptr) , fManager(nullptr) { int major, minor, patch; zmq_version(&major, &minor, &patch); LOG(debug) << "Transport: Using ZeroMQ (" << major << "." << minor << "." << patch << ") & " << "boost::interprocess (" << (BOOST_VERSION / 100000) << "." << (BOOST_VERSION / 100 % 1000) << "." << (BOOST_VERSION % 100) << ")"; fContext = zmq_ctx_new(); if (!fContext) { LOG(error) << "failed creating context, reason: " << zmq_strerror(errno); exit(EXIT_FAILURE); } int numIoThreads = 1; size_t segmentSize = 2000000000; if (config) { numIoThreads = config->GetValue("io-threads"); fSessionName = config->GetValue("session"); segmentSize = config->GetValue("shm-segment-size"); } else { LOG(warn) << "FairMQProgOptions not available! Using defaults."; } fSessionName.resize(8, '_'); // shorten the session name, to accommodate for name size limit on some systems (MacOS) try { fShMutex = fair::mq::tools::make_unique(bipc::open_or_create, std::string("fmq_shm_" + fSessionName + "_mutex").c_str()); if (zmq_ctx_set(fContext, ZMQ_IO_THREADS, numIoThreads) != 0) { LOG(error) << "failed configuring context, reason: " << zmq_strerror(errno); } // Set the maximum number of allowed sockets on the context. if (zmq_ctx_set(fContext, ZMQ_MAX_SOCKETS, 10000) != 0) { LOG(error) << "failed configuring context, reason: " << zmq_strerror(errno); } fManager = fair::mq::tools::make_unique(fSessionName, segmentSize); LOG(debug) << "created/opened shared memory segment '" << "fmq_shm_" << fSessionName << "_main" << "' of " << segmentSize << " bytes. Available are " << fManager->Segment().get_free_memory() << " bytes."; { bipc::scoped_lock lock(*fShMutex); fDeviceCounter = fManager->Segment().find(bipc::unique_instance).first; if (fDeviceCounter) { LOG(debug) << "device counter found, with value of " << fDeviceCounter->fCount << ". incrementing."; (fDeviceCounter->fCount)++; LOG(debug) << "incremented device counter, now: " << fDeviceCounter->fCount; } else { LOG(debug) << "no device counter found, creating one and initializing with 1"; fDeviceCounter = fManager->Segment().construct(bipc::unique_instance)(1); LOG(debug) << "initialized device counter with: " << fDeviceCounter->fCount; } // start shm monitor // try // { // MonitorStatus* monitorStatus = fManagementSegment.find(bipc::unique_instance).first; // if (monitorStatus == nullptr) // { // LOG(debug) << "no shmmonitor found, starting..."; // StartMonitor(); // } // else // { // LOG(debug) << "found shmmonitor."; // } // } // catch (std::exception& e) // { // LOG(error) << "Exception during shmmonitor initialization: " << e.what() << ", application will now exit"; // exit(EXIT_FAILURE); // } } } catch(bipc::interprocess_exception& e) { LOG(error) << "Could not initialize shared memory transport: " << e.what(); throw runtime_error("Cannot update configuration. Socket method (bind/connect) not specified."); } fSendHeartbeats = true; fHeartbeatThread = thread(&FairMQTransportFactorySHM::SendHeartbeats, this); } void FairMQTransportFactorySHM::StartMonitor() { int numTries = 0; if (!bfs::exists(bfs::path("shmmonitor"))) { LOG(error) << "Could not find shmmonitor. Is it in the PATH? Monitor not started"; return; } // TODO: replace with Boost.Process once boost 1.64 is available int r = system("shmmonitor --self-destruct &"); LOG(debug) << r; do { MonitorStatus* monitorStatus = fManager->ManagementSegment().find(bipc::unique_instance).first; if (monitorStatus) { LOG(debug) << "shmmonitor started"; break; } else { this_thread::sleep_for(std::chrono::milliseconds(10)); if (++numTries > 100) { LOG(error) << "Did not get response from shmmonitor after " << 10 * 100 << " milliseconds. Exiting."; exit(EXIT_FAILURE); } } } while (true); } void FairMQTransportFactorySHM::SendHeartbeats() { string controlQueueName("fmq_shm_" + fSessionName + "_control_queue"); while (fSendHeartbeats) { try { bipc::message_queue mq(bipc::open_only, controlQueueName.c_str()); bool heartbeat = true; bpt::ptime sndTill = bpt::microsec_clock::universal_time() + bpt::milliseconds(100); if (mq.timed_send(&heartbeat, sizeof(heartbeat), 0, sndTill)) { this_thread::sleep_for(chrono::milliseconds(100)); } else { LOG(debug) << "control queue timeout"; } } catch (bipc::interprocess_exception& ie) { this_thread::sleep_for(chrono::milliseconds(500)); // LOG(warn) << "no " << controlQueueName << " found"; } } } FairMQMessagePtr FairMQTransportFactorySHM::CreateMessage() const { return unique_ptr(new FairMQMessageSHM(*fManager)); } FairMQMessagePtr FairMQTransportFactorySHM::CreateMessage(const size_t size) const { return unique_ptr(new FairMQMessageSHM(*fManager, size)); } FairMQMessagePtr FairMQTransportFactorySHM::CreateMessage(void* data, const size_t size, fairmq_free_fn* ffn, void* hint) const { return unique_ptr(new FairMQMessageSHM(*fManager, data, size, ffn, hint)); } FairMQMessagePtr FairMQTransportFactorySHM::CreateMessage(FairMQUnmanagedRegionPtr& region, void* data, const size_t size, void* hint) const { return unique_ptr(new FairMQMessageSHM(*fManager, region, data, size, hint)); } FairMQSocketPtr FairMQTransportFactorySHM::CreateSocket(const string& type, const string& name) const { assert(fContext); return unique_ptr(new FairMQSocketSHM(*fManager, type, name, GetId(), fContext)); } FairMQPollerPtr FairMQTransportFactorySHM::CreatePoller(const vector& channels) const { return unique_ptr(new FairMQPollerSHM(channels)); } FairMQPollerPtr FairMQTransportFactorySHM::CreatePoller(const std::vector& channels) const { return unique_ptr(new FairMQPollerSHM(channels)); } FairMQPollerPtr FairMQTransportFactorySHM::CreatePoller(const unordered_map>& channelsMap, const vector& channelList) const { return unique_ptr(new FairMQPollerSHM(channelsMap, channelList)); } FairMQPollerPtr FairMQTransportFactorySHM::CreatePoller(const FairMQSocket& cmdSocket, const FairMQSocket& dataSocket) const { return unique_ptr(new FairMQPollerSHM(cmdSocket, dataSocket)); } FairMQUnmanagedRegionPtr FairMQTransportFactorySHM::CreateUnmanagedRegion(const size_t size, FairMQRegionCallback callback) const { return unique_ptr(new FairMQUnmanagedRegionSHM(*fManager, size, callback)); } FairMQTransportFactorySHM::~FairMQTransportFactorySHM() { fSendHeartbeats = false; fHeartbeatThread.join(); if (fContext) { if (zmq_ctx_term(fContext) != 0) { if (errno == EINTR) { LOG(error) << "failed closing context, reason: " << zmq_strerror(errno); } else { fContext = nullptr; return; } } } else { LOG(error) << "context not available for shutdown"; } bool lastRemoved = false; { // mutex scope bipc::scoped_lock lock(*fShMutex); (fDeviceCounter->fCount)--; if (fDeviceCounter->fCount == 0) { LOG(debug) << "last segment user, removing segment."; fManager->RemoveSegment(); lastRemoved = true; } else { LOG(debug) << "other segment users present (" << fDeviceCounter->fCount << "), not removing it."; } } if (lastRemoved) { boost::interprocess::named_mutex::remove(std::string("fmq_shm_" + fSessionName + "_mutex").c_str()); } } FairMQ::Transport FairMQTransportFactorySHM::GetType() const { return fTransportType; }