From c92181c6b28c4749d9fdcc3ecfa096fdb41c7989 Mon Sep 17 00:00:00 2001 From: Richard Chapman Date: Wed, 2 Oct 2024 13:43:45 +0100 Subject: [PATCH 1/3] HPCC-32781 RoxieSocketQueueManager::run may be blocked by actCrit Avoid need to obtain critsec just to check if a worker thread's packet matches Signed-off-by: Richard Chapman --- roxie/ccd/ccd.hpp | 3 +- roxie/ccd/ccdqueue.cpp | 76 ++++++++++++++++++----------------------- roxie/udplib/udplib.hpp | 3 +- 3 files changed, 38 insertions(+), 44 deletions(-) diff --git a/roxie/ccd/ccd.hpp b/roxie/ccd/ccd.hpp index 53a6c53e338..a8e2252b7e5 100644 --- a/roxie/ccd/ccd.hpp +++ b/roxie/ccd/ccd.hpp @@ -159,7 +159,7 @@ class RoxiePacketHeader unsigned activityId = 0; // identifies the helper factory to be used (activityId in graph) hash64_t queryHash = 0; // identifies the query - ruid_t uid = 0; // unique id + std::atomic uid = 0; // unique id ServerIdentifier serverId; #ifdef SUBCHANNELS_IN_HEADER ServerIdentifier subChannels[MAX_SUBCHANNEL]; @@ -173,6 +173,7 @@ class RoxiePacketHeader static unsigned getSubChannelMask(unsigned subChannel); unsigned priorityHash() const; + void clear(); void copy(const RoxiePacketHeader &oh); bool matchPacket(const RoxiePacketHeader &oh) const; void init(const RemoteActivityId &_remoteId, ruid_t _uid, unsigned _channel, unsigned _overflowSequence); diff --git a/roxie/ccd/ccdqueue.cpp b/roxie/ccd/ccdqueue.cpp index 5d9b47ea209..669c6530180 100644 --- a/roxie/ccd/ccdqueue.cpp +++ b/roxie/ccd/ccdqueue.cpp @@ -56,7 +56,7 @@ RoxiePacketHeader::RoxiePacketHeader(const RoxiePacketHeader &source, unsigned _ { // Used to create the header to send a callback to originating server or an IBYTI to a buddy activityId = _activityId; - uid = source.uid; + uid.store(source.uid); queryHash = source.queryHash; channel = source.channel; overflowSequence = source.overflowSequence; @@ -88,15 +88,21 @@ unsigned RoxiePacketHeader::priorityHash() const void RoxiePacketHeader::copy(const RoxiePacketHeader &oh) { - // used for saving away kill packets for later matching by match - uid = oh.uid; + // used for saving away info for later matching by match, without having to lock overflowSequence = oh.overflowSequence; continueSequence = oh.continueSequence; serverId = oh.serverId; channel = oh.channel; + uid.store(oh.uid); // MORE - would it be safer, maybe even faster to copy the rest too? } +void RoxiePacketHeader::clear() +{ + // used for saving away kill packets for later matching by match + uid = RUID_NONE; // Will never match a queued packet +} + bool RoxiePacketHeader::matchPacket(const RoxiePacketHeader &oh) const { // used when matching up a kill packet against a pending one... @@ -156,7 +162,7 @@ StringBuffer &RoxiePacketHeader::toString(StringBuffer &ret) const ret.appendf(" (fetch part)"); break; } - ret.appendf(" uid=" RUIDF " pri=", uid); + ret.appendf(" uid=" RUIDF " pri=", uid.load()); switch(activityId & ROXIE_PRIORITY_MASK) { case ROXIE_SLA_PRIORITY: ret.append("SLA"); break; @@ -1192,7 +1198,6 @@ class RoxieQueue : public CInterface, implements IThreadFactory virtual IPooledThread *createNew(); - void abortChannel(unsigned channel); void start() { @@ -1389,6 +1394,7 @@ class CRoxieWorker : public CInterface, implements IPooledThread Owned topology; #endif AgentContextLogger logctx; + RoxiePacketHeader packetHeader; public: IMPLEMENT_IINTERFACE; @@ -1417,41 +1423,40 @@ class CRoxieWorker : public CInterface, implements IPooledThread } inline void setActivity(IRoxieAgentActivity *act) { - //Ensure that the activity is released outside of the critical section Owned temp(act); { CriticalBlock b(actCrit); activity.swap(temp); } } - inline bool match(RoxiePacketHeader &h) + inline void setPacket(IRoxieQueryPacket *p) { - // There is a window between getting packet from queue and being able to match it. - // This could cause some deduping to fail, but it does not matter if it does (so long as it is rare!) CriticalBlock b(actCrit); - return packet && packet->queryHeader().matchPacket(h); - } - - void abortChannel(unsigned channel) - { - CriticalBlock b(actCrit); - if (packet && packet->queryHeader().channel==channel) + if (p) { - abortLaunch = true; -#ifndef NEW_IBYTI - if (doIbytiDelay) - ibytiSem.signal(); -#endif - if (activity) - activity->abort(); + packet.setown(p); + packetHeader.copy(p->queryHeader()); } + else + { + packetHeader.clear(); + packet.setown(p); + } + } + inline bool match(RoxiePacketHeader &h) + { + // There is a window between getting packet from queue and being able to match it. + // This could cause some deduping to fail, but it does not matter if it does (so long as it is rare!) + return packetHeader.matchPacket(h); } bool checkAbort(RoxiePacketHeader &h, bool checkRank, bool &queryFound, bool &preActivity) { - CriticalBlock b(actCrit); - if (packet && packet->queryHeader().matchPacket(h)) + if (packetHeader.matchPacket(h)) { + CriticalBlock b(actCrit); + if (!packetHeader.matchPacket(h)) + return false; queryFound = true; abortLaunch = true; #ifndef NEW_IBYTI @@ -1772,7 +1777,7 @@ class CRoxieWorker : public CInterface, implements IPooledThread #ifdef NEW_IBYTI logctx.setStatistic(StTimeIBYTIDelay, next->queryIBYTIDelayTime()); #endif - packet.setown(next->deserialize()); + setPacket(next->deserialize()); next.clear(); RoxiePacketHeader &header = packet->queryHeader(); #ifndef SUBCHANNELS_IN_HEADER @@ -1804,8 +1809,7 @@ class CRoxieWorker : public CInterface, implements IPooledThread } workerThreadBusy = false; { - CriticalBlock b(actCrit); - packet.clear(); + setPacket(nullptr); #ifndef SUBCHANNELS_IN_HEADER topology.clear(); #endif @@ -1815,12 +1819,11 @@ class CRoxieWorker : public CInterface, implements IPooledThread } catch(IException *E) { - CriticalBlock b(actCrit); EXCLOG(E); if (packet) { throwRemoteException(E, NULL, packet, false); - packet.clear(); + setPacket(nullptr); } else E->Release(); @@ -1830,13 +1833,12 @@ class CRoxieWorker : public CInterface, implements IPooledThread } catch(...) { - CriticalBlock b(actCrit); Owned E = MakeStringException(ROXIE_INTERNAL_ERROR, "Unexpected exception in Roxie worker thread"); EXCLOG(E); if (packet) { throwRemoteException(E.getClear(), NULL, packet, false); - packet.clear(); + setPacket(nullptr); } #ifndef SUBCHANNELS_IN_HEADER topology.clear(); @@ -1851,16 +1853,6 @@ IPooledThread *RoxieQueue::createNew() return new CRoxieWorker; } -void RoxieQueue::abortChannel(unsigned channel) -{ - Owned wi = workers->running(); - ForEach(*wi) - { - CRoxieWorker &w = (CRoxieWorker &) wi->query(); - w.abortChannel(channel); - } -} - //================================================================================= class CallbackEntry : implements IPendingCallback, public CInterface diff --git a/roxie/udplib/udplib.hpp b/roxie/udplib/udplib.hpp index 89190424dd2..ebd674376df 100644 --- a/roxie/udplib/udplib.hpp +++ b/roxie/udplib/udplib.hpp @@ -33,7 +33,8 @@ typedef unsigned ruid_t; // at 1000/sec recycle every 49 days #define RUIDF "0x%.8x" #define RUID_PING 0 #define RUID_DISCARD 1 -#define RUID_FIRST 2 +#define RUID_NONE 2 +#define RUID_FIRST 3 typedef unsigned RecordLengthType; #define MAX_RECORD_LENGTH 0xffffffff From bf856dd879c7b4e777b391e81204886ae607ca4f Mon Sep 17 00:00:00 2001 From: Richard Chapman Date: Wed, 2 Oct 2024 14:47:29 +0100 Subject: [PATCH 2/3] HPCC-32783 Add option to avoid too many workers waiting on semaphore Signed-off-by: Richard Chapman --- roxie/ccd/ccd.hpp | 1 + roxie/ccd/ccdmain.cpp | 2 ++ roxie/ccd/ccdqueue.cpp | 11 ++++++++--- 3 files changed, 11 insertions(+), 3 deletions(-) diff --git a/roxie/ccd/ccd.hpp b/roxie/ccd/ccd.hpp index a8e2252b7e5..9bac5d78eda 100644 --- a/roxie/ccd/ccd.hpp +++ b/roxie/ccd/ccd.hpp @@ -390,6 +390,7 @@ extern bool ignoreFileDateMismatches; extern bool ignoreFileSizeMismatches; extern int fileTimeFuzzySeconds; extern SinkMode defaultSinkMode; +extern bool limitWaitingWorkers; #if defined(_CONTAINERIZED) || defined(SUBCHANNELS_IN_HEADER) static constexpr bool roxieMulticastEnabled = false; diff --git a/roxie/ccd/ccdmain.cpp b/roxie/ccd/ccdmain.cpp index 9d2680aa8ee..3eca077f7d9 100644 --- a/roxie/ccd/ccdmain.cpp +++ b/roxie/ccd/ccdmain.cpp @@ -203,6 +203,7 @@ unsigned maxGraphLoopIterations; bool steppingEnabled = true; bool simpleLocalKeyedJoins = true; bool adhocRoxie = false; +bool limitWaitingWorkers = false; unsigned __int64 minFreeDiskSpace = 1024 * 0x100000; // default to 1 GB unsigned socketCheckInterval = 5000; @@ -1279,6 +1280,7 @@ int CCD_API roxie_main(int argc, const char *argv[], const char * defaultYaml) const char *sinkModeText = topology->queryProp("@sinkMode"); if (sinkModeText) defaultSinkMode = getSinkMode(sinkModeText); + limitWaitingWorkers = topology->getPropBool("@limitWaitingWorkers", limitWaitingWorkers); cacheReportPeriodSeconds = topology->getPropInt("@cacheReportPeriodSeconds", 5*60); setLegacyAES(topology->getPropBool("expert/@useLegacyAES", false)); diff --git a/roxie/ccd/ccdqueue.cpp b/roxie/ccd/ccdqueue.cpp index 669c6530180..be77b7a5896 100644 --- a/roxie/ccd/ccdqueue.cpp +++ b/roxie/ccd/ccdqueue.cpp @@ -1157,6 +1157,7 @@ class RoxieQueue : public CInterface, implements IThreadFactory Owned workers; QueueOf waiting; Semaphore available; + CriticalSection availCrit; // Semaphore post may be slow with a lot of waiters - this crit may be used to limit to a single waiter CriticalSection qcrit; unsigned headRegionSize; unsigned numWorkers; @@ -1324,7 +1325,10 @@ class RoxieQueue : public CInterface, implements IThreadFactory void wait() { idle++; - available.wait(); + { + CLeavableCriticalBlock b(availCrit, limitWaitingWorkers); + available.wait(); + } idle--; } @@ -1431,16 +1435,17 @@ class CRoxieWorker : public CInterface, implements IPooledThread } inline void setPacket(IRoxieQueryPacket *p) { + Owned temp(p); CriticalBlock b(actCrit); if (p) { - packet.setown(p); + packet.swap(temp); packetHeader.copy(p->queryHeader()); } else { packetHeader.clear(); - packet.setown(p); + packet.swap(temp); } } inline bool match(RoxiePacketHeader &h) From 32402f5a2d683f559e69ad25bcb4bd036cf907f0 Mon Sep 17 00:00:00 2001 From: Richard Chapman Date: Wed, 2 Oct 2024 14:57:28 +0100 Subject: [PATCH 3/3] HPCC-32782 Remove headRegionSize option and associated code This was not used (I hope!) and was desiged to solve an issue that was better managed by the IBYTI delay logic. Signed-off-by: Richard Chapman --- roxie/ccd/ccd.hpp | 1 - roxie/ccd/ccdmain.cpp | 3 --- roxie/ccd/ccdqueue.cpp | 44 +++-------------------------------------- roxie/udplib/udplib.hpp | 3 --- 4 files changed, 3 insertions(+), 48 deletions(-) diff --git a/roxie/ccd/ccd.hpp b/roxie/ccd/ccd.hpp index 9bac5d78eda..86a901a7c71 100644 --- a/roxie/ccd/ccd.hpp +++ b/roxie/ccd/ccd.hpp @@ -296,7 +296,6 @@ extern unsigned callbackTimeout; extern unsigned lowTimeout; extern unsigned highTimeout; extern unsigned slaTimeout; -extern unsigned headRegionSize; extern unsigned ccdMulticastPort; extern IPropertyTree *topology; extern MapStringTo *preferredClusters; diff --git a/roxie/ccd/ccdmain.cpp b/roxie/ccd/ccdmain.cpp index 3eca077f7d9..d0af342b917 100644 --- a/roxie/ccd/ccdmain.cpp +++ b/roxie/ccd/ccdmain.cpp @@ -75,7 +75,6 @@ unsigned numRequestArrayThreads = 5; bool blockedLocalAgent = true; bool acknowledgeAllRequests = true; unsigned packetAcknowledgeTimeout = 100; -unsigned headRegionSize; unsigned ccdMulticastPort; bool enableHeartBeat = true; unsigned parallelLoopFlowLimit = 100; @@ -1000,7 +999,6 @@ int CCD_API roxie_main(int argc, const char *argv[], const char * defaultYaml) minPayloadSize = topology->getPropInt("@minPayloadSize", minPayloadSize); blockedLocalAgent = topology->getPropBool("@blockedLocalAgent", blockedLocalAgent); acknowledgeAllRequests = topology->getPropBool("@acknowledgeAllRequests", acknowledgeAllRequests); - headRegionSize = topology->getPropInt("@headRegionSize", 0); packetAcknowledgeTimeout = topology->getPropInt("@packetAcknowledgeTimeout", packetAcknowledgeTimeout); ccdMulticastPort = topology->getPropInt("@multicastPort", CCD_MULTICAST_PORT); statsExpiryTime = topology->getPropInt("@statsExpiryTime", 3600); @@ -1450,7 +1448,6 @@ int CCD_API roxie_main(int argc, const char *argv[], const char * defaultYaml) DBGLOG("Loading all packages took %ums", loadPackageTimer.elapsedMs()); ROQ = createOutputQueueManager(numAgentThreads, encryptInTransit); - ROQ->setHeadRegionSize(headRegionSize); ROQ->start(); Owned packetDiscarder = createPacketDiscarder(); #if defined(WIN32) && defined(_DEBUG) && defined(_DEBUG_HEAP_FULL) diff --git a/roxie/ccd/ccdqueue.cpp b/roxie/ccd/ccdqueue.cpp index be77b7a5896..e0ad44803d8 100644 --- a/roxie/ccd/ccdqueue.cpp +++ b/roxie/ccd/ccdqueue.cpp @@ -1159,7 +1159,6 @@ class RoxieQueue : public CInterface, implements IThreadFactory Semaphore available; CriticalSection availCrit; // Semaphore post may be slow with a lot of waiters - this crit may be used to limit to a single waiter CriticalSection qcrit; - unsigned headRegionSize; unsigned numWorkers; RelaxedAtomic started; std::atomic idle; @@ -1181,9 +1180,8 @@ class RoxieQueue : public CInterface, implements IThreadFactory public: IMPLEMENT_IINTERFACE; - RoxieQueue(unsigned _headRegionSize, unsigned _numWorkers) + RoxieQueue(unsigned _numWorkers) { - headRegionSize = _headRegionSize; numWorkers = _numWorkers; workers.setown(createThreadPool("RoxieWorkers", this, false, nullptr, numWorkers)); started = 0; @@ -1340,31 +1338,7 @@ class RoxieQueue : public CInterface, implements IThreadFactory ISerializedRoxieQueryPacket *dequeue() { CriticalBlock qc(qcrit); - unsigned lim = waiting.ordinality(); - if (lim) - { - if (headRegionSize) - { - if (lim > headRegionSize) - lim = headRegionSize; - return waiting.dequeue(fastRand() % lim); - } - return waiting.dequeue(); - } - else - return NULL; - } - - unsigned getHeadRegionSize() const - { - return headRegionSize; - } - - unsigned setHeadRegionSize(unsigned newsize) - { - unsigned ret = headRegionSize; - headRegionSize = newsize; - return ret; + return waiting.dequeue(); } void noteOrphanIBYTI(const RoxiePacketHeader &hdr) @@ -1914,20 +1888,8 @@ class RoxieReceiverBase : implements IRoxieOutputQueueManager, public CInterface public: IMPLEMENT_IINTERFACE; - RoxieReceiverBase(unsigned _numWorkers) : slaQueue(headRegionSize, _numWorkers), hiQueue(headRegionSize, _numWorkers), loQueue(headRegionSize, _numWorkers), numWorkers(_numWorkers) - { - } - - virtual unsigned getHeadRegionSize() const - { - return loQueue.getHeadRegionSize(); - } - - virtual void setHeadRegionSize(unsigned newSize) + RoxieReceiverBase(unsigned _numWorkers) : slaQueue(_numWorkers), hiQueue(_numWorkers), loQueue(_numWorkers), numWorkers(_numWorkers) { - slaQueue.setHeadRegionSize(newSize); - hiQueue.setHeadRegionSize(newSize); - loQueue.setHeadRegionSize(newSize); } virtual void start() diff --git a/roxie/udplib/udplib.hpp b/roxie/udplib/udplib.hpp index ebd674376df..56d75c36d35 100644 --- a/roxie/udplib/udplib.hpp +++ b/roxie/udplib/udplib.hpp @@ -177,9 +177,6 @@ interface IRoxieOutputQueueManager : public IInterface virtual bool replyPending(RoxiePacketHeader &x) = 0; virtual bool abortCompleted(RoxiePacketHeader &x) = 0; - virtual unsigned getHeadRegionSize() const = 0; - virtual void setHeadRegionSize(unsigned newsize) = 0; - virtual void start() = 0; virtual void stop() = 0; virtual void join() = 0;