From: Victor Julien Date: Fri, 23 Oct 2015 16:29:10 +0000 (+0200) Subject: threading: avoid autofp deadlock X-Git-Tag: suricata-3.0RC1~34 X-Git-Url: http://git.ipfire.org/cgi-bin/gitweb.cgi?a=commitdiff_plain;h=refs%2Fpull%2F1716%2Fhead;p=thirdparty%2Fsuricata.git threading: avoid autofp deadlock When there are many threads and/or the packet pool (max-pending-packets) is small, a potential dead lock exists between the packet pool return pool logic and the capture threads. The autofp workers together can have all the packets in their return pools, while the capture thread(s) are waiting at an empty pool. A race between the worker threads and the capture thread, where the latter signals the former, is lost by the capture thread. Now everyone is waiting. To avoid this scenario, this patch makes the previously hardcoded 'return pool' threshold dynamic based on the number of threads and the packet pool size. It sets the threshold to the max pending packets value, divided by the number of lister threads. The max value hasn't changed. Normally, in the autofp runmode these are the stream/detect/log worker threads. The max_pending_return_packets value needs to stay below the packet pool size of the 'producers' (normally pkt capture threads but also flow timeout injection) to avoid the deadlock. As it's quite impossible at this time to learn how many threads will be created before starting the runmodes, and thus spawning the threads and already initializing the packet pools, this code sets a global variable after runmode setup, but before the threads are 'unpaused'. --- diff --git a/src/suricata.c b/src/suricata.c index 6c45c57e99..8ddd79fd7a 100644 --- a/src/suricata.c +++ b/src/suricata.c @@ -2367,6 +2367,7 @@ int main(int argc, char **argv) } (void) SC_ATOMIC_CAS(&engine_stage, SURICATA_INIT, SURICATA_RUNTIME); + PacketPoolPostRunmodes(); /* Un-pause all the paused threads */ TmThreadContinueThreads(); diff --git a/src/tmqh-packetpool.c b/src/tmqh-packetpool.c index a1f19dca46..75139254ee 100644 --- a/src/tmqh-packetpool.c +++ b/src/tmqh-packetpool.c @@ -38,6 +38,8 @@ #include "stream-tcp-reassemble.h" #include "tm-queuehandlers.h" +#include "tm-threads.h" +#include "tm-modules.h" #include "pkt-var.h" @@ -50,6 +52,7 @@ /* Number of freed packet to save for one pool before freeing them. */ #define MAX_PENDING_RETURN_PACKETS 32 +static uint32_t max_pending_return_packets = MAX_PENDING_RETURN_PACKETS; #ifdef TLS __thread PktPool thread_pkt_pool; @@ -313,7 +316,7 @@ void PacketPoolReturnPacket(Packet *p) p->next = my_pool->pending_head; my_pool->pending_head = p; my_pool->pending_count++; - if (SC_ATOMIC_GET(pool->return_stack.sync_now) || my_pool->pending_count > MAX_PENDING_RETURN_PACKETS) { + if (SC_ATOMIC_GET(pool->return_stack.sync_now) || my_pool->pending_count > max_pending_return_packets) { /* Return the entire list of pending packets. */ SCMutexLock(&pool->return_stack.mutex); my_pool->pending_tail->next = pool->return_stack.head; @@ -563,3 +566,34 @@ void TmqhReleasePacketsToPacketPool(PacketQueue *pq) return; } + +/** + * \brief Set the max_pending_return_packets value + * + * Set it to the max pending packets value, devided by the number + * of lister threads. Normally, in autofp these are the stream/detect/log + * worker threads. + * + * The max_pending_return_packets value needs to stay below the packet + * pool size of the 'producers' (normally pkt capture threads but also + * flow timeout injection ) to avoid a deadlock where all the 'workers' + * keep packets in their return pools, while the capture thread can't + * continue because its pool is empty. + */ +void PacketPoolPostRunmodes(void) +{ + extern intmax_t max_pending_packets; + + uint32_t threads = TmThreadCountThreadsByTmmFlags(TM_FLAG_DETECT_TM); + if (threads == 0) + return; + if (threads > max_pending_packets) + return; + + uint32_t packets = (max_pending_packets / threads) - 1; + if (packets < max_pending_return_packets) + max_pending_return_packets = packets; + + SCLogDebug("detect threads %u, max packets %u, max_pending_return_packets %u", + threads, (uint)threads, max_pending_return_packets); +} diff --git a/src/tmqh-packetpool.h b/src/tmqh-packetpool.h index ab45184c65..2b6b90b04e 100644 --- a/src/tmqh-packetpool.h +++ b/src/tmqh-packetpool.h @@ -78,5 +78,6 @@ void PacketPoolReturnPacket(Packet *p); void PacketPoolInit(void); void PacketPoolInitEmpty(void); void PacketPoolDestroy(void); +void PacketPoolPostRunmodes(void); #endif /* __TMQH_PACKETPOOL_H__ */