From: Stefan Eissing Date: Wed, 25 May 2022 12:09:36 +0000 (+0000) Subject: Merge /httpd/httpd/trunk:r1899858,1899865,1899884,1900991 X-Git-Tag: 2.4.54-rc1-candidate~39 X-Git-Url: http://git.ipfire.org/cgi-bin/gitweb.cgi?a=commitdiff_plain;h=5f3010a643ac7c67b733484797d41366e328ecdb;p=thirdparty%2Fapache%2Fhttpd.git Merge /httpd/httpd/trunk:r1899858,1899865,1899884,1900991 *) mpm_event, mpm_worker: Handle children killed pathologically. git-svn-id: https://svn.apache.org/repos/asf/httpd/httpd/branches/2.4.x@1901234 13f79535-47bb-0310-9956-ffa450edef68 --- diff --git a/changes-entries/event_early_killed_children.txt b/changes-entries/event_early_killed_children.txt new file mode 100644 index 00000000000..db968c69775 --- /dev/null +++ b/changes-entries/event_early_killed_children.txt @@ -0,0 +1,2 @@ + *) MPM event: Restart chilren processes killed before idle maintenance. + PR 65769. [Yann Ylavic, Ruediger Pluem] diff --git a/server/mpm/event/event.c b/server/mpm/event/event.c index ff260ef9489..3672f449634 100644 --- a/server/mpm/event/event.c +++ b/server/mpm/event/event.c @@ -3058,6 +3058,7 @@ static void server_main_loop(int remaining_children_to_start) { int num_buckets = retained->mpm->num_buckets; int max_daemon_used = 0; + int successive_kills = 0; int child_slot; apr_exit_why_e exitwhy; int status, processed_status; @@ -3136,11 +3137,30 @@ static void server_main_loop(int remaining_children_to_start) /* Don't perform idle maintenance when a child dies, * only do it when there's a timeout. Remember only a * finite number of children can die, and it's pretty - * pathological for a lot to die suddenly. + * pathological for a lot to die suddenly. If a child is + * killed by a signal (faulting) we want to restart it ASAP + * though, up to 3 successive faults or we stop this until + * a timeout happens again (to avoid the flood of fork()ed + * processes that keep being killed early). */ - continue; + if (child_slot < 0 || !APR_PROC_CHECK_SIGNALED(exitwhy)) { + continue; + } + if (++successive_kills >= 3) { + if (successive_kills % 10 == 3) { + ap_log_error(APLOG_MARK, APLOG_WARNING, 0, + ap_server_conf, APLOGNO(10392) + "children are killed successively!"); + } + continue; + } + ++remaining_children_to_start; + } + else { + successive_kills = 0; } - else if (remaining_children_to_start) { + + if (remaining_children_to_start) { /* we hit a 1 second timeout in which none of the previous * generation of children needed to be reaped... so assume * they're all done, and pick up the slack if any is left. diff --git a/server/mpm/worker/worker.c b/server/mpm/worker/worker.c index 7e3a5542406..0907db3281c 100644 --- a/server/mpm/worker/worker.c +++ b/server/mpm/worker/worker.c @@ -1590,6 +1590,7 @@ static void perform_idle_server_maintenance(int child_bucket) static void server_main_loop(int remaining_children_to_start) { int num_buckets = retained->mpm->num_buckets; + int successive_kills = 0; ap_generation_t old_gen; int child_slot; apr_exit_why_e exitwhy; @@ -1684,11 +1685,30 @@ static void server_main_loop(int remaining_children_to_start) /* Don't perform idle maintenance when a child dies, * only do it when there's a timeout. Remember only a * finite number of children can die, and it's pretty - * pathological for a lot to die suddenly. + * pathological for a lot to die suddenly. If a child is + * killed by a signal (faulting) we want to restart it ASAP + * though, up to 3 successive faults or we stop this until + * a timeout happens again (to avoid the flood of fork()ed + * processes that keep being killed early). */ - continue; + if (child_slot < 0 || !APR_PROC_CHECK_SIGNALED(exitwhy)) { + continue; + } + if (++successive_kills >= 3) { + if (successive_kills % 10 == 3) { + ap_log_error(APLOG_MARK, APLOG_WARNING, 0, + ap_server_conf, APLOGNO(10392) + "children are killed successively!"); + } + continue; + } + ++remaining_children_to_start; + } + else { + successive_kills = 0; } - else if (remaining_children_to_start) { + + if (remaining_children_to_start) { /* we hit a 1 second timeout in which none of the previous * generation of children needed to be reaped... so assume * they're all done, and pick up the slack if any is left.