MEDIUM: hlua: take nbthread into account in hlua_get_nb_instruction()

author Aurelien DARRAGON <adarragon@haproxy.com>

Wed, 15 May 2024 08:02:27 +0000 (10:02 +0200)

committer Aurelien DARRAGON <adarragon@haproxy.com>

Wed, 15 May 2024 09:59:44 +0000 (11:59 +0200)
author Aurelien DARRAGON <adarragon@haproxy.com>
Wed, 15 May 2024 08:02:27 +0000 (10:02 +0200)
committer Aurelien DARRAGON <adarragon@haproxy.com>
Wed, 15 May 2024 09:59:44 +0000 (11:59 +0200)
diff --git a/doc/configuration.txt b/doc/configuration.txt

index 7732843427beaf386a512b00bd89b5f9f5779f67..27a616e6ba91dc57538d4a6a3c0365997960aabd 100644 (file)
--- a/doc/configuration.txt
+++ b/doc/configuration.txt
@@ -3456,10 +3456,17 @@ tune.lua.forced-yield <number>
    This directive forces the Lua engine to execute a yield each <number> of
    instructions executed. This permits interrupting a long script and allows the
    HAProxy scheduler to process other tasks like accepting connections or
-  forwarding traffic. The default value is 10000 instructions. If HAProxy often
-  executes some Lua code but more responsiveness is required, this value can be
-  lowered. If the Lua code is quite long and its result is absolutely required
-  to process the data, the <number> can be increased.
+  forwarding traffic. The default value is 10000 instructions for scripts loaded
+  using "lua-load-per-thread" and MAX(500, 10000 / nbthread) instructions for
+  scripts loaded using "lua-load" (it was found to be an optimal value for
+  performance while taking care of not creating thread contention with multiple
+  threads competing for the global lua lock).
+
+  If HAProxy often executes some Lua code but more responsiveness is required,
+  this value can be lowered. If the Lua code is quite long and its result is
+  absolutely required to process the data, the <number> can be increased, but
+  the value should be set wisely as in multithreading context it could increase
+  contention.
  
  tune.lua.maxmem <number>
    Sets the maximum amount of RAM in megabytes per process usable by Lua. By
diff --git a/src/hlua.c b/src/hlua.c

index 6fe64be85abae7e492170e3afb8b99253d629f27..098107f7aea35c6053b404cb0c703b87b8fc4117 100644 (file)
--- a/src/hlua.c
+++ b/src/hlua.c
@@ -516,7 +516,15 @@ static inline int hlua_timer_check(const struct hlua_timer *timer)
  
  /* Interrupts the Lua processing each "hlua_nb_instruction" instructions.
   * it is used for preventing infinite loops.
+ */
+static unsigned int hlua_nb_instruction = 0;
+
+/* Wrapper to retrieve the number of instructions between two interrupts
+ * depending on user settings and current hlua context. If not already
+ * explicitly set, we compute the ideal value using hard limits releaved
+ * by Thierry Fournier's work, whose original notes may be found below:
   *
+ * --
   * I test the scheer with an infinite loop containing one incrementation
   * and one test. I run this loop between 10 seconds, I raise a ceil of
   * 710M loops from one interrupt each 9000 instructions, so I fix the value
@@ -537,16 +545,41 @@ static inline int hlua_timer_check(const struct hlua_timer *timer)
   *  10000         | 710
   *  100000        | 710
   *  1000000       | 710
+ * --
   *
- */
-static unsigned int hlua_nb_instruction = 10000;
-
-/* Wrapper to retrieve the number of instructions between two interrupts
- * depending on user settings and current hlua context.
+ * Thanks to his work, we know we can safely use values between 500 and 10000
+ * without a significant impact on performance.
   */
  static inline unsigned int hlua_get_nb_instruction(struct hlua *hlua)
  {
-       return hlua_nb_instruction;
+       int ceil = 10000; /* above 10k, no significant performance gain */
+       int floor = 500;  /* below 500, significant performance loss */
+
+       if (hlua_nb_instruction) {
+               /* value enforced by user */
+               return hlua_nb_instruction;
+       }
+
+       /* not set, assign automatic value */
+       if (hlua->state_id == 0) {
+               /* this function is expected to be called during runtime (after config
+                * parsing), thus global.nb_thread is expected to be set.
+                */
+               BUG_ON(global.nbthread == 0);
+
+               /* main lua stack (shared global lock), take number of threads into
+                * account in an attempt to reduce thread contention
+                */
+               return MAX(floor, ceil / global.nbthread);
+       }
+       else {
+               /* per-thread lua stack, less contention is expected (no global lock),
+                * allow up to the maximum number of instructions and hope that the
+                * user manually yields after heavy (lock dependent) work from lua
+                * script (e.g.: map manipulation).
+                */
+               return ceil;
+       }
  }
  
  /* Descriptor for the memory allocation state. The limit is pre-initialised to
author	Aurelien DARRAGON <adarragon@haproxy.com>
	Wed, 15 May 2024 08:02:27 +0000 (10:02 +0200)
committer	Aurelien DARRAGON <adarragon@haproxy.com>
	Wed, 15 May 2024 09:59:44 +0000 (11:59 +0200)
doc/configuration.txt		patch \| blob \| blame \| history
src/hlua.c		patch \| blob \| blame \| history