Add tunables for tcache count and max size

author DJ Delorie <dj@delorie.com>

Sat, 16 Jul 2016 01:39:30 +0000 (21:39 -0400)

committer DJ Delorie <dj@delorie.com>

Sat, 16 Jul 2016 01:39:46 +0000 (21:39 -0400)
author DJ Delorie <dj@delorie.com>
Sat, 16 Jul 2016 01:39:30 +0000 (21:39 -0400)
committer DJ Delorie <dj@delorie.com>
Sat, 16 Jul 2016 01:39:46 +0000 (21:39 -0400)
diff --git a/malloc/README.copr.html b/malloc/README.copr.html

index 543758cf644f4c5c4e02d21a5ad19f6b56c9d0b3..7b53930c73d676d1719937ca5b4d3b7d8a335d85 100644 (file)
--- a/malloc/README.copr.html
+++ b/malloc/README.copr.html
@@ -155,6 +155,25 @@ see <a href="http://developers.redhat.com/blog/2016/03/11/practical-micro-benchm
  Micro-Benchmarking with ltrace and sched</a> to get more stable
  numbers.
  
+<h2>Tunables</h2>
+
+<pre>
+MALLOC_TCACHE_COUNT=<i>count</i>
+MALLOC_TCACHE_MAX=<i>bytes</i>
+</pre>
+
+<p><tt>count</tt> can be anything from 0 to whatever.</p>
+
+<p><tt>bytes</tt> can be anything from 0 to 63*2*sizeof(void *)-1 (503
+for 32-bit, 1007 for 64-bit).</p>
+
+<p><tt>mallopt</tt> parameters are (private):</p>
+
+<pre>
+#define M_TCACHE_COUNT  -9
+#define M_TCACHE_MAX  -10
+</pre>
+
  <h2>Uninstalling</h2>
  
  To uninstall the custom build and revert to an official release, you
diff --git a/malloc/arena.c b/malloc/arena.c

index 229783f3b7e445199803d428798f94906fd5c8ba..8c057ea1880bf6a67f32a7c28ff1174e97eeb572 100644 (file)
--- a/malloc/arena.c
+++ b/malloc/arena.c
@@ -229,11 +229,10 @@ next_env_entry (char ***position)
  
            /* Save current position for next visit.  */
            *position = ++current;
-
            break;
          }
  
-      ++current;
+      *position = ++current;
      }
  
    return result;
@@ -278,7 +277,9 @@ ptmalloc_init (void)
        char **runp = _environ;
        char *envline;
  
-      while (__builtin_expect ((envline = next_env_entry (&runp)) != NULL,
+      while (*runp)
+       {
+         if (__builtin_expect ((envline = next_env_entry (&runp)) != NULL,
                                 0))
          {
            size_t len = strcspn (envline, "=");
@@ -319,7 +320,19 @@ ptmalloc_init (void)
                    if (memcmp (envline, "ARENA_TEST", 10) == 0)
                      __libc_mallopt (M_ARENA_TEST, atoi (&envline[11]));
                  }
+              if (!__builtin_expect (__libc_enable_secure, 0))
+                {
+                  if (memcmp (envline, "TCACHE_MAX", 10) == 0)
+                    __libc_mallopt (M_TCACHE_MAX, atoi (&envline[11]));
+                }
                break;
+            case 12:
+              if (!__builtin_expect (__libc_enable_secure, 0))
+                {
+                  if (memcmp (envline, "TCACHE_COUNT", 12) == 0)
+                    __libc_mallopt (M_TCACHE_COUNT, atoi (&envline[13]));
+                }
+             break;
              case 15:
                if (!__builtin_expect (__libc_enable_secure, 0))
                  {
@@ -333,6 +346,7 @@ ptmalloc_init (void)
                break;
              }
          }
+       }
      }
    if (s && s[0])
      {
diff --git a/malloc/malloc.c b/malloc/malloc.c

index 1714e5cf6935a5af26c74281c4c1d31faf374844..35ac6228e4833b7c7694e6f42946769f01b68c07 100644 (file)
--- a/malloc/malloc.c
+++ b/malloc/malloc.c
@@ -278,6 +278,24 @@
  #define MALLOC_DEBUG 0
  #endif
  
+#define USE_TCACHE 1
+
+#if USE_TCACHE
+/* we want 64 entries */
+#define MAX_TCACHE_SIZE                (MALLOC_ALIGNMENT * 63)
+#define TCACHE_IDX             ((MAX_TCACHE_SIZE / MALLOC_ALIGNMENT) + 1)
+#define size2tidx(bytes)       (((bytes) + MALLOC_ALIGNMENT - 1) / MALLOC_ALIGNMENT)
+
+/* Rounds up, so...
+   idx 0   bytes 0
+   idx 1   bytes 1..8
+   idx 2   bytes 9..16
+   etc
+*/
+
+#define TCACHE_FILL_COUNT 7
+#endif
+
  #ifdef NDEBUG
  # define assert(expr) ((void) 0)
  #else
@@ -2051,6 +2069,13 @@ struct malloc_par
  
    /* First address handed out by MORECORE/sbrk.  */
    char *sbrk_base;
+
+#if USE_TCACHE
+  /* Maximum number of buckets to use.  */
+  int tcache_max;
+  /* Maximum number of chunks in each bucket.  */
+  int tcache_count;
+#endif
  };
  
  /* There are several instances of this struct ("arenas") in this
@@ -2089,12 +2114,19 @@ static struct malloc_par mp_ =
    .trim_threshold = DEFAULT_TRIM_THRESHOLD,
  #define NARENAS_FROM_NCORES(n) ((n) * (sizeof (long) == 4 ? 2 : 8))
    .arena_test = NARENAS_FROM_NCORES (1)
+#if USE_TCACHE
+  ,
+  .tcache_count = TCACHE_FILL_COUNT,
+  .tcache_max = TCACHE_IDX-1
+#endif
  };
  
  
  /*  Non public mallopt parameters.  */
  #define M_ARENA_TEST -7
  #define M_ARENA_MAX  -8
+#define M_TCACHE_COUNT  -9
+#define M_TCACHE_MAX  -10
  
  
  /* Maximum size of memory handled in fastbins.  */
@@ -3236,22 +3268,7 @@ mremap_chunk (mchunkptr p, size_t new_size)
  
  /*------------------------ Public wrappers. --------------------------------*/
  
-#define USE_TCACHE 1
-
  #if USE_TCACHE
-/* we want 64 entries */
-#define MAX_TCACHE_SIZE                (MALLOC_ALIGNMENT * 63)
-#define TCACHE_IDX             ((MAX_TCACHE_SIZE / MALLOC_ALIGNMENT) + 1)
-#define size2tidx(bytes)       (((bytes) + MALLOC_ALIGNMENT - 1) / MALLOC_ALIGNMENT)
-
-/* Rounds up, so...
-   idx 0   bytes 0
-   idx 1   bytes 1..8
-   idx 2   bytes 9..16
-   etc
-*/
-
-#define TCACHE_FILL_COUNT 7
  
  typedef struct TCacheEntry {
    struct TCacheEntry *next;
@@ -3315,7 +3332,7 @@ __libc_malloc (size_t bytes)
    __MTB_TRACE_ENTRY (MALLOC,bytes,NULL);
  
  #if USE_TCACHE
-  if (tbytes < MAX_TCACHE_SIZE
+  if (tc_idx < mp_.tcache_max
        && tcache.entries[tc_idx] != NULL
        && tcache.initted == 1)
      {
@@ -3340,7 +3357,7 @@ __libc_malloc (size_t bytes)
    /* This is fast but causes internal fragmentation, as it always
       pulls large chunks but puts small chunks, leading to a large
       backlog of small chunks.  */
-  if (tbytes < MAX_TCACHE_SIZE
+  if (tc_idx < mp_.tcache_max
        && tcache.initted == 1)
      {
        void *ent;
@@ -3355,7 +3372,7 @@ __libc_malloc (size_t bytes)
         tc_bytes = 2 * SIZE_SZ;
        tc_ibytes = tc_bytes + 2*SIZE_SZ;
  
-      total_bytes = tc_bytes + tc_ibytes * TCACHE_FILL_COUNT;
+      total_bytes = tc_bytes + tc_ibytes * mp_.tcache_count;
  
        __MTB_TRACE_PATH (thread_cache);
        __MTB_TRACE_PATH (cpu_cache);
@@ -3397,7 +3414,7 @@ __libc_malloc (size_t bytes)
           m->size = tc_ibytes | flags;
           flags |= PREV_INUSE;
  
-         for (i = 0; i < TCACHE_FILL_COUNT; i++)
+         for (i = 0; i < mp_.tcache_count; i++)
             {
               m =     (mchunkptr) (ent + i * tc_ibytes + tc_bytes);
               e = (TCacheEntry *) (ent + i * tc_ibytes + tc_ibytes);
@@ -3914,7 +3931,7 @@ _tcache_fill (mstate av, size_t original_nb, mchunkptr chunk)
    int tc_idx = size2tidx (original_nb - SIZE_SZ);
    int bits = chunk->size & SIZE_BITS;
  
-  if (original_nb-SIZE_SZ > MAX_TCACHE_SIZE)
+  if (tc_idx > mp_.tcache_max)
      return chunk;
  
    //_m_printf("_tcache_fill %p %x %d %d %p\n", chunk, (unsigned int)original_nb, n, MALLOC_ALIGNMENT,
@@ -3949,11 +3966,11 @@ _tcache_fill (mstate av, size_t original_nb, mchunkptr chunk)
  static int
  _tcache_maxsize (INTERNAL_SIZE_T desired_size, INTERNAL_SIZE_T actual_size)
  {
-  if (desired_size-SIZE_SZ > MAX_TCACHE_SIZE)
+  if (size2tidx(desired_size-SIZE_SZ) > mp_.tcache_max)
      return desired_size;
    actual_size -= actual_size % desired_size;
-  if (actual_size > desired_size * TCACHE_FILL_COUNT)
-    actual_size = desired_size * TCACHE_FILL_COUNT;
+  if (actual_size > desired_size * mp_.tcache_count)
+    actual_size = desired_size * mp_.tcache_count;
    return actual_size;
  }
  #endif
@@ -4043,14 +4060,14 @@ _int_malloc (mstate av, size_t bytes)
  #if USE_TCACHE
           /* While we're here, if we see other chunk of the same size,
              stash them in the tcache.  */
-         if (nb-SIZE_SZ < MAX_TCACHE_SIZE)
+         int tc_idx = size2tidx (nb-SIZE_SZ);
+         if (tc_idx < mp_.tcache_max)
             {
-             int tc_idx = size2tidx (nb-SIZE_SZ);
               mchunkptr tc_victim;
               int found = 0;
  
               /* While bin not empty and tcache not full, copy chunks over.  */
-             while (tcache.counts[tc_idx] < TCACHE_FILL_COUNT
+             while (tcache.counts[tc_idx] < mp_.tcache_count
                      && (pp = *fb) != NULL)
                 {
                   do
@@ -4113,14 +4130,14 @@ _int_malloc (mstate av, size_t bytes)
  #if USE_TCACHE
           /* While we're here, if we see other chunk of the same size,
              stash them in the tcache.  */
-         if (nb-SIZE_SZ < MAX_TCACHE_SIZE)
+         int tc_idx = size2tidx (nb-SIZE_SZ);
+         if (tc_idx < mp_.tcache_max)
             {
-             int tc_idx = size2tidx (nb-SIZE_SZ);
               mchunkptr tc_victim;
               int found = 0;
  
               /* While bin not empty and tcache not full, copy chunks over.  */
-             while (tcache.counts[tc_idx] < TCACHE_FILL_COUNT
+             while (tcache.counts[tc_idx] < mp_.tcache_count
                      && (tc_victim = last(bin)) != bin)
                 {
                   if (tc_victim != 0)
@@ -4186,11 +4203,11 @@ _int_malloc (mstate av, size_t bytes)
  #if USE_TCACHE
    INTERNAL_SIZE_T tcache_nb = 0;
    //INTERNAL_SIZE_T tcache_max = 0;
-  if (nb-SIZE_SZ <= MAX_TCACHE_SIZE)
+  if (size2tidx (nb-SIZE_SZ) <= mp_.tcache_max)
      {
        //int tc_idx = size2tidx (bytes);
        tcache_nb = nb;
-      //tcache_max = nb * (TCACHE_FILL_COUNT - tcache.counts[tc_idx]);
+      //tcache_max = nb * (mp_.tcache_count - tcache.counts[tc_idx]);
      }
    int tc_idx = size2tidx (nb-SIZE_SZ);
    int return_cached = 0;
@@ -4261,7 +4278,7 @@ _int_malloc (mstate av, size_t bytes)
  #if 0 && USE_TCACHE
               /* This forces us to split up bigger chunks later */
               && tcache_nb
-                 && tcache.counts[tc_idx] < TCACHE_FILL_COUNT
+                 && tcache.counts[tc_idx] < mp_.tcache_count
  #endif
               )
              {
@@ -4273,7 +4290,7 @@ _int_malloc (mstate av, size_t bytes)
               /* Fill cache first, return to user only if cache fills.
                  We may return one of these chunks later.  */
               if (tcache_nb
-                 && tcache.counts[tc_idx] < TCACHE_FILL_COUNT)
+                 && tcache.counts[tc_idx] < mp_.tcache_count)
                 {
                   TCacheEntry *e = (TCacheEntry *) chunk2mem(victim);
                   e->next = tcache.entries[tc_idx];
@@ -4685,8 +4702,8 @@ _int_free (mstate av, mchunkptr p, int have_lock)
    {
      int tc_idx = size2tidx (size - SIZE_SZ);
  
-    if (size - SIZE_SZ < MAX_TCACHE_SIZE
-       && tcache.counts[tc_idx] < TCACHE_FILL_COUNT
+    if (tc_idx < mp_.tcache_max
+       && tcache.counts[tc_idx] < mp_.tcache_count
         && tcache.initted == 1)
        {
         TCacheEntry *e = (TCacheEntry *) chunk2mem (p);
@@ -5660,6 +5677,26 @@ __libc_mallopt (int param_number, int value)
            mp_.arena_max = value;
          }
        break;
+#if USE_TCACHE
+    case M_TCACHE_COUNT:
+      if (value >= 0)
+        {
+          LIBC_PROBE (memory_mallopt_tcache_count, 2, value, mp_.tcache_count);
+          mp_.tcache_count = value;
+        }
+      break;
+    case M_TCACHE_MAX:
+      if (value >= 0)
+        {
+          value = size2tidx (value);
+         if (value < TCACHE_IDX)
+           {
+              LIBC_PROBE (memory_mallopt_tcache_max, 2, value, mp_.tcache_max);
+             mp_.tcache_max = value;
+            }
+        }
+      break;
+#endif
      }
    (void) mutex_unlock (&av->mutex);
    return res;
author	DJ Delorie <dj@delorie.com>
	Sat, 16 Jul 2016 01:39:30 +0000 (21:39 -0400)
committer	DJ Delorie <dj@delorie.com>
	Sat, 16 Jul 2016 01:39:46 +0000 (21:39 -0400)
malloc/README.copr.html		patch \| blob \| blame \| history
malloc/arena.c		patch \| blob \| blame \| history
malloc/malloc.c		patch \| blob \| blame \| history