debugobjects: Add percpu free pools

author Waiman Long <longman@redhat.com>

Mon, 20 May 2019 14:14:46 +0000 (10:14 -0400)

committer Thomas Gleixner <tglx@linutronix.de>

Fri, 14 Jun 2019 12:51:14 +0000 (14:51 +0200)
author Waiman Long <longman@redhat.com>
Mon, 20 May 2019 14:14:46 +0000 (10:14 -0400)
committer Thomas Gleixner <tglx@linutronix.de>
Fri, 14 Jun 2019 12:51:14 +0000 (14:51 +0200)
diff --git a/lib/debugobjects.c b/lib/debugobjects.c

index 2ac4228..38c23b5 100644 (file)
--- a/lib/debugobjects.c
+++ b/lib/debugobjects.c
@@ -25,6 +25,7 @@
  
  #define ODEBUG_POOL_SIZE       1024
  #define ODEBUG_POOL_MIN_LEVEL  256
  
  #define ODEBUG_POOL_SIZE       1024
  #define ODEBUG_POOL_MIN_LEVEL  256
+#define ODEBUG_POOL_PERCPU_SIZE        64
  
  #define ODEBUG_CHUNK_SHIFT     PAGE_SHIFT
  #define ODEBUG_CHUNK_SIZE      (1 << ODEBUG_CHUNK_SHIFT)
  
  #define ODEBUG_CHUNK_SHIFT     PAGE_SHIFT
  #define ODEBUG_CHUNK_SIZE      (1 << ODEBUG_CHUNK_SHIFT)
@@ -35,6 +36,17 @@ struct debug_bucket {
         raw_spinlock_t          lock;
  };
  
         raw_spinlock_t          lock;
  };
  
+/*
+ * Debug object percpu free list
+ * Access is protected by disabling irq
+ */
+struct debug_percpu_free {
+       struct hlist_head       free_objs;
+       int                     obj_free;
+};
+
+static DEFINE_PER_CPU(struct debug_percpu_free, percpu_obj_pool);
+
  static struct debug_bucket     obj_hash[ODEBUG_HASH_SIZE];
  
  static struct debug_obj                obj_static_pool[ODEBUG_POOL_SIZE] __initdata;
  static struct debug_bucket     obj_hash[ODEBUG_HASH_SIZE];
  
  static struct debug_obj                obj_static_pool[ODEBUG_POOL_SIZE] __initdata;
@@ -44,13 +56,19 @@ static DEFINE_RAW_SPINLOCK(pool_lock);
  static HLIST_HEAD(obj_pool);
  static HLIST_HEAD(obj_to_free);
  
  static HLIST_HEAD(obj_pool);
  static HLIST_HEAD(obj_to_free);
  
+/*
+ * Because of the presence of percpu free pools, obj_pool_free will
+ * under-count those in the percpu free pools. Similarly, obj_pool_used
+ * will over-count those in the percpu free pools. Adjustments will be
+ * made at debug_stats_show(). Both obj_pool_min_free and obj_pool_max_used
+ * can be off.
+ */
  static int                     obj_pool_min_free = ODEBUG_POOL_SIZE;
  static int                     obj_pool_free = ODEBUG_POOL_SIZE;
  static int                     obj_pool_used;
  static int                     obj_pool_max_used;
  /* The number of objs on the global free list */
  static int                     obj_nr_tofree;
  static int                     obj_pool_min_free = ODEBUG_POOL_SIZE;
  static int                     obj_pool_free = ODEBUG_POOL_SIZE;
  static int                     obj_pool_used;
  static int                     obj_pool_max_used;
  /* The number of objs on the global free list */
  static int                     obj_nr_tofree;
-static struct kmem_cache       *obj_cache;
  
  static int                     debug_objects_maxchain __read_mostly;
  static int __maybe_unused      debug_objects_maxchecked __read_mostly;
  
  static int                     debug_objects_maxchain __read_mostly;
  static int __maybe_unused      debug_objects_maxchecked __read_mostly;
@@ -63,6 +81,7 @@ static int                    debug_objects_pool_size __read_mostly
  static int                     debug_objects_pool_min_level __read_mostly
                                 = ODEBUG_POOL_MIN_LEVEL;
  static struct debug_obj_descr  *descr_test  __read_mostly;
  static int                     debug_objects_pool_min_level __read_mostly
                                 = ODEBUG_POOL_MIN_LEVEL;
  static struct debug_obj_descr  *descr_test  __read_mostly;
+static struct kmem_cache       *obj_cache __read_mostly;
  
  /*
   * Track numbers of kmem_cache_alloc()/free() calls done.
  
  /*
   * Track numbers of kmem_cache_alloc()/free() calls done.
@@ -163,26 +182,42 @@ static struct debug_obj *lookup_object(void *addr, struct debug_bucket *b)
  }
  
  /*
  }
  
  /*
+ * Allocate a new object from the hlist
+ */
+static struct debug_obj *__alloc_object(struct hlist_head *list)
+{
+       struct debug_obj *obj = NULL;
+
+       if (list->first) {
+               obj = hlist_entry(list->first, typeof(*obj), node);
+               hlist_del(&obj->node);
+       }
+
+       return obj;
+}
+
+/*
   * Allocate a new object. If the pool is empty, switch off the debugger.
   * Must be called with interrupts disabled.
   */
  static struct debug_obj *
  alloc_object(void *addr, struct debug_bucket *b, struct debug_obj_descr *descr)
  {
   * Allocate a new object. If the pool is empty, switch off the debugger.
   * Must be called with interrupts disabled.
   */
  static struct debug_obj *
  alloc_object(void *addr, struct debug_bucket *b, struct debug_obj_descr *descr)
  {
-       struct debug_obj *obj = NULL;
-
-       raw_spin_lock(&pool_lock);
-       if (obj_pool.first) {
-               obj         = hlist_entry(obj_pool.first, typeof(*obj), node);
-
-               obj->object = addr;
-               obj->descr  = descr;
-               obj->state  = ODEBUG_STATE_NONE;
-               obj->astate = 0;
-               hlist_del(&obj->node);
+       struct debug_percpu_free *percpu_pool;
+       struct debug_obj *obj;
  
  
-               hlist_add_head(&obj->node, &b->list);
+       if (likely(obj_cache)) {
+               percpu_pool = this_cpu_ptr(&percpu_obj_pool);
+               obj = __alloc_object(&percpu_pool->free_objs);
+               if (obj) {
+                       percpu_pool->obj_free--;
+                       goto init_obj;
+               }
+       }
  
  
+       raw_spin_lock(&pool_lock);
+       obj = __alloc_object(&obj_pool);
+       if (obj) {
                 obj_pool_used++;
                 if (obj_pool_used > obj_pool_max_used)
                         obj_pool_max_used = obj_pool_used;
                 obj_pool_used++;
                 if (obj_pool_used > obj_pool_max_used)
                         obj_pool_max_used = obj_pool_used;
@@ -193,6 +228,14 @@ alloc_object(void *addr, struct debug_bucket *b, struct debug_obj_descr *descr)
         }
         raw_spin_unlock(&pool_lock);
  
         }
         raw_spin_unlock(&pool_lock);
  
+init_obj:
+       if (obj) {
+               obj->object = addr;
+               obj->descr  = descr;
+               obj->state  = ODEBUG_STATE_NONE;
+               obj->astate = 0;
+               hlist_add_head(&obj->node, &b->list);
+       }
         return obj;
  }
  
         return obj;
  }
  
@@ -247,8 +290,21 @@ static bool __free_object(struct debug_obj *obj)
  {
         unsigned long flags;
         bool work;
  {
         unsigned long flags;
         bool work;
+       struct debug_percpu_free *percpu_pool;
  
  
-       raw_spin_lock_irqsave(&pool_lock, flags);
+       local_irq_save(flags);
+       /*
+        * Try to free it into the percpu pool first.
+        */
+       percpu_pool = this_cpu_ptr(&percpu_obj_pool);
+       if (obj_cache && percpu_pool->obj_free < ODEBUG_POOL_PERCPU_SIZE) {
+               hlist_add_head(&obj->node, &percpu_pool->free_objs);
+               percpu_pool->obj_free++;
+               local_irq_restore(flags);
+               return false;
+       }
+
+       raw_spin_lock(&pool_lock);
         work = (obj_pool_free > debug_objects_pool_size) && obj_cache;
         obj_pool_used--;
  
         work = (obj_pool_free > debug_objects_pool_size) && obj_cache;
         obj_pool_used--;
  
@@ -259,7 +315,8 @@ static bool __free_object(struct debug_obj *obj)
                 obj_pool_free++;
                 hlist_add_head(&obj->node, &obj_pool);
         }
                 obj_pool_free++;
                 hlist_add_head(&obj->node, &obj_pool);
         }
-       raw_spin_unlock_irqrestore(&pool_lock, flags);
+       raw_spin_unlock(&pool_lock);
+       local_irq_restore(flags);
         return work;
  }
  
         return work;
  }
  
@@ -822,13 +879,19 @@ void debug_check_no_obj_freed(const void *address, unsigned long size)
  
  static int debug_stats_show(struct seq_file *m, void *v)
  {
  
  static int debug_stats_show(struct seq_file *m, void *v)
  {
+       int cpu, obj_percpu_free = 0;
+
+       for_each_possible_cpu(cpu)
+               obj_percpu_free += per_cpu(percpu_obj_pool.obj_free, cpu);
+
         seq_printf(m, "max_chain     :%d\n", debug_objects_maxchain);
         seq_printf(m, "max_checked   :%d\n", debug_objects_maxchecked);
         seq_printf(m, "warnings      :%d\n", debug_objects_warnings);
         seq_printf(m, "fixups        :%d\n", debug_objects_fixups);
         seq_printf(m, "max_chain     :%d\n", debug_objects_maxchain);
         seq_printf(m, "max_checked   :%d\n", debug_objects_maxchecked);
         seq_printf(m, "warnings      :%d\n", debug_objects_warnings);
         seq_printf(m, "fixups        :%d\n", debug_objects_fixups);
-       seq_printf(m, "pool_free     :%d\n", obj_pool_free);
+       seq_printf(m, "pool_free     :%d\n", obj_pool_free + obj_percpu_free);
+       seq_printf(m, "pool_pcp_free :%d\n", obj_percpu_free);
         seq_printf(m, "pool_min_free :%d\n", obj_pool_min_free);
         seq_printf(m, "pool_min_free :%d\n", obj_pool_min_free);
-       seq_printf(m, "pool_used     :%d\n", obj_pool_used);
+       seq_printf(m, "pool_used     :%d\n", obj_pool_used - obj_percpu_free);
         seq_printf(m, "pool_max_used :%d\n", obj_pool_max_used);
         seq_printf(m, "on_free_list  :%d\n", obj_nr_tofree);
         seq_printf(m, "objs_allocated:%d\n", debug_objects_allocated);
         seq_printf(m, "pool_max_used :%d\n", obj_pool_max_used);
         seq_printf(m, "on_free_list  :%d\n", obj_nr_tofree);
         seq_printf(m, "objs_allocated:%d\n", debug_objects_allocated);
@@ -1165,9 +1228,20 @@ free:
   */
  void __init debug_objects_mem_init(void)
  {
   */
  void __init debug_objects_mem_init(void)
  {
+       int cpu;
+
         if (!debug_objects_enabled)
                 return;
  
         if (!debug_objects_enabled)
                 return;
  
+       /*
+        * Initialize the percpu object pools
+        *
+        * Initialization is not strictly necessary, but was done for
+        * completeness.
+        */
+       for_each_possible_cpu(cpu)
+               INIT_HLIST_HEAD(&per_cpu(percpu_obj_pool.free_objs, cpu));
+
         obj_cache = kmem_cache_create("debug_objects_cache",
                                       sizeof (struct debug_obj), 0,
                                       SLAB_DEBUG_OBJECTS | SLAB_NOLEAKTRACE,
         obj_cache = kmem_cache_create("debug_objects_cache",
                                       sizeof (struct debug_obj), 0,
                                       SLAB_DEBUG_OBJECTS | SLAB_NOLEAKTRACE,
@@ -1179,11 +1253,4 @@ void __init debug_objects_mem_init(void)
                 pr_warn("out of memory.\n");
         } else
                 debug_objects_selftest();
                 pr_warn("out of memory.\n");
         } else
                 debug_objects_selftest();
-
-       /*
-        * Increase the thresholds for allocating and freeing objects
-        * according to the number of possible CPUs available in the system.
-        */
-       debug_objects_pool_size += num_possible_cpus() * 32;
-       debug_objects_pool_min_level += num_possible_cpus() * 4;
  }
  }
author	Waiman Long <longman@redhat.com>
	Mon, 20 May 2019 14:14:46 +0000 (10:14 -0400)
committer	Thomas Gleixner <tglx@linutronix.de>
	Fri, 14 Jun 2019 12:51:14 +0000 (14:51 +0200)