mm: have order > 0 compaction start off where it left

[cascardo/linux.git] / mm / slab.c
diff --git a/mm/slab.c b/mm/slab.c

index 105f188..1fcf3ac 100644 (file)
--- a/mm/slab.c
+++ b/mm/slab.c
@@ -68,7 +68,7 @@
   * Further notes from the original documentation:
   *
   * 11 April '97.  Started multi-threading - markhe
- *     The global cache-chain is protected by the mutex 'cache_chain_mutex'.
+ *     The global cache-chain is protected by the mutex 'slab_mutex'.
   *     The sem is only needed when accessing/extending the cache-chain, which
   *     can never happen inside an interrupt (kmem_cache_create(),
   *     kmem_cache_shrink() and kmem_cache_reap()).
@@ -87,6 +87,7 @@
   */
  
  #include       <linux/slab.h>
+#include       "slab.h"
  #include       <linux/mm.h>
  #include       <linux/poison.h>
  #include       <linux/swap.h>
@@ -565,27 +566,6 @@ static struct kmem_cache cache_cache = {
  
  #define BAD_ALIEN_MAGIC 0x01020304ul
  
-/*
- * chicken and egg problem: delay the per-cpu array allocation
- * until the general caches are up.
- */
-static enum {
-       NONE,
-       PARTIAL_AC,
-       PARTIAL_L3,
-       EARLY,
-       LATE,
-       FULL
-} g_cpucache_up;
-
-/*
- * used by boot code to determine if it can use slab based allocator
- */
-int slab_is_available(void)
-{
-       return g_cpucache_up >= EARLY;
-}
-
  #ifdef CONFIG_LOCKDEP
  
  /*
@@ -651,7 +631,7 @@ static void init_node_lock_keys(int q)
  {
         struct cache_sizes *s = malloc_sizes;
  
-       if (g_cpucache_up < LATE)
+       if (slab_state < UP)
                 return;
  
         for (s = malloc_sizes; s->cs_size != ULONG_MAX; s++) {
@@ -691,12 +671,6 @@ static void slab_set_debugobj_lock_classes(struct kmem_cache *cachep)
  }
  #endif
  
-/*
- * Guard access to the cache-chain.
- */
-static DEFINE_MUTEX(cache_chain_mutex);
-static struct list_head cache_chain;
-
  static DEFINE_PER_CPU(struct delayed_work, slab_reap_work);
  
  static inline struct array_cache *cpu_cache_get(struct kmem_cache *cachep)
@@ -1120,7 +1094,7 @@ static inline int cache_free_alien(struct kmem_cache *cachep, void *objp)
   * When hotplugging memory or a cpu, existing nodelists are not replaced if
   * already in use.
   *
- * Must hold cache_chain_mutex.
+ * Must hold slab_mutex.
   */
  static int init_cache_nodelists_node(int node)
  {
@@ -1128,7 +1102,7 @@ static int init_cache_nodelists_node(int node)
         struct kmem_list3 *l3;
         const int memsize = sizeof(struct kmem_list3);
  
-       list_for_each_entry(cachep, &cache_chain, list) {
+       list_for_each_entry(cachep, &slab_caches, list) {
                 /*
                  * Set up the size64 kmemlist for cpu before we can
                  * begin anything. Make sure some other cpu on this
@@ -1144,7 +1118,7 @@ static int init_cache_nodelists_node(int node)
  
                         /*
                          * The l3s don't come and go as CPUs come and
-                        * go.  cache_chain_mutex is sufficient
+                        * go.  slab_mutex is sufficient
                          * protection here.
                          */
                         cachep->nodelists[node] = l3;
@@ -1166,7 +1140,7 @@ static void __cpuinit cpuup_canceled(long cpu)
         int node = cpu_to_mem(cpu);
         const struct cpumask *mask = cpumask_of_node(node);
  
-       list_for_each_entry(cachep, &cache_chain, list) {
+       list_for_each_entry(cachep, &slab_caches, list) {
                 struct array_cache *nc;
                 struct array_cache *shared;
                 struct array_cache **alien;
@@ -1216,7 +1190,7 @@ free_array_cache:
          * the respective cache's slabs,  now we can go ahead and
          * shrink each nodelist to its limit.
          */
-       list_for_each_entry(cachep, &cache_chain, list) {
+       list_for_each_entry(cachep, &slab_caches, list) {
                 l3 = cachep->nodelists[node];
                 if (!l3)
                         continue;
@@ -1245,7 +1219,7 @@ static int __cpuinit cpuup_prepare(long cpu)
          * Now we can go ahead with allocating the shared arrays and
          * array caches
          */
-       list_for_each_entry(cachep, &cache_chain, list) {
+       list_for_each_entry(cachep, &slab_caches, list) {
                 struct array_cache *nc;
                 struct array_cache *shared = NULL;
                 struct array_cache **alien = NULL;
@@ -1313,9 +1287,9 @@ static int __cpuinit cpuup_callback(struct notifier_block *nfb,
         switch (action) {
         case CPU_UP_PREPARE:
         case CPU_UP_PREPARE_FROZEN:
-               mutex_lock(&cache_chain_mutex);
+               mutex_lock(&slab_mutex);
                 err = cpuup_prepare(cpu);
-               mutex_unlock(&cache_chain_mutex);
+               mutex_unlock(&slab_mutex);
                 break;
         case CPU_ONLINE:
         case CPU_ONLINE_FROZEN:
@@ -1325,7 +1299,7 @@ static int __cpuinit cpuup_callback(struct notifier_block *nfb,
         case CPU_DOWN_PREPARE:
         case CPU_DOWN_PREPARE_FROZEN:
                 /*
-                * Shutdown cache reaper. Note that the cache_chain_mutex is
+                * Shutdown cache reaper. Note that the slab_mutex is
                  * held so that if cache_reap() is invoked it cannot do
                  * anything expensive but will only modify reap_work
                  * and reschedule the timer.
@@ -1352,9 +1326,9 @@ static int __cpuinit cpuup_callback(struct notifier_block *nfb,
  #endif
         case CPU_UP_CANCELED:
         case CPU_UP_CANCELED_FROZEN:
-               mutex_lock(&cache_chain_mutex);
+               mutex_lock(&slab_mutex);
                 cpuup_canceled(cpu);
-               mutex_unlock(&cache_chain_mutex);
+               mutex_unlock(&slab_mutex);
                 break;
         }
         return notifier_from_errno(err);
@@ -1370,14 +1344,14 @@ static struct notifier_block __cpuinitdata cpucache_notifier = {
   * Returns -EBUSY if all objects cannot be drained so that the node is not
   * removed.
   *
- * Must hold cache_chain_mutex.
+ * Must hold slab_mutex.
   */
  static int __meminit drain_cache_nodelists_node(int node)
  {
         struct kmem_cache *cachep;
         int ret = 0;
  
-       list_for_each_entry(cachep, &cache_chain, list) {
+       list_for_each_entry(cachep, &slab_caches, list) {
                 struct kmem_list3 *l3;
  
                 l3 = cachep->nodelists[node];
@@ -1408,14 +1382,14 @@ static int __meminit slab_memory_callback(struct notifier_block *self,
  
         switch (action) {
         case MEM_GOING_ONLINE:
-               mutex_lock(&cache_chain_mutex);
+               mutex_lock(&slab_mutex);
                 ret = init_cache_nodelists_node(nid);
-               mutex_unlock(&cache_chain_mutex);
+               mutex_unlock(&slab_mutex);
                 break;
         case MEM_GOING_OFFLINE:
-               mutex_lock(&cache_chain_mutex);
+               mutex_lock(&slab_mutex);
                 ret = drain_cache_nodelists_node(nid);
-               mutex_unlock(&cache_chain_mutex);
+               mutex_unlock(&slab_mutex);
                 break;
         case MEM_ONLINE:
         case MEM_OFFLINE:
@@ -1519,8 +1493,8 @@ void __init kmem_cache_init(void)
         node = numa_mem_id();
  
         /* 1) create the cache_cache */
-       INIT_LIST_HEAD(&cache_chain);
-       list_add(&cache_cache.list, &cache_chain);
+       INIT_LIST_HEAD(&slab_caches);
+       list_add(&cache_cache.list, &slab_caches);
         cache_cache.colour_off = cache_line_size();
         cache_cache.array[smp_processor_id()] = &initarray_cache.cache;
         cache_cache.nodelists[node] = &initkmem_list3[CACHE_CACHE + node];
@@ -1558,7 +1532,7 @@ void __init kmem_cache_init(void)
          * bug.
          */
  
-       sizes[INDEX_AC].cs_cachep = kmem_cache_create(names[INDEX_AC].name,
+       sizes[INDEX_AC].cs_cachep = __kmem_cache_create(names[INDEX_AC].name,
                                         sizes[INDEX_AC].cs_size,
                                         ARCH_KMALLOC_MINALIGN,
                                         ARCH_KMALLOC_FLAGS|SLAB_PANIC,
@@ -1566,7 +1540,7 @@ void __init kmem_cache_init(void)
  
         if (INDEX_AC != INDEX_L3) {
                 sizes[INDEX_L3].cs_cachep =
-                       kmem_cache_create(names[INDEX_L3].name,
+                       __kmem_cache_create(names[INDEX_L3].name,
                                 sizes[INDEX_L3].cs_size,
                                 ARCH_KMALLOC_MINALIGN,
                                 ARCH_KMALLOC_FLAGS|SLAB_PANIC,
@@ -1584,14 +1558,14 @@ void __init kmem_cache_init(void)
                  * allow tighter packing of the smaller caches.
                  */
                 if (!sizes->cs_cachep) {
-                       sizes->cs_cachep = kmem_cache_create(names->name,
+                       sizes->cs_cachep = __kmem_cache_create(names->name,
                                         sizes->cs_size,
                                         ARCH_KMALLOC_MINALIGN,
                                         ARCH_KMALLOC_FLAGS|SLAB_PANIC,
                                         NULL);
                 }
  #ifdef CONFIG_ZONE_DMA
-               sizes->cs_dmacachep = kmem_cache_create(
+               sizes->cs_dmacachep = __kmem_cache_create(
                                         names->name_dma,
                                         sizes->cs_size,
                                         ARCH_KMALLOC_MINALIGN,
@@ -1649,24 +1623,27 @@ void __init kmem_cache_init(void)
                 }
         }
  
-       g_cpucache_up = EARLY;
+       slab_state = UP;
  }
  
  void __init kmem_cache_init_late(void)
  {
         struct kmem_cache *cachep;
  
-       g_cpucache_up = LATE;
+       slab_state = UP;
  
         /* Annotate slab for lockdep -- annotate the malloc caches */
         init_lock_keys();
  
         /* 6) resize the head arrays to their final sizes */
-       mutex_lock(&cache_chain_mutex);
-       list_for_each_entry(cachep, &cache_chain, list)
+       mutex_lock(&slab_mutex);
+       list_for_each_entry(cachep, &slab_caches, list)
                 if (enable_cpucache(cachep, GFP_NOWAIT))
                         BUG();
-       mutex_unlock(&cache_chain_mutex);
+       mutex_unlock(&slab_mutex);
+
+       /* Done! */
+       slab_state = FULL;
  
         /*
          * Register a cpu startup notifier callback that initializes
@@ -1699,7 +1676,7 @@ static int __init cpucache_init(void)
                 start_cpu_timer(cpu);
  
         /* Done! */
-       g_cpucache_up = FULL;
+       slab_state = FULL;
         return 0;
  }
  __initcall(cpucache_init);
@@ -2167,10 +2144,10 @@ static size_t calculate_slab_order(struct kmem_cache *cachep,
  
  static int __init_refok setup_cpu_cache(struct kmem_cache *cachep, gfp_t gfp)
  {
-       if (g_cpucache_up >= LATE)
+       if (slab_state >= FULL)
                 return enable_cpucache(cachep, gfp);
  
-       if (g_cpucache_up == NONE) {
+       if (slab_state == DOWN) {
                 /*
                  * Note: the first kmem_cache_create must create the cache
                  * that's used by kmalloc(24), otherwise the creation of
@@ -2185,16 +2162,16 @@ static int __init_refok setup_cpu_cache(struct kmem_cache *cachep, gfp_t gfp)
                  */
                 set_up_list3s(cachep, SIZE_AC);
                 if (INDEX_AC == INDEX_L3)
-                       g_cpucache_up = PARTIAL_L3;
+                       slab_state = PARTIAL_L3;
                 else
-                       g_cpucache_up = PARTIAL_AC;
+                       slab_state = PARTIAL_ARRAYCACHE;
         } else {
                 cachep->array[smp_processor_id()] =
                         kmalloc(sizeof(struct arraycache_init), gfp);
  
-               if (g_cpucache_up == PARTIAL_AC) {
+               if (slab_state == PARTIAL_ARRAYCACHE) {
                         set_up_list3s(cachep, SIZE_L3);
-                       g_cpucache_up = PARTIAL_L3;
+                       slab_state = PARTIAL_L3;
                 } else {
                         int node;
                         for_each_online_node(node) {
@@ -2220,7 +2197,7 @@ static int __init_refok setup_cpu_cache(struct kmem_cache *cachep, gfp_t gfp)
  }
  
  /**
- * kmem_cache_create - Create a cache.
+ * __kmem_cache_create - Create a cache.
   * @name: A string which is used in /proc/slabinfo to identify this cache.
   * @size: The size of objects to be created in this cache.
   * @align: The required alignment for the objects.
@@ -2247,59 +2224,14 @@ static int __init_refok setup_cpu_cache(struct kmem_cache *cachep, gfp_t gfp)
   * as davem.
   */
  struct kmem_cache *
-kmem_cache_create (const char *name, size_t size, size_t align,
+__kmem_cache_create (const char *name, size_t size, size_t align,
         unsigned long flags, void (*ctor)(void *))
  {
         size_t left_over, slab_size, ralign;
-       struct kmem_cache *cachep = NULL, *pc;
+       struct kmem_cache *cachep = NULL;
         gfp_t gfp;
  
-       /*
-        * Sanity checks... these are all serious usage bugs.
-        */
-       if (!name || in_interrupt() || (size < BYTES_PER_WORD) ||
-           size > KMALLOC_MAX_SIZE) {
-               printk(KERN_ERR "%s: Early error in slab %s\n", __func__,
-                               name);
-               BUG();
-       }
-
-       /*
-        * We use cache_chain_mutex to ensure a consistent view of
-        * cpu_online_mask as well.  Please see cpuup_callback
-        */
-       if (slab_is_available()) {
-               get_online_cpus();
-               mutex_lock(&cache_chain_mutex);
-       }
-
-       list_for_each_entry(pc, &cache_chain, list) {
-               char tmp;
-               int res;
-
-               /*
-                * This happens when the module gets unloaded and doesn't
-                * destroy its slab cache and no-one else reuses the vmalloc
-                * area of the module.  Print a warning.
-                */
-               res = probe_kernel_address(pc->name, tmp);
-               if (res) {
-                       printk(KERN_ERR
-                              "SLAB: cache with size %d has lost its name\n",
-                              pc->size);
-                       continue;
-               }
-
-               if (!strcmp(pc->name, name)) {
-                       printk(KERN_ERR
-                              "kmem_cache_create: duplicate cache %s\n", name);
-                       dump_stack();
-                       goto oops;
-               }
-       }
-
  #if DEBUG
-       WARN_ON(strchr(name, ' '));     /* It confuses parsers */
  #if FORCED_DEBUG
         /*
          * Enable redzoning and last user accounting, except for caches with
@@ -2388,7 +2320,7 @@ kmem_cache_create (const char *name, size_t size, size_t align,
         /* Get cache's description obj. */
         cachep = kmem_cache_zalloc(&cache_cache, gfp);
         if (!cachep)
-               goto oops;
+               return NULL;
  
         cachep->nodelists = (struct kmem_list3 **)&cachep->array[nr_cpu_ids];
         cachep->object_size = size;
@@ -2445,8 +2377,7 @@ kmem_cache_create (const char *name, size_t size, size_t align,
                 printk(KERN_ERR
                        "kmem_cache_create: couldn't create cache %s.\n", name);
                 kmem_cache_free(&cache_cache, cachep);
-               cachep = NULL;
-               goto oops;
+               return NULL;
         }
         slab_size = ALIGN(cachep->num * sizeof(kmem_bufctl_t)
                           + sizeof(struct slab), align);
@@ -2504,8 +2435,7 @@ kmem_cache_create (const char *name, size_t size, size_t align,
  
         if (setup_cpu_cache(cachep, gfp)) {
                 __kmem_cache_destroy(cachep);
-               cachep = NULL;
-               goto oops;
+               return NULL;
         }
  
         if (flags & SLAB_DEBUG_OBJECTS) {
@@ -2519,18 +2449,9 @@ kmem_cache_create (const char *name, size_t size, size_t align,
         }
  
         /* cache setup completed, link it into the list */
-       list_add(&cachep->list, &cache_chain);
-oops:
-       if (!cachep && (flags & SLAB_PANIC))
-               panic("kmem_cache_create(): failed to create slab `%s'\n",
-                     name);
-       if (slab_is_available()) {
-               mutex_unlock(&cache_chain_mutex);
-               put_online_cpus();
-       }
+       list_add(&cachep->list, &slab_caches);
         return cachep;
  }
-EXPORT_SYMBOL(kmem_cache_create);
  
  #if DEBUG
  static void check_irq_off(void)
@@ -2645,7 +2566,7 @@ out:
         return nr_freed;
  }
  
-/* Called with cache_chain_mutex held to protect against cpu hotplug */
+/* Called with slab_mutex held to protect against cpu hotplug */
  static int __cache_shrink(struct kmem_cache *cachep)
  {
         int ret = 0, i = 0;
@@ -2680,9 +2601,9 @@ int kmem_cache_shrink(struct kmem_cache *cachep)
         BUG_ON(!cachep || in_interrupt());
  
         get_online_cpus();
-       mutex_lock(&cache_chain_mutex);
+       mutex_lock(&slab_mutex);
         ret = __cache_shrink(cachep);
-       mutex_unlock(&cache_chain_mutex);
+       mutex_unlock(&slab_mutex);
         put_online_cpus();
         return ret;
  }
@@ -2710,15 +2631,15 @@ void kmem_cache_destroy(struct kmem_cache *cachep)
  
         /* Find the cache in the chain of caches. */
         get_online_cpus();
-       mutex_lock(&cache_chain_mutex);
+       mutex_lock(&slab_mutex);
         /*
          * the chain is never empty, cache_cache is never destroyed
          */
         list_del(&cachep->list);
         if (__cache_shrink(cachep)) {
                 slab_error(cachep, "Can't free all objects");
-               list_add(&cachep->list, &cache_chain);
-               mutex_unlock(&cache_chain_mutex);
+               list_add(&cachep->list, &slab_caches);
+               mutex_unlock(&slab_mutex);
                 put_online_cpus();
                 return;
         }
@@ -2727,7 +2648,7 @@ void kmem_cache_destroy(struct kmem_cache *cachep)
                 rcu_barrier();
  
         __kmem_cache_destroy(cachep);
-       mutex_unlock(&cache_chain_mutex);
+       mutex_unlock(&slab_mutex);
         put_online_cpus();
  }
  EXPORT_SYMBOL(kmem_cache_destroy);
@@ -4040,7 +3961,7 @@ static void do_ccupdate_local(void *info)
         new->new[smp_processor_id()] = old;
  }
  
-/* Always called with the cache_chain_mutex held */
+/* Always called with the slab_mutex held */
  static int do_tune_cpucache(struct kmem_cache *cachep, int limit,
                                 int batchcount, int shared, gfp_t gfp)
  {
@@ -4084,7 +4005,7 @@ static int do_tune_cpucache(struct kmem_cache *cachep, int limit,
         return alloc_kmemlist(cachep, gfp);
  }
  
-/* Called with cache_chain_mutex held always */
+/* Called with slab_mutex held always */
  static int enable_cpucache(struct kmem_cache *cachep, gfp_t gfp)
  {
         int err;
@@ -4186,11 +4107,11 @@ static void cache_reap(struct work_struct *w)
         int node = numa_mem_id();
         struct delayed_work *work = to_delayed_work(w);
  
-       if (!mutex_trylock(&cache_chain_mutex))
+       if (!mutex_trylock(&slab_mutex))
                 /* Give up. Setup the next iteration. */
                 goto out;
  
-       list_for_each_entry(searchp, &cache_chain, list) {
+       list_for_each_entry(searchp, &slab_caches, list) {
                 check_irq_on();
  
                 /*
@@ -4228,7 +4149,7 @@ next:
                 cond_resched();
         }
         check_irq_on();
-       mutex_unlock(&cache_chain_mutex);
+       mutex_unlock(&slab_mutex);
         next_reap_node();
  out:
         /* Set up the next iteration */
@@ -4264,21 +4185,21 @@ static void *s_start(struct seq_file *m, loff_t *pos)
  {
         loff_t n = *pos;
  
-       mutex_lock(&cache_chain_mutex);
+       mutex_lock(&slab_mutex);
         if (!n)
                 print_slabinfo_header(m);
  
-       return seq_list_start(&cache_chain, *pos);
+       return seq_list_start(&slab_caches, *pos);
  }
  
  static void *s_next(struct seq_file *m, void *p, loff_t *pos)
  {
-       return seq_list_next(p, &cache_chain, pos);
+       return seq_list_next(p, &slab_caches, pos);
  }
  
  static void s_stop(struct seq_file *m, void *p)
  {
-       mutex_unlock(&cache_chain_mutex);
+       mutex_unlock(&slab_mutex);
  }
  
  static int s_show(struct seq_file *m, void *p)
@@ -4429,9 +4350,9 @@ static ssize_t slabinfo_write(struct file *file, const char __user *buffer,
                 return -EINVAL;
  
         /* Find the cache in the chain of caches. */
-       mutex_lock(&cache_chain_mutex);
+       mutex_lock(&slab_mutex);
         res = -EINVAL;
-       list_for_each_entry(cachep, &cache_chain, list) {
+       list_for_each_entry(cachep, &slab_caches, list) {
                 if (!strcmp(cachep->name, kbuf)) {
                         if (limit < 1 || batchcount < 1 ||
                                         batchcount > limit || shared < 0) {
@@ -4444,7 +4365,7 @@ static ssize_t slabinfo_write(struct file *file, const char __user *buffer,
                         break;
                 }
         }
-       mutex_unlock(&cache_chain_mutex);
+       mutex_unlock(&slab_mutex);
         if (res >= 0)
                 res = count;
         return res;
@@ -4467,8 +4388,8 @@ static const struct file_operations proc_slabinfo_operations = {
  
  static void *leaks_start(struct seq_file *m, loff_t *pos)
  {
-       mutex_lock(&cache_chain_mutex);
-       return seq_list_start(&cache_chain, *pos);
+       mutex_lock(&slab_mutex);
+       return seq_list_start(&slab_caches, *pos);
  }
  
  static inline int add_caller(unsigned long *n, unsigned long v)
@@ -4567,17 +4488,17 @@ static int leaks_show(struct seq_file *m, void *p)
         name = cachep->name;
         if (n[0] == n[1]) {
                 /* Increase the buffer size */
-               mutex_unlock(&cache_chain_mutex);
+               mutex_unlock(&slab_mutex);
                 m->private = kzalloc(n[0] * 4 * sizeof(unsigned long), GFP_KERNEL);
                 if (!m->private) {
                         /* Too bad, we are really out */
                         m->private = n;
-                       mutex_lock(&cache_chain_mutex);
+                       mutex_lock(&slab_mutex);
                         return -ENOMEM;
                 }
                 *(unsigned long *)m->private = n[0] * 2;
                 kfree(n);
-               mutex_lock(&cache_chain_mutex);
+               mutex_lock(&slab_mutex);
                 /* Now make sure this entry will be retried */
                 m->count = m->size;
                 return 0;