patches/mm-slab-wrap-functions.patch - pub/scm/linux/kernel/git/paulg/3.8-rt-patches - Git at Google

 Subject: mm-slab-wrap-functions.patch
 From: Thomas Gleixner <tglx@linutronix.de>
 Date: Sat, 18 Jun 2011 19:44:43 +0200

 Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
 ---
  mm/slab.c |  163 +++++++++++++++++++++++++++++++++++++++++++-------------------
  1 file changed, 114 insertions(+), 49 deletions(-)

 --- a/mm/slab.c
 +++ b/mm/slab.c
 @@ -116,6 +116,7 @@
  #include	<linux/kmemcheck.h>
  #include	<linux/memory.h>
  #include	<linux/prefetch.h>
 +#include	<linux/locallock.h>

  #include	<net/sock.h>

 @@ -696,12 +697,49 @@ static void slab_set_debugobj_lock_class
  #endif

  static DEFINE_PER_CPU(struct delayed_work, slab_reap_work);
 +static DEFINE_LOCAL_IRQ_LOCK(slab_lock);
 +
 +#ifndef CONFIG_PREEMPT_RT_BASE
 +# define slab_on_each_cpu(func, cp)	on_each_cpu(func, cp, 1)
 +#else
 +/*
 + * execute func() for all CPUs. On PREEMPT_RT we dont actually have
 + * to run on the remote CPUs - we only have to take their CPU-locks.
 + * (This is a rare operation, so cacheline bouncing is not an issue.)
 + */
 +static void
 +slab_on_each_cpu(void (*func)(void *arg, int this_cpu), void *arg)
 +{
 +	unsigned int i;
 +
 +	get_cpu_light();
 +	for_each_online_cpu(i)
 +		func(arg, i);
 +	put_cpu_light();
 +}
 +
 +static void lock_slab_on(unsigned int cpu)
 +{
 +	local_lock_irq_on(slab_lock, cpu);
 +}
 +
 +static void unlock_slab_on(unsigned int cpu)
 +{
 +	local_unlock_irq_on(slab_lock, cpu);
 +}
 +#endif

  static inline struct array_cache *cpu_cache_get(struct kmem_cache *cachep)
  {
  	return cachep->array[smp_processor_id()];
  }

 +static inline struct array_cache *cpu_cache_get_on_cpu(struct kmem_cache *cachep,
 +						       int cpu)
 +{
 +	return cachep->array[cpu];
 +}
 +
  static inline struct kmem_cache *__find_general_cachep(size_t size,
  							gfp_t gfpflags)
  {
 @@ -1171,9 +1209,10 @@ static void reap_alien(struct kmem_cache
  	if (l3->alien) {
  		struct array_cache *ac = l3->alien[node];

 -		if (ac && ac->avail && spin_trylock_irq(&ac->lock)) {
 +		if (ac && ac->avail &&
 +		    local_spin_trylock_irq(slab_lock, &ac->lock)) {
  			__drain_alien_cache(cachep, ac, node);
 -			spin_unlock_irq(&ac->lock);
 +			local_spin_unlock_irq(slab_lock, &ac->lock);
  		}
  	}
  }
 @@ -1188,9 +1227,9 @@ static void drain_alien_cache(struct kme
  	for_each_online_node(i) {
  		ac = alien[i];
  		if (ac) {
 -			spin_lock_irqsave(&ac->lock, flags);
 +			local_spin_lock_irqsave(slab_lock, &ac->lock, flags);
  			__drain_alien_cache(cachep, ac, i);
 -			spin_unlock_irqrestore(&ac->lock, flags);
 +			local_spin_unlock_irqrestore(slab_lock, &ac->lock, flags);
  		}
  	}
  }
 @@ -1269,11 +1308,11 @@ static int init_cache_nodelists_node(int
  			cachep->nodelists[node] = l3;
  		}

 -		spin_lock_irq(&cachep->nodelists[node]->list_lock);
 +		local_spin_lock_irq(slab_lock, &cachep->nodelists[node]->list_lock);
  		cachep->nodelists[node]->free_limit =
  			(1 + nr_cpus_node(node)) *
  			cachep->batchcount + cachep->num;
 -		spin_unlock_irq(&cachep->nodelists[node]->list_lock);
 +		local_spin_unlock_irq(slab_lock, &cachep->nodelists[node]->list_lock);
  	}
  	return 0;
  }
 @@ -1298,7 +1337,7 @@ static void __cpuinit cpuup_canceled(lon
  		if (!l3)
  			goto free_array_cache;

 -		spin_lock_irq(&l3->list_lock);
 +		local_spin_lock_irq(slab_lock, &l3->list_lock);

  		/* Free limit for this kmem_list3 */
  		l3->free_limit -= cachep->batchcount;
 @@ -1306,7 +1345,7 @@ static void __cpuinit cpuup_canceled(lon
  			free_block(cachep, nc->entry, nc->avail, node);

  		if (!cpumask_empty(mask)) {
 -			spin_unlock_irq(&l3->list_lock);
 +			local_spin_unlock_irq(slab_lock, &l3->list_lock);
  			goto free_array_cache;
  		}

 @@ -1320,7 +1359,7 @@ static void __cpuinit cpuup_canceled(lon
  		alien = l3->alien;
  		l3->alien = NULL;

 -		spin_unlock_irq(&l3->list_lock);
 +		local_spin_unlock_irq(slab_lock, &l3->list_lock);

  		kfree(shared);
  		if (alien) {
 @@ -1394,7 +1433,7 @@ static int __cpuinit cpuup_prepare(long
  		l3 = cachep->nodelists[node];
  		BUG_ON(!l3);

 -		spin_lock_irq(&l3->list_lock);
 +		local_spin_lock_irq(slab_lock, &l3->list_lock);
  		if (!l3->shared) {
  			/*
  			 * We are serialised from CPU_DEAD or
 @@ -1409,7 +1448,7 @@ static int __cpuinit cpuup_prepare(long
  			alien = NULL;
  		}
  #endif
 -		spin_unlock_irq(&l3->list_lock);
 +		local_spin_unlock_irq(slab_lock, &l3->list_lock);
  		kfree(shared);
  		free_alien_cache(alien);
  		if (cachep->flags & SLAB_DEBUG_OBJECTS)
 @@ -1612,6 +1651,8 @@ void __init kmem_cache_init(void)
  	if (num_possible_nodes() == 1)
  		use_alien_caches = 0;

 +	local_irq_lock_init(slab_lock);
 +
  	for (i = 0; i < NUM_INIT_LISTS; i++)
  		kmem_list3_init(&initkmem_list3[i]);

 @@ -2533,7 +2574,7 @@ __kmem_cache_create (struct kmem_cache *
  #if DEBUG
  static void check_irq_off(void)
  {
 -	BUG_ON(!irqs_disabled());
 +	BUG_ON_NONRT(!irqs_disabled());
  }

  static void check_irq_on(void)
 @@ -2568,26 +2609,37 @@ static void drain_array(struct kmem_cach
  			struct array_cache *ac,
  			int force, int node);

 -static void do_drain(void *arg)
 +static void __do_drain(void *arg, unsigned int cpu)
  {
  	struct kmem_cache *cachep = arg;
  	struct array_cache *ac;
 -	int node = numa_mem_id();
 +	int node = cpu_to_mem(cpu);

 -	check_irq_off();
 -	ac = cpu_cache_get(cachep);
 +	ac = cpu_cache_get_on_cpu(cachep, cpu);
  	spin_lock(&cachep->nodelists[node]->list_lock);
  	free_block(cachep, ac->entry, ac->avail, node);
  	spin_unlock(&cachep->nodelists[node]->list_lock);
  	ac->avail = 0;
  }

 +#ifndef CONFIG_PREEMPT_RT_BASE
 +static void do_drain(void *arg)
 +{
 +	__do_drain(arg, smp_processor_id());
 +}
 +#else
 +static void do_drain(void *arg, int this_cpu)
 +{
 +	__do_drain(arg, this_cpu);
 +}
 +#endif
 +
  static void drain_cpu_caches(struct kmem_cache *cachep)
  {
  	struct kmem_list3 *l3;
  	int node;

 -	on_each_cpu(do_drain, cachep, 1);
 +	slab_on_each_cpu(do_drain, cachep);
  	check_irq_on();
  	for_each_online_node(node) {
  		l3 = cachep->nodelists[node];
 @@ -2618,10 +2670,10 @@ static int drain_freelist(struct kmem_ca
  	nr_freed = 0;
  	while (nr_freed < tofree && !list_empty(&l3->slabs_free)) {

 -		spin_lock_irq(&l3->list_lock);
 +		local_spin_lock_irq(slab_lock, &l3->list_lock);
  		p = l3->slabs_free.prev;
  		if (p == &l3->slabs_free) {
 -			spin_unlock_irq(&l3->list_lock);
 +			local_spin_unlock_irq(slab_lock, &l3->list_lock);
  			goto out;
  		}

 @@ -2635,7 +2687,7 @@ static int drain_freelist(struct kmem_ca
  		 * to the cache.
  		 */
  		l3->free_objects -= cache->num;
 -		spin_unlock_irq(&l3->list_lock);
 +		local_spin_unlock_irq(slab_lock, &l3->list_lock);
  		slab_destroy(cache, slabp);
  		nr_freed++;
  	}
 @@ -2910,7 +2962,7 @@ static int cache_grow(struct kmem_cache
  	offset *= cachep->colour_off;

  	if (local_flags & __GFP_WAIT)
 -		local_irq_enable();
 +		local_unlock_irq(slab_lock);

  	/*
  	 * The test for missing atomic flag is performed here, rather than
 @@ -2940,7 +2992,7 @@ static int cache_grow(struct kmem_cache
  	cache_init_objs(cachep, slabp);

  	if (local_flags & __GFP_WAIT)
 -		local_irq_disable();
 +		local_lock_irq(slab_lock);
  	check_irq_off();
  	spin_lock(&l3->list_lock);

 @@ -2954,7 +3006,7 @@ opps1:
  	kmem_freepages(cachep, objp);
  failed:
  	if (local_flags & __GFP_WAIT)
 -		local_irq_disable();
 +		local_lock_irq(slab_lock);
  	return 0;
  }

 @@ -3368,11 +3420,11 @@ retry:
  		 * set and go into memory reserves if necessary.
  		 */
  		if (local_flags & __GFP_WAIT)
 -			local_irq_enable();
 +			local_unlock_irq(slab_lock);
  		kmem_flagcheck(cache, flags);
  		obj = kmem_getpages(cache, local_flags, numa_mem_id());
  		if (local_flags & __GFP_WAIT)
 -			local_irq_disable();
 +			local_lock_irq(slab_lock);
  		if (obj) {
  			/*
  			 * Insert into the appropriate per node queues
 @@ -3492,7 +3544,7 @@ slab_alloc_node(struct kmem_cache *cache
  	cachep = memcg_kmem_get_cache(cachep, flags);

  	cache_alloc_debugcheck_before(cachep, flags);
 -	local_irq_save(save_flags);
 +	local_lock_irqsave(slab_lock, save_flags);

  	if (nodeid == NUMA_NO_NODE)
  		nodeid = slab_node;
 @@ -3517,7 +3569,7 @@ slab_alloc_node(struct kmem_cache *cache
  	/* ___cache_alloc_node can fall back to other nodes */
  	ptr = ____cache_alloc_node(cachep, flags, nodeid);
    out:
 -	local_irq_restore(save_flags);
 +	local_unlock_irqrestore(slab_lock, save_flags);
  	ptr = cache_alloc_debugcheck_after(cachep, flags, ptr, caller);
  	kmemleak_alloc_recursive(ptr, cachep->object_size, 1, cachep->flags,
  				 flags);
 @@ -3579,9 +3631,9 @@ slab_alloc(struct kmem_cache *cachep, gf
  	cachep = memcg_kmem_get_cache(cachep, flags);

  	cache_alloc_debugcheck_before(cachep, flags);
 -	local_irq_save(save_flags);
 +	local_lock_irqsave(slab_lock, save_flags);
  	objp = __do_cache_alloc(cachep, flags);
 -	local_irq_restore(save_flags);
 +	local_unlock_irqrestore(slab_lock, save_flags);
  	objp = cache_alloc_debugcheck_after(cachep, flags, objp, caller);
  	kmemleak_alloc_recursive(objp, cachep->object_size, 1, cachep->flags,
  				 flags);
 @@ -3898,9 +3950,9 @@ void kmem_cache_free(struct kmem_cache *
  	debug_check_no_locks_freed(objp, cachep->object_size);
  	if (!(cachep->flags & SLAB_DEBUG_OBJECTS))
  		debug_check_no_obj_freed(objp, cachep->object_size);
 -	local_irq_save(flags);
 +	local_lock_irqsave(slab_lock, flags);
  	__cache_free(cachep, objp, _RET_IP_);
 -	local_irq_restore(flags);
 +	local_unlock_irqrestore(slab_lock, flags);

  	trace_kmem_cache_free(_RET_IP_, objp);
  }
 @@ -3929,9 +3981,9 @@ void kfree(const void *objp)
  	debug_check_no_locks_freed(objp, c->object_size);

  	debug_check_no_obj_freed(objp, c->object_size);
 -	local_irq_save(flags);
 +	local_lock_irqsave(slab_lock, flags);
  	__cache_free(c, (void *)objp, _RET_IP_);
 -	local_irq_restore(flags);
 +	local_unlock_irqrestore(slab_lock, flags);
  }
  EXPORT_SYMBOL(kfree);

 @@ -3968,7 +4020,7 @@ static int alloc_kmemlist(struct kmem_ca
  		if (l3) {
  			struct array_cache *shared = l3->shared;

 -			spin_lock_irq(&l3->list_lock);
 +			local_spin_lock_irq(slab_lock, &l3->list_lock);

  			if (shared)
  				free_block(cachep, shared->entry,
 @@ -3981,7 +4033,7 @@ static int alloc_kmemlist(struct kmem_ca
  			}
  			l3->free_limit = (1 + nr_cpus_node(node)) *
  					cachep->batchcount + cachep->num;
 -			spin_unlock_irq(&l3->list_lock);
 +			local_spin_unlock_irq(slab_lock, &l3->list_lock);
  			kfree(shared);
  			free_alien_cache(new_alien);
  			continue;
 @@ -4028,17 +4080,28 @@ struct ccupdate_struct {
  	struct array_cache *new[0];
  };

 -static void do_ccupdate_local(void *info)
 +static void __do_ccupdate_local(void *info, int cpu)
  {
  	struct ccupdate_struct *new = info;
  	struct array_cache *old;

 -	check_irq_off();
 -	old = cpu_cache_get(new->cachep);
 +	old = cpu_cache_get_on_cpu(new->cachep, cpu);

 -	new->cachep->array[smp_processor_id()] = new->new[smp_processor_id()];
 -	new->new[smp_processor_id()] = old;
 +	new->cachep->array[cpu] = new->new[cpu];
 +	new->new[cpu] = old;
 +}
 +
 +#ifndef CONFIG_PREEMPT_RT_BASE
 +static void do_ccupdate_local(void *info)
 +{
 +	__do_ccupdate_local(info, smp_processor_id());
  }
 +#else
 +static void do_ccupdate_local(void *info, int cpu)
 +{
 +	__do_ccupdate_local(info, cpu);
 +}
 +#endif

  /* Always called with the slab_mutex held */
  static int __do_tune_cpucache(struct kmem_cache *cachep, int limit,
 @@ -4064,7 +4127,7 @@ static int __do_tune_cpucache(struct kme
  	}
  	new->cachep = cachep;

 -	on_each_cpu(do_ccupdate_local, (void *)new, 1);
 +	slab_on_each_cpu(do_ccupdate_local, (void *)new);

  	check_irq_on();
  	cachep->batchcount = batchcount;
 @@ -4075,9 +4138,11 @@ static int __do_tune_cpucache(struct kme
  		struct array_cache *ccold = new->new[i];
  		if (!ccold)
  			continue;
 -		spin_lock_irq(&cachep->nodelists[cpu_to_mem(i)]->list_lock);
 +		local_spin_lock_irq(slab_lock,
 +				    &cachep->nodelists[cpu_to_mem(i)]->list_lock);
  		free_block(cachep, ccold->entry, ccold->avail, cpu_to_mem(i));
 -		spin_unlock_irq(&cachep->nodelists[cpu_to_mem(i)]->list_lock);
 +		local_spin_unlock_irq(slab_lock,
 +				      &cachep->nodelists[cpu_to_mem(i)]->list_lock);
  		kfree(ccold);
  	}
  	kfree(new);
 @@ -4192,7 +4257,7 @@ static void drain_array(struct kmem_cach
  	if (ac->touched && !force) {
  		ac->touched = 0;
  	} else {
 -		spin_lock_irq(&l3->list_lock);
 +		local_spin_lock_irq(slab_lock, &l3->list_lock);
  		if (ac->avail) {
  			tofree = force ? ac->avail : (ac->limit + 4) / 5;
  			if (tofree > ac->avail)
 @@ -4202,7 +4267,7 @@ static void drain_array(struct kmem_cach
  			memmove(ac->entry, &(ac->entry[tofree]),
  				sizeof(void *) * ac->avail);
  		}
 -		spin_unlock_irq(&l3->list_lock);
 +		local_spin_unlock_irq(slab_lock, &l3->list_lock);
  	}
  }

 @@ -4295,7 +4360,7 @@ void get_slabinfo(struct kmem_cache *cac
  			continue;

  		check_irq_on();
 -		spin_lock_irq(&l3->list_lock);
 +		local_spin_lock_irq(slab_lock, &l3->list_lock);

  		list_for_each_entry(slabp, &l3->slabs_full, list) {
  			if (slabp->inuse != cachep->num && !error)
 @@ -4320,7 +4385,7 @@ void get_slabinfo(struct kmem_cache *cac
  		if (l3->shared)
  			shared_avail += l3->shared->avail;

 -		spin_unlock_irq(&l3->list_lock);
 +		local_spin_unlock_irq(slab_lock, &l3->list_lock);
  	}
  	num_slabs += active_slabs;
  	num_objs = num_slabs * cachep->num;
 @@ -4520,13 +4585,13 @@ static int leaks_show(struct seq_file *m
  			continue;

  		check_irq_on();
 -		spin_lock_irq(&l3->list_lock);
 +		local_spin_lock_irq(slab_lock, &l3->list_lock);

  		list_for_each_entry(slabp, &l3->slabs_full, list)
  			handle_slab(n, cachep, slabp);
  		list_for_each_entry(slabp, &l3->slabs_partial, list)
  			handle_slab(n, cachep, slabp);
 -		spin_unlock_irq(&l3->list_lock);
 +		local_spin_unlock_irq(slab_lock, &l3->list_lock);
  	}
  	name = cachep->name;
  	if (n[0] == n[1]) {
	Subject: mm-slab-wrap-functions.patch
	From: Thomas Gleixner <tglx@linutronix.de>
	Date: Sat, 18 Jun 2011 19:44:43 +0200

	Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
	---
	mm/slab.c \| 163 +++++++++++++++++++++++++++++++++++++++++++-------------------
	1 file changed, 114 insertions(+), 49 deletions(-)

	--- a/mm/slab.c
	+++ b/mm/slab.c
	@@ -116,6 +116,7 @@
	#include <linux/kmemcheck.h>
	#include <linux/memory.h>
	#include <linux/prefetch.h>
	+#include <linux/locallock.h>

	#include <net/sock.h>

	@@ -696,12 +697,49 @@ static void slab_set_debugobj_lock_class
	#endif

	static DEFINE_PER_CPU(struct delayed_work, slab_reap_work);
	+static DEFINE_LOCAL_IRQ_LOCK(slab_lock);
	+
	+#ifndef CONFIG_PREEMPT_RT_BASE
	+# define slab_on_each_cpu(func, cp) on_each_cpu(func, cp, 1)
	+#else
	+/*
	+ * execute func() for all CPUs. On PREEMPT_RT we dont actually have
	+ * to run on the remote CPUs - we only have to take their CPU-locks.
	+ * (This is a rare operation, so cacheline bouncing is not an issue.)
	+ */
	+static void
	+slab_on_each_cpu(void (func)(void arg, int this_cpu), void *arg)
	+{
	+ unsigned int i;
	+
	+ get_cpu_light();
	+ for_each_online_cpu(i)
	+ func(arg, i);
	+ put_cpu_light();
	+}
	+
	+static void lock_slab_on(unsigned int cpu)
	+{
	+ local_lock_irq_on(slab_lock, cpu);
	+}
	+
	+static void unlock_slab_on(unsigned int cpu)
	+{
	+ local_unlock_irq_on(slab_lock, cpu);
	+}
	+#endif

	static inline struct array_cache cpu_cache_get(struct kmem_cache cachep)
	{
	return cachep->array[smp_processor_id()];
	}

	+static inline struct array_cache cpu_cache_get_on_cpu(struct kmem_cache cachep,
	+ int cpu)
	+{
	+ return cachep->array[cpu];
	+}
	+
	static inline struct kmem_cache *__find_general_cachep(size_t size,
	gfp_t gfpflags)
	{
	@@ -1171,9 +1209,10 @@ static void reap_alien(struct kmem_cache
	if (l3->alien) {
	struct array_cache *ac = l3->alien[node];

	- if (ac && ac->avail && spin_trylock_irq(&ac->lock)) {
	+ if (ac && ac->avail &&
	+ local_spin_trylock_irq(slab_lock, &ac->lock)) {
	__drain_alien_cache(cachep, ac, node);
	- spin_unlock_irq(&ac->lock);
	+ local_spin_unlock_irq(slab_lock, &ac->lock);
	}
	}
	}
	@@ -1188,9 +1227,9 @@ static void drain_alien_cache(struct kme
	for_each_online_node(i) {
	ac = alien[i];
	if (ac) {
	- spin_lock_irqsave(&ac->lock, flags);
	+ local_spin_lock_irqsave(slab_lock, &ac->lock, flags);
	__drain_alien_cache(cachep, ac, i);
	- spin_unlock_irqrestore(&ac->lock, flags);
	+ local_spin_unlock_irqrestore(slab_lock, &ac->lock, flags);
	}
	}
	}
	@@ -1269,11 +1308,11 @@ static int init_cache_nodelists_node(int
	cachep->nodelists[node] = l3;
	}

	- spin_lock_irq(&cachep->nodelists[node]->list_lock);
	+ local_spin_lock_irq(slab_lock, &cachep->nodelists[node]->list_lock);
	cachep->nodelists[node]->free_limit =
	(1 + nr_cpus_node(node)) *
	cachep->batchcount + cachep->num;
	- spin_unlock_irq(&cachep->nodelists[node]->list_lock);
	+ local_spin_unlock_irq(slab_lock, &cachep->nodelists[node]->list_lock);
	}
	return 0;
	}
	@@ -1298,7 +1337,7 @@ static void __cpuinit cpuup_canceled(lon
	if (!l3)
	goto free_array_cache;

	- spin_lock_irq(&l3->list_lock);
	+ local_spin_lock_irq(slab_lock, &l3->list_lock);

	/* Free limit for this kmem_list3 */
	l3->free_limit -= cachep->batchcount;
	@@ -1306,7 +1345,7 @@ static void __cpuinit cpuup_canceled(lon
	free_block(cachep, nc->entry, nc->avail, node);

	if (!cpumask_empty(mask)) {
	- spin_unlock_irq(&l3->list_lock);
	+ local_spin_unlock_irq(slab_lock, &l3->list_lock);
	goto free_array_cache;
	}

	@@ -1320,7 +1359,7 @@ static void __cpuinit cpuup_canceled(lon
	alien = l3->alien;
	l3->alien = NULL;

	- spin_unlock_irq(&l3->list_lock);
	+ local_spin_unlock_irq(slab_lock, &l3->list_lock);

	kfree(shared);
	if (alien) {
	@@ -1394,7 +1433,7 @@ static int __cpuinit cpuup_prepare(long
	l3 = cachep->nodelists[node];
	BUG_ON(!l3);

	- spin_lock_irq(&l3->list_lock);
	+ local_spin_lock_irq(slab_lock, &l3->list_lock);
	if (!l3->shared) {
	/*
	* We are serialised from CPU_DEAD or
	@@ -1409,7 +1448,7 @@ static int __cpuinit cpuup_prepare(long
	alien = NULL;
	}
	#endif
	- spin_unlock_irq(&l3->list_lock);
	+ local_spin_unlock_irq(slab_lock, &l3->list_lock);
	kfree(shared);
	free_alien_cache(alien);
	if (cachep->flags & SLAB_DEBUG_OBJECTS)
	@@ -1612,6 +1651,8 @@ void __init kmem_cache_init(void)
	if (num_possible_nodes() == 1)
	use_alien_caches = 0;

	+ local_irq_lock_init(slab_lock);
	+
	for (i = 0; i < NUM_INIT_LISTS; i++)
	kmem_list3_init(&initkmem_list3[i]);

	@@ -2533,7 +2574,7 @@ __kmem_cache_create (struct kmem_cache *
	#if DEBUG
	static void check_irq_off(void)
	{
	- BUG_ON(!irqs_disabled());
	+ BUG_ON_NONRT(!irqs_disabled());
	}

	static void check_irq_on(void)
	@@ -2568,26 +2609,37 @@ static void drain_array(struct kmem_cach
	struct array_cache *ac,
	int force, int node);

	-static void do_drain(void *arg)
	+static void __do_drain(void *arg, unsigned int cpu)
	{
	struct kmem_cache *cachep = arg;
	struct array_cache *ac;
	- int node = numa_mem_id();
	+ int node = cpu_to_mem(cpu);

	- check_irq_off();
	- ac = cpu_cache_get(cachep);
	+ ac = cpu_cache_get_on_cpu(cachep, cpu);
	spin_lock(&cachep->nodelists[node]->list_lock);
	free_block(cachep, ac->entry, ac->avail, node);
	spin_unlock(&cachep->nodelists[node]->list_lock);
	ac->avail = 0;
	}

	+#ifndef CONFIG_PREEMPT_RT_BASE
	+static void do_drain(void *arg)
	+{
	+ __do_drain(arg, smp_processor_id());
	+}
	+#else
	+static void do_drain(void *arg, int this_cpu)
	+{
	+ __do_drain(arg, this_cpu);
	+}
	+#endif
	+
	static void drain_cpu_caches(struct kmem_cache *cachep)
	{
	struct kmem_list3 *l3;
	int node;

	- on_each_cpu(do_drain, cachep, 1);
	+ slab_on_each_cpu(do_drain, cachep);
	check_irq_on();
	for_each_online_node(node) {
	l3 = cachep->nodelists[node];
	@@ -2618,10 +2670,10 @@ static int drain_freelist(struct kmem_ca
	nr_freed = 0;
	while (nr_freed < tofree && !list_empty(&l3->slabs_free)) {

	- spin_lock_irq(&l3->list_lock);
	+ local_spin_lock_irq(slab_lock, &l3->list_lock);
	p = l3->slabs_free.prev;
	if (p == &l3->slabs_free) {
	- spin_unlock_irq(&l3->list_lock);
	+ local_spin_unlock_irq(slab_lock, &l3->list_lock);
	goto out;
	}

	@@ -2635,7 +2687,7 @@ static int drain_freelist(struct kmem_ca
	* to the cache.
	*/
	l3->free_objects -= cache->num;
	- spin_unlock_irq(&l3->list_lock);
	+ local_spin_unlock_irq(slab_lock, &l3->list_lock);
	slab_destroy(cache, slabp);
	nr_freed++;
	}
	@@ -2910,7 +2962,7 @@ static int cache_grow(struct kmem_cache
	offset *= cachep->colour_off;

	if (local_flags & __GFP_WAIT)
	- local_irq_enable();
	+ local_unlock_irq(slab_lock);

	/*
	* The test for missing atomic flag is performed here, rather than
	@@ -2940,7 +2992,7 @@ static int cache_grow(struct kmem_cache
	cache_init_objs(cachep, slabp);

	if (local_flags & __GFP_WAIT)
	- local_irq_disable();
	+ local_lock_irq(slab_lock);
	check_irq_off();
	spin_lock(&l3->list_lock);

	@@ -2954,7 +3006,7 @@ opps1:
	kmem_freepages(cachep, objp);
	failed:
	if (local_flags & __GFP_WAIT)
	- local_irq_disable();
	+ local_lock_irq(slab_lock);
	return 0;
	}

	@@ -3368,11 +3420,11 @@ retry:
	* set and go into memory reserves if necessary.
	*/
	if (local_flags & __GFP_WAIT)
	- local_irq_enable();
	+ local_unlock_irq(slab_lock);
	kmem_flagcheck(cache, flags);
	obj = kmem_getpages(cache, local_flags, numa_mem_id());
	if (local_flags & __GFP_WAIT)
	- local_irq_disable();
	+ local_lock_irq(slab_lock);
	if (obj) {
	/*
	* Insert into the appropriate per node queues
	@@ -3492,7 +3544,7 @@ slab_alloc_node(struct kmem_cache *cache
	cachep = memcg_kmem_get_cache(cachep, flags);

	cache_alloc_debugcheck_before(cachep, flags);
	- local_irq_save(save_flags);
	+ local_lock_irqsave(slab_lock, save_flags);

	if (nodeid == NUMA_NO_NODE)
	nodeid = slab_node;
	@@ -3517,7 +3569,7 @@ slab_alloc_node(struct kmem_cache *cache
	/* ___cache_alloc_node can fall back to other nodes */
	ptr = ____cache_alloc_node(cachep, flags, nodeid);
	out:
	- local_irq_restore(save_flags);
	+ local_unlock_irqrestore(slab_lock, save_flags);
	ptr = cache_alloc_debugcheck_after(cachep, flags, ptr, caller);
	kmemleak_alloc_recursive(ptr, cachep->object_size, 1, cachep->flags,
	flags);
	@@ -3579,9 +3631,9 @@ slab_alloc(struct kmem_cache *cachep, gf
	cachep = memcg_kmem_get_cache(cachep, flags);

	cache_alloc_debugcheck_before(cachep, flags);
	- local_irq_save(save_flags);
	+ local_lock_irqsave(slab_lock, save_flags);
	objp = __do_cache_alloc(cachep, flags);
	- local_irq_restore(save_flags);
	+ local_unlock_irqrestore(slab_lock, save_flags);
	objp = cache_alloc_debugcheck_after(cachep, flags, objp, caller);
	kmemleak_alloc_recursive(objp, cachep->object_size, 1, cachep->flags,
	flags);
	@@ -3898,9 +3950,9 @@ void kmem_cache_free(struct kmem_cache *
	debug_check_no_locks_freed(objp, cachep->object_size);
	if (!(cachep->flags & SLAB_DEBUG_OBJECTS))
	debug_check_no_obj_freed(objp, cachep->object_size);
	- local_irq_save(flags);
	+ local_lock_irqsave(slab_lock, flags);
	__cache_free(cachep, objp, _RET_IP_);
	- local_irq_restore(flags);
	+ local_unlock_irqrestore(slab_lock, flags);

	trace_kmem_cache_free(_RET_IP_, objp);
	}
	@@ -3929,9 +3981,9 @@ void kfree(const void *objp)
	debug_check_no_locks_freed(objp, c->object_size);

	debug_check_no_obj_freed(objp, c->object_size);
	- local_irq_save(flags);
	+ local_lock_irqsave(slab_lock, flags);
	__cache_free(c, (void *)objp, _RET_IP_);
	- local_irq_restore(flags);
	+ local_unlock_irqrestore(slab_lock, flags);
	}
	EXPORT_SYMBOL(kfree);

	@@ -3968,7 +4020,7 @@ static int alloc_kmemlist(struct kmem_ca
	if (l3) {
	struct array_cache *shared = l3->shared;

	- spin_lock_irq(&l3->list_lock);
	+ local_spin_lock_irq(slab_lock, &l3->list_lock);

	if (shared)
	free_block(cachep, shared->entry,
	@@ -3981,7 +4033,7 @@ static int alloc_kmemlist(struct kmem_ca
	}
	l3->free_limit = (1 + nr_cpus_node(node)) *
	cachep->batchcount + cachep->num;
	- spin_unlock_irq(&l3->list_lock);
	+ local_spin_unlock_irq(slab_lock, &l3->list_lock);
	kfree(shared);
	free_alien_cache(new_alien);
	continue;
	@@ -4028,17 +4080,28 @@ struct ccupdate_struct {
	struct array_cache *new[0];
	};

	-static void do_ccupdate_local(void *info)
	+static void __do_ccupdate_local(void *info, int cpu)
	{
	struct ccupdate_struct *new = info;
	struct array_cache *old;

	- check_irq_off();
	- old = cpu_cache_get(new->cachep);
	+ old = cpu_cache_get_on_cpu(new->cachep, cpu);

	- new->cachep->array[smp_processor_id()] = new->new[smp_processor_id()];
	- new->new[smp_processor_id()] = old;
	+ new->cachep->array[cpu] = new->new[cpu];
	+ new->new[cpu] = old;
	+}
	+
	+#ifndef CONFIG_PREEMPT_RT_BASE
	+static void do_ccupdate_local(void *info)
	+{
	+ __do_ccupdate_local(info, smp_processor_id());
	}
	+#else
	+static void do_ccupdate_local(void *info, int cpu)
	+{
	+ __do_ccupdate_local(info, cpu);
	+}
	+#endif

	/* Always called with the slab_mutex held */
	static int __do_tune_cpucache(struct kmem_cache *cachep, int limit,
	@@ -4064,7 +4127,7 @@ static int __do_tune_cpucache(struct kme
	}
	new->cachep = cachep;

	- on_each_cpu(do_ccupdate_local, (void *)new, 1);
	+ slab_on_each_cpu(do_ccupdate_local, (void *)new);

	check_irq_on();
	cachep->batchcount = batchcount;
	@@ -4075,9 +4138,11 @@ static int __do_tune_cpucache(struct kme
	struct array_cache *ccold = new->new[i];
	if (!ccold)
	continue;
	- spin_lock_irq(&cachep->nodelists[cpu_to_mem(i)]->list_lock);
	+ local_spin_lock_irq(slab_lock,
	+ &cachep->nodelists[cpu_to_mem(i)]->list_lock);
	free_block(cachep, ccold->entry, ccold->avail, cpu_to_mem(i));
	- spin_unlock_irq(&cachep->nodelists[cpu_to_mem(i)]->list_lock);
	+ local_spin_unlock_irq(slab_lock,
	+ &cachep->nodelists[cpu_to_mem(i)]->list_lock);
	kfree(ccold);
	}
	kfree(new);
	@@ -4192,7 +4257,7 @@ static void drain_array(struct kmem_cach
	if (ac->touched && !force) {
	ac->touched = 0;
	} else {
	- spin_lock_irq(&l3->list_lock);
	+ local_spin_lock_irq(slab_lock, &l3->list_lock);
	if (ac->avail) {
	tofree = force ? ac->avail : (ac->limit + 4) / 5;
	if (tofree > ac->avail)
	@@ -4202,7 +4267,7 @@ static void drain_array(struct kmem_cach
	memmove(ac->entry, &(ac->entry[tofree]),
	sizeof(void ) ac->avail);
	}
	- spin_unlock_irq(&l3->list_lock);
	+ local_spin_unlock_irq(slab_lock, &l3->list_lock);
	}
	}

	@@ -4295,7 +4360,7 @@ void get_slabinfo(struct kmem_cache *cac
	continue;

	check_irq_on();
	- spin_lock_irq(&l3->list_lock);
	+ local_spin_lock_irq(slab_lock, &l3->list_lock);

	list_for_each_entry(slabp, &l3->slabs_full, list) {
	if (slabp->inuse != cachep->num && !error)
	@@ -4320,7 +4385,7 @@ void get_slabinfo(struct kmem_cache *cac
	if (l3->shared)
	shared_avail += l3->shared->avail;

	- spin_unlock_irq(&l3->list_lock);
	+ local_spin_unlock_irq(slab_lock, &l3->list_lock);
	}
	num_slabs += active_slabs;
	num_objs = num_slabs * cachep->num;
	@@ -4520,13 +4585,13 @@ static int leaks_show(struct seq_file *m
	continue;

	check_irq_on();
	- spin_lock_irq(&l3->list_lock);
	+ local_spin_lock_irq(slab_lock, &l3->list_lock);

	list_for_each_entry(slabp, &l3->slabs_full, list)
	handle_slab(n, cachep, slabp);
	list_for_each_entry(slabp, &l3->slabs_partial, list)
	handle_slab(n, cachep, slabp);
	- spin_unlock_irq(&l3->list_lock);
	+ local_spin_unlock_irq(slab_lock, &l3->list_lock);
	}
	name = cachep->name;
	if (n[0] == n[1]) {