mm, slub: move disabling/enabling irqs to ___slab_alloc()

Currently __slab_alloc() disables irqs around the whole ___slab_alloc().  This
includes cases where this is not needed, such as when the allocation ends up in
the page allocator and has to awkwardly enable irqs back based on gfp flags.
Also the whole kmem_cache_alloc_bulk() is executed with irqs disabled even when
it hits the __slab_alloc() slow path, and long periods with disabled interrupts
are undesirable.

As a first step towards reducing irq disabled periods, move irq handling into
___slab_alloc(). Callers will instead prevent the s->cpu_slab percpu pointer
from becoming invalid via get_cpu_ptr(), thus preempt_disable(). This does not
protect against modification by an irq handler, which is still done by disabled
irq for most of ___slab_alloc(). As a small immediate benefit,
slab_out_of_memory() from ___slab_alloc() is now called with irqs enabled.

kmem_cache_alloc_bulk() disables irqs for its fastpath and then re-enables them
before calling ___slab_alloc(), which then disables them at its discretion. The
whole kmem_cache_alloc_bulk() operation also disables preemption.

When  ___slab_alloc() calls new_slab() to allocate a new page, re-enable
preemption, because new_slab() will re-enable interrupts in contexts that allow
blocking (this will be improved by later patches).

The patch itself will thus increase overhead a bit due to disabled preemption
(on configs where it matters) and increased disabling/enabling irqs in
kmem_cache_alloc_bulk(), but that will be gradually improved in the following
patches.

Note in __slab_alloc() we need to change the #ifdef CONFIG_PREEMPT guard to
CONFIG_PREEMPT_COUNT to make sure preempt disable/enable is properly paired in
all configurations. On configs without involuntary preemption and debugging
the re-read of kmem_cache_cpu pointer is still compiled out as it was before.

[ Mike Galbraith <efault@gmx.de>: Fix kmem_cache_alloc_bulk() error path ]
Signed-off-by: Vlastimil Babka <vbabka@suse.cz>
This commit is contained in:
Vlastimil Babka 2021-05-07 19:32:31 +02:00
parent 9b4bc85a69
commit e500059ba5

View File

@ -2670,7 +2670,7 @@ static inline void *get_freelist(struct kmem_cache *s, struct page *page)
* we need to allocate a new slab. This is the slowest path since it involves * we need to allocate a new slab. This is the slowest path since it involves
* a call to the page allocator and the setup of a new slab. * a call to the page allocator and the setup of a new slab.
* *
* Version of __slab_alloc to use when we know that interrupts are * Version of __slab_alloc to use when we know that preemption is
* already disabled (which is the case for bulk allocation). * already disabled (which is the case for bulk allocation).
*/ */
static void *___slab_alloc(struct kmem_cache *s, gfp_t gfpflags, int node, static void *___slab_alloc(struct kmem_cache *s, gfp_t gfpflags, int node,
@ -2678,9 +2678,11 @@ static void *___slab_alloc(struct kmem_cache *s, gfp_t gfpflags, int node,
{ {
void *freelist; void *freelist;
struct page *page; struct page *page;
unsigned long flags;
stat(s, ALLOC_SLOWPATH); stat(s, ALLOC_SLOWPATH);
local_irq_save(flags);
page = c->page; page = c->page;
if (!page) { if (!page) {
/* /*
@ -2743,6 +2745,7 @@ load_freelist:
VM_BUG_ON(!c->page->frozen); VM_BUG_ON(!c->page->frozen);
c->freelist = get_freepointer(s, freelist); c->freelist = get_freepointer(s, freelist);
c->tid = next_tid(c->tid); c->tid = next_tid(c->tid);
local_irq_restore(flags);
return freelist; return freelist;
new_slab: new_slab:
@ -2760,14 +2763,16 @@ new_slab:
goto check_new_page; goto check_new_page;
} }
put_cpu_ptr(s->cpu_slab);
page = new_slab(s, gfpflags, node); page = new_slab(s, gfpflags, node);
c = get_cpu_ptr(s->cpu_slab);
if (unlikely(!page)) { if (unlikely(!page)) {
local_irq_restore(flags);
slab_out_of_memory(s, gfpflags, node); slab_out_of_memory(s, gfpflags, node);
return NULL; return NULL;
} }
c = raw_cpu_ptr(s->cpu_slab);
if (c->page) if (c->page)
flush_slab(s, c); flush_slab(s, c);
@ -2807,31 +2812,33 @@ check_new_page:
return_single: return_single:
deactivate_slab(s, page, get_freepointer(s, freelist), c); deactivate_slab(s, page, get_freepointer(s, freelist), c);
local_irq_restore(flags);
return freelist; return freelist;
} }
/* /*
* Another one that disabled interrupt and compensates for possible * A wrapper for ___slab_alloc() for contexts where preemption is not yet
* cpu changes by refetching the per cpu area pointer. * disabled. Compensates for possible cpu changes by refetching the per cpu area
* pointer.
*/ */
static void *__slab_alloc(struct kmem_cache *s, gfp_t gfpflags, int node, static void *__slab_alloc(struct kmem_cache *s, gfp_t gfpflags, int node,
unsigned long addr, struct kmem_cache_cpu *c) unsigned long addr, struct kmem_cache_cpu *c)
{ {
void *p; void *p;
unsigned long flags;
local_irq_save(flags); #ifdef CONFIG_PREEMPT_COUNT
#ifdef CONFIG_PREEMPTION
/* /*
* We may have been preempted and rescheduled on a different * We may have been preempted and rescheduled on a different
* cpu before disabling interrupts. Need to reload cpu area * cpu before disabling preemption. Need to reload cpu area
* pointer. * pointer.
*/ */
c = this_cpu_ptr(s->cpu_slab); c = get_cpu_ptr(s->cpu_slab);
#endif #endif
p = ___slab_alloc(s, gfpflags, node, addr, c); p = ___slab_alloc(s, gfpflags, node, addr, c);
local_irq_restore(flags); #ifdef CONFIG_PREEMPT_COUNT
put_cpu_ptr(s->cpu_slab);
#endif
return p; return p;
} }
@ -3359,8 +3366,8 @@ int kmem_cache_alloc_bulk(struct kmem_cache *s, gfp_t flags, size_t size,
* IRQs, which protects against PREEMPT and interrupts * IRQs, which protects against PREEMPT and interrupts
* handlers invoking normal fastpath. * handlers invoking normal fastpath.
*/ */
c = get_cpu_ptr(s->cpu_slab);
local_irq_disable(); local_irq_disable();
c = this_cpu_ptr(s->cpu_slab);
for (i = 0; i < size; i++) { for (i = 0; i < size; i++) {
void *object = kfence_alloc(s, s->object_size, flags); void *object = kfence_alloc(s, s->object_size, flags);
@ -3381,6 +3388,8 @@ int kmem_cache_alloc_bulk(struct kmem_cache *s, gfp_t flags, size_t size,
*/ */
c->tid = next_tid(c->tid); c->tid = next_tid(c->tid);
local_irq_enable();
/* /*
* Invoking slow path likely have side-effect * Invoking slow path likely have side-effect
* of re-populating per CPU c->freelist * of re-populating per CPU c->freelist
@ -3393,6 +3402,8 @@ int kmem_cache_alloc_bulk(struct kmem_cache *s, gfp_t flags, size_t size,
c = this_cpu_ptr(s->cpu_slab); c = this_cpu_ptr(s->cpu_slab);
maybe_wipe_obj_freeptr(s, p[i]); maybe_wipe_obj_freeptr(s, p[i]);
local_irq_disable();
continue; /* goto for-loop */ continue; /* goto for-loop */
} }
c->freelist = get_freepointer(s, object); c->freelist = get_freepointer(s, object);
@ -3401,6 +3412,7 @@ int kmem_cache_alloc_bulk(struct kmem_cache *s, gfp_t flags, size_t size,
} }
c->tid = next_tid(c->tid); c->tid = next_tid(c->tid);
local_irq_enable(); local_irq_enable();
put_cpu_ptr(s->cpu_slab);
/* /*
* memcg and kmem_cache debug support and memory initialization. * memcg and kmem_cache debug support and memory initialization.
@ -3410,7 +3422,7 @@ int kmem_cache_alloc_bulk(struct kmem_cache *s, gfp_t flags, size_t size,
slab_want_init_on_alloc(flags, s)); slab_want_init_on_alloc(flags, s));
return i; return i;
error: error:
local_irq_enable(); put_cpu_ptr(s->cpu_slab);
slab_post_alloc_hook(s, objcg, flags, i, p, false); slab_post_alloc_hook(s, objcg, flags, i, p, false);
__kmem_cache_free_bulk(s, i, p); __kmem_cache_free_bulk(s, i, p);
return 0; return 0;