From 90db05ab34da60f2c09e69db715f64ddc4196d5a Mon Sep 17 00:00:00 2001 From: Christoph Lameter Date: Fri, 15 Feb 2008 15:22:22 -0800 Subject: [PATCH] slub: Update statistics handling for variable order slabs Change the statistics to consider that slabs of the same slabcache can have different number of objects in them since they may be of different order. Provide a new sysfs field total_objects which shows the total objects that the allocated slabs of a slabcache could hold. Update the description of the objects field in the kmem_cache structure. Its role is now to be the limit of the maximum number of objects per slab if a slab is allocated with the largest possible order. Reviewed-by: Pekka Enberg Signed-off-by: Christoph Lameter --- include/linux/slub_def.h | 3 + mm/slub.c | 83 ++++++++++++++++++++++++++++++++++------------- 2 files changed, 63 insertions(+), 23 deletions(-) Index: linux-2.6/include/linux/slub_def.h =================================================================== --- linux-2.6.orig/include/linux/slub_def.h 2008-02-28 18:39:59.283484392 -0800 +++ linux-2.6/include/linux/slub_def.h 2008-02-28 18:47:28.878128171 -0800 @@ -46,6 +46,7 @@ struct kmem_cache_node { spinlock_t list_lock; /* Protect partial list and nr_partial */ unsigned long nr_partial; atomic_long_t nr_slabs; + atomic_long_t total_objects; struct list_head partial; #ifdef CONFIG_SLUB_DEBUG struct list_head full; @@ -70,7 +71,7 @@ struct kmem_cache { struct kmem_cache_node local_node; /* Allocation and freeing of slabs */ - int objects; /* Number of objects in slab */ + int max_objects; /* Number of objects in a slab of maximum size */ gfp_t allocflags; /* gfp flags to use on each alloc */ int refcount; /* Refcount for slab cache destroy */ void (*ctor)(struct kmem_cache *, void *); Index: linux-2.6/mm/slub.c =================================================================== --- linux-2.6.orig/mm/slub.c 2008-02-28 18:41:17.155960129 -0800 +++ linux-2.6/mm/slub.c 2008-02-28 18:47:28.886128178 -0800 @@ -294,7 +294,7 @@ static inline struct kmem_cache_cpu *get /* Determine the maximum number of objects that a slab page can hold */ static inline unsigned long slab_objects(struct kmem_cache *s, struct page *page) { - return s->objects; + return s->max_objects; } /* Verify that a pointer has an address that is valid within a slab page */ @@ -1087,8 +1087,10 @@ static struct page *new_slab(struct kmem goto out; n = get_node(s, page_to_nid(page)); - if (n) + if (n) { atomic_long_inc(&n->nr_slabs); + atomic_long_add(slab_objects(s, page), &n->total_objects); + } page->slab = s; page->flags |= 1 << PG_slab; if (s->flags & (SLAB_DEBUG_FREE | SLAB_RED_ZONE | SLAB_POISON | @@ -1163,6 +1165,7 @@ static void discard_slab(struct kmem_cac struct kmem_cache_node *n = get_node(s, page_to_nid(page)); atomic_long_dec(&n->nr_slabs); + atomic_long_sub(slab_objects(s, page), &n->total_objects); reset_page_mapcount(page); __ClearPageSlab(page); free_slab(s, page); @@ -2251,9 +2254,9 @@ static int calculate_sizes(struct kmem_c /* * Determine the number of objects per slab */ - s->objects = (PAGE_SIZE << s->order) / size; + s->max_objects = (PAGE_SIZE << s->order) / size; - return !!s->objects; + return !!s->max_objects; } @@ -2673,7 +2676,7 @@ void kfree(const void *x) } EXPORT_SYMBOL(kfree); -static unsigned long count_partial(struct kmem_cache_node *n) +static unsigned long count_partial_inuse(struct kmem_cache_node *n) { unsigned long flags; unsigned long x = 0; @@ -2687,6 +2690,23 @@ static unsigned long count_partial(struc } /* + * Count the total number of objects in the partial list + */ +static unsigned long count_partial_total(struct kmem_cache *s, + struct kmem_cache_node *n) +{ + unsigned long flags; + unsigned long x = 0; + struct page *page; + + spin_lock_irqsave(&n->list_lock, flags); + list_for_each_entry(page, &n->partial, lru) + x += slab_objects(s, page); + spin_unlock_irqrestore(&n->list_lock, flags); + return x; +} + +/* * kmem_cache_shrink removes empty slabs from the partial lists and sorts * the remaining slabs by the number of items in use. The slabs with the * most items in use come first. New allocations will then fill those up @@ -2704,7 +2724,7 @@ int kmem_cache_shrink(struct kmem_cache struct page *page; struct page *t; struct list_head *slabs_by_inuse = - kmalloc(sizeof(struct list_head) * s->objects, GFP_KERNEL); + kmalloc(sizeof(struct list_head) * s->max_objects, GFP_KERNEL); unsigned long flags; if (!slabs_by_inuse) @@ -2717,7 +2737,7 @@ int kmem_cache_shrink(struct kmem_cache if (!n->nr_partial) continue; - for (i = 0; i < s->objects; i++) + for (i = 0; i < s->max_objects; i++) INIT_LIST_HEAD(slabs_by_inuse + i); spin_lock_irqsave(&n->list_lock, flags); @@ -2749,7 +2769,7 @@ int kmem_cache_shrink(struct kmem_cache * Rebuild the partial list with the slabs filled up most * first and the least used slabs at the end. */ - for (i = s->objects - 1; i >= 0; i--) + for (i = s->max_objects - 1; i >= 0; i--) list_splice(slabs_by_inuse + i, n->partial.prev); spin_unlock_irqrestore(&n->list_lock, flags); @@ -3251,7 +3271,7 @@ static long validate_slab_cache(struct k { int node; unsigned long count = 0; - unsigned long *map = kmalloc(BITS_TO_LONGS(s->objects) * + unsigned long *map = kmalloc(BITS_TO_LONGS(s->max_objects) * sizeof(unsigned long), GFP_KERNEL); if (!map) @@ -3555,13 +3575,15 @@ enum slab_stat_type { SL_FULL, SL_PARTIAL, SL_CPU, - SL_OBJECTS + SL_OBJECTS, + SL_TOTAL }; #define SO_FULL (1 << SL_FULL) #define SO_PARTIAL (1 << SL_PARTIAL) #define SO_CPU (1 << SL_CPU) #define SO_OBJECTS (1 << SL_OBJECTS) +#define SO_TOTAL (1 << SL_TOTAL) static unsigned long show_slab_objects(struct kmem_cache *s, char *buf, unsigned long flags) @@ -3589,7 +3611,9 @@ static unsigned long show_slab_objects(s continue; if (page) { if (flags & SO_CPU) { - if (flags & SO_OBJECTS) + if (flags & SO_TOTAL) + x = slab_objects(s, page); + else if (flags & SO_OBJECTS) x = page->inuse; else x = 1; @@ -3604,8 +3628,10 @@ static unsigned long show_slab_objects(s struct kmem_cache_node *n = get_node(s, node); if (flags & SO_PARTIAL) { - if (flags & SO_OBJECTS) - x = count_partial(n); + if (flags & SO_TOTAL) + x = count_partial_total(s, n); + else if (flags & SO_OBJECTS) + x = count_partial_inuse(n); else x = n->nr_partial; total += x; @@ -3616,9 +3642,12 @@ static unsigned long show_slab_objects(s int full_slabs = atomic_long_read(&n->nr_slabs) - per_cpu[node] - n->nr_partial; - - if (flags & SO_OBJECTS) - x = full_slabs * s->objects; + if (flags & SO_TOTAL) + x = atomic_long_read(&n->total_objects); + else if (flags & SO_OBJECTS) + x = atomic_long_read(&n->total_objects) - + (count_partial_total(s, n) - + count_partial_inuse(n)); else x = full_slabs; total += x; @@ -3697,7 +3726,7 @@ SLAB_ATTR_RO(object_size); static ssize_t objs_per_slab_show(struct kmem_cache *s, char *buf) { - return sprintf(buf, "%d\n", s->objects); + return sprintf(buf, "%d\n", s->max_objects); } SLAB_ATTR_RO(objs_per_slab); @@ -3748,6 +3777,12 @@ static ssize_t objects_show(struct kmem_ } SLAB_ATTR_RO(objects); +static ssize_t total_objects_show(struct kmem_cache *s, char *buf) +{ + return show_slab_objects(s, buf, SO_TOTAL|SO_FULL); +} +SLAB_ATTR_RO(total_objects); + static ssize_t sanity_checks_show(struct kmem_cache *s, char *buf) { return sprintf(buf, "%d\n", !!(s->flags & SLAB_DEBUG_FREE)); @@ -4003,6 +4038,7 @@ static struct attribute *slab_attrs[] = &objs_per_slab_attr.attr, &order_attr.attr, &objects_attr.attr, + &total_objects_attr.attr, &slabs_attr.attr, &partial_attr.attr, &cpu_slabs_attr.attr, @@ -4331,7 +4367,9 @@ static int s_show(struct seq_file *m, vo unsigned long nr_partials = 0; unsigned long nr_slabs = 0; unsigned long nr_inuse = 0; - unsigned long nr_objs; + unsigned long nr_objs = 0; + unsigned long nr_partial_inuse = 0; + unsigned long nr_partial_total = 0; struct kmem_cache *s; int node; @@ -4345,14 +4383,15 @@ static int s_show(struct seq_file *m, vo nr_partials += n->nr_partial; nr_slabs += atomic_long_read(&n->nr_slabs); - nr_inuse += count_partial(n); + nr_objs += atomic_long_read(&n->total_objects); + nr_partial_inuse += count_partial_inuse(n); + nr_partial_total += count_partial_total(s, n); } - nr_objs = nr_slabs * s->objects; - nr_inuse += (nr_slabs - nr_partials) * s->objects; + nr_inuse = nr_objs - (nr_partial_total - nr_partial_inuse); seq_printf(m, "%-17s %6lu %6lu %6u %4u %4d", s->name, nr_inuse, - nr_objs, s->size, s->objects, (1 << s->order)); + nr_objs, s->size, s->max_objects, (1 << s->order)); seq_printf(m, " : tunables %4u %4u %4u", 0, 0, 0); seq_printf(m, " : slabdata %6lu %6lu %6lu", nr_slabs, nr_slabs, 0UL);