Blame view

mm/slab_common.c 31.2 KB
039363f38   Christoph Lameter   mm, sl[aou]b: Ext...
1
2
3
4
5
6
7
8
9
10
11
12
13
  /*
   * Slab allocator functions that are independent of the allocator strategy
   *
   * (C) 2012 Christoph Lameter <cl@linux.com>
   */
  #include <linux/slab.h>
  
  #include <linux/mm.h>
  #include <linux/poison.h>
  #include <linux/interrupt.h>
  #include <linux/memory.h>
  #include <linux/compiler.h>
  #include <linux/module.h>
20cea9683   Christoph Lameter   mm, sl[aou]b: Mov...
14
15
  #include <linux/cpu.h>
  #include <linux/uaccess.h>
b7454ad3c   Glauber Costa   mm/sl[au]b: Move ...
16
17
  #include <linux/seq_file.h>
  #include <linux/proc_fs.h>
039363f38   Christoph Lameter   mm, sl[aou]b: Ext...
18
19
20
  #include <asm/cacheflush.h>
  #include <asm/tlbflush.h>
  #include <asm/page.h>
2633d7a02   Glauber Costa   slab/slub: consid...
21
  #include <linux/memcontrol.h>
928cec9cd   Andrey Ryabinin   mm: move slab rel...
22
23
  
  #define CREATE_TRACE_POINTS
f1b6eb6e6   Christoph Lameter   mm/sl[aou]b: Move...
24
  #include <trace/events/kmem.h>
039363f38   Christoph Lameter   mm, sl[aou]b: Ext...
25

97d066091   Christoph Lameter   mm, sl[aou]b: Com...
26
27
28
  #include "slab.h"
  
  enum slab_state slab_state;
18004c5d4   Christoph Lameter   mm, sl[aou]b: Use...
29
30
  LIST_HEAD(slab_caches);
  DEFINE_MUTEX(slab_mutex);
9b030cb86   Christoph Lameter   mm/sl[aou]b: Use ...
31
  struct kmem_cache *kmem_cache;
97d066091   Christoph Lameter   mm, sl[aou]b: Com...
32

07f361b2b   Joonsoo Kim   mm/slab_common: m...
33
  /*
423c929cb   Joonsoo Kim   mm/slab_common: c...
34
35
36
37
   * Set of flags that will prevent slab merging
   */
  #define SLAB_NEVER_MERGE (SLAB_RED_ZONE | SLAB_POISON | SLAB_STORE_USER | \
  		SLAB_TRACE | SLAB_DESTROY_BY_RCU | SLAB_NOLEAKTRACE | \
7ed2f9e66   Alexander Potapenko   mm, kasan: SLAB s...
38
  		SLAB_FAILSLAB | SLAB_KASAN)
423c929cb   Joonsoo Kim   mm/slab_common: c...
39

230e9fc28   Vladimir Davydov   slab: add SLAB_AC...
40
41
  #define SLAB_MERGE_SAME (SLAB_RECLAIM_ACCOUNT | SLAB_CACHE_DMA | \
  			 SLAB_NOTRACK | SLAB_ACCOUNT)
423c929cb   Joonsoo Kim   mm/slab_common: c...
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
  
  /*
   * Merge control. If this is set then no merging of slab caches will occur.
   * (Could be removed. This was introduced to pacify the merge skeptics.)
   */
  static int slab_nomerge;
  
  static int __init setup_slab_nomerge(char *str)
  {
  	slab_nomerge = 1;
  	return 1;
  }
  
  #ifdef CONFIG_SLUB
  __setup_param("slub_nomerge", slub_nomerge, setup_slab_nomerge, 0);
  #endif
  
  __setup("slab_nomerge", setup_slab_nomerge);
  
  /*
07f361b2b   Joonsoo Kim   mm/slab_common: m...
62
63
64
65
66
67
68
   * Determine the size of a slab object
   */
  unsigned int kmem_cache_size(struct kmem_cache *s)
  {
  	return s->object_size;
  }
  EXPORT_SYMBOL(kmem_cache_size);
77be4b136   Shuah Khan   mm/slab: restruct...
69
  #ifdef CONFIG_DEBUG_VM
794b1248b   Vladimir Davydov   memcg, slab: sepa...
70
  static int kmem_cache_sanity_check(const char *name, size_t size)
039363f38   Christoph Lameter   mm, sl[aou]b: Ext...
71
72
  {
  	struct kmem_cache *s = NULL;
039363f38   Christoph Lameter   mm, sl[aou]b: Ext...
73
74
  	if (!name || in_interrupt() || size < sizeof(void *) ||
  		size > KMALLOC_MAX_SIZE) {
77be4b136   Shuah Khan   mm/slab: restruct...
75
76
77
  		pr_err("kmem_cache_create(%s) integrity check failed
  ", name);
  		return -EINVAL;
039363f38   Christoph Lameter   mm, sl[aou]b: Ext...
78
  	}
b920536aa   Pekka Enberg   Revert "mm/slab_c...
79

20cea9683   Christoph Lameter   mm, sl[aou]b: Mov...
80
81
82
83
84
85
86
87
88
89
90
  	list_for_each_entry(s, &slab_caches, list) {
  		char tmp;
  		int res;
  
  		/*
  		 * This happens when the module gets unloaded and doesn't
  		 * destroy its slab cache and no-one else reuses the vmalloc
  		 * area of the module.  Print a warning.
  		 */
  		res = probe_kernel_address(s->name, tmp);
  		if (res) {
77be4b136   Shuah Khan   mm/slab: restruct...
91
92
  			pr_err("Slab cache with size %d has lost its name
  ",
20cea9683   Christoph Lameter   mm, sl[aou]b: Mov...
93
94
95
  			       s->object_size);
  			continue;
  		}
20cea9683   Christoph Lameter   mm, sl[aou]b: Mov...
96
97
98
  	}
  
  	WARN_ON(strchr(name, ' '));	/* It confuses parsers */
77be4b136   Shuah Khan   mm/slab: restruct...
99
100
101
  	return 0;
  }
  #else
794b1248b   Vladimir Davydov   memcg, slab: sepa...
102
  static inline int kmem_cache_sanity_check(const char *name, size_t size)
77be4b136   Shuah Khan   mm/slab: restruct...
103
104
105
  {
  	return 0;
  }
20cea9683   Christoph Lameter   mm, sl[aou]b: Mov...
106
  #endif
484748f0b   Christoph Lameter   slab: infrastruct...
107
108
109
  void __kmem_cache_free_bulk(struct kmem_cache *s, size_t nr, void **p)
  {
  	size_t i;
ca2571955   Jesper Dangaard Brouer   mm: new API kfree...
110
111
112
113
114
115
  	for (i = 0; i < nr; i++) {
  		if (s)
  			kmem_cache_free(s, p[i]);
  		else
  			kfree(p[i]);
  	}
484748f0b   Christoph Lameter   slab: infrastruct...
116
  }
865762a81   Jesper Dangaard Brouer   slab/slub: adjust...
117
  int __kmem_cache_alloc_bulk(struct kmem_cache *s, gfp_t flags, size_t nr,
484748f0b   Christoph Lameter   slab: infrastruct...
118
119
120
121
122
123
124
125
  								void **p)
  {
  	size_t i;
  
  	for (i = 0; i < nr; i++) {
  		void *x = p[i] = kmem_cache_alloc(s, flags);
  		if (!x) {
  			__kmem_cache_free_bulk(s, i, p);
865762a81   Jesper Dangaard Brouer   slab/slub: adjust...
126
  			return 0;
484748f0b   Christoph Lameter   slab: infrastruct...
127
128
  		}
  	}
865762a81   Jesper Dangaard Brouer   slab/slub: adjust...
129
  	return i;
484748f0b   Christoph Lameter   slab: infrastruct...
130
  }
127424c86   Johannes Weiner   mm: memcontrol: m...
131
  #if defined(CONFIG_MEMCG) && !defined(CONFIG_SLOB)
f7ce3190c   Vladimir Davydov   slab: embed memcg...
132
  void slab_init_memcg_params(struct kmem_cache *s)
33a690c45   Vladimir Davydov   memcg: move memcg...
133
  {
f7ce3190c   Vladimir Davydov   slab: embed memcg...
134
  	s->memcg_params.is_root_cache = true;
426589f57   Vladimir Davydov   slab: link memcg ...
135
  	INIT_LIST_HEAD(&s->memcg_params.list);
f7ce3190c   Vladimir Davydov   slab: embed memcg...
136
137
138
139
140
141
142
  	RCU_INIT_POINTER(s->memcg_params.memcg_caches, NULL);
  }
  
  static int init_memcg_params(struct kmem_cache *s,
  		struct mem_cgroup *memcg, struct kmem_cache *root_cache)
  {
  	struct memcg_cache_array *arr;
33a690c45   Vladimir Davydov   memcg: move memcg...
143

f7ce3190c   Vladimir Davydov   slab: embed memcg...
144
145
146
147
  	if (memcg) {
  		s->memcg_params.is_root_cache = false;
  		s->memcg_params.memcg = memcg;
  		s->memcg_params.root_cache = root_cache;
33a690c45   Vladimir Davydov   memcg: move memcg...
148
  		return 0;
f7ce3190c   Vladimir Davydov   slab: embed memcg...
149
  	}
33a690c45   Vladimir Davydov   memcg: move memcg...
150

f7ce3190c   Vladimir Davydov   slab: embed memcg...
151
  	slab_init_memcg_params(s);
33a690c45   Vladimir Davydov   memcg: move memcg...
152

f7ce3190c   Vladimir Davydov   slab: embed memcg...
153
154
  	if (!memcg_nr_cache_ids)
  		return 0;
33a690c45   Vladimir Davydov   memcg: move memcg...
155

f7ce3190c   Vladimir Davydov   slab: embed memcg...
156
157
158
159
160
  	arr = kzalloc(sizeof(struct memcg_cache_array) +
  		      memcg_nr_cache_ids * sizeof(void *),
  		      GFP_KERNEL);
  	if (!arr)
  		return -ENOMEM;
33a690c45   Vladimir Davydov   memcg: move memcg...
161

f7ce3190c   Vladimir Davydov   slab: embed memcg...
162
  	RCU_INIT_POINTER(s->memcg_params.memcg_caches, arr);
33a690c45   Vladimir Davydov   memcg: move memcg...
163
164
  	return 0;
  }
f7ce3190c   Vladimir Davydov   slab: embed memcg...
165
  static void destroy_memcg_params(struct kmem_cache *s)
33a690c45   Vladimir Davydov   memcg: move memcg...
166
  {
f7ce3190c   Vladimir Davydov   slab: embed memcg...
167
168
  	if (is_root_cache(s))
  		kfree(rcu_access_pointer(s->memcg_params.memcg_caches));
33a690c45   Vladimir Davydov   memcg: move memcg...
169
  }
f7ce3190c   Vladimir Davydov   slab: embed memcg...
170
  static int update_memcg_params(struct kmem_cache *s, int new_array_size)
6f817f4cd   Vladimir Davydov   memcg: move memcg...
171
  {
f7ce3190c   Vladimir Davydov   slab: embed memcg...
172
  	struct memcg_cache_array *old, *new;
6f817f4cd   Vladimir Davydov   memcg: move memcg...
173

f7ce3190c   Vladimir Davydov   slab: embed memcg...
174
175
  	if (!is_root_cache(s))
  		return 0;
6f817f4cd   Vladimir Davydov   memcg: move memcg...
176

f7ce3190c   Vladimir Davydov   slab: embed memcg...
177
178
179
  	new = kzalloc(sizeof(struct memcg_cache_array) +
  		      new_array_size * sizeof(void *), GFP_KERNEL);
  	if (!new)
6f817f4cd   Vladimir Davydov   memcg: move memcg...
180
  		return -ENOMEM;
f7ce3190c   Vladimir Davydov   slab: embed memcg...
181
182
183
184
185
  	old = rcu_dereference_protected(s->memcg_params.memcg_caches,
  					lockdep_is_held(&slab_mutex));
  	if (old)
  		memcpy(new->entries, old->entries,
  		       memcg_nr_cache_ids * sizeof(void *));
6f817f4cd   Vladimir Davydov   memcg: move memcg...
186

f7ce3190c   Vladimir Davydov   slab: embed memcg...
187
188
189
  	rcu_assign_pointer(s->memcg_params.memcg_caches, new);
  	if (old)
  		kfree_rcu(old, rcu);
6f817f4cd   Vladimir Davydov   memcg: move memcg...
190
191
  	return 0;
  }
55007d849   Glauber Costa   memcg: allocate m...
192
193
194
195
  int memcg_update_all_caches(int num_memcgs)
  {
  	struct kmem_cache *s;
  	int ret = 0;
55007d849   Glauber Costa   memcg: allocate m...
196

05257a1a3   Vladimir Davydov   memcg: add rwsem ...
197
  	mutex_lock(&slab_mutex);
55007d849   Glauber Costa   memcg: allocate m...
198
  	list_for_each_entry(s, &slab_caches, list) {
f7ce3190c   Vladimir Davydov   slab: embed memcg...
199
  		ret = update_memcg_params(s, num_memcgs);
55007d849   Glauber Costa   memcg: allocate m...
200
  		/*
55007d849   Glauber Costa   memcg: allocate m...
201
202
203
204
  		 * Instead of freeing the memory, we'll just leave the caches
  		 * up to this point in an updated state.
  		 */
  		if (ret)
05257a1a3   Vladimir Davydov   memcg: add rwsem ...
205
  			break;
55007d849   Glauber Costa   memcg: allocate m...
206
  	}
55007d849   Glauber Costa   memcg: allocate m...
207
208
209
  	mutex_unlock(&slab_mutex);
  	return ret;
  }
33a690c45   Vladimir Davydov   memcg: move memcg...
210
  #else
f7ce3190c   Vladimir Davydov   slab: embed memcg...
211
212
  static inline int init_memcg_params(struct kmem_cache *s,
  		struct mem_cgroup *memcg, struct kmem_cache *root_cache)
33a690c45   Vladimir Davydov   memcg: move memcg...
213
214
215
  {
  	return 0;
  }
f7ce3190c   Vladimir Davydov   slab: embed memcg...
216
  static inline void destroy_memcg_params(struct kmem_cache *s)
33a690c45   Vladimir Davydov   memcg: move memcg...
217
218
  {
  }
127424c86   Johannes Weiner   mm: memcontrol: m...
219
  #endif /* CONFIG_MEMCG && !CONFIG_SLOB */
55007d849   Glauber Costa   memcg: allocate m...
220

77be4b136   Shuah Khan   mm/slab: restruct...
221
  /*
423c929cb   Joonsoo Kim   mm/slab_common: c...
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
   * Find a mergeable slab cache
   */
  int slab_unmergeable(struct kmem_cache *s)
  {
  	if (slab_nomerge || (s->flags & SLAB_NEVER_MERGE))
  		return 1;
  
  	if (!is_root_cache(s))
  		return 1;
  
  	if (s->ctor)
  		return 1;
  
  	/*
  	 * We may have set a slab to be unmergeable during bootstrap.
  	 */
  	if (s->refcount < 0)
  		return 1;
  
  	return 0;
  }
  
  struct kmem_cache *find_mergeable(size_t size, size_t align,
  		unsigned long flags, const char *name, void (*ctor)(void *))
  {
  	struct kmem_cache *s;
  
  	if (slab_nomerge || (flags & SLAB_NEVER_MERGE))
  		return NULL;
  
  	if (ctor)
  		return NULL;
  
  	size = ALIGN(size, sizeof(void *));
  	align = calculate_alignment(flags, align, size);
  	size = ALIGN(size, align);
  	flags = kmem_cache_flags(size, flags, name, NULL);
543620573   Joonsoo Kim   mm/slab: reverse ...
259
  	list_for_each_entry_reverse(s, &slab_caches, list) {
423c929cb   Joonsoo Kim   mm/slab_common: c...
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
  		if (slab_unmergeable(s))
  			continue;
  
  		if (size > s->size)
  			continue;
  
  		if ((flags & SLAB_MERGE_SAME) != (s->flags & SLAB_MERGE_SAME))
  			continue;
  		/*
  		 * Check if alignment is compatible.
  		 * Courtesy of Adrian Drzewiecki
  		 */
  		if ((s->size & ~(align - 1)) != s->size)
  			continue;
  
  		if (s->size - size >= sizeof(void *))
  			continue;
95069ac8d   Joonsoo Kim   mm/slab: fix unal...
277
278
279
  		if (IS_ENABLED(CONFIG_SLAB) && align &&
  			(align > s->align || s->align % align))
  			continue;
423c929cb   Joonsoo Kim   mm/slab_common: c...
280
281
282
283
284
285
  		return s;
  	}
  	return NULL;
  }
  
  /*
459068554   Christoph Lameter   mm/sl[aou]b: Comm...
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
   * Figure out what the alignment of the objects will be given a set of
   * flags, a user specified alignment and the size of the objects.
   */
  unsigned long calculate_alignment(unsigned long flags,
  		unsigned long align, unsigned long size)
  {
  	/*
  	 * If the user wants hardware cache aligned objects then follow that
  	 * suggestion if the object is sufficiently large.
  	 *
  	 * The hardware cache alignment cannot override the specified
  	 * alignment though. If that is greater then use it.
  	 */
  	if (flags & SLAB_HWCACHE_ALIGN) {
  		unsigned long ralign = cache_line_size();
  		while (size <= ralign / 2)
  			ralign /= 2;
  		align = max(align, ralign);
  	}
  
  	if (align < ARCH_SLAB_MINALIGN)
  		align = ARCH_SLAB_MINALIGN;
  
  	return ALIGN(align, sizeof(void *));
  }
c9a77a792   Vladimir Davydov   mm/slab_common.c:...
311
312
313
314
  static struct kmem_cache *create_cache(const char *name,
  		size_t object_size, size_t size, size_t align,
  		unsigned long flags, void (*ctor)(void *),
  		struct mem_cgroup *memcg, struct kmem_cache *root_cache)
794b1248b   Vladimir Davydov   memcg, slab: sepa...
315
316
317
318
319
320
321
322
323
324
325
326
327
328
  {
  	struct kmem_cache *s;
  	int err;
  
  	err = -ENOMEM;
  	s = kmem_cache_zalloc(kmem_cache, GFP_KERNEL);
  	if (!s)
  		goto out;
  
  	s->name = name;
  	s->object_size = object_size;
  	s->size = size;
  	s->align = align;
  	s->ctor = ctor;
f7ce3190c   Vladimir Davydov   slab: embed memcg...
329
  	err = init_memcg_params(s, memcg, root_cache);
794b1248b   Vladimir Davydov   memcg, slab: sepa...
330
331
332
333
334
335
336
337
338
  	if (err)
  		goto out_free_cache;
  
  	err = __kmem_cache_create(s, flags);
  	if (err)
  		goto out_free_cache;
  
  	s->refcount = 1;
  	list_add(&s->list, &slab_caches);
794b1248b   Vladimir Davydov   memcg, slab: sepa...
339
340
341
342
343
344
  out:
  	if (err)
  		return ERR_PTR(err);
  	return s;
  
  out_free_cache:
f7ce3190c   Vladimir Davydov   slab: embed memcg...
345
  	destroy_memcg_params(s);
7c4da061f   Vaishali Thakkar   mm/slab_common.c:...
346
  	kmem_cache_free(kmem_cache, s);
794b1248b   Vladimir Davydov   memcg, slab: sepa...
347
348
  	goto out;
  }
459068554   Christoph Lameter   mm/sl[aou]b: Comm...
349
350
  
  /*
77be4b136   Shuah Khan   mm/slab: restruct...
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
   * kmem_cache_create - Create a cache.
   * @name: A string which is used in /proc/slabinfo to identify this cache.
   * @size: The size of objects to be created in this cache.
   * @align: The required alignment for the objects.
   * @flags: SLAB flags
   * @ctor: A constructor for the objects.
   *
   * Returns a ptr to the cache on success, NULL on failure.
   * Cannot be called within a interrupt, but can be interrupted.
   * The @ctor is run when new pages are allocated by the cache.
   *
   * The flags are
   *
   * %SLAB_POISON - Poison the slab with a known test pattern (a5a5a5a5)
   * to catch references to uninitialised memory.
   *
   * %SLAB_RED_ZONE - Insert `Red' zones around the allocated memory to check
   * for buffer overruns.
   *
   * %SLAB_HWCACHE_ALIGN - Align the objects in this cache to a hardware
   * cacheline.  This can be beneficial if you're counting cycles as closely
   * as davem.
   */
2633d7a02   Glauber Costa   slab/slub: consid...
374
  struct kmem_cache *
794b1248b   Vladimir Davydov   memcg, slab: sepa...
375
376
  kmem_cache_create(const char *name, size_t size, size_t align,
  		  unsigned long flags, void (*ctor)(void *))
77be4b136   Shuah Khan   mm/slab: restruct...
377
  {
40911a798   Alexandru Moise   mm/slab_common.c:...
378
  	struct kmem_cache *s = NULL;
3dec16ea3   Andrzej Hajda   mm/slab: convert ...
379
  	const char *cache_name;
3965fc365   Vladimir Davydov   slab: clean up km...
380
  	int err;
039363f38   Christoph Lameter   mm, sl[aou]b: Ext...
381

77be4b136   Shuah Khan   mm/slab: restruct...
382
  	get_online_cpus();
03afc0e25   Vladimir Davydov   slab: get_online_...
383
  	get_online_mems();
05257a1a3   Vladimir Davydov   memcg: add rwsem ...
384
  	memcg_get_cache_ids();
03afc0e25   Vladimir Davydov   slab: get_online_...
385

77be4b136   Shuah Khan   mm/slab: restruct...
386
  	mutex_lock(&slab_mutex);
686d550d2   Christoph Lameter   mm/slab_common: I...
387

794b1248b   Vladimir Davydov   memcg, slab: sepa...
388
  	err = kmem_cache_sanity_check(name, size);
3aa24f519   Andrew Morton   mm/slab_common.c:...
389
  	if (err) {
3965fc365   Vladimir Davydov   slab: clean up km...
390
  		goto out_unlock;
3aa24f519   Andrew Morton   mm/slab_common.c:...
391
  	}
686d550d2   Christoph Lameter   mm/slab_common: I...
392

d8843922f   Glauber Costa   slab: Ignore inte...
393
394
395
396
397
398
399
  	/*
  	 * Some allocators will constraint the set of valid flags to a subset
  	 * of all flags. We expect them to define CACHE_CREATE_MASK in this
  	 * case, and we'll just provide them with a sanitized version of the
  	 * passed flags.
  	 */
  	flags &= CACHE_CREATE_MASK;
686d550d2   Christoph Lameter   mm/slab_common: I...
400

794b1248b   Vladimir Davydov   memcg, slab: sepa...
401
402
  	s = __kmem_cache_alias(name, size, align, flags, ctor);
  	if (s)
3965fc365   Vladimir Davydov   slab: clean up km...
403
  		goto out_unlock;
2633d7a02   Glauber Costa   slab/slub: consid...
404

3dec16ea3   Andrzej Hajda   mm/slab: convert ...
405
  	cache_name = kstrdup_const(name, GFP_KERNEL);
794b1248b   Vladimir Davydov   memcg, slab: sepa...
406
407
408
409
  	if (!cache_name) {
  		err = -ENOMEM;
  		goto out_unlock;
  	}
7c9adf5a5   Christoph Lameter   mm/sl[aou]b: Move...
410

c9a77a792   Vladimir Davydov   mm/slab_common.c:...
411
412
413
  	s = create_cache(cache_name, size, size,
  			 calculate_alignment(flags, align, size),
  			 flags, ctor, NULL, NULL);
794b1248b   Vladimir Davydov   memcg, slab: sepa...
414
415
  	if (IS_ERR(s)) {
  		err = PTR_ERR(s);
3dec16ea3   Andrzej Hajda   mm/slab: convert ...
416
  		kfree_const(cache_name);
794b1248b   Vladimir Davydov   memcg, slab: sepa...
417
  	}
3965fc365   Vladimir Davydov   slab: clean up km...
418
419
  
  out_unlock:
20cea9683   Christoph Lameter   mm, sl[aou]b: Mov...
420
  	mutex_unlock(&slab_mutex);
03afc0e25   Vladimir Davydov   slab: get_online_...
421

05257a1a3   Vladimir Davydov   memcg: add rwsem ...
422
  	memcg_put_cache_ids();
03afc0e25   Vladimir Davydov   slab: get_online_...
423
  	put_online_mems();
20cea9683   Christoph Lameter   mm, sl[aou]b: Mov...
424
  	put_online_cpus();
ba3253c78   Dave Jones   slab: fix wrong r...
425
  	if (err) {
686d550d2   Christoph Lameter   mm/slab_common: I...
426
427
428
429
430
  		if (flags & SLAB_PANIC)
  			panic("kmem_cache_create: Failed to create slab '%s'. Error %d
  ",
  				name, err);
  		else {
1170532bb   Joe Perches   mm: convert print...
431
432
  			pr_warn("kmem_cache_create(%s) failed with error %d
  ",
686d550d2   Christoph Lameter   mm/slab_common: I...
433
434
435
  				name, err);
  			dump_stack();
  		}
686d550d2   Christoph Lameter   mm/slab_common: I...
436
437
  		return NULL;
  	}
039363f38   Christoph Lameter   mm, sl[aou]b: Ext...
438
439
  	return s;
  }
794b1248b   Vladimir Davydov   memcg, slab: sepa...
440
  EXPORT_SYMBOL(kmem_cache_create);
2633d7a02   Glauber Costa   slab/slub: consid...
441

c9a77a792   Vladimir Davydov   mm/slab_common.c:...
442
  static int shutdown_cache(struct kmem_cache *s,
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
443
444
  		struct list_head *release, bool *need_rcu_barrier)
  {
cd918c557   Vladimir Davydov   mm/slab_common.c:...
445
  	if (__kmem_cache_shutdown(s) != 0)
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
446
  		return -EBUSY;
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
447
448
449
  
  	if (s->flags & SLAB_DESTROY_BY_RCU)
  		*need_rcu_barrier = true;
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
450
451
452
  	list_move(&s->list, release);
  	return 0;
  }
c9a77a792   Vladimir Davydov   mm/slab_common.c:...
453
  static void release_caches(struct list_head *release, bool need_rcu_barrier)
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
454
455
456
457
458
459
460
461
462
463
464
465
466
467
  {
  	struct kmem_cache *s, *s2;
  
  	if (need_rcu_barrier)
  		rcu_barrier();
  
  	list_for_each_entry_safe(s, s2, release, list) {
  #ifdef SLAB_SUPPORTS_SYSFS
  		sysfs_slab_remove(s);
  #else
  		slab_kmem_cache_release(s);
  #endif
  	}
  }
127424c86   Johannes Weiner   mm: memcontrol: m...
468
  #if defined(CONFIG_MEMCG) && !defined(CONFIG_SLOB)
794b1248b   Vladimir Davydov   memcg, slab: sepa...
469
  /*
776ed0f03   Vladimir Davydov   memcg: cleanup km...
470
   * memcg_create_kmem_cache - Create a cache for a memory cgroup.
794b1248b   Vladimir Davydov   memcg, slab: sepa...
471
472
473
474
475
476
477
   * @memcg: The memory cgroup the new cache is for.
   * @root_cache: The parent of the new cache.
   *
   * This function attempts to create a kmem cache that will serve allocation
   * requests going from @memcg to @root_cache. The new cache inherits properties
   * from its parent.
   */
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
478
479
  void memcg_create_kmem_cache(struct mem_cgroup *memcg,
  			     struct kmem_cache *root_cache)
2633d7a02   Glauber Costa   slab/slub: consid...
480
  {
3e0350a36   Vladimir Davydov   memcg: zap memcg_...
481
  	static char memcg_name_buf[NAME_MAX + 1]; /* protected by slab_mutex */
33398cf2f   Michal Hocko   memcg: export str...
482
  	struct cgroup_subsys_state *css = &memcg->css;
f7ce3190c   Vladimir Davydov   slab: embed memcg...
483
  	struct memcg_cache_array *arr;
bd6731458   Vladimir Davydov   memcg, slab: simp...
484
  	struct kmem_cache *s = NULL;
794b1248b   Vladimir Davydov   memcg, slab: sepa...
485
  	char *cache_name;
f7ce3190c   Vladimir Davydov   slab: embed memcg...
486
  	int idx;
794b1248b   Vladimir Davydov   memcg, slab: sepa...
487
488
  
  	get_online_cpus();
03afc0e25   Vladimir Davydov   slab: get_online_...
489
  	get_online_mems();
794b1248b   Vladimir Davydov   memcg, slab: sepa...
490
  	mutex_lock(&slab_mutex);
2a4db7eb9   Vladimir Davydov   memcg: free memcg...
491
  	/*
567e9ab2e   Johannes Weiner   mm: memcontrol: g...
492
  	 * The memory cgroup could have been offlined while the cache
2a4db7eb9   Vladimir Davydov   memcg: free memcg...
493
494
  	 * creation work was pending.
  	 */
b6ecd2dea   Vladimir Davydov   mm: memcontrol: z...
495
  	if (memcg->kmem_state != KMEM_ONLINE)
2a4db7eb9   Vladimir Davydov   memcg: free memcg...
496
  		goto out_unlock;
f7ce3190c   Vladimir Davydov   slab: embed memcg...
497
498
499
  	idx = memcg_cache_id(memcg);
  	arr = rcu_dereference_protected(root_cache->memcg_params.memcg_caches,
  					lockdep_is_held(&slab_mutex));
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
500
501
502
503
504
  	/*
  	 * Since per-memcg caches are created asynchronously on first
  	 * allocation (see memcg_kmem_get_cache()), several threads can try to
  	 * create the same cache, but only one of them may succeed.
  	 */
f7ce3190c   Vladimir Davydov   slab: embed memcg...
505
  	if (arr->entries[idx])
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
506
  		goto out_unlock;
f1008365b   Vladimir Davydov   slab: use css id ...
507
  	cgroup_name(css->cgroup, memcg_name_buf, sizeof(memcg_name_buf));
73f576c04   Johannes Weiner   mm: memcontrol: f...
508
509
  	cache_name = kasprintf(GFP_KERNEL, "%s(%llu:%s)", root_cache->name,
  			       css->serial_nr, memcg_name_buf);
794b1248b   Vladimir Davydov   memcg, slab: sepa...
510
511
  	if (!cache_name)
  		goto out_unlock;
c9a77a792   Vladimir Davydov   mm/slab_common.c:...
512
513
  	s = create_cache(cache_name, root_cache->object_size,
  			 root_cache->size, root_cache->align,
f773e36de   Greg Thelen   memcg: prevent me...
514
515
  			 root_cache->flags & CACHE_CREATE_MASK,
  			 root_cache->ctor, memcg, root_cache);
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
516
517
518
519
520
  	/*
  	 * If we could not create a memcg cache, do not complain, because
  	 * that's not critical at all as we can always proceed with the root
  	 * cache.
  	 */
bd6731458   Vladimir Davydov   memcg, slab: simp...
521
  	if (IS_ERR(s)) {
794b1248b   Vladimir Davydov   memcg, slab: sepa...
522
  		kfree(cache_name);
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
523
  		goto out_unlock;
bd6731458   Vladimir Davydov   memcg, slab: simp...
524
  	}
794b1248b   Vladimir Davydov   memcg, slab: sepa...
525

426589f57   Vladimir Davydov   slab: link memcg ...
526
  	list_add(&s->memcg_params.list, &root_cache->memcg_params.list);
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
527
528
529
530
531
532
  	/*
  	 * Since readers won't lock (see cache_from_memcg_idx()), we need a
  	 * barrier here to ensure nobody will see the kmem_cache partially
  	 * initialized.
  	 */
  	smp_wmb();
f7ce3190c   Vladimir Davydov   slab: embed memcg...
533
  	arr->entries[idx] = s;
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
534

794b1248b   Vladimir Davydov   memcg, slab: sepa...
535
536
  out_unlock:
  	mutex_unlock(&slab_mutex);
03afc0e25   Vladimir Davydov   slab: get_online_...
537
538
  
  	put_online_mems();
794b1248b   Vladimir Davydov   memcg, slab: sepa...
539
  	put_online_cpus();
2633d7a02   Glauber Costa   slab/slub: consid...
540
  }
b8529907b   Vladimir Davydov   memcg, slab: do n...
541

2a4db7eb9   Vladimir Davydov   memcg: free memcg...
542
543
544
545
  void memcg_deactivate_kmem_caches(struct mem_cgroup *memcg)
  {
  	int idx;
  	struct memcg_cache_array *arr;
d6e0b7fa1   Vladimir Davydov   slub: make dead c...
546
  	struct kmem_cache *s, *c;
2a4db7eb9   Vladimir Davydov   memcg: free memcg...
547
548
  
  	idx = memcg_cache_id(memcg);
d6e0b7fa1   Vladimir Davydov   slub: make dead c...
549
550
  	get_online_cpus();
  	get_online_mems();
2a4db7eb9   Vladimir Davydov   memcg: free memcg...
551
552
553
554
555
556
557
  	mutex_lock(&slab_mutex);
  	list_for_each_entry(s, &slab_caches, list) {
  		if (!is_root_cache(s))
  			continue;
  
  		arr = rcu_dereference_protected(s->memcg_params.memcg_caches,
  						lockdep_is_held(&slab_mutex));
d6e0b7fa1   Vladimir Davydov   slub: make dead c...
558
559
560
561
562
  		c = arr->entries[idx];
  		if (!c)
  			continue;
  
  		__kmem_cache_shrink(c, true);
2a4db7eb9   Vladimir Davydov   memcg: free memcg...
563
564
565
  		arr->entries[idx] = NULL;
  	}
  	mutex_unlock(&slab_mutex);
d6e0b7fa1   Vladimir Davydov   slub: make dead c...
566
567
568
  
  	put_online_mems();
  	put_online_cpus();
2a4db7eb9   Vladimir Davydov   memcg: free memcg...
569
  }
d60fdcc9e   Vladimir Davydov   mm/slab_common.c:...
570
571
572
573
574
575
576
577
578
579
580
  static int __shutdown_memcg_cache(struct kmem_cache *s,
  		struct list_head *release, bool *need_rcu_barrier)
  {
  	BUG_ON(is_root_cache(s));
  
  	if (shutdown_cache(s, release, need_rcu_barrier))
  		return -EBUSY;
  
  	list_del(&s->memcg_params.list);
  	return 0;
  }
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
581
  void memcg_destroy_kmem_caches(struct mem_cgroup *memcg)
b8529907b   Vladimir Davydov   memcg, slab: do n...
582
  {
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
583
584
585
  	LIST_HEAD(release);
  	bool need_rcu_barrier = false;
  	struct kmem_cache *s, *s2;
b8529907b   Vladimir Davydov   memcg, slab: do n...
586

d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
587
588
  	get_online_cpus();
  	get_online_mems();
b8529907b   Vladimir Davydov   memcg, slab: do n...
589

b8529907b   Vladimir Davydov   memcg, slab: do n...
590
  	mutex_lock(&slab_mutex);
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
591
  	list_for_each_entry_safe(s, s2, &slab_caches, list) {
f7ce3190c   Vladimir Davydov   slab: embed memcg...
592
  		if (is_root_cache(s) || s->memcg_params.memcg != memcg)
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
593
594
595
596
597
  			continue;
  		/*
  		 * The cgroup is about to be freed and therefore has no charges
  		 * left. Hence, all its caches must be empty by now.
  		 */
d60fdcc9e   Vladimir Davydov   mm/slab_common.c:...
598
  		BUG_ON(__shutdown_memcg_cache(s, &release, &need_rcu_barrier));
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
599
600
  	}
  	mutex_unlock(&slab_mutex);
b8529907b   Vladimir Davydov   memcg, slab: do n...
601

d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
602
603
  	put_online_mems();
  	put_online_cpus();
c9a77a792   Vladimir Davydov   mm/slab_common.c:...
604
  	release_caches(&release, need_rcu_barrier);
b8529907b   Vladimir Davydov   memcg, slab: do n...
605
  }
d60fdcc9e   Vladimir Davydov   mm/slab_common.c:...
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
  
  static int shutdown_memcg_caches(struct kmem_cache *s,
  		struct list_head *release, bool *need_rcu_barrier)
  {
  	struct memcg_cache_array *arr;
  	struct kmem_cache *c, *c2;
  	LIST_HEAD(busy);
  	int i;
  
  	BUG_ON(!is_root_cache(s));
  
  	/*
  	 * First, shutdown active caches, i.e. caches that belong to online
  	 * memory cgroups.
  	 */
  	arr = rcu_dereference_protected(s->memcg_params.memcg_caches,
  					lockdep_is_held(&slab_mutex));
  	for_each_memcg_cache_index(i) {
  		c = arr->entries[i];
  		if (!c)
  			continue;
  		if (__shutdown_memcg_cache(c, release, need_rcu_barrier))
  			/*
  			 * The cache still has objects. Move it to a temporary
  			 * list so as not to try to destroy it for a second
  			 * time while iterating over inactive caches below.
  			 */
  			list_move(&c->memcg_params.list, &busy);
  		else
  			/*
  			 * The cache is empty and will be destroyed soon. Clear
  			 * the pointer to it in the memcg_caches array so that
  			 * it will never be accessed even if the root cache
  			 * stays alive.
  			 */
  			arr->entries[i] = NULL;
  	}
  
  	/*
  	 * Second, shutdown all caches left from memory cgroups that are now
  	 * offline.
  	 */
  	list_for_each_entry_safe(c, c2, &s->memcg_params.list,
  				 memcg_params.list)
  		__shutdown_memcg_cache(c, release, need_rcu_barrier);
  
  	list_splice(&busy, &s->memcg_params.list);
  
  	/*
  	 * A cache being destroyed must be empty. In particular, this means
  	 * that all per memcg caches attached to it must be empty too.
  	 */
  	if (!list_empty(&s->memcg_params.list))
  		return -EBUSY;
  	return 0;
  }
  #else
  static inline int shutdown_memcg_caches(struct kmem_cache *s,
  		struct list_head *release, bool *need_rcu_barrier)
  {
  	return 0;
  }
127424c86   Johannes Weiner   mm: memcontrol: m...
668
  #endif /* CONFIG_MEMCG && !CONFIG_SLOB */
97d066091   Christoph Lameter   mm, sl[aou]b: Com...
669

41a212859   Christoph Lameter   slub: use sysfs'e...
670
671
  void slab_kmem_cache_release(struct kmem_cache *s)
  {
52b4b950b   Dmitry Safonov   mm: slab: free km...
672
  	__kmem_cache_release(s);
f7ce3190c   Vladimir Davydov   slab: embed memcg...
673
  	destroy_memcg_params(s);
3dec16ea3   Andrzej Hajda   mm/slab: convert ...
674
  	kfree_const(s->name);
41a212859   Christoph Lameter   slub: use sysfs'e...
675
676
  	kmem_cache_free(kmem_cache, s);
  }
945cf2b61   Christoph Lameter   mm/sl[aou]b: Extr...
677
678
  void kmem_cache_destroy(struct kmem_cache *s)
  {
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
679
680
  	LIST_HEAD(release);
  	bool need_rcu_barrier = false;
d60fdcc9e   Vladimir Davydov   mm/slab_common.c:...
681
  	int err;
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
682

3942d2991   Sergey Senozhatsky   mm/slab_common: a...
683
684
  	if (unlikely(!s))
  		return;
945cf2b61   Christoph Lameter   mm/sl[aou]b: Extr...
685
  	get_online_cpus();
03afc0e25   Vladimir Davydov   slab: get_online_...
686
  	get_online_mems();
55834c590   Alexander Potapenko   mm: kasan: initia...
687
  	kasan_cache_destroy(s);
945cf2b61   Christoph Lameter   mm/sl[aou]b: Extr...
688
  	mutex_lock(&slab_mutex);
b8529907b   Vladimir Davydov   memcg, slab: do n...
689

945cf2b61   Christoph Lameter   mm/sl[aou]b: Extr...
690
  	s->refcount--;
b8529907b   Vladimir Davydov   memcg, slab: do n...
691
692
  	if (s->refcount)
  		goto out_unlock;
d60fdcc9e   Vladimir Davydov   mm/slab_common.c:...
693
694
  	err = shutdown_memcg_caches(s, &release, &need_rcu_barrier);
  	if (!err)
cd918c557   Vladimir Davydov   mm/slab_common.c:...
695
  		err = shutdown_cache(s, &release, &need_rcu_barrier);
b8529907b   Vladimir Davydov   memcg, slab: do n...
696

cd918c557   Vladimir Davydov   mm/slab_common.c:...
697
  	if (err) {
756a025f0   Joe Perches   mm: coalesce spli...
698
699
700
  		pr_err("kmem_cache_destroy %s: Slab cache still has objects
  ",
  		       s->name);
cd918c557   Vladimir Davydov   mm/slab_common.c:...
701
702
  		dump_stack();
  	}
b8529907b   Vladimir Davydov   memcg, slab: do n...
703
704
  out_unlock:
  	mutex_unlock(&slab_mutex);
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
705

03afc0e25   Vladimir Davydov   slab: get_online_...
706
  	put_online_mems();
945cf2b61   Christoph Lameter   mm/sl[aou]b: Extr...
707
  	put_online_cpus();
d5b3cf713   Vladimir Davydov   memcg: zap memcg_...
708

c9a77a792   Vladimir Davydov   mm/slab_common.c:...
709
  	release_caches(&release, need_rcu_barrier);
945cf2b61   Christoph Lameter   mm/sl[aou]b: Extr...
710
711
  }
  EXPORT_SYMBOL(kmem_cache_destroy);
03afc0e25   Vladimir Davydov   slab: get_online_...
712
713
714
715
716
717
718
719
720
721
722
723
724
  /**
   * kmem_cache_shrink - Shrink a cache.
   * @cachep: The cache to shrink.
   *
   * Releases as many slabs as possible for a cache.
   * To help debugging, a zero exit status indicates all slabs were released.
   */
  int kmem_cache_shrink(struct kmem_cache *cachep)
  {
  	int ret;
  
  	get_online_cpus();
  	get_online_mems();
55834c590   Alexander Potapenko   mm: kasan: initia...
725
  	kasan_cache_shrink(cachep);
d6e0b7fa1   Vladimir Davydov   slub: make dead c...
726
  	ret = __kmem_cache_shrink(cachep, false);
03afc0e25   Vladimir Davydov   slab: get_online_...
727
728
729
730
731
  	put_online_mems();
  	put_online_cpus();
  	return ret;
  }
  EXPORT_SYMBOL(kmem_cache_shrink);
fda901241   Denis Kirjanov   slab: convert sla...
732
  bool slab_is_available(void)
97d066091   Christoph Lameter   mm, sl[aou]b: Com...
733
734
735
  {
  	return slab_state >= UP;
  }
b7454ad3c   Glauber Costa   mm/sl[au]b: Move ...
736

45530c447   Christoph Lameter   mm, sl[au]b: crea...
737
738
739
740
741
742
743
744
745
  #ifndef CONFIG_SLOB
  /* Create a cache during boot when no slab services are available yet */
  void __init create_boot_cache(struct kmem_cache *s, const char *name, size_t size,
  		unsigned long flags)
  {
  	int err;
  
  	s->name = name;
  	s->size = s->object_size = size;
459068554   Christoph Lameter   mm/sl[aou]b: Comm...
746
  	s->align = calculate_alignment(flags, ARCH_KMALLOC_MINALIGN, size);
f7ce3190c   Vladimir Davydov   slab: embed memcg...
747
748
  
  	slab_init_memcg_params(s);
45530c447   Christoph Lameter   mm, sl[au]b: crea...
749
750
751
  	err = __kmem_cache_create(s, flags);
  
  	if (err)
31ba7346f   Christoph Lameter   slab: Use proper ...
752
753
  		panic("Creation of kmalloc slab %s size=%zu failed. Reason %d
  ",
45530c447   Christoph Lameter   mm, sl[au]b: crea...
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
  					name, size, err);
  
  	s->refcount = -1;	/* Exempt from merging for now */
  }
  
  struct kmem_cache *__init create_kmalloc_cache(const char *name, size_t size,
  				unsigned long flags)
  {
  	struct kmem_cache *s = kmem_cache_zalloc(kmem_cache, GFP_NOWAIT);
  
  	if (!s)
  		panic("Out of memory when creating slab %s
  ", name);
  
  	create_boot_cache(s, name, size, flags);
  	list_add(&s->list, &slab_caches);
  	s->refcount = 1;
  	return s;
  }
9425c58e5   Christoph Lameter   slab: Common defi...
773
774
775
776
777
778
779
  struct kmem_cache *kmalloc_caches[KMALLOC_SHIFT_HIGH + 1];
  EXPORT_SYMBOL(kmalloc_caches);
  
  #ifdef CONFIG_ZONE_DMA
  struct kmem_cache *kmalloc_dma_caches[KMALLOC_SHIFT_HIGH + 1];
  EXPORT_SYMBOL(kmalloc_dma_caches);
  #endif
f97d5f634   Christoph Lameter   slab: Common func...
780
  /*
2c59dd654   Christoph Lameter   slab: Common Kmal...
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
   * Conversion table for small slabs sizes / 8 to the index in the
   * kmalloc array. This is necessary for slabs < 192 since we have non power
   * of two cache sizes there. The size of larger slabs can be determined using
   * fls.
   */
  static s8 size_index[24] = {
  	3,	/* 8 */
  	4,	/* 16 */
  	5,	/* 24 */
  	5,	/* 32 */
  	6,	/* 40 */
  	6,	/* 48 */
  	6,	/* 56 */
  	6,	/* 64 */
  	1,	/* 72 */
  	1,	/* 80 */
  	1,	/* 88 */
  	1,	/* 96 */
  	7,	/* 104 */
  	7,	/* 112 */
  	7,	/* 120 */
  	7,	/* 128 */
  	2,	/* 136 */
  	2,	/* 144 */
  	2,	/* 152 */
  	2,	/* 160 */
  	2,	/* 168 */
  	2,	/* 176 */
  	2,	/* 184 */
  	2	/* 192 */
  };
  
  static inline int size_index_elem(size_t bytes)
  {
  	return (bytes - 1) / 8;
  }
  
  /*
   * Find the kmem_cache structure that serves a given size of
   * allocation
   */
  struct kmem_cache *kmalloc_slab(size_t size, gfp_t flags)
  {
  	int index;
9de1bc875   Joonsoo Kim   mm, slab_common: ...
825
  	if (unlikely(size > KMALLOC_MAX_SIZE)) {
907985f48   Sasha Levin   slab: prevent war...
826
  		WARN_ON_ONCE(!(flags & __GFP_NOWARN));
6286ae97d   Christoph Lameter   slab: Return NULL...
827
  		return NULL;
907985f48   Sasha Levin   slab: prevent war...
828
  	}
6286ae97d   Christoph Lameter   slab: Return NULL...
829

2c59dd654   Christoph Lameter   slab: Common Kmal...
830
831
832
833
834
835
836
837
838
  	if (size <= 192) {
  		if (!size)
  			return ZERO_SIZE_PTR;
  
  		index = size_index[size_index_elem(size)];
  	} else
  		index = fls(size - 1);
  
  #ifdef CONFIG_ZONE_DMA
b1e054167   Joonsoo Kim   mm/sl[au]b: corre...
839
  	if (unlikely((flags & GFP_DMA)))
2c59dd654   Christoph Lameter   slab: Common Kmal...
840
841
842
843
844
845
846
  		return kmalloc_dma_caches[index];
  
  #endif
  	return kmalloc_caches[index];
  }
  
  /*
4066c33d0   Gavin Guo   mm/slab_common: s...
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
   * kmalloc_info[] is to make slub_debug=,kmalloc-xx option work at boot time.
   * kmalloc_index() supports up to 2^26=64MB, so the final entry of the table is
   * kmalloc-67108864.
   */
  static struct {
  	const char *name;
  	unsigned long size;
  } const kmalloc_info[] __initconst = {
  	{NULL,                      0},		{"kmalloc-96",             96},
  	{"kmalloc-192",           192},		{"kmalloc-8",               8},
  	{"kmalloc-16",             16},		{"kmalloc-32",             32},
  	{"kmalloc-64",             64},		{"kmalloc-128",           128},
  	{"kmalloc-256",           256},		{"kmalloc-512",           512},
  	{"kmalloc-1024",         1024},		{"kmalloc-2048",         2048},
  	{"kmalloc-4096",         4096},		{"kmalloc-8192",         8192},
  	{"kmalloc-16384",       16384},		{"kmalloc-32768",       32768},
  	{"kmalloc-65536",       65536},		{"kmalloc-131072",     131072},
  	{"kmalloc-262144",     262144},		{"kmalloc-524288",     524288},
  	{"kmalloc-1048576",   1048576},		{"kmalloc-2097152",   2097152},
  	{"kmalloc-4194304",   4194304},		{"kmalloc-8388608",   8388608},
  	{"kmalloc-16777216", 16777216},		{"kmalloc-33554432", 33554432},
  	{"kmalloc-67108864", 67108864}
  };
  
  /*
34cc6990d   Daniel Sanders   slab: correct siz...
872
873
874
875
876
877
878
879
880
   * Patch up the size_index table if we have strange large alignment
   * requirements for the kmalloc array. This is only the case for
   * MIPS it seems. The standard arches will not generate any code here.
   *
   * Largest permitted alignment is 256 bytes due to the way we
   * handle the index determination for the smaller caches.
   *
   * Make sure that nothing crazy happens if someone starts tinkering
   * around with ARCH_KMALLOC_MINALIGN
f97d5f634   Christoph Lameter   slab: Common func...
881
   */
34cc6990d   Daniel Sanders   slab: correct siz...
882
  void __init setup_kmalloc_cache_index_table(void)
f97d5f634   Christoph Lameter   slab: Common func...
883
884
  {
  	int i;
2c59dd654   Christoph Lameter   slab: Common Kmal...
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
  	BUILD_BUG_ON(KMALLOC_MIN_SIZE > 256 ||
  		(KMALLOC_MIN_SIZE & (KMALLOC_MIN_SIZE - 1)));
  
  	for (i = 8; i < KMALLOC_MIN_SIZE; i += 8) {
  		int elem = size_index_elem(i);
  
  		if (elem >= ARRAY_SIZE(size_index))
  			break;
  		size_index[elem] = KMALLOC_SHIFT_LOW;
  	}
  
  	if (KMALLOC_MIN_SIZE >= 64) {
  		/*
  		 * The 96 byte size cache is not used if the alignment
  		 * is 64 byte.
  		 */
  		for (i = 64 + 8; i <= 96; i += 8)
  			size_index[size_index_elem(i)] = 7;
  
  	}
  
  	if (KMALLOC_MIN_SIZE >= 128) {
  		/*
  		 * The 192 byte sized cache is not used if the alignment
  		 * is 128 byte. Redirect kmalloc to use the 256 byte cache
  		 * instead.
  		 */
  		for (i = 128 + 8; i <= 192; i += 8)
  			size_index[size_index_elem(i)] = 8;
  	}
34cc6990d   Daniel Sanders   slab: correct siz...
915
  }
ae6f2462e   Christoph Lameter   Add __init attrib...
916
  static void __init new_kmalloc_cache(int idx, unsigned long flags)
a9730fca9   Christoph Lameter   Fix kmalloc slab ...
917
918
919
920
  {
  	kmalloc_caches[idx] = create_kmalloc_cache(kmalloc_info[idx].name,
  					kmalloc_info[idx].size, flags);
  }
34cc6990d   Daniel Sanders   slab: correct siz...
921
922
923
924
925
926
927
928
  /*
   * Create the kmalloc array. Some of the regular kmalloc arrays
   * may already have been created because they were needed to
   * enable allocations for slab creation.
   */
  void __init create_kmalloc_caches(unsigned long flags)
  {
  	int i;
a9730fca9   Christoph Lameter   Fix kmalloc slab ...
929
930
931
  	for (i = KMALLOC_SHIFT_LOW; i <= KMALLOC_SHIFT_HIGH; i++) {
  		if (!kmalloc_caches[i])
  			new_kmalloc_cache(i, flags);
f97d5f634   Christoph Lameter   slab: Common func...
932

956e46efb   Chris Mason   mm/slab: Fix cras...
933
  		/*
a9730fca9   Christoph Lameter   Fix kmalloc slab ...
934
935
936
  		 * Caches that are not of the two-to-the-power-of size.
  		 * These have to be created immediately after the
  		 * earlier power of two caches
956e46efb   Chris Mason   mm/slab: Fix cras...
937
  		 */
a9730fca9   Christoph Lameter   Fix kmalloc slab ...
938
939
940
941
  		if (KMALLOC_MIN_SIZE <= 32 && !kmalloc_caches[1] && i == 6)
  			new_kmalloc_cache(1, flags);
  		if (KMALLOC_MIN_SIZE <= 64 && !kmalloc_caches[2] && i == 7)
  			new_kmalloc_cache(2, flags);
8a965b3ba   Christoph Lameter   mm, slab_common: ...
942
  	}
f97d5f634   Christoph Lameter   slab: Common func...
943
944
  	/* Kmalloc array is now usable */
  	slab_state = UP;
f97d5f634   Christoph Lameter   slab: Common func...
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
  #ifdef CONFIG_ZONE_DMA
  	for (i = 0; i <= KMALLOC_SHIFT_HIGH; i++) {
  		struct kmem_cache *s = kmalloc_caches[i];
  
  		if (s) {
  			int size = kmalloc_size(i);
  			char *n = kasprintf(GFP_NOWAIT,
  				 "dma-kmalloc-%d", size);
  
  			BUG_ON(!n);
  			kmalloc_dma_caches[i] = create_kmalloc_cache(n,
  				size, SLAB_CACHE_DMA | flags);
  		}
  	}
  #endif
  }
45530c447   Christoph Lameter   mm, sl[au]b: crea...
961
  #endif /* !CONFIG_SLOB */
cea371f4f   Vladimir Davydov   slab: document km...
962
963
964
965
966
  /*
   * To avoid unnecessary overhead, we pass through large allocation requests
   * directly to the page allocator. We use __GFP_COMP, because we will need to
   * know the allocation order to free the pages properly in kfree.
   */
52383431b   Vladimir Davydov   mm: get rid of __...
967
968
969
970
971
972
  void *kmalloc_order(size_t size, gfp_t flags, unsigned int order)
  {
  	void *ret;
  	struct page *page;
  
  	flags |= __GFP_COMP;
4949148ad   Vladimir Davydov   mm: charge/unchar...
973
  	page = alloc_pages(flags, order);
52383431b   Vladimir Davydov   mm: get rid of __...
974
975
  	ret = page ? page_address(page) : NULL;
  	kmemleak_alloc(ret, size, 1, flags);
505f5dcb1   Alexander Potapenko   mm, kasan: add GF...
976
  	kasan_kmalloc_large(ret, size, flags);
52383431b   Vladimir Davydov   mm: get rid of __...
977
978
979
  	return ret;
  }
  EXPORT_SYMBOL(kmalloc_order);
f1b6eb6e6   Christoph Lameter   mm/sl[aou]b: Move...
980
981
982
983
984
985
986
987
988
  #ifdef CONFIG_TRACING
  void *kmalloc_order_trace(size_t size, gfp_t flags, unsigned int order)
  {
  	void *ret = kmalloc_order(size, flags, order);
  	trace_kmalloc(_RET_IP_, ret, size, PAGE_SIZE << order, flags);
  	return ret;
  }
  EXPORT_SYMBOL(kmalloc_order_trace);
  #endif
45530c447   Christoph Lameter   mm, sl[au]b: crea...
989

7c00fce98   Thomas Garnier   mm: reorganize SL...
990
991
992
993
994
995
996
997
998
999
1000
1001
1002
1003
1004
1005
1006
1007
1008
1009
1010
1011
1012
1013
1014
1015
1016
1017
1018
1019
1020
1021
1022
1023
1024
1025
1026
1027
1028
1029
1030
1031
1032
1033
1034
1035
  #ifdef CONFIG_SLAB_FREELIST_RANDOM
  /* Randomize a generic freelist */
  static void freelist_randomize(struct rnd_state *state, unsigned int *list,
  			size_t count)
  {
  	size_t i;
  	unsigned int rand;
  
  	for (i = 0; i < count; i++)
  		list[i] = i;
  
  	/* Fisher-Yates shuffle */
  	for (i = count - 1; i > 0; i--) {
  		rand = prandom_u32_state(state);
  		rand %= (i + 1);
  		swap(list[i], list[rand]);
  	}
  }
  
  /* Create a random sequence per cache */
  int cache_random_seq_create(struct kmem_cache *cachep, unsigned int count,
  				    gfp_t gfp)
  {
  	struct rnd_state state;
  
  	if (count < 2 || cachep->random_seq)
  		return 0;
  
  	cachep->random_seq = kcalloc(count, sizeof(unsigned int), gfp);
  	if (!cachep->random_seq)
  		return -ENOMEM;
  
  	/* Get best entropy at this stage of boot */
  	prandom_seed_state(&state, get_random_long());
  
  	freelist_randomize(&state, cachep->random_seq, count);
  	return 0;
  }
  
  /* Destroy the per-cache random freelist sequence */
  void cache_random_seq_destroy(struct kmem_cache *cachep)
  {
  	kfree(cachep->random_seq);
  	cachep->random_seq = NULL;
  }
  #endif /* CONFIG_SLAB_FREELIST_RANDOM */
b7454ad3c   Glauber Costa   mm/sl[au]b: Move ...
1036
  #ifdef CONFIG_SLABINFO
e9b4db2b8   Wanpeng Li   mm/slab: Fix /pro...
1037
1038
1039
1040
1041
1042
  
  #ifdef CONFIG_SLAB
  #define SLABINFO_RIGHTS (S_IWUSR | S_IRUSR)
  #else
  #define SLABINFO_RIGHTS S_IRUSR
  #endif
b047501cd   Vladimir Davydov   memcg: use generi...
1043
  static void print_slabinfo_header(struct seq_file *m)
bcee6e2a1   Glauber Costa   mm/sl[au]b: Move ...
1044
1045
1046
1047
1048
1049
1050
1051
1052
1053
1054
1055
  {
  	/*
  	 * Output format version, so at least we can change it
  	 * without _too_ many complaints.
  	 */
  #ifdef CONFIG_DEBUG_SLAB
  	seq_puts(m, "slabinfo - version: 2.1 (statistics)
  ");
  #else
  	seq_puts(m, "slabinfo - version: 2.1
  ");
  #endif
756a025f0   Joe Perches   mm: coalesce spli...
1056
  	seq_puts(m, "# name            <active_objs> <num_objs> <objsize> <objperslab> <pagesperslab>");
bcee6e2a1   Glauber Costa   mm/sl[au]b: Move ...
1057
1058
1059
  	seq_puts(m, " : tunables <limit> <batchcount> <sharedfactor>");
  	seq_puts(m, " : slabdata <active_slabs> <num_slabs> <sharedavail>");
  #ifdef CONFIG_DEBUG_SLAB
756a025f0   Joe Perches   mm: coalesce spli...
1060
  	seq_puts(m, " : globalstat <listallocs> <maxobjs> <grown> <reaped> <error> <maxfreeable> <nodeallocs> <remotefrees> <alienoverflow>");
bcee6e2a1   Glauber Costa   mm/sl[au]b: Move ...
1061
1062
1063
1064
1065
  	seq_puts(m, " : cpustat <allochit> <allocmiss> <freehit> <freemiss>");
  #endif
  	seq_putc(m, '
  ');
  }
1df3b26f2   Vladimir Davydov   slab: print slabi...
1066
  void *slab_start(struct seq_file *m, loff_t *pos)
b7454ad3c   Glauber Costa   mm/sl[au]b: Move ...
1067
  {
b7454ad3c   Glauber Costa   mm/sl[au]b: Move ...
1068
  	mutex_lock(&slab_mutex);
b7454ad3c   Glauber Costa   mm/sl[au]b: Move ...
1069
1070
  	return seq_list_start(&slab_caches, *pos);
  }
276a2439c   Wanpeng Li   mm/slab: Give s_n...
1071
  void *slab_next(struct seq_file *m, void *p, loff_t *pos)
b7454ad3c   Glauber Costa   mm/sl[au]b: Move ...
1072
1073
1074
  {
  	return seq_list_next(p, &slab_caches, pos);
  }
276a2439c   Wanpeng Li   mm/slab: Give s_n...
1075
  void slab_stop(struct seq_file *m, void *p)
b7454ad3c   Glauber Costa   mm/sl[au]b: Move ...
1076
1077
1078
  {
  	mutex_unlock(&slab_mutex);
  }
749c54151   Glauber Costa   memcg: aggregate ...
1079
1080
1081
1082
1083
  static void
  memcg_accumulate_slabinfo(struct kmem_cache *s, struct slabinfo *info)
  {
  	struct kmem_cache *c;
  	struct slabinfo sinfo;
749c54151   Glauber Costa   memcg: aggregate ...
1084
1085
1086
  
  	if (!is_root_cache(s))
  		return;
426589f57   Vladimir Davydov   slab: link memcg ...
1087
  	for_each_memcg_cache(c, s) {
749c54151   Glauber Costa   memcg: aggregate ...
1088
1089
1090
1091
1092
1093
1094
1095
1096
1097
  		memset(&sinfo, 0, sizeof(sinfo));
  		get_slabinfo(c, &sinfo);
  
  		info->active_slabs += sinfo.active_slabs;
  		info->num_slabs += sinfo.num_slabs;
  		info->shared_avail += sinfo.shared_avail;
  		info->active_objs += sinfo.active_objs;
  		info->num_objs += sinfo.num_objs;
  	}
  }
b047501cd   Vladimir Davydov   memcg: use generi...
1098
  static void cache_show(struct kmem_cache *s, struct seq_file *m)
b7454ad3c   Glauber Costa   mm/sl[au]b: Move ...
1099
  {
0d7561c61   Glauber Costa   sl[au]b: Process ...
1100
1101
1102
1103
  	struct slabinfo sinfo;
  
  	memset(&sinfo, 0, sizeof(sinfo));
  	get_slabinfo(s, &sinfo);
749c54151   Glauber Costa   memcg: aggregate ...
1104
  	memcg_accumulate_slabinfo(s, &sinfo);
0d7561c61   Glauber Costa   sl[au]b: Process ...
1105
  	seq_printf(m, "%-17s %6lu %6lu %6u %4u %4d",
749c54151   Glauber Costa   memcg: aggregate ...
1106
  		   cache_name(s), sinfo.active_objs, sinfo.num_objs, s->size,
0d7561c61   Glauber Costa   sl[au]b: Process ...
1107
1108
1109
1110
1111
1112
1113
1114
1115
  		   sinfo.objects_per_slab, (1 << sinfo.cache_order));
  
  	seq_printf(m, " : tunables %4u %4u %4u",
  		   sinfo.limit, sinfo.batchcount, sinfo.shared);
  	seq_printf(m, " : slabdata %6lu %6lu %6lu",
  		   sinfo.active_slabs, sinfo.num_slabs, sinfo.shared_avail);
  	slabinfo_show_stats(m, s);
  	seq_putc(m, '
  ');
b7454ad3c   Glauber Costa   mm/sl[au]b: Move ...
1116
  }
1df3b26f2   Vladimir Davydov   slab: print slabi...
1117
  static int slab_show(struct seq_file *m, void *p)
749c54151   Glauber Costa   memcg: aggregate ...
1118
1119
  {
  	struct kmem_cache *s = list_entry(p, struct kmem_cache, list);
1df3b26f2   Vladimir Davydov   slab: print slabi...
1120
1121
  	if (p == slab_caches.next)
  		print_slabinfo_header(m);
b047501cd   Vladimir Davydov   memcg: use generi...
1122
1123
1124
1125
  	if (is_root_cache(s))
  		cache_show(s, m);
  	return 0;
  }
127424c86   Johannes Weiner   mm: memcontrol: m...
1126
  #if defined(CONFIG_MEMCG) && !defined(CONFIG_SLOB)
b047501cd   Vladimir Davydov   memcg: use generi...
1127
1128
1129
1130
1131
1132
1133
  int memcg_slab_show(struct seq_file *m, void *p)
  {
  	struct kmem_cache *s = list_entry(p, struct kmem_cache, list);
  	struct mem_cgroup *memcg = mem_cgroup_from_css(seq_css(m));
  
  	if (p == slab_caches.next)
  		print_slabinfo_header(m);
f7ce3190c   Vladimir Davydov   slab: embed memcg...
1134
  	if (!is_root_cache(s) && s->memcg_params.memcg == memcg)
b047501cd   Vladimir Davydov   memcg: use generi...
1135
1136
  		cache_show(s, m);
  	return 0;
749c54151   Glauber Costa   memcg: aggregate ...
1137
  }
b047501cd   Vladimir Davydov   memcg: use generi...
1138
  #endif
749c54151   Glauber Costa   memcg: aggregate ...
1139

b7454ad3c   Glauber Costa   mm/sl[au]b: Move ...
1140
1141
1142
1143
1144
1145
1146
1147
1148
1149
1150
1151
1152
1153
  /*
   * slabinfo_op - iterator that generates /proc/slabinfo
   *
   * Output layout:
   * cache-name
   * num-active-objs
   * total-objs
   * object size
   * num-active-slabs
   * total-slabs
   * num-pages-per-slab
   * + further values on SMP and with statistics enabled
   */
  static const struct seq_operations slabinfo_op = {
1df3b26f2   Vladimir Davydov   slab: print slabi...
1154
  	.start = slab_start,
276a2439c   Wanpeng Li   mm/slab: Give s_n...
1155
1156
  	.next = slab_next,
  	.stop = slab_stop,
1df3b26f2   Vladimir Davydov   slab: print slabi...
1157
  	.show = slab_show,
b7454ad3c   Glauber Costa   mm/sl[au]b: Move ...
1158
1159
1160
1161
1162
1163
1164
1165
1166
1167
1168
1169
1170
1171
1172
1173
1174
  };
  
  static int slabinfo_open(struct inode *inode, struct file *file)
  {
  	return seq_open(file, &slabinfo_op);
  }
  
  static const struct file_operations proc_slabinfo_operations = {
  	.open		= slabinfo_open,
  	.read		= seq_read,
  	.write          = slabinfo_write,
  	.llseek		= seq_lseek,
  	.release	= seq_release,
  };
  
  static int __init slab_proc_init(void)
  {
e9b4db2b8   Wanpeng Li   mm/slab: Fix /pro...
1175
1176
  	proc_create("slabinfo", SLABINFO_RIGHTS, NULL,
  						&proc_slabinfo_operations);
b7454ad3c   Glauber Costa   mm/sl[au]b: Move ...
1177
1178
1179
1180
  	return 0;
  }
  module_init(slab_proc_init);
  #endif /* CONFIG_SLABINFO */
928cec9cd   Andrey Ryabinin   mm: move slab rel...
1181
1182
1183
1184
1185
1186
1187
1188
1189
  
  static __always_inline void *__do_krealloc(const void *p, size_t new_size,
  					   gfp_t flags)
  {
  	void *ret;
  	size_t ks = 0;
  
  	if (p)
  		ks = ksize(p);
0316bec22   Andrey Ryabinin   mm: slub: add ker...
1190
  	if (ks >= new_size) {
505f5dcb1   Alexander Potapenko   mm, kasan: add GF...
1191
  		kasan_krealloc((void *)p, new_size, flags);
928cec9cd   Andrey Ryabinin   mm: move slab rel...
1192
  		return (void *)p;
0316bec22   Andrey Ryabinin   mm: slub: add ker...
1193
  	}
928cec9cd   Andrey Ryabinin   mm: move slab rel...
1194
1195
1196
1197
1198
1199
1200
1201
1202
1203
1204
1205
1206
1207
1208
1209
1210
1211
1212
1213
1214
1215
1216
1217
1218
1219
1220
1221
1222
1223
1224
1225
1226
1227
1228
1229
1230
1231
1232
1233
1234
1235
1236
1237
1238
1239
1240
1241
1242
1243
1244
1245
1246
1247
1248
1249
1250
1251
1252
1253
1254
1255
1256
1257
1258
1259
1260
1261
1262
1263
1264
1265
1266
1267
1268
1269
1270
1271
1272
1273
1274
1275
1276
1277
1278
1279
1280
  
  	ret = kmalloc_track_caller(new_size, flags);
  	if (ret && p)
  		memcpy(ret, p, ks);
  
  	return ret;
  }
  
  /**
   * __krealloc - like krealloc() but don't free @p.
   * @p: object to reallocate memory for.
   * @new_size: how many bytes of memory are required.
   * @flags: the type of memory to allocate.
   *
   * This function is like krealloc() except it never frees the originally
   * allocated buffer. Use this if you don't want to free the buffer immediately
   * like, for example, with RCU.
   */
  void *__krealloc(const void *p, size_t new_size, gfp_t flags)
  {
  	if (unlikely(!new_size))
  		return ZERO_SIZE_PTR;
  
  	return __do_krealloc(p, new_size, flags);
  
  }
  EXPORT_SYMBOL(__krealloc);
  
  /**
   * krealloc - reallocate memory. The contents will remain unchanged.
   * @p: object to reallocate memory for.
   * @new_size: how many bytes of memory are required.
   * @flags: the type of memory to allocate.
   *
   * The contents of the object pointed to are preserved up to the
   * lesser of the new and old sizes.  If @p is %NULL, krealloc()
   * behaves exactly like kmalloc().  If @new_size is 0 and @p is not a
   * %NULL pointer, the object pointed to is freed.
   */
  void *krealloc(const void *p, size_t new_size, gfp_t flags)
  {
  	void *ret;
  
  	if (unlikely(!new_size)) {
  		kfree(p);
  		return ZERO_SIZE_PTR;
  	}
  
  	ret = __do_krealloc(p, new_size, flags);
  	if (ret && p != ret)
  		kfree(p);
  
  	return ret;
  }
  EXPORT_SYMBOL(krealloc);
  
  /**
   * kzfree - like kfree but zero memory
   * @p: object to free memory of
   *
   * The memory of the object @p points to is zeroed before freed.
   * If @p is %NULL, kzfree() does nothing.
   *
   * Note: this function zeroes the whole allocated buffer which can be a good
   * deal bigger than the requested buffer size passed to kmalloc(). So be
   * careful when using this function in performance sensitive code.
   */
  void kzfree(const void *p)
  {
  	size_t ks;
  	void *mem = (void *)p;
  
  	if (unlikely(ZERO_OR_NULL_PTR(mem)))
  		return;
  	ks = ksize(mem);
  	memset(mem, 0, ks);
  	kfree(mem);
  }
  EXPORT_SYMBOL(kzfree);
  
  /* Tracepoints definitions. */
  EXPORT_TRACEPOINT_SYMBOL(kmalloc);
  EXPORT_TRACEPOINT_SYMBOL(kmem_cache_alloc);
  EXPORT_TRACEPOINT_SYMBOL(kmalloc_node);
  EXPORT_TRACEPOINT_SYMBOL(kmem_cache_alloc_node);
  EXPORT_TRACEPOINT_SYMBOL(kfree);
  EXPORT_TRACEPOINT_SYMBOL(kmem_cache_free);