1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0 */
2*4882a593Smuzhiyun #ifndef MM_SLAB_H
3*4882a593Smuzhiyun #define MM_SLAB_H
4*4882a593Smuzhiyun /*
5*4882a593Smuzhiyun * Internal slab definitions
6*4882a593Smuzhiyun */
7*4882a593Smuzhiyun
8*4882a593Smuzhiyun #ifdef CONFIG_SLOB
9*4882a593Smuzhiyun /*
10*4882a593Smuzhiyun * Common fields provided in kmem_cache by all slab allocators
11*4882a593Smuzhiyun * This struct is either used directly by the allocator (SLOB)
12*4882a593Smuzhiyun * or the allocator must include definitions for all fields
13*4882a593Smuzhiyun * provided in kmem_cache_common in their definition of kmem_cache.
14*4882a593Smuzhiyun *
15*4882a593Smuzhiyun * Once we can do anonymous structs (C11 standard) we could put a
16*4882a593Smuzhiyun * anonymous struct definition in these allocators so that the
17*4882a593Smuzhiyun * separate allocations in the kmem_cache structure of SLAB and
18*4882a593Smuzhiyun * SLUB is no longer needed.
19*4882a593Smuzhiyun */
20*4882a593Smuzhiyun struct kmem_cache {
21*4882a593Smuzhiyun unsigned int object_size;/* The original size of the object */
22*4882a593Smuzhiyun unsigned int size; /* The aligned/padded/added on size */
23*4882a593Smuzhiyun unsigned int align; /* Alignment as calculated */
24*4882a593Smuzhiyun slab_flags_t flags; /* Active flags on the slab */
25*4882a593Smuzhiyun unsigned int useroffset;/* Usercopy region offset */
26*4882a593Smuzhiyun unsigned int usersize; /* Usercopy region size */
27*4882a593Smuzhiyun const char *name; /* Slab name for sysfs */
28*4882a593Smuzhiyun int refcount; /* Use counter */
29*4882a593Smuzhiyun void (*ctor)(void *); /* Called on object slot creation */
30*4882a593Smuzhiyun struct list_head list; /* List of all slab caches on the system */
31*4882a593Smuzhiyun };
32*4882a593Smuzhiyun
33*4882a593Smuzhiyun #endif /* CONFIG_SLOB */
34*4882a593Smuzhiyun
35*4882a593Smuzhiyun #ifdef CONFIG_SLAB
36*4882a593Smuzhiyun #include <linux/slab_def.h>
37*4882a593Smuzhiyun #endif
38*4882a593Smuzhiyun
39*4882a593Smuzhiyun #ifdef CONFIG_SLUB
40*4882a593Smuzhiyun #include <linux/slub_def.h>
41*4882a593Smuzhiyun #endif
42*4882a593Smuzhiyun
43*4882a593Smuzhiyun #include <linux/memcontrol.h>
44*4882a593Smuzhiyun #include <linux/fault-inject.h>
45*4882a593Smuzhiyun #include <linux/kasan.h>
46*4882a593Smuzhiyun #include <linux/kmemleak.h>
47*4882a593Smuzhiyun #include <linux/random.h>
48*4882a593Smuzhiyun #include <linux/sched/mm.h>
49*4882a593Smuzhiyun #include <linux/android_vendor.h>
50*4882a593Smuzhiyun
51*4882a593Smuzhiyun /*
52*4882a593Smuzhiyun * State of the slab allocator.
53*4882a593Smuzhiyun *
54*4882a593Smuzhiyun * This is used to describe the states of the allocator during bootup.
55*4882a593Smuzhiyun * Allocators use this to gradually bootstrap themselves. Most allocators
56*4882a593Smuzhiyun * have the problem that the structures used for managing slab caches are
57*4882a593Smuzhiyun * allocated from slab caches themselves.
58*4882a593Smuzhiyun */
59*4882a593Smuzhiyun enum slab_state {
60*4882a593Smuzhiyun DOWN, /* No slab functionality yet */
61*4882a593Smuzhiyun PARTIAL, /* SLUB: kmem_cache_node available */
62*4882a593Smuzhiyun PARTIAL_NODE, /* SLAB: kmalloc size for node struct available */
63*4882a593Smuzhiyun UP, /* Slab caches usable but not all extras yet */
64*4882a593Smuzhiyun FULL /* Everything is working */
65*4882a593Smuzhiyun };
66*4882a593Smuzhiyun
67*4882a593Smuzhiyun extern enum slab_state slab_state;
68*4882a593Smuzhiyun
69*4882a593Smuzhiyun /* The slab cache mutex protects the management structures during changes */
70*4882a593Smuzhiyun extern struct mutex slab_mutex;
71*4882a593Smuzhiyun
72*4882a593Smuzhiyun /* The list of all slab caches on the system */
73*4882a593Smuzhiyun extern struct list_head slab_caches;
74*4882a593Smuzhiyun
75*4882a593Smuzhiyun /* The slab cache that manages slab cache information */
76*4882a593Smuzhiyun extern struct kmem_cache *kmem_cache;
77*4882a593Smuzhiyun
78*4882a593Smuzhiyun /* A table of kmalloc cache names and sizes */
79*4882a593Smuzhiyun extern const struct kmalloc_info_struct {
80*4882a593Smuzhiyun const char *name[NR_KMALLOC_TYPES];
81*4882a593Smuzhiyun unsigned int size;
82*4882a593Smuzhiyun } kmalloc_info[];
83*4882a593Smuzhiyun
84*4882a593Smuzhiyun #ifndef CONFIG_SLOB
85*4882a593Smuzhiyun /* Kmalloc array related functions */
86*4882a593Smuzhiyun void setup_kmalloc_cache_index_table(void);
87*4882a593Smuzhiyun void create_kmalloc_caches(slab_flags_t);
88*4882a593Smuzhiyun
89*4882a593Smuzhiyun /* Find the kmalloc slab corresponding for a certain size */
90*4882a593Smuzhiyun struct kmem_cache *kmalloc_slab(size_t, gfp_t);
91*4882a593Smuzhiyun #endif
92*4882a593Smuzhiyun
93*4882a593Smuzhiyun gfp_t kmalloc_fix_flags(gfp_t flags);
94*4882a593Smuzhiyun
95*4882a593Smuzhiyun #ifdef CONFIG_SLUB
96*4882a593Smuzhiyun /*
97*4882a593Smuzhiyun * Tracking user of a slab.
98*4882a593Smuzhiyun */
99*4882a593Smuzhiyun #define TRACK_ADDRS_COUNT 16
100*4882a593Smuzhiyun struct track {
101*4882a593Smuzhiyun unsigned long addr; /* Called from address */
102*4882a593Smuzhiyun #ifdef CONFIG_STACKTRACE
103*4882a593Smuzhiyun unsigned long addrs[TRACK_ADDRS_COUNT]; /* Called from address */
104*4882a593Smuzhiyun #endif
105*4882a593Smuzhiyun int cpu; /* Was running on cpu */
106*4882a593Smuzhiyun int pid; /* Pid context */
107*4882a593Smuzhiyun unsigned long when; /* When did the operation occur */
108*4882a593Smuzhiyun #ifdef CONFIG_STACKTRACE
109*4882a593Smuzhiyun ANDROID_OEM_DATA(1);
110*4882a593Smuzhiyun #endif
111*4882a593Smuzhiyun };
112*4882a593Smuzhiyun
113*4882a593Smuzhiyun enum track_item { TRACK_ALLOC, TRACK_FREE };
114*4882a593Smuzhiyun #endif
115*4882a593Smuzhiyun
116*4882a593Smuzhiyun /* Functions provided by the slab allocators */
117*4882a593Smuzhiyun int __kmem_cache_create(struct kmem_cache *, slab_flags_t flags);
118*4882a593Smuzhiyun
119*4882a593Smuzhiyun struct kmem_cache *create_kmalloc_cache(const char *name, unsigned int size,
120*4882a593Smuzhiyun slab_flags_t flags, unsigned int useroffset,
121*4882a593Smuzhiyun unsigned int usersize);
122*4882a593Smuzhiyun extern void create_boot_cache(struct kmem_cache *, const char *name,
123*4882a593Smuzhiyun unsigned int size, slab_flags_t flags,
124*4882a593Smuzhiyun unsigned int useroffset, unsigned int usersize);
125*4882a593Smuzhiyun
126*4882a593Smuzhiyun int slab_unmergeable(struct kmem_cache *s);
127*4882a593Smuzhiyun struct kmem_cache *find_mergeable(unsigned size, unsigned align,
128*4882a593Smuzhiyun slab_flags_t flags, const char *name, void (*ctor)(void *));
129*4882a593Smuzhiyun #ifndef CONFIG_SLOB
130*4882a593Smuzhiyun struct kmem_cache *
131*4882a593Smuzhiyun __kmem_cache_alias(const char *name, unsigned int size, unsigned int align,
132*4882a593Smuzhiyun slab_flags_t flags, void (*ctor)(void *));
133*4882a593Smuzhiyun
134*4882a593Smuzhiyun slab_flags_t kmem_cache_flags(unsigned int object_size,
135*4882a593Smuzhiyun slab_flags_t flags, const char *name);
136*4882a593Smuzhiyun #else
137*4882a593Smuzhiyun static inline struct kmem_cache *
__kmem_cache_alias(const char * name,unsigned int size,unsigned int align,slab_flags_t flags,void (* ctor)(void *))138*4882a593Smuzhiyun __kmem_cache_alias(const char *name, unsigned int size, unsigned int align,
139*4882a593Smuzhiyun slab_flags_t flags, void (*ctor)(void *))
140*4882a593Smuzhiyun { return NULL; }
141*4882a593Smuzhiyun
kmem_cache_flags(unsigned int object_size,slab_flags_t flags,const char * name)142*4882a593Smuzhiyun static inline slab_flags_t kmem_cache_flags(unsigned int object_size,
143*4882a593Smuzhiyun slab_flags_t flags, const char *name)
144*4882a593Smuzhiyun {
145*4882a593Smuzhiyun return flags;
146*4882a593Smuzhiyun }
147*4882a593Smuzhiyun #endif
148*4882a593Smuzhiyun
149*4882a593Smuzhiyun
150*4882a593Smuzhiyun /* Legal flag mask for kmem_cache_create(), for various configurations */
151*4882a593Smuzhiyun #define SLAB_CORE_FLAGS (SLAB_HWCACHE_ALIGN | SLAB_CACHE_DMA | \
152*4882a593Smuzhiyun SLAB_CACHE_DMA32 | SLAB_PANIC | \
153*4882a593Smuzhiyun SLAB_TYPESAFE_BY_RCU | SLAB_DEBUG_OBJECTS )
154*4882a593Smuzhiyun
155*4882a593Smuzhiyun #if defined(CONFIG_DEBUG_SLAB)
156*4882a593Smuzhiyun #define SLAB_DEBUG_FLAGS (SLAB_RED_ZONE | SLAB_POISON | SLAB_STORE_USER)
157*4882a593Smuzhiyun #elif defined(CONFIG_SLUB_DEBUG)
158*4882a593Smuzhiyun #define SLAB_DEBUG_FLAGS (SLAB_RED_ZONE | SLAB_POISON | SLAB_STORE_USER | \
159*4882a593Smuzhiyun SLAB_TRACE | SLAB_CONSISTENCY_CHECKS)
160*4882a593Smuzhiyun #else
161*4882a593Smuzhiyun #define SLAB_DEBUG_FLAGS (0)
162*4882a593Smuzhiyun #endif
163*4882a593Smuzhiyun
164*4882a593Smuzhiyun #if defined(CONFIG_SLAB)
165*4882a593Smuzhiyun #define SLAB_CACHE_FLAGS (SLAB_MEM_SPREAD | SLAB_NOLEAKTRACE | \
166*4882a593Smuzhiyun SLAB_RECLAIM_ACCOUNT | SLAB_TEMPORARY | \
167*4882a593Smuzhiyun SLAB_ACCOUNT)
168*4882a593Smuzhiyun #elif defined(CONFIG_SLUB)
169*4882a593Smuzhiyun #define SLAB_CACHE_FLAGS (SLAB_NOLEAKTRACE | SLAB_RECLAIM_ACCOUNT | \
170*4882a593Smuzhiyun SLAB_TEMPORARY | SLAB_ACCOUNT)
171*4882a593Smuzhiyun #else
172*4882a593Smuzhiyun #define SLAB_CACHE_FLAGS (SLAB_NOLEAKTRACE)
173*4882a593Smuzhiyun #endif
174*4882a593Smuzhiyun
175*4882a593Smuzhiyun /* Common flags available with current configuration */
176*4882a593Smuzhiyun #define CACHE_CREATE_MASK (SLAB_CORE_FLAGS | SLAB_DEBUG_FLAGS | SLAB_CACHE_FLAGS)
177*4882a593Smuzhiyun
178*4882a593Smuzhiyun /* Common flags permitted for kmem_cache_create */
179*4882a593Smuzhiyun #define SLAB_FLAGS_PERMITTED (SLAB_CORE_FLAGS | \
180*4882a593Smuzhiyun SLAB_RED_ZONE | \
181*4882a593Smuzhiyun SLAB_POISON | \
182*4882a593Smuzhiyun SLAB_STORE_USER | \
183*4882a593Smuzhiyun SLAB_TRACE | \
184*4882a593Smuzhiyun SLAB_CONSISTENCY_CHECKS | \
185*4882a593Smuzhiyun SLAB_MEM_SPREAD | \
186*4882a593Smuzhiyun SLAB_NOLEAKTRACE | \
187*4882a593Smuzhiyun SLAB_RECLAIM_ACCOUNT | \
188*4882a593Smuzhiyun SLAB_TEMPORARY | \
189*4882a593Smuzhiyun SLAB_ACCOUNT)
190*4882a593Smuzhiyun
191*4882a593Smuzhiyun bool __kmem_cache_empty(struct kmem_cache *);
192*4882a593Smuzhiyun int __kmem_cache_shutdown(struct kmem_cache *);
193*4882a593Smuzhiyun void __kmem_cache_release(struct kmem_cache *);
194*4882a593Smuzhiyun int __kmem_cache_shrink(struct kmem_cache *);
195*4882a593Smuzhiyun void slab_kmem_cache_release(struct kmem_cache *);
196*4882a593Smuzhiyun
197*4882a593Smuzhiyun struct seq_file;
198*4882a593Smuzhiyun struct file;
199*4882a593Smuzhiyun
200*4882a593Smuzhiyun struct slabinfo {
201*4882a593Smuzhiyun unsigned long active_objs;
202*4882a593Smuzhiyun unsigned long num_objs;
203*4882a593Smuzhiyun unsigned long active_slabs;
204*4882a593Smuzhiyun unsigned long num_slabs;
205*4882a593Smuzhiyun unsigned long shared_avail;
206*4882a593Smuzhiyun unsigned int limit;
207*4882a593Smuzhiyun unsigned int batchcount;
208*4882a593Smuzhiyun unsigned int shared;
209*4882a593Smuzhiyun unsigned int objects_per_slab;
210*4882a593Smuzhiyun unsigned int cache_order;
211*4882a593Smuzhiyun };
212*4882a593Smuzhiyun
213*4882a593Smuzhiyun void get_slabinfo(struct kmem_cache *s, struct slabinfo *sinfo);
214*4882a593Smuzhiyun void slabinfo_show_stats(struct seq_file *m, struct kmem_cache *s);
215*4882a593Smuzhiyun ssize_t slabinfo_write(struct file *file, const char __user *buffer,
216*4882a593Smuzhiyun size_t count, loff_t *ppos);
217*4882a593Smuzhiyun
218*4882a593Smuzhiyun /*
219*4882a593Smuzhiyun * Generic implementation of bulk operations
220*4882a593Smuzhiyun * These are useful for situations in which the allocator cannot
221*4882a593Smuzhiyun * perform optimizations. In that case segments of the object listed
222*4882a593Smuzhiyun * may be allocated or freed using these operations.
223*4882a593Smuzhiyun */
224*4882a593Smuzhiyun void __kmem_cache_free_bulk(struct kmem_cache *, size_t, void **);
225*4882a593Smuzhiyun int __kmem_cache_alloc_bulk(struct kmem_cache *, gfp_t, size_t, void **);
226*4882a593Smuzhiyun
cache_vmstat_idx(struct kmem_cache * s)227*4882a593Smuzhiyun static inline int cache_vmstat_idx(struct kmem_cache *s)
228*4882a593Smuzhiyun {
229*4882a593Smuzhiyun return (s->flags & SLAB_RECLAIM_ACCOUNT) ?
230*4882a593Smuzhiyun NR_SLAB_RECLAIMABLE_B : NR_SLAB_UNRECLAIMABLE_B;
231*4882a593Smuzhiyun }
232*4882a593Smuzhiyun
233*4882a593Smuzhiyun #ifdef CONFIG_SLUB_DEBUG
234*4882a593Smuzhiyun #ifdef CONFIG_SLUB_DEBUG_ON
235*4882a593Smuzhiyun DECLARE_STATIC_KEY_TRUE(slub_debug_enabled);
236*4882a593Smuzhiyun #else
237*4882a593Smuzhiyun DECLARE_STATIC_KEY_FALSE(slub_debug_enabled);
238*4882a593Smuzhiyun #endif
239*4882a593Smuzhiyun extern void print_tracking(struct kmem_cache *s, void *object);
240*4882a593Smuzhiyun extern unsigned long get_each_object_track(struct kmem_cache *s,
241*4882a593Smuzhiyun struct page *page, enum track_item alloc,
242*4882a593Smuzhiyun int (*fn)(const struct kmem_cache *, const void *,
243*4882a593Smuzhiyun const struct track *, void *), void *private);
244*4882a593Smuzhiyun extern slab_flags_t slub_debug;
__slub_debug_enabled(void)245*4882a593Smuzhiyun static inline bool __slub_debug_enabled(void)
246*4882a593Smuzhiyun {
247*4882a593Smuzhiyun return static_branch_unlikely(&slub_debug_enabled);
248*4882a593Smuzhiyun }
249*4882a593Smuzhiyun #else
print_tracking(struct kmem_cache * s,void * object)250*4882a593Smuzhiyun static inline void print_tracking(struct kmem_cache *s, void *object)
251*4882a593Smuzhiyun {
252*4882a593Smuzhiyun }
__slub_debug_enabled(void)253*4882a593Smuzhiyun static inline bool __slub_debug_enabled(void)
254*4882a593Smuzhiyun {
255*4882a593Smuzhiyun return false;
256*4882a593Smuzhiyun }
257*4882a593Smuzhiyun #ifdef CONFIG_SLUB
get_each_object_track(struct kmem_cache * s,struct page * page,enum track_item alloc,int (* fn)(const struct kmem_cache *,const void *,const struct track *,void *),void * private)258*4882a593Smuzhiyun static inline unsigned long get_each_object_track(struct kmem_cache *s,
259*4882a593Smuzhiyun struct page *page, enum track_item alloc,
260*4882a593Smuzhiyun int (*fn)(const struct kmem_cache *, const void *,
261*4882a593Smuzhiyun const struct track *, void *), void *private)
262*4882a593Smuzhiyun {
263*4882a593Smuzhiyun return 0;
264*4882a593Smuzhiyun }
265*4882a593Smuzhiyun #endif
266*4882a593Smuzhiyun #endif
267*4882a593Smuzhiyun
268*4882a593Smuzhiyun /*
269*4882a593Smuzhiyun * Returns true if any of the specified slub_debug flags is enabled for the
270*4882a593Smuzhiyun * cache. Use only for flags parsed by setup_slub_debug() as it also enables
271*4882a593Smuzhiyun * the static key.
272*4882a593Smuzhiyun */
kmem_cache_debug_flags(struct kmem_cache * s,slab_flags_t flags)273*4882a593Smuzhiyun static inline bool kmem_cache_debug_flags(struct kmem_cache *s, slab_flags_t flags)
274*4882a593Smuzhiyun {
275*4882a593Smuzhiyun if (IS_ENABLED(CONFIG_SLUB_DEBUG))
276*4882a593Smuzhiyun VM_WARN_ON_ONCE(!(flags & SLAB_DEBUG_FLAGS));
277*4882a593Smuzhiyun if (__slub_debug_enabled())
278*4882a593Smuzhiyun return s->flags & flags;
279*4882a593Smuzhiyun return false;
280*4882a593Smuzhiyun }
281*4882a593Smuzhiyun
282*4882a593Smuzhiyun #ifdef CONFIG_MEMCG_KMEM
page_obj_cgroups(struct page * page)283*4882a593Smuzhiyun static inline struct obj_cgroup **page_obj_cgroups(struct page *page)
284*4882a593Smuzhiyun {
285*4882a593Smuzhiyun /*
286*4882a593Smuzhiyun * page->mem_cgroup and page->obj_cgroups are sharing the same
287*4882a593Smuzhiyun * space. To distinguish between them in case we don't know for sure
288*4882a593Smuzhiyun * that the page is a slab page (e.g. page_cgroup_ino()), let's
289*4882a593Smuzhiyun * always set the lowest bit of obj_cgroups.
290*4882a593Smuzhiyun */
291*4882a593Smuzhiyun return (struct obj_cgroup **)
292*4882a593Smuzhiyun ((unsigned long)page->obj_cgroups & ~0x1UL);
293*4882a593Smuzhiyun }
294*4882a593Smuzhiyun
page_has_obj_cgroups(struct page * page)295*4882a593Smuzhiyun static inline bool page_has_obj_cgroups(struct page *page)
296*4882a593Smuzhiyun {
297*4882a593Smuzhiyun return ((unsigned long)page->obj_cgroups & 0x1UL);
298*4882a593Smuzhiyun }
299*4882a593Smuzhiyun
300*4882a593Smuzhiyun int memcg_alloc_page_obj_cgroups(struct page *page, struct kmem_cache *s,
301*4882a593Smuzhiyun gfp_t gfp);
302*4882a593Smuzhiyun
memcg_free_page_obj_cgroups(struct page * page)303*4882a593Smuzhiyun static inline void memcg_free_page_obj_cgroups(struct page *page)
304*4882a593Smuzhiyun {
305*4882a593Smuzhiyun kfree(page_obj_cgroups(page));
306*4882a593Smuzhiyun page->obj_cgroups = NULL;
307*4882a593Smuzhiyun }
308*4882a593Smuzhiyun
obj_full_size(struct kmem_cache * s)309*4882a593Smuzhiyun static inline size_t obj_full_size(struct kmem_cache *s)
310*4882a593Smuzhiyun {
311*4882a593Smuzhiyun /*
312*4882a593Smuzhiyun * For each accounted object there is an extra space which is used
313*4882a593Smuzhiyun * to store obj_cgroup membership. Charge it too.
314*4882a593Smuzhiyun */
315*4882a593Smuzhiyun return s->size + sizeof(struct obj_cgroup *);
316*4882a593Smuzhiyun }
317*4882a593Smuzhiyun
318*4882a593Smuzhiyun /*
319*4882a593Smuzhiyun * Returns false if the allocation should fail.
320*4882a593Smuzhiyun */
memcg_slab_pre_alloc_hook(struct kmem_cache * s,struct obj_cgroup ** objcgp,size_t objects,gfp_t flags)321*4882a593Smuzhiyun static inline bool memcg_slab_pre_alloc_hook(struct kmem_cache *s,
322*4882a593Smuzhiyun struct obj_cgroup **objcgp,
323*4882a593Smuzhiyun size_t objects, gfp_t flags)
324*4882a593Smuzhiyun {
325*4882a593Smuzhiyun struct obj_cgroup *objcg;
326*4882a593Smuzhiyun
327*4882a593Smuzhiyun if (!memcg_kmem_enabled())
328*4882a593Smuzhiyun return true;
329*4882a593Smuzhiyun
330*4882a593Smuzhiyun if (!(flags & __GFP_ACCOUNT) && !(s->flags & SLAB_ACCOUNT))
331*4882a593Smuzhiyun return true;
332*4882a593Smuzhiyun
333*4882a593Smuzhiyun objcg = get_obj_cgroup_from_current();
334*4882a593Smuzhiyun if (!objcg)
335*4882a593Smuzhiyun return true;
336*4882a593Smuzhiyun
337*4882a593Smuzhiyun if (obj_cgroup_charge(objcg, flags, objects * obj_full_size(s))) {
338*4882a593Smuzhiyun obj_cgroup_put(objcg);
339*4882a593Smuzhiyun return false;
340*4882a593Smuzhiyun }
341*4882a593Smuzhiyun
342*4882a593Smuzhiyun *objcgp = objcg;
343*4882a593Smuzhiyun return true;
344*4882a593Smuzhiyun }
345*4882a593Smuzhiyun
mod_objcg_state(struct obj_cgroup * objcg,struct pglist_data * pgdat,int idx,int nr)346*4882a593Smuzhiyun static inline void mod_objcg_state(struct obj_cgroup *objcg,
347*4882a593Smuzhiyun struct pglist_data *pgdat,
348*4882a593Smuzhiyun int idx, int nr)
349*4882a593Smuzhiyun {
350*4882a593Smuzhiyun struct mem_cgroup *memcg;
351*4882a593Smuzhiyun struct lruvec *lruvec;
352*4882a593Smuzhiyun
353*4882a593Smuzhiyun rcu_read_lock();
354*4882a593Smuzhiyun memcg = obj_cgroup_memcg(objcg);
355*4882a593Smuzhiyun lruvec = mem_cgroup_lruvec(memcg, pgdat);
356*4882a593Smuzhiyun mod_memcg_lruvec_state(lruvec, idx, nr);
357*4882a593Smuzhiyun rcu_read_unlock();
358*4882a593Smuzhiyun }
359*4882a593Smuzhiyun
memcg_slab_post_alloc_hook(struct kmem_cache * s,struct obj_cgroup * objcg,gfp_t flags,size_t size,void ** p)360*4882a593Smuzhiyun static inline void memcg_slab_post_alloc_hook(struct kmem_cache *s,
361*4882a593Smuzhiyun struct obj_cgroup *objcg,
362*4882a593Smuzhiyun gfp_t flags, size_t size,
363*4882a593Smuzhiyun void **p)
364*4882a593Smuzhiyun {
365*4882a593Smuzhiyun struct page *page;
366*4882a593Smuzhiyun unsigned long off;
367*4882a593Smuzhiyun size_t i;
368*4882a593Smuzhiyun
369*4882a593Smuzhiyun if (!memcg_kmem_enabled() || !objcg)
370*4882a593Smuzhiyun return;
371*4882a593Smuzhiyun
372*4882a593Smuzhiyun for (i = 0; i < size; i++) {
373*4882a593Smuzhiyun if (likely(p[i])) {
374*4882a593Smuzhiyun page = virt_to_head_page(p[i]);
375*4882a593Smuzhiyun
376*4882a593Smuzhiyun if (!page_has_obj_cgroups(page) &&
377*4882a593Smuzhiyun memcg_alloc_page_obj_cgroups(page, s, flags)) {
378*4882a593Smuzhiyun obj_cgroup_uncharge(objcg, obj_full_size(s));
379*4882a593Smuzhiyun continue;
380*4882a593Smuzhiyun }
381*4882a593Smuzhiyun
382*4882a593Smuzhiyun off = obj_to_index(s, page, p[i]);
383*4882a593Smuzhiyun obj_cgroup_get(objcg);
384*4882a593Smuzhiyun page_obj_cgroups(page)[off] = objcg;
385*4882a593Smuzhiyun mod_objcg_state(objcg, page_pgdat(page),
386*4882a593Smuzhiyun cache_vmstat_idx(s), obj_full_size(s));
387*4882a593Smuzhiyun } else {
388*4882a593Smuzhiyun obj_cgroup_uncharge(objcg, obj_full_size(s));
389*4882a593Smuzhiyun }
390*4882a593Smuzhiyun }
391*4882a593Smuzhiyun obj_cgroup_put(objcg);
392*4882a593Smuzhiyun }
393*4882a593Smuzhiyun
memcg_slab_free_hook(struct kmem_cache * s_orig,void ** p,int objects)394*4882a593Smuzhiyun static inline void memcg_slab_free_hook(struct kmem_cache *s_orig,
395*4882a593Smuzhiyun void **p, int objects)
396*4882a593Smuzhiyun {
397*4882a593Smuzhiyun struct kmem_cache *s;
398*4882a593Smuzhiyun struct obj_cgroup *objcg;
399*4882a593Smuzhiyun struct page *page;
400*4882a593Smuzhiyun unsigned int off;
401*4882a593Smuzhiyun int i;
402*4882a593Smuzhiyun
403*4882a593Smuzhiyun if (!memcg_kmem_enabled())
404*4882a593Smuzhiyun return;
405*4882a593Smuzhiyun
406*4882a593Smuzhiyun for (i = 0; i < objects; i++) {
407*4882a593Smuzhiyun if (unlikely(!p[i]))
408*4882a593Smuzhiyun continue;
409*4882a593Smuzhiyun
410*4882a593Smuzhiyun page = virt_to_head_page(p[i]);
411*4882a593Smuzhiyun if (!page_has_obj_cgroups(page))
412*4882a593Smuzhiyun continue;
413*4882a593Smuzhiyun
414*4882a593Smuzhiyun if (!s_orig)
415*4882a593Smuzhiyun s = page->slab_cache;
416*4882a593Smuzhiyun else
417*4882a593Smuzhiyun s = s_orig;
418*4882a593Smuzhiyun
419*4882a593Smuzhiyun off = obj_to_index(s, page, p[i]);
420*4882a593Smuzhiyun objcg = page_obj_cgroups(page)[off];
421*4882a593Smuzhiyun if (!objcg)
422*4882a593Smuzhiyun continue;
423*4882a593Smuzhiyun
424*4882a593Smuzhiyun page_obj_cgroups(page)[off] = NULL;
425*4882a593Smuzhiyun obj_cgroup_uncharge(objcg, obj_full_size(s));
426*4882a593Smuzhiyun mod_objcg_state(objcg, page_pgdat(page), cache_vmstat_idx(s),
427*4882a593Smuzhiyun -obj_full_size(s));
428*4882a593Smuzhiyun obj_cgroup_put(objcg);
429*4882a593Smuzhiyun }
430*4882a593Smuzhiyun }
431*4882a593Smuzhiyun
432*4882a593Smuzhiyun #else /* CONFIG_MEMCG_KMEM */
page_has_obj_cgroups(struct page * page)433*4882a593Smuzhiyun static inline bool page_has_obj_cgroups(struct page *page)
434*4882a593Smuzhiyun {
435*4882a593Smuzhiyun return false;
436*4882a593Smuzhiyun }
437*4882a593Smuzhiyun
memcg_from_slab_obj(void * ptr)438*4882a593Smuzhiyun static inline struct mem_cgroup *memcg_from_slab_obj(void *ptr)
439*4882a593Smuzhiyun {
440*4882a593Smuzhiyun return NULL;
441*4882a593Smuzhiyun }
442*4882a593Smuzhiyun
memcg_alloc_page_obj_cgroups(struct page * page,struct kmem_cache * s,gfp_t gfp)443*4882a593Smuzhiyun static inline int memcg_alloc_page_obj_cgroups(struct page *page,
444*4882a593Smuzhiyun struct kmem_cache *s, gfp_t gfp)
445*4882a593Smuzhiyun {
446*4882a593Smuzhiyun return 0;
447*4882a593Smuzhiyun }
448*4882a593Smuzhiyun
memcg_free_page_obj_cgroups(struct page * page)449*4882a593Smuzhiyun static inline void memcg_free_page_obj_cgroups(struct page *page)
450*4882a593Smuzhiyun {
451*4882a593Smuzhiyun }
452*4882a593Smuzhiyun
memcg_slab_pre_alloc_hook(struct kmem_cache * s,struct obj_cgroup ** objcgp,size_t objects,gfp_t flags)453*4882a593Smuzhiyun static inline bool memcg_slab_pre_alloc_hook(struct kmem_cache *s,
454*4882a593Smuzhiyun struct obj_cgroup **objcgp,
455*4882a593Smuzhiyun size_t objects, gfp_t flags)
456*4882a593Smuzhiyun {
457*4882a593Smuzhiyun return true;
458*4882a593Smuzhiyun }
459*4882a593Smuzhiyun
memcg_slab_post_alloc_hook(struct kmem_cache * s,struct obj_cgroup * objcg,gfp_t flags,size_t size,void ** p)460*4882a593Smuzhiyun static inline void memcg_slab_post_alloc_hook(struct kmem_cache *s,
461*4882a593Smuzhiyun struct obj_cgroup *objcg,
462*4882a593Smuzhiyun gfp_t flags, size_t size,
463*4882a593Smuzhiyun void **p)
464*4882a593Smuzhiyun {
465*4882a593Smuzhiyun }
466*4882a593Smuzhiyun
memcg_slab_free_hook(struct kmem_cache * s,void ** p,int objects)467*4882a593Smuzhiyun static inline void memcg_slab_free_hook(struct kmem_cache *s,
468*4882a593Smuzhiyun void **p, int objects)
469*4882a593Smuzhiyun {
470*4882a593Smuzhiyun }
471*4882a593Smuzhiyun #endif /* CONFIG_MEMCG_KMEM */
472*4882a593Smuzhiyun
virt_to_cache(const void * obj)473*4882a593Smuzhiyun static inline struct kmem_cache *virt_to_cache(const void *obj)
474*4882a593Smuzhiyun {
475*4882a593Smuzhiyun struct page *page;
476*4882a593Smuzhiyun
477*4882a593Smuzhiyun page = virt_to_head_page(obj);
478*4882a593Smuzhiyun if (WARN_ONCE(!PageSlab(page), "%s: Object is not a Slab page!\n",
479*4882a593Smuzhiyun __func__))
480*4882a593Smuzhiyun return NULL;
481*4882a593Smuzhiyun return page->slab_cache;
482*4882a593Smuzhiyun }
483*4882a593Smuzhiyun
account_slab_page(struct page * page,int order,struct kmem_cache * s)484*4882a593Smuzhiyun static __always_inline void account_slab_page(struct page *page, int order,
485*4882a593Smuzhiyun struct kmem_cache *s)
486*4882a593Smuzhiyun {
487*4882a593Smuzhiyun mod_node_page_state(page_pgdat(page), cache_vmstat_idx(s),
488*4882a593Smuzhiyun PAGE_SIZE << order);
489*4882a593Smuzhiyun }
490*4882a593Smuzhiyun
unaccount_slab_page(struct page * page,int order,struct kmem_cache * s)491*4882a593Smuzhiyun static __always_inline void unaccount_slab_page(struct page *page, int order,
492*4882a593Smuzhiyun struct kmem_cache *s)
493*4882a593Smuzhiyun {
494*4882a593Smuzhiyun if (memcg_kmem_enabled())
495*4882a593Smuzhiyun memcg_free_page_obj_cgroups(page);
496*4882a593Smuzhiyun
497*4882a593Smuzhiyun mod_node_page_state(page_pgdat(page), cache_vmstat_idx(s),
498*4882a593Smuzhiyun -(PAGE_SIZE << order));
499*4882a593Smuzhiyun }
500*4882a593Smuzhiyun
cache_from_obj(struct kmem_cache * s,void * x)501*4882a593Smuzhiyun static inline struct kmem_cache *cache_from_obj(struct kmem_cache *s, void *x)
502*4882a593Smuzhiyun {
503*4882a593Smuzhiyun struct kmem_cache *cachep;
504*4882a593Smuzhiyun
505*4882a593Smuzhiyun if (!IS_ENABLED(CONFIG_SLAB_FREELIST_HARDENED) &&
506*4882a593Smuzhiyun !kmem_cache_debug_flags(s, SLAB_CONSISTENCY_CHECKS))
507*4882a593Smuzhiyun return s;
508*4882a593Smuzhiyun
509*4882a593Smuzhiyun cachep = virt_to_cache(x);
510*4882a593Smuzhiyun if (WARN(cachep && cachep != s,
511*4882a593Smuzhiyun "%s: Wrong slab cache. %s but object is from %s\n",
512*4882a593Smuzhiyun __func__, s->name, cachep->name))
513*4882a593Smuzhiyun print_tracking(cachep, x);
514*4882a593Smuzhiyun return cachep;
515*4882a593Smuzhiyun }
516*4882a593Smuzhiyun
slab_ksize(const struct kmem_cache * s)517*4882a593Smuzhiyun static inline size_t slab_ksize(const struct kmem_cache *s)
518*4882a593Smuzhiyun {
519*4882a593Smuzhiyun #ifndef CONFIG_SLUB
520*4882a593Smuzhiyun return s->object_size;
521*4882a593Smuzhiyun
522*4882a593Smuzhiyun #else /* CONFIG_SLUB */
523*4882a593Smuzhiyun # ifdef CONFIG_SLUB_DEBUG
524*4882a593Smuzhiyun /*
525*4882a593Smuzhiyun * Debugging requires use of the padding between object
526*4882a593Smuzhiyun * and whatever may come after it.
527*4882a593Smuzhiyun */
528*4882a593Smuzhiyun if (s->flags & (SLAB_RED_ZONE | SLAB_POISON))
529*4882a593Smuzhiyun return s->object_size;
530*4882a593Smuzhiyun # endif
531*4882a593Smuzhiyun if (s->flags & SLAB_KASAN)
532*4882a593Smuzhiyun return s->object_size;
533*4882a593Smuzhiyun /*
534*4882a593Smuzhiyun * If we have the need to store the freelist pointer
535*4882a593Smuzhiyun * back there or track user information then we can
536*4882a593Smuzhiyun * only use the space before that information.
537*4882a593Smuzhiyun */
538*4882a593Smuzhiyun if (s->flags & (SLAB_TYPESAFE_BY_RCU | SLAB_STORE_USER))
539*4882a593Smuzhiyun return s->inuse;
540*4882a593Smuzhiyun /*
541*4882a593Smuzhiyun * Else we can use all the padding etc for the allocation
542*4882a593Smuzhiyun */
543*4882a593Smuzhiyun return s->size;
544*4882a593Smuzhiyun #endif
545*4882a593Smuzhiyun }
546*4882a593Smuzhiyun
slab_pre_alloc_hook(struct kmem_cache * s,struct obj_cgroup ** objcgp,size_t size,gfp_t flags)547*4882a593Smuzhiyun static inline struct kmem_cache *slab_pre_alloc_hook(struct kmem_cache *s,
548*4882a593Smuzhiyun struct obj_cgroup **objcgp,
549*4882a593Smuzhiyun size_t size, gfp_t flags)
550*4882a593Smuzhiyun {
551*4882a593Smuzhiyun flags &= gfp_allowed_mask;
552*4882a593Smuzhiyun
553*4882a593Smuzhiyun fs_reclaim_acquire(flags);
554*4882a593Smuzhiyun fs_reclaim_release(flags);
555*4882a593Smuzhiyun
556*4882a593Smuzhiyun might_sleep_if(gfpflags_allow_blocking(flags));
557*4882a593Smuzhiyun
558*4882a593Smuzhiyun if (should_failslab(s, flags))
559*4882a593Smuzhiyun return NULL;
560*4882a593Smuzhiyun
561*4882a593Smuzhiyun if (!memcg_slab_pre_alloc_hook(s, objcgp, size, flags))
562*4882a593Smuzhiyun return NULL;
563*4882a593Smuzhiyun
564*4882a593Smuzhiyun return s;
565*4882a593Smuzhiyun }
566*4882a593Smuzhiyun
slab_post_alloc_hook(struct kmem_cache * s,struct obj_cgroup * objcg,gfp_t flags,size_t size,void ** p,bool init)567*4882a593Smuzhiyun static inline void slab_post_alloc_hook(struct kmem_cache *s,
568*4882a593Smuzhiyun struct obj_cgroup *objcg, gfp_t flags,
569*4882a593Smuzhiyun size_t size, void **p, bool init)
570*4882a593Smuzhiyun {
571*4882a593Smuzhiyun size_t i;
572*4882a593Smuzhiyun
573*4882a593Smuzhiyun flags &= gfp_allowed_mask;
574*4882a593Smuzhiyun
575*4882a593Smuzhiyun /*
576*4882a593Smuzhiyun * As memory initialization might be integrated into KASAN,
577*4882a593Smuzhiyun * kasan_slab_alloc and initialization memset must be
578*4882a593Smuzhiyun * kept together to avoid discrepancies in behavior.
579*4882a593Smuzhiyun *
580*4882a593Smuzhiyun * As p[i] might get tagged, memset and kmemleak hook come after KASAN.
581*4882a593Smuzhiyun */
582*4882a593Smuzhiyun for (i = 0; i < size; i++) {
583*4882a593Smuzhiyun p[i] = kasan_slab_alloc(s, p[i], flags, init);
584*4882a593Smuzhiyun if (p[i] && init && !kasan_has_integrated_init())
585*4882a593Smuzhiyun memset(p[i], 0, s->object_size);
586*4882a593Smuzhiyun kmemleak_alloc_recursive(p[i], s->object_size, 1,
587*4882a593Smuzhiyun s->flags, flags);
588*4882a593Smuzhiyun }
589*4882a593Smuzhiyun
590*4882a593Smuzhiyun memcg_slab_post_alloc_hook(s, objcg, flags, size, p);
591*4882a593Smuzhiyun }
592*4882a593Smuzhiyun
593*4882a593Smuzhiyun #ifndef CONFIG_SLOB
594*4882a593Smuzhiyun /*
595*4882a593Smuzhiyun * The slab lists for all objects.
596*4882a593Smuzhiyun */
597*4882a593Smuzhiyun struct kmem_cache_node {
598*4882a593Smuzhiyun spinlock_t list_lock;
599*4882a593Smuzhiyun
600*4882a593Smuzhiyun #ifdef CONFIG_SLAB
601*4882a593Smuzhiyun struct list_head slabs_partial; /* partial list first, better asm code */
602*4882a593Smuzhiyun struct list_head slabs_full;
603*4882a593Smuzhiyun struct list_head slabs_free;
604*4882a593Smuzhiyun unsigned long total_slabs; /* length of all slab lists */
605*4882a593Smuzhiyun unsigned long free_slabs; /* length of free slab list only */
606*4882a593Smuzhiyun unsigned long free_objects;
607*4882a593Smuzhiyun unsigned int free_limit;
608*4882a593Smuzhiyun unsigned int colour_next; /* Per-node cache coloring */
609*4882a593Smuzhiyun struct array_cache *shared; /* shared per node */
610*4882a593Smuzhiyun struct alien_cache **alien; /* on other nodes */
611*4882a593Smuzhiyun unsigned long next_reap; /* updated without locking */
612*4882a593Smuzhiyun int free_touched; /* updated without locking */
613*4882a593Smuzhiyun #endif
614*4882a593Smuzhiyun
615*4882a593Smuzhiyun #ifdef CONFIG_SLUB
616*4882a593Smuzhiyun unsigned long nr_partial;
617*4882a593Smuzhiyun struct list_head partial;
618*4882a593Smuzhiyun #ifdef CONFIG_SLUB_DEBUG
619*4882a593Smuzhiyun atomic_long_t nr_slabs;
620*4882a593Smuzhiyun atomic_long_t total_objects;
621*4882a593Smuzhiyun struct list_head full;
622*4882a593Smuzhiyun #endif
623*4882a593Smuzhiyun #endif
624*4882a593Smuzhiyun
625*4882a593Smuzhiyun };
626*4882a593Smuzhiyun
get_node(struct kmem_cache * s,int node)627*4882a593Smuzhiyun static inline struct kmem_cache_node *get_node(struct kmem_cache *s, int node)
628*4882a593Smuzhiyun {
629*4882a593Smuzhiyun return s->node[node];
630*4882a593Smuzhiyun }
631*4882a593Smuzhiyun
632*4882a593Smuzhiyun /*
633*4882a593Smuzhiyun * Iterator over all nodes. The body will be executed for each node that has
634*4882a593Smuzhiyun * a kmem_cache_node structure allocated (which is true for all online nodes)
635*4882a593Smuzhiyun */
636*4882a593Smuzhiyun #define for_each_kmem_cache_node(__s, __node, __n) \
637*4882a593Smuzhiyun for (__node = 0; __node < nr_node_ids; __node++) \
638*4882a593Smuzhiyun if ((__n = get_node(__s, __node)))
639*4882a593Smuzhiyun
640*4882a593Smuzhiyun #endif
641*4882a593Smuzhiyun
642*4882a593Smuzhiyun void *slab_start(struct seq_file *m, loff_t *pos);
643*4882a593Smuzhiyun void *slab_next(struct seq_file *m, void *p, loff_t *pos);
644*4882a593Smuzhiyun void slab_stop(struct seq_file *m, void *p);
645*4882a593Smuzhiyun int memcg_slab_show(struct seq_file *m, void *p);
646*4882a593Smuzhiyun
647*4882a593Smuzhiyun #if defined(CONFIG_SLAB) || defined(CONFIG_SLUB_DEBUG)
648*4882a593Smuzhiyun void dump_unreclaimable_slab(void);
649*4882a593Smuzhiyun #else
dump_unreclaimable_slab(void)650*4882a593Smuzhiyun static inline void dump_unreclaimable_slab(void)
651*4882a593Smuzhiyun {
652*4882a593Smuzhiyun }
653*4882a593Smuzhiyun #endif
654*4882a593Smuzhiyun
655*4882a593Smuzhiyun void ___cache_free(struct kmem_cache *cache, void *x, unsigned long addr);
656*4882a593Smuzhiyun
657*4882a593Smuzhiyun #ifdef CONFIG_SLAB_FREELIST_RANDOM
658*4882a593Smuzhiyun int cache_random_seq_create(struct kmem_cache *cachep, unsigned int count,
659*4882a593Smuzhiyun gfp_t gfp);
660*4882a593Smuzhiyun void cache_random_seq_destroy(struct kmem_cache *cachep);
661*4882a593Smuzhiyun #else
cache_random_seq_create(struct kmem_cache * cachep,unsigned int count,gfp_t gfp)662*4882a593Smuzhiyun static inline int cache_random_seq_create(struct kmem_cache *cachep,
663*4882a593Smuzhiyun unsigned int count, gfp_t gfp)
664*4882a593Smuzhiyun {
665*4882a593Smuzhiyun return 0;
666*4882a593Smuzhiyun }
cache_random_seq_destroy(struct kmem_cache * cachep)667*4882a593Smuzhiyun static inline void cache_random_seq_destroy(struct kmem_cache *cachep) { }
668*4882a593Smuzhiyun #endif /* CONFIG_SLAB_FREELIST_RANDOM */
669*4882a593Smuzhiyun
slab_want_init_on_alloc(gfp_t flags,struct kmem_cache * c)670*4882a593Smuzhiyun static inline bool slab_want_init_on_alloc(gfp_t flags, struct kmem_cache *c)
671*4882a593Smuzhiyun {
672*4882a593Smuzhiyun if (static_branch_unlikely(&init_on_alloc)) {
673*4882a593Smuzhiyun if (c->ctor)
674*4882a593Smuzhiyun return false;
675*4882a593Smuzhiyun if (c->flags & (SLAB_TYPESAFE_BY_RCU | SLAB_POISON))
676*4882a593Smuzhiyun return flags & __GFP_ZERO;
677*4882a593Smuzhiyun return true;
678*4882a593Smuzhiyun }
679*4882a593Smuzhiyun return flags & __GFP_ZERO;
680*4882a593Smuzhiyun }
681*4882a593Smuzhiyun
slab_want_init_on_free(struct kmem_cache * c)682*4882a593Smuzhiyun static inline bool slab_want_init_on_free(struct kmem_cache *c)
683*4882a593Smuzhiyun {
684*4882a593Smuzhiyun if (static_branch_unlikely(&init_on_free))
685*4882a593Smuzhiyun return !(c->ctor ||
686*4882a593Smuzhiyun (c->flags & (SLAB_TYPESAFE_BY_RCU | SLAB_POISON)));
687*4882a593Smuzhiyun return false;
688*4882a593Smuzhiyun }
689*4882a593Smuzhiyun
690*4882a593Smuzhiyun #if defined(CONFIG_DEBUG_FS) && defined(CONFIG_SLUB_DEBUG)
691*4882a593Smuzhiyun void debugfs_slab_release(struct kmem_cache *);
692*4882a593Smuzhiyun #else
debugfs_slab_release(struct kmem_cache * s)693*4882a593Smuzhiyun static inline void debugfs_slab_release(struct kmem_cache *s) { }
694*4882a593Smuzhiyun #endif
695*4882a593Smuzhiyun
696*4882a593Smuzhiyun #endif /* MM_SLAB_H */
697