xref: /linux/mm/percpu-internal.h (revision cdd5b5a9761fd66d17586e4f4ba6588c70e640ea)
1b2441318SGreg Kroah-Hartman /* SPDX-License-Identifier: GPL-2.0 */
28fa3ed80SDennis Zhou #ifndef _MM_PERCPU_INTERNAL_H
38fa3ed80SDennis Zhou #define _MM_PERCPU_INTERNAL_H
48fa3ed80SDennis Zhou 
58fa3ed80SDennis Zhou #include <linux/types.h>
68fa3ed80SDennis Zhou #include <linux/percpu.h>
72ef8ed7dSYafang Shao #include <linux/memcontrol.h>
88fa3ed80SDennis Zhou 
9ca460b3cSDennis Zhou (Facebook) /*
10ca460b3cSDennis Zhou (Facebook)  * pcpu_block_md is the metadata block struct.
11ca460b3cSDennis Zhou (Facebook)  * Each chunk's bitmap is split into a number of full blocks.
12ca460b3cSDennis Zhou (Facebook)  * All units are in terms of bits.
13382b88e9SDennis Zhou  *
14382b88e9SDennis Zhou  * The scan hint is the largest known contiguous area before the contig hint.
15382b88e9SDennis Zhou  * It is not necessarily the actual largest contig hint though.  There is an
16382b88e9SDennis Zhou  * invariant that the scan_hint_start > contig_hint_start iff
17382b88e9SDennis Zhou  * scan_hint == contig_hint.  This is necessary because when scanning forward,
18382b88e9SDennis Zhou  * we don't know if a new contig hint would be better than the current one.
19ca460b3cSDennis Zhou (Facebook)  */
20ca460b3cSDennis Zhou (Facebook) struct pcpu_block_md {
21382b88e9SDennis Zhou 	int			scan_hint;	/* scan hint for block */
22382b88e9SDennis Zhou 	int			scan_hint_start; /* block relative starting
23382b88e9SDennis Zhou 						    position of the scan hint */
24ca460b3cSDennis Zhou (Facebook) 	int                     contig_hint;    /* contig hint for block */
25ca460b3cSDennis Zhou (Facebook) 	int                     contig_hint_start; /* block relative starting
26ca460b3cSDennis Zhou (Facebook) 						      position of the contig hint */
27ca460b3cSDennis Zhou (Facebook) 	int                     left_free;      /* size of free space along
28ca460b3cSDennis Zhou (Facebook) 						   the left side of the block */
29ca460b3cSDennis Zhou (Facebook) 	int                     right_free;     /* size of free space along
30ca460b3cSDennis Zhou (Facebook) 						   the right side of the block */
31ca460b3cSDennis Zhou (Facebook) 	int                     first_free;     /* block position of first free */
32047924c9SDennis Zhou 	int			nr_bits;	/* total bits responsible for */
33ca460b3cSDennis Zhou (Facebook) };
34ca460b3cSDennis Zhou (Facebook) 
358fa3ed80SDennis Zhou struct pcpu_chunk {
3630a5b536SDennis Zhou #ifdef CONFIG_PERCPU_STATS
3730a5b536SDennis Zhou 	int			nr_alloc;	/* # of allocations */
3830a5b536SDennis Zhou 	size_t			max_alloc_size; /* largest allocation size */
3930a5b536SDennis Zhou #endif
4030a5b536SDennis Zhou 
418fa3ed80SDennis Zhou 	struct list_head	list;		/* linked to pcpu_slot lists */
4240064aecSDennis Zhou (Facebook) 	int			free_bytes;	/* free bytes in the chunk */
4392c14cabSDennis Zhou 	struct pcpu_block_md	chunk_md;
44*3a6358c0SYu Ma 	unsigned long		*bound_map;	/* boundary map */
45*3a6358c0SYu Ma 
46*3a6358c0SYu Ma 	/*
47*3a6358c0SYu Ma 	 * base_addr is the base address of this chunk.
48*3a6358c0SYu Ma 	 * To reduce false sharing, current layout is optimized to make sure
49*3a6358c0SYu Ma 	 * base_addr locate in the different cacheline with free_bytes and
50*3a6358c0SYu Ma 	 * chunk_md.
51*3a6358c0SYu Ma 	 */
52*3a6358c0SYu Ma 	void			*base_addr ____cacheline_aligned_in_smp;
538fa3ed80SDennis Zhou 
5440064aecSDennis Zhou (Facebook) 	unsigned long		*alloc_map;	/* allocation map */
55ca460b3cSDennis Zhou (Facebook) 	struct pcpu_block_md	*md_blocks;	/* metadata blocks */
568fa3ed80SDennis Zhou 
578fa3ed80SDennis Zhou 	void			*data;		/* chunk data */
588fa3ed80SDennis Zhou 	bool			immutable;	/* no [de]population allowed */
59f1833241SRoman Gushchin 	bool			isolated;	/* isolated from active chunk
60f1833241SRoman Gushchin 						   slots */
61e2266705SDennis Zhou (Facebook) 	int			start_offset;	/* the overlap with the previous
62e2266705SDennis Zhou (Facebook) 						   region to have a page aligned
63e2266705SDennis Zhou (Facebook) 						   base_addr */
646b9d7c8eSDennis Zhou (Facebook) 	int			end_offset;	/* additional area required to
656b9d7c8eSDennis Zhou (Facebook) 						   have the region end page
666b9d7c8eSDennis Zhou (Facebook) 						   aligned */
673c7be18aSRoman Gushchin #ifdef CONFIG_MEMCG_KMEM
683c7be18aSRoman Gushchin 	struct obj_cgroup	**obj_cgroups;	/* vector of object cgroups */
693c7be18aSRoman Gushchin #endif
70c0ebfdc3SDennis Zhou (Facebook) 
71c0ebfdc3SDennis Zhou (Facebook) 	int			nr_pages;	/* # of pages served by this chunk */
728fa3ed80SDennis Zhou 	int			nr_populated;	/* # of populated pages */
730cecf50cSDennis Zhou (Facebook) 	int                     nr_empty_pop_pages; /* # of empty populated pages */
748fa3ed80SDennis Zhou 	unsigned long		populated[];	/* populated bitmap */
758fa3ed80SDennis Zhou };
768fa3ed80SDennis Zhou 
778fa3ed80SDennis Zhou extern spinlock_t pcpu_lock;
788fa3ed80SDennis Zhou 
793c7be18aSRoman Gushchin extern struct list_head *pcpu_chunk_lists;
808fa3ed80SDennis Zhou extern int pcpu_nr_slots;
81f1833241SRoman Gushchin extern int pcpu_sidelined_slot;
82f1833241SRoman Gushchin extern int pcpu_to_depopulate_slot;
83faf65ddeSRoman Gushchin extern int pcpu_nr_empty_pop_pages;
848fa3ed80SDennis Zhou 
858fa3ed80SDennis Zhou extern struct pcpu_chunk *pcpu_first_chunk;
868fa3ed80SDennis Zhou extern struct pcpu_chunk *pcpu_reserved_chunk;
878fa3ed80SDennis Zhou 
8840064aecSDennis Zhou (Facebook) /**
89ca460b3cSDennis Zhou (Facebook)  * pcpu_chunk_nr_blocks - converts nr_pages to # of md_blocks
90ca460b3cSDennis Zhou (Facebook)  * @chunk: chunk of interest
91ca460b3cSDennis Zhou (Facebook)  *
92ca460b3cSDennis Zhou (Facebook)  * This conversion is from the number of physical pages that the chunk
93ca460b3cSDennis Zhou (Facebook)  * serves to the number of bitmap blocks used.
94ca460b3cSDennis Zhou (Facebook)  */
pcpu_chunk_nr_blocks(struct pcpu_chunk * chunk)95ca460b3cSDennis Zhou (Facebook) static inline int pcpu_chunk_nr_blocks(struct pcpu_chunk *chunk)
96ca460b3cSDennis Zhou (Facebook) {
97ca460b3cSDennis Zhou (Facebook) 	return chunk->nr_pages * PAGE_SIZE / PCPU_BITMAP_BLOCK_SIZE;
98ca460b3cSDennis Zhou (Facebook) }
99ca460b3cSDennis Zhou (Facebook) 
100ca460b3cSDennis Zhou (Facebook) /**
10140064aecSDennis Zhou (Facebook)  * pcpu_nr_pages_to_map_bits - converts the pages to size of bitmap
10240064aecSDennis Zhou (Facebook)  * @pages: number of physical pages
10340064aecSDennis Zhou (Facebook)  *
10440064aecSDennis Zhou (Facebook)  * This conversion is from physical pages to the number of bits
10540064aecSDennis Zhou (Facebook)  * required in the bitmap.
10640064aecSDennis Zhou (Facebook)  */
pcpu_nr_pages_to_map_bits(int pages)10740064aecSDennis Zhou (Facebook) static inline int pcpu_nr_pages_to_map_bits(int pages)
10840064aecSDennis Zhou (Facebook) {
10940064aecSDennis Zhou (Facebook) 	return pages * PAGE_SIZE / PCPU_MIN_ALLOC_SIZE;
11040064aecSDennis Zhou (Facebook) }
11140064aecSDennis Zhou (Facebook) 
11240064aecSDennis Zhou (Facebook) /**
11340064aecSDennis Zhou (Facebook)  * pcpu_chunk_map_bits - helper to convert nr_pages to size of bitmap
11440064aecSDennis Zhou (Facebook)  * @chunk: chunk of interest
11540064aecSDennis Zhou (Facebook)  *
11640064aecSDennis Zhou (Facebook)  * This conversion is from the number of physical pages that the chunk
11740064aecSDennis Zhou (Facebook)  * serves to the number of bits in the bitmap.
11840064aecSDennis Zhou (Facebook)  */
pcpu_chunk_map_bits(struct pcpu_chunk * chunk)11940064aecSDennis Zhou (Facebook) static inline int pcpu_chunk_map_bits(struct pcpu_chunk *chunk)
12040064aecSDennis Zhou (Facebook) {
12140064aecSDennis Zhou (Facebook) 	return pcpu_nr_pages_to_map_bits(chunk->nr_pages);
12240064aecSDennis Zhou (Facebook) }
12340064aecSDennis Zhou (Facebook) 
1248c57c077SQi Zheng /**
1258c57c077SQi Zheng  * pcpu_obj_full_size - helper to calculate size of each accounted object
1268c57c077SQi Zheng  * @size: size of area to allocate in bytes
1278c57c077SQi Zheng  *
1288c57c077SQi Zheng  * For each accounted object there is an extra space which is used to store
1292ef8ed7dSYafang Shao  * obj_cgroup membership if kmemcg is not disabled. Charge it too.
1308c57c077SQi Zheng  */
pcpu_obj_full_size(size_t size)1318c57c077SQi Zheng static inline size_t pcpu_obj_full_size(size_t size)
1328c57c077SQi Zheng {
133f67bed13SVasily Averin 	size_t extra_size = 0;
1348c57c077SQi Zheng 
135f67bed13SVasily Averin #ifdef CONFIG_MEMCG_KMEM
1362ef8ed7dSYafang Shao 	if (!mem_cgroup_kmem_disabled())
137f67bed13SVasily Averin 		extra_size += size / PCPU_MIN_ALLOC_SIZE * sizeof(struct obj_cgroup *);
138f67bed13SVasily Averin #endif
1398c57c077SQi Zheng 
1408c57c077SQi Zheng 	return size * num_possible_cpus() + extra_size;
1418c57c077SQi Zheng }
1428c57c077SQi Zheng 
14330a5b536SDennis Zhou #ifdef CONFIG_PERCPU_STATS
14430a5b536SDennis Zhou 
14530a5b536SDennis Zhou #include <linux/spinlock.h>
14630a5b536SDennis Zhou 
14730a5b536SDennis Zhou struct percpu_stats {
14830a5b536SDennis Zhou 	u64 nr_alloc;		/* lifetime # of allocations */
14930a5b536SDennis Zhou 	u64 nr_dealloc;		/* lifetime # of deallocations */
15030a5b536SDennis Zhou 	u64 nr_cur_alloc;	/* current # of allocations */
15130a5b536SDennis Zhou 	u64 nr_max_alloc;	/* max # of live allocations */
15230a5b536SDennis Zhou 	u32 nr_chunks;		/* current # of live chunks */
15330a5b536SDennis Zhou 	u32 nr_max_chunks;	/* max # of live chunks */
154f0953a1bSIngo Molnar 	size_t min_alloc_size;	/* min allocation size */
15530a5b536SDennis Zhou 	size_t max_alloc_size;	/* max allocation size */
15630a5b536SDennis Zhou };
15730a5b536SDennis Zhou 
15830a5b536SDennis Zhou extern struct percpu_stats pcpu_stats;
15930a5b536SDennis Zhou extern struct pcpu_alloc_info pcpu_stats_ai;
16030a5b536SDennis Zhou 
16130a5b536SDennis Zhou /*
16230a5b536SDennis Zhou  * For debug purposes. We don't care about the flexible array.
16330a5b536SDennis Zhou  */
pcpu_stats_save_ai(const struct pcpu_alloc_info * ai)16430a5b536SDennis Zhou static inline void pcpu_stats_save_ai(const struct pcpu_alloc_info *ai)
16530a5b536SDennis Zhou {
16630a5b536SDennis Zhou 	memcpy(&pcpu_stats_ai, ai, sizeof(struct pcpu_alloc_info));
16730a5b536SDennis Zhou 
16830a5b536SDennis Zhou 	/* initialize min_alloc_size to unit_size */
16930a5b536SDennis Zhou 	pcpu_stats.min_alloc_size = pcpu_stats_ai.unit_size;
17030a5b536SDennis Zhou }
17130a5b536SDennis Zhou 
17230a5b536SDennis Zhou /*
17330a5b536SDennis Zhou  * pcpu_stats_area_alloc - increment area allocation stats
17430a5b536SDennis Zhou  * @chunk: the location of the area being allocated
17530a5b536SDennis Zhou  * @size: size of area to allocate in bytes
17630a5b536SDennis Zhou  *
17730a5b536SDennis Zhou  * CONTEXT:
17830a5b536SDennis Zhou  * pcpu_lock.
17930a5b536SDennis Zhou  */
pcpu_stats_area_alloc(struct pcpu_chunk * chunk,size_t size)18030a5b536SDennis Zhou static inline void pcpu_stats_area_alloc(struct pcpu_chunk *chunk, size_t size)
18130a5b536SDennis Zhou {
18230a5b536SDennis Zhou 	lockdep_assert_held(&pcpu_lock);
18330a5b536SDennis Zhou 
18430a5b536SDennis Zhou 	pcpu_stats.nr_alloc++;
18530a5b536SDennis Zhou 	pcpu_stats.nr_cur_alloc++;
18630a5b536SDennis Zhou 	pcpu_stats.nr_max_alloc =
18730a5b536SDennis Zhou 		max(pcpu_stats.nr_max_alloc, pcpu_stats.nr_cur_alloc);
18830a5b536SDennis Zhou 	pcpu_stats.min_alloc_size =
18930a5b536SDennis Zhou 		min(pcpu_stats.min_alloc_size, size);
19030a5b536SDennis Zhou 	pcpu_stats.max_alloc_size =
19130a5b536SDennis Zhou 		max(pcpu_stats.max_alloc_size, size);
19230a5b536SDennis Zhou 
19330a5b536SDennis Zhou 	chunk->nr_alloc++;
19430a5b536SDennis Zhou 	chunk->max_alloc_size = max(chunk->max_alloc_size, size);
19530a5b536SDennis Zhou }
19630a5b536SDennis Zhou 
19730a5b536SDennis Zhou /*
19830a5b536SDennis Zhou  * pcpu_stats_area_dealloc - decrement allocation stats
19930a5b536SDennis Zhou  * @chunk: the location of the area being deallocated
20030a5b536SDennis Zhou  *
20130a5b536SDennis Zhou  * CONTEXT:
20230a5b536SDennis Zhou  * pcpu_lock.
20330a5b536SDennis Zhou  */
pcpu_stats_area_dealloc(struct pcpu_chunk * chunk)20430a5b536SDennis Zhou static inline void pcpu_stats_area_dealloc(struct pcpu_chunk *chunk)
20530a5b536SDennis Zhou {
20630a5b536SDennis Zhou 	lockdep_assert_held(&pcpu_lock);
20730a5b536SDennis Zhou 
20830a5b536SDennis Zhou 	pcpu_stats.nr_dealloc++;
20930a5b536SDennis Zhou 	pcpu_stats.nr_cur_alloc--;
21030a5b536SDennis Zhou 
21130a5b536SDennis Zhou 	chunk->nr_alloc--;
21230a5b536SDennis Zhou }
21330a5b536SDennis Zhou 
21430a5b536SDennis Zhou /*
21530a5b536SDennis Zhou  * pcpu_stats_chunk_alloc - increment chunk stats
21630a5b536SDennis Zhou  */
pcpu_stats_chunk_alloc(void)21730a5b536SDennis Zhou static inline void pcpu_stats_chunk_alloc(void)
21830a5b536SDennis Zhou {
219303abfdfSDennis Zhou 	unsigned long flags;
220303abfdfSDennis Zhou 	spin_lock_irqsave(&pcpu_lock, flags);
22130a5b536SDennis Zhou 
22230a5b536SDennis Zhou 	pcpu_stats.nr_chunks++;
22330a5b536SDennis Zhou 	pcpu_stats.nr_max_chunks =
22430a5b536SDennis Zhou 		max(pcpu_stats.nr_max_chunks, pcpu_stats.nr_chunks);
22530a5b536SDennis Zhou 
226303abfdfSDennis Zhou 	spin_unlock_irqrestore(&pcpu_lock, flags);
22730a5b536SDennis Zhou }
22830a5b536SDennis Zhou 
22930a5b536SDennis Zhou /*
23030a5b536SDennis Zhou  * pcpu_stats_chunk_dealloc - decrement chunk stats
23130a5b536SDennis Zhou  */
pcpu_stats_chunk_dealloc(void)23230a5b536SDennis Zhou static inline void pcpu_stats_chunk_dealloc(void)
23330a5b536SDennis Zhou {
234303abfdfSDennis Zhou 	unsigned long flags;
235303abfdfSDennis Zhou 	spin_lock_irqsave(&pcpu_lock, flags);
23630a5b536SDennis Zhou 
23730a5b536SDennis Zhou 	pcpu_stats.nr_chunks--;
23830a5b536SDennis Zhou 
239303abfdfSDennis Zhou 	spin_unlock_irqrestore(&pcpu_lock, flags);
24030a5b536SDennis Zhou }
24130a5b536SDennis Zhou 
24230a5b536SDennis Zhou #else
24330a5b536SDennis Zhou 
pcpu_stats_save_ai(const struct pcpu_alloc_info * ai)24430a5b536SDennis Zhou static inline void pcpu_stats_save_ai(const struct pcpu_alloc_info *ai)
24530a5b536SDennis Zhou {
24630a5b536SDennis Zhou }
24730a5b536SDennis Zhou 
pcpu_stats_area_alloc(struct pcpu_chunk * chunk,size_t size)24830a5b536SDennis Zhou static inline void pcpu_stats_area_alloc(struct pcpu_chunk *chunk, size_t size)
24930a5b536SDennis Zhou {
25030a5b536SDennis Zhou }
25130a5b536SDennis Zhou 
pcpu_stats_area_dealloc(struct pcpu_chunk * chunk)25230a5b536SDennis Zhou static inline void pcpu_stats_area_dealloc(struct pcpu_chunk *chunk)
25330a5b536SDennis Zhou {
25430a5b536SDennis Zhou }
25530a5b536SDennis Zhou 
pcpu_stats_chunk_alloc(void)25630a5b536SDennis Zhou static inline void pcpu_stats_chunk_alloc(void)
25730a5b536SDennis Zhou {
25830a5b536SDennis Zhou }
25930a5b536SDennis Zhou 
pcpu_stats_chunk_dealloc(void)26030a5b536SDennis Zhou static inline void pcpu_stats_chunk_dealloc(void)
26130a5b536SDennis Zhou {
26230a5b536SDennis Zhou }
26330a5b536SDennis Zhou 
26430a5b536SDennis Zhou #endif /* !CONFIG_PERCPU_STATS */
26530a5b536SDennis Zhou 
2668fa3ed80SDennis Zhou #endif
267