xref: /linux/mm/percpu-km.c (revision 4ba24fef3eb3b142197135223b90ced2f319cd53)
1b0c9778bSTejun Heo /*
2b0c9778bSTejun Heo  * mm/percpu-km.c - kernel memory based chunk allocation
3b0c9778bSTejun Heo  *
4b0c9778bSTejun Heo  * Copyright (C) 2010		SUSE Linux Products GmbH
5b0c9778bSTejun Heo  * Copyright (C) 2010		Tejun Heo <tj@kernel.org>
6b0c9778bSTejun Heo  *
7b0c9778bSTejun Heo  * This file is released under the GPLv2.
8b0c9778bSTejun Heo  *
9b0c9778bSTejun Heo  * Chunks are allocated as a contiguous kernel memory using gfp
10b0c9778bSTejun Heo  * allocation.  This is to be used on nommu architectures.
11b0c9778bSTejun Heo  *
12b0c9778bSTejun Heo  * To use percpu-km,
13b0c9778bSTejun Heo  *
14b0c9778bSTejun Heo  * - define CONFIG_NEED_PER_CPU_KM from the arch Kconfig.
15b0c9778bSTejun Heo  *
16b0c9778bSTejun Heo  * - CONFIG_NEED_PER_CPU_PAGE_FIRST_CHUNK must not be defined.  It's
17b0c9778bSTejun Heo  *   not compatible with PER_CPU_KM.  EMBED_FIRST_CHUNK should work
18b0c9778bSTejun Heo  *   fine.
19b0c9778bSTejun Heo  *
20b0c9778bSTejun Heo  * - NUMA is not supported.  When setting up the first chunk,
21b0c9778bSTejun Heo  *   @cpu_distance_fn should be NULL or report all CPUs to be nearer
22b0c9778bSTejun Heo  *   than or at LOCAL_DISTANCE.
23b0c9778bSTejun Heo  *
24b0c9778bSTejun Heo  * - It's best if the chunk size is power of two multiple of
25b0c9778bSTejun Heo  *   PAGE_SIZE.  Because each chunk is allocated as a contiguous
26b0c9778bSTejun Heo  *   kernel memory block using alloc_pages(), memory will be wasted if
27b0c9778bSTejun Heo  *   chunk size is not aligned.  percpu-km code will whine about it.
28b0c9778bSTejun Heo  */
29b0c9778bSTejun Heo 
30bbddff05STejun Heo #if defined(CONFIG_SMP) && defined(CONFIG_NEED_PER_CPU_PAGE_FIRST_CHUNK)
31b0c9778bSTejun Heo #error "contiguous percpu allocation is incompatible with paged first chunk"
32b0c9778bSTejun Heo #endif
33b0c9778bSTejun Heo 
34b0c9778bSTejun Heo #include <linux/log2.h>
35b0c9778bSTejun Heo 
36a93ace48STejun Heo static int pcpu_populate_chunk(struct pcpu_chunk *chunk,
37a93ace48STejun Heo 			       int page_start, int page_end)
38b0c9778bSTejun Heo {
39b0c9778bSTejun Heo 	return 0;
40b0c9778bSTejun Heo }
41b0c9778bSTejun Heo 
42a93ace48STejun Heo static void pcpu_depopulate_chunk(struct pcpu_chunk *chunk,
43a93ace48STejun Heo 				  int page_start, int page_end)
44b0c9778bSTejun Heo {
45b0c9778bSTejun Heo 	/* nada */
46b0c9778bSTejun Heo }
47b0c9778bSTejun Heo 
48b0c9778bSTejun Heo static struct pcpu_chunk *pcpu_create_chunk(void)
49b0c9778bSTejun Heo {
50b0c9778bSTejun Heo 	const int nr_pages = pcpu_group_sizes[0] >> PAGE_SHIFT;
51b0c9778bSTejun Heo 	struct pcpu_chunk *chunk;
52b0c9778bSTejun Heo 	struct page *pages;
53b0c9778bSTejun Heo 	int i;
54b0c9778bSTejun Heo 
55b0c9778bSTejun Heo 	chunk = pcpu_alloc_chunk();
56b0c9778bSTejun Heo 	if (!chunk)
57b0c9778bSTejun Heo 		return NULL;
58b0c9778bSTejun Heo 
59b0c9778bSTejun Heo 	pages = alloc_pages(GFP_KERNEL, order_base_2(nr_pages));
60b0c9778bSTejun Heo 	if (!pages) {
61b0c9778bSTejun Heo 		pcpu_free_chunk(chunk);
62b0c9778bSTejun Heo 		return NULL;
63b0c9778bSTejun Heo 	}
64b0c9778bSTejun Heo 
65b0c9778bSTejun Heo 	for (i = 0; i < nr_pages; i++)
66b0c9778bSTejun Heo 		pcpu_set_page_chunk(nth_page(pages, i), chunk);
67b0c9778bSTejun Heo 
68b0c9778bSTejun Heo 	chunk->data = pages;
69b0c9778bSTejun Heo 	chunk->base_addr = page_address(pages) - pcpu_group_offsets[0];
70a63d4ac4STejun Heo 
71b38d08f3STejun Heo 	spin_lock_irq(&pcpu_lock);
72*b539b87fSTejun Heo 	pcpu_chunk_populated(chunk, 0, nr_pages);
73b38d08f3STejun Heo 	spin_unlock_irq(&pcpu_lock);
74a63d4ac4STejun Heo 
75b0c9778bSTejun Heo 	return chunk;
76b0c9778bSTejun Heo }
77b0c9778bSTejun Heo 
78b0c9778bSTejun Heo static void pcpu_destroy_chunk(struct pcpu_chunk *chunk)
79b0c9778bSTejun Heo {
80b0c9778bSTejun Heo 	const int nr_pages = pcpu_group_sizes[0] >> PAGE_SHIFT;
81b0c9778bSTejun Heo 
82b0c9778bSTejun Heo 	if (chunk && chunk->data)
83b0c9778bSTejun Heo 		__free_pages(chunk->data, order_base_2(nr_pages));
84b0c9778bSTejun Heo 	pcpu_free_chunk(chunk);
85b0c9778bSTejun Heo }
86b0c9778bSTejun Heo 
87b0c9778bSTejun Heo static struct page *pcpu_addr_to_page(void *addr)
88b0c9778bSTejun Heo {
89b0c9778bSTejun Heo 	return virt_to_page(addr);
90b0c9778bSTejun Heo }
91b0c9778bSTejun Heo 
92b0c9778bSTejun Heo static int __init pcpu_verify_alloc_info(const struct pcpu_alloc_info *ai)
93b0c9778bSTejun Heo {
94b0c9778bSTejun Heo 	size_t nr_pages, alloc_pages;
95b0c9778bSTejun Heo 
96b0c9778bSTejun Heo 	/* all units must be in a single group */
97b0c9778bSTejun Heo 	if (ai->nr_groups != 1) {
98b0c9778bSTejun Heo 		printk(KERN_CRIT "percpu: can't handle more than one groups\n");
99b0c9778bSTejun Heo 		return -EINVAL;
100b0c9778bSTejun Heo 	}
101b0c9778bSTejun Heo 
102b0c9778bSTejun Heo 	nr_pages = (ai->groups[0].nr_units * ai->unit_size) >> PAGE_SHIFT;
103b0c9778bSTejun Heo 	alloc_pages = roundup_pow_of_two(nr_pages);
104b0c9778bSTejun Heo 
105b0c9778bSTejun Heo 	if (alloc_pages > nr_pages)
106b0c9778bSTejun Heo 		printk(KERN_WARNING "percpu: wasting %zu pages per chunk\n",
107b0c9778bSTejun Heo 		       alloc_pages - nr_pages);
108b0c9778bSTejun Heo 
109b0c9778bSTejun Heo 	return 0;
110b0c9778bSTejun Heo }
111