1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /* Test selecting other page sizes for mmap/shmget.
3*4882a593Smuzhiyun
4*4882a593Smuzhiyun Before running this huge pages for each huge page size must have been
5*4882a593Smuzhiyun reserved.
6*4882a593Smuzhiyun For large pages beyond MAX_ORDER (like 1GB on x86) boot options must be used.
7*4882a593Smuzhiyun Also shmmax must be increased.
8*4882a593Smuzhiyun And you need to run as root to work around some weird permissions in shm.
9*4882a593Smuzhiyun And nothing using huge pages should run in parallel.
10*4882a593Smuzhiyun When the program aborts you may need to clean up the shm segments with
11*4882a593Smuzhiyun ipcrm -m by hand, like this
12*4882a593Smuzhiyun sudo ipcs | awk '$1 == "0x00000000" {print $2}' | xargs -n1 sudo ipcrm -m
13*4882a593Smuzhiyun (warning this will remove all if someone else uses them) */
14*4882a593Smuzhiyun
15*4882a593Smuzhiyun #define _GNU_SOURCE 1
16*4882a593Smuzhiyun #include <sys/mman.h>
17*4882a593Smuzhiyun #include <stdlib.h>
18*4882a593Smuzhiyun #include <stdio.h>
19*4882a593Smuzhiyun #include <sys/ipc.h>
20*4882a593Smuzhiyun #include <sys/shm.h>
21*4882a593Smuzhiyun #include <sys/stat.h>
22*4882a593Smuzhiyun #include <glob.h>
23*4882a593Smuzhiyun #include <assert.h>
24*4882a593Smuzhiyun #include <unistd.h>
25*4882a593Smuzhiyun #include <stdarg.h>
26*4882a593Smuzhiyun #include <string.h>
27*4882a593Smuzhiyun
28*4882a593Smuzhiyun #define err(x) perror(x), exit(1)
29*4882a593Smuzhiyun
30*4882a593Smuzhiyun #define MAP_HUGE_2MB (21 << MAP_HUGE_SHIFT)
31*4882a593Smuzhiyun #define MAP_HUGE_1GB (30 << MAP_HUGE_SHIFT)
32*4882a593Smuzhiyun #define MAP_HUGE_SHIFT 26
33*4882a593Smuzhiyun #define MAP_HUGE_MASK 0x3f
34*4882a593Smuzhiyun #if !defined(MAP_HUGETLB)
35*4882a593Smuzhiyun #define MAP_HUGETLB 0x40000
36*4882a593Smuzhiyun #endif
37*4882a593Smuzhiyun
38*4882a593Smuzhiyun #define SHM_HUGETLB 04000 /* segment will use huge TLB pages */
39*4882a593Smuzhiyun #define SHM_HUGE_SHIFT 26
40*4882a593Smuzhiyun #define SHM_HUGE_MASK 0x3f
41*4882a593Smuzhiyun #define SHM_HUGE_2MB (21 << SHM_HUGE_SHIFT)
42*4882a593Smuzhiyun #define SHM_HUGE_1GB (30 << SHM_HUGE_SHIFT)
43*4882a593Smuzhiyun
44*4882a593Smuzhiyun #define NUM_PAGESIZES 5
45*4882a593Smuzhiyun
46*4882a593Smuzhiyun #define NUM_PAGES 4
47*4882a593Smuzhiyun
48*4882a593Smuzhiyun #define Dprintf(fmt...) // printf(fmt)
49*4882a593Smuzhiyun
50*4882a593Smuzhiyun unsigned long page_sizes[NUM_PAGESIZES];
51*4882a593Smuzhiyun int num_page_sizes;
52*4882a593Smuzhiyun
ilog2(unsigned long v)53*4882a593Smuzhiyun int ilog2(unsigned long v)
54*4882a593Smuzhiyun {
55*4882a593Smuzhiyun int l = 0;
56*4882a593Smuzhiyun while ((1UL << l) < v)
57*4882a593Smuzhiyun l++;
58*4882a593Smuzhiyun return l;
59*4882a593Smuzhiyun }
60*4882a593Smuzhiyun
find_pagesizes(void)61*4882a593Smuzhiyun void find_pagesizes(void)
62*4882a593Smuzhiyun {
63*4882a593Smuzhiyun glob_t g;
64*4882a593Smuzhiyun int i;
65*4882a593Smuzhiyun glob("/sys/kernel/mm/hugepages/hugepages-*kB", 0, NULL, &g);
66*4882a593Smuzhiyun assert(g.gl_pathc <= NUM_PAGESIZES);
67*4882a593Smuzhiyun for (i = 0; i < g.gl_pathc; i++) {
68*4882a593Smuzhiyun sscanf(g.gl_pathv[i], "/sys/kernel/mm/hugepages/hugepages-%lukB",
69*4882a593Smuzhiyun &page_sizes[i]);
70*4882a593Smuzhiyun page_sizes[i] <<= 10;
71*4882a593Smuzhiyun printf("Found %luMB\n", page_sizes[i] >> 20);
72*4882a593Smuzhiyun }
73*4882a593Smuzhiyun num_page_sizes = g.gl_pathc;
74*4882a593Smuzhiyun globfree(&g);
75*4882a593Smuzhiyun }
76*4882a593Smuzhiyun
default_huge_page_size(void)77*4882a593Smuzhiyun unsigned long default_huge_page_size(void)
78*4882a593Smuzhiyun {
79*4882a593Smuzhiyun unsigned long hps = 0;
80*4882a593Smuzhiyun char *line = NULL;
81*4882a593Smuzhiyun size_t linelen = 0;
82*4882a593Smuzhiyun FILE *f = fopen("/proc/meminfo", "r");
83*4882a593Smuzhiyun if (!f)
84*4882a593Smuzhiyun return 0;
85*4882a593Smuzhiyun while (getline(&line, &linelen, f) > 0) {
86*4882a593Smuzhiyun if (sscanf(line, "Hugepagesize: %lu kB", &hps) == 1) {
87*4882a593Smuzhiyun hps <<= 10;
88*4882a593Smuzhiyun break;
89*4882a593Smuzhiyun }
90*4882a593Smuzhiyun }
91*4882a593Smuzhiyun free(line);
92*4882a593Smuzhiyun return hps;
93*4882a593Smuzhiyun }
94*4882a593Smuzhiyun
show(unsigned long ps)95*4882a593Smuzhiyun void show(unsigned long ps)
96*4882a593Smuzhiyun {
97*4882a593Smuzhiyun char buf[100];
98*4882a593Smuzhiyun if (ps == getpagesize())
99*4882a593Smuzhiyun return;
100*4882a593Smuzhiyun printf("%luMB: ", ps >> 20);
101*4882a593Smuzhiyun fflush(stdout);
102*4882a593Smuzhiyun snprintf(buf, sizeof buf,
103*4882a593Smuzhiyun "cat /sys/kernel/mm/hugepages/hugepages-%lukB/free_hugepages",
104*4882a593Smuzhiyun ps >> 10);
105*4882a593Smuzhiyun system(buf);
106*4882a593Smuzhiyun }
107*4882a593Smuzhiyun
read_sysfs(int warn,char * fmt,...)108*4882a593Smuzhiyun unsigned long read_sysfs(int warn, char *fmt, ...)
109*4882a593Smuzhiyun {
110*4882a593Smuzhiyun char *line = NULL;
111*4882a593Smuzhiyun size_t linelen = 0;
112*4882a593Smuzhiyun char buf[100];
113*4882a593Smuzhiyun FILE *f;
114*4882a593Smuzhiyun va_list ap;
115*4882a593Smuzhiyun unsigned long val = 0;
116*4882a593Smuzhiyun
117*4882a593Smuzhiyun va_start(ap, fmt);
118*4882a593Smuzhiyun vsnprintf(buf, sizeof buf, fmt, ap);
119*4882a593Smuzhiyun va_end(ap);
120*4882a593Smuzhiyun
121*4882a593Smuzhiyun f = fopen(buf, "r");
122*4882a593Smuzhiyun if (!f) {
123*4882a593Smuzhiyun if (warn)
124*4882a593Smuzhiyun printf("missing %s\n", buf);
125*4882a593Smuzhiyun return 0;
126*4882a593Smuzhiyun }
127*4882a593Smuzhiyun if (getline(&line, &linelen, f) > 0) {
128*4882a593Smuzhiyun sscanf(line, "%lu", &val);
129*4882a593Smuzhiyun }
130*4882a593Smuzhiyun fclose(f);
131*4882a593Smuzhiyun free(line);
132*4882a593Smuzhiyun return val;
133*4882a593Smuzhiyun }
134*4882a593Smuzhiyun
read_free(unsigned long ps)135*4882a593Smuzhiyun unsigned long read_free(unsigned long ps)
136*4882a593Smuzhiyun {
137*4882a593Smuzhiyun return read_sysfs(ps != getpagesize(),
138*4882a593Smuzhiyun "/sys/kernel/mm/hugepages/hugepages-%lukB/free_hugepages",
139*4882a593Smuzhiyun ps >> 10);
140*4882a593Smuzhiyun }
141*4882a593Smuzhiyun
test_mmap(unsigned long size,unsigned flags)142*4882a593Smuzhiyun void test_mmap(unsigned long size, unsigned flags)
143*4882a593Smuzhiyun {
144*4882a593Smuzhiyun char *map;
145*4882a593Smuzhiyun unsigned long before, after;
146*4882a593Smuzhiyun int err;
147*4882a593Smuzhiyun
148*4882a593Smuzhiyun before = read_free(size);
149*4882a593Smuzhiyun map = mmap(NULL, size*NUM_PAGES, PROT_READ|PROT_WRITE,
150*4882a593Smuzhiyun MAP_PRIVATE|MAP_ANONYMOUS|MAP_HUGETLB|flags, -1, 0);
151*4882a593Smuzhiyun
152*4882a593Smuzhiyun if (map == (char *)-1) err("mmap");
153*4882a593Smuzhiyun memset(map, 0xff, size*NUM_PAGES);
154*4882a593Smuzhiyun after = read_free(size);
155*4882a593Smuzhiyun Dprintf("before %lu after %lu diff %ld size %lu\n",
156*4882a593Smuzhiyun before, after, before - after, size);
157*4882a593Smuzhiyun assert(size == getpagesize() || (before - after) == NUM_PAGES);
158*4882a593Smuzhiyun show(size);
159*4882a593Smuzhiyun err = munmap(map, size);
160*4882a593Smuzhiyun assert(!err);
161*4882a593Smuzhiyun }
162*4882a593Smuzhiyun
test_shmget(unsigned long size,unsigned flags)163*4882a593Smuzhiyun void test_shmget(unsigned long size, unsigned flags)
164*4882a593Smuzhiyun {
165*4882a593Smuzhiyun int id;
166*4882a593Smuzhiyun unsigned long before, after;
167*4882a593Smuzhiyun int err;
168*4882a593Smuzhiyun
169*4882a593Smuzhiyun before = read_free(size);
170*4882a593Smuzhiyun id = shmget(IPC_PRIVATE, size * NUM_PAGES, IPC_CREAT|0600|flags);
171*4882a593Smuzhiyun if (id < 0) err("shmget");
172*4882a593Smuzhiyun
173*4882a593Smuzhiyun struct shm_info i;
174*4882a593Smuzhiyun if (shmctl(id, SHM_INFO, (void *)&i) < 0) err("shmctl");
175*4882a593Smuzhiyun Dprintf("alloc %lu res %lu\n", i.shm_tot, i.shm_rss);
176*4882a593Smuzhiyun
177*4882a593Smuzhiyun
178*4882a593Smuzhiyun Dprintf("id %d\n", id);
179*4882a593Smuzhiyun char *map = shmat(id, NULL, 0600);
180*4882a593Smuzhiyun if (map == (char*)-1) err("shmat");
181*4882a593Smuzhiyun
182*4882a593Smuzhiyun shmctl(id, IPC_RMID, NULL);
183*4882a593Smuzhiyun
184*4882a593Smuzhiyun memset(map, 0xff, size*NUM_PAGES);
185*4882a593Smuzhiyun after = read_free(size);
186*4882a593Smuzhiyun
187*4882a593Smuzhiyun Dprintf("before %lu after %lu diff %ld size %lu\n",
188*4882a593Smuzhiyun before, after, before - after, size);
189*4882a593Smuzhiyun assert(size == getpagesize() || (before - after) == NUM_PAGES);
190*4882a593Smuzhiyun show(size);
191*4882a593Smuzhiyun err = shmdt(map);
192*4882a593Smuzhiyun assert(!err);
193*4882a593Smuzhiyun }
194*4882a593Smuzhiyun
sanity_checks(void)195*4882a593Smuzhiyun void sanity_checks(void)
196*4882a593Smuzhiyun {
197*4882a593Smuzhiyun int i;
198*4882a593Smuzhiyun unsigned long largest = getpagesize();
199*4882a593Smuzhiyun
200*4882a593Smuzhiyun for (i = 0; i < num_page_sizes; i++) {
201*4882a593Smuzhiyun if (page_sizes[i] > largest)
202*4882a593Smuzhiyun largest = page_sizes[i];
203*4882a593Smuzhiyun
204*4882a593Smuzhiyun if (read_free(page_sizes[i]) < NUM_PAGES) {
205*4882a593Smuzhiyun printf("Not enough huge pages for page size %lu MB, need %u\n",
206*4882a593Smuzhiyun page_sizes[i] >> 20,
207*4882a593Smuzhiyun NUM_PAGES);
208*4882a593Smuzhiyun exit(0);
209*4882a593Smuzhiyun }
210*4882a593Smuzhiyun }
211*4882a593Smuzhiyun
212*4882a593Smuzhiyun if (read_sysfs(0, "/proc/sys/kernel/shmmax") < NUM_PAGES * largest) {
213*4882a593Smuzhiyun printf("Please do echo %lu > /proc/sys/kernel/shmmax", largest * NUM_PAGES);
214*4882a593Smuzhiyun exit(0);
215*4882a593Smuzhiyun }
216*4882a593Smuzhiyun
217*4882a593Smuzhiyun #if defined(__x86_64__)
218*4882a593Smuzhiyun if (largest != 1U<<30) {
219*4882a593Smuzhiyun printf("No GB pages available on x86-64\n"
220*4882a593Smuzhiyun "Please boot with hugepagesz=1G hugepages=%d\n", NUM_PAGES);
221*4882a593Smuzhiyun exit(0);
222*4882a593Smuzhiyun }
223*4882a593Smuzhiyun #endif
224*4882a593Smuzhiyun }
225*4882a593Smuzhiyun
main(void)226*4882a593Smuzhiyun int main(void)
227*4882a593Smuzhiyun {
228*4882a593Smuzhiyun int i;
229*4882a593Smuzhiyun unsigned default_hps = default_huge_page_size();
230*4882a593Smuzhiyun
231*4882a593Smuzhiyun find_pagesizes();
232*4882a593Smuzhiyun
233*4882a593Smuzhiyun sanity_checks();
234*4882a593Smuzhiyun
235*4882a593Smuzhiyun for (i = 0; i < num_page_sizes; i++) {
236*4882a593Smuzhiyun unsigned long ps = page_sizes[i];
237*4882a593Smuzhiyun int arg = ilog2(ps) << MAP_HUGE_SHIFT;
238*4882a593Smuzhiyun printf("Testing %luMB mmap with shift %x\n", ps >> 20, arg);
239*4882a593Smuzhiyun test_mmap(ps, MAP_HUGETLB | arg);
240*4882a593Smuzhiyun }
241*4882a593Smuzhiyun printf("Testing default huge mmap\n");
242*4882a593Smuzhiyun test_mmap(default_hps, SHM_HUGETLB);
243*4882a593Smuzhiyun
244*4882a593Smuzhiyun puts("Testing non-huge shmget");
245*4882a593Smuzhiyun test_shmget(getpagesize(), 0);
246*4882a593Smuzhiyun
247*4882a593Smuzhiyun for (i = 0; i < num_page_sizes; i++) {
248*4882a593Smuzhiyun unsigned long ps = page_sizes[i];
249*4882a593Smuzhiyun int arg = ilog2(ps) << SHM_HUGE_SHIFT;
250*4882a593Smuzhiyun printf("Testing %luMB shmget with shift %x\n", ps >> 20, arg);
251*4882a593Smuzhiyun test_shmget(ps, SHM_HUGETLB | arg);
252*4882a593Smuzhiyun }
253*4882a593Smuzhiyun puts("default huge shmget");
254*4882a593Smuzhiyun test_shmget(default_hps, SHM_HUGETLB);
255*4882a593Smuzhiyun
256*4882a593Smuzhiyun return 0;
257*4882a593Smuzhiyun }
258