1 #define _GNU_SOURCE
2 #include <sys/mman.h>
3 #include <stdint.h>
4 #include <stdio.h>
5 #include <stdlib.h>
6 #include <unistd.h>
7 #include <string.h>
8 #include <sys/time.h>
9 #include <sys/resource.h>
10 #include <syscall.h>
11 #include <errno.h>
12 #include <stdbool.h>
13
14 #ifndef MLOCK_ONFAULT
15 #define MLOCK_ONFAULT 1
16 #endif
17
18 #ifndef MCL_ONFAULT
19 #define MCL_ONFAULT (MCL_FUTURE << 1)
20 #endif
21
mlock2_(void * start,size_t len,int flags)22 static int mlock2_(void *start, size_t len, int flags)
23 {
24 #ifdef __NR_mlock2
25 return syscall(__NR_mlock2, start, len, flags);
26 #else
27 errno = ENOSYS;
28 return -1;
29 #endif
30 }
31
32 struct vm_boundaries {
33 unsigned long start;
34 unsigned long end;
35 };
36
get_vm_area(unsigned long addr,struct vm_boundaries * area)37 static int get_vm_area(unsigned long addr, struct vm_boundaries *area)
38 {
39 FILE *file;
40 int ret = 1;
41 char line[1024] = {0};
42 char *end_addr;
43 char *stop;
44 unsigned long start;
45 unsigned long end;
46
47 if (!area)
48 return ret;
49
50 file = fopen("/proc/self/maps", "r");
51 if (!file) {
52 perror("fopen");
53 return ret;
54 }
55
56 memset(area, 0, sizeof(struct vm_boundaries));
57
58 while(fgets(line, 1024, file)) {
59 end_addr = strchr(line, '-');
60 if (!end_addr) {
61 printf("cannot parse /proc/self/maps\n");
62 goto out;
63 }
64 *end_addr = '\0';
65 end_addr++;
66 stop = strchr(end_addr, ' ');
67 if (!stop) {
68 printf("cannot parse /proc/self/maps\n");
69 goto out;
70 }
71 stop = '\0';
72
73 sscanf(line, "%lx", &start);
74 sscanf(end_addr, "%lx", &end);
75
76 if (start <= addr && end > addr) {
77 area->start = start;
78 area->end = end;
79 ret = 0;
80 goto out;
81 }
82 }
83 out:
84 fclose(file);
85 return ret;
86 }
87
get_pageflags(unsigned long addr)88 static uint64_t get_pageflags(unsigned long addr)
89 {
90 FILE *file;
91 uint64_t pfn;
92 unsigned long offset;
93
94 file = fopen("/proc/self/pagemap", "r");
95 if (!file) {
96 perror("fopen pagemap");
97 _exit(1);
98 }
99
100 offset = addr / getpagesize() * sizeof(pfn);
101
102 if (fseek(file, offset, SEEK_SET)) {
103 perror("fseek pagemap");
104 _exit(1);
105 }
106
107 if (fread(&pfn, sizeof(pfn), 1, file) != 1) {
108 perror("fread pagemap");
109 _exit(1);
110 }
111
112 fclose(file);
113 return pfn;
114 }
115
get_kpageflags(unsigned long pfn)116 static uint64_t get_kpageflags(unsigned long pfn)
117 {
118 uint64_t flags;
119 FILE *file;
120
121 file = fopen("/proc/kpageflags", "r");
122 if (!file) {
123 perror("fopen kpageflags");
124 _exit(1);
125 }
126
127 if (fseek(file, pfn * sizeof(flags), SEEK_SET)) {
128 perror("fseek kpageflags");
129 _exit(1);
130 }
131
132 if (fread(&flags, sizeof(flags), 1, file) != 1) {
133 perror("fread kpageflags");
134 _exit(1);
135 }
136
137 fclose(file);
138 return flags;
139 }
140
seek_to_smaps_entry(unsigned long addr)141 static FILE *seek_to_smaps_entry(unsigned long addr)
142 {
143 FILE *file;
144 char *line = NULL;
145 size_t size = 0;
146 unsigned long start, end;
147 char perms[5];
148 unsigned long offset;
149 char dev[32];
150 unsigned long inode;
151 char path[BUFSIZ];
152
153 file = fopen("/proc/self/smaps", "r");
154 if (!file) {
155 perror("fopen smaps");
156 _exit(1);
157 }
158
159 while (getline(&line, &size, file) > 0) {
160 if (sscanf(line, "%lx-%lx %s %lx %s %lu %s\n",
161 &start, &end, perms, &offset, dev, &inode, path) < 6)
162 goto next;
163
164 if (start <= addr && addr < end)
165 goto out;
166
167 next:
168 free(line);
169 line = NULL;
170 size = 0;
171 }
172
173 fclose(file);
174 file = NULL;
175
176 out:
177 free(line);
178 return file;
179 }
180
181 #define VMFLAGS "VmFlags:"
182
is_vmflag_set(unsigned long addr,const char * vmflag)183 static bool is_vmflag_set(unsigned long addr, const char *vmflag)
184 {
185 char *line = NULL;
186 char *flags;
187 size_t size = 0;
188 bool ret = false;
189 FILE *smaps;
190
191 smaps = seek_to_smaps_entry(addr);
192 if (!smaps) {
193 printf("Unable to parse /proc/self/smaps\n");
194 goto out;
195 }
196
197 while (getline(&line, &size, smaps) > 0) {
198 if (!strstr(line, VMFLAGS)) {
199 free(line);
200 line = NULL;
201 size = 0;
202 continue;
203 }
204
205 flags = line + strlen(VMFLAGS);
206 ret = (strstr(flags, vmflag) != NULL);
207 goto out;
208 }
209
210 out:
211 free(line);
212 fclose(smaps);
213 return ret;
214 }
215
216 #define SIZE "Size:"
217 #define RSS "Rss:"
218 #define LOCKED "lo"
219
is_vma_lock_on_fault(unsigned long addr)220 static bool is_vma_lock_on_fault(unsigned long addr)
221 {
222 bool ret = false;
223 bool locked;
224 FILE *smaps = NULL;
225 unsigned long vma_size, vma_rss;
226 char *line = NULL;
227 char *value;
228 size_t size = 0;
229
230 locked = is_vmflag_set(addr, LOCKED);
231 if (!locked)
232 goto out;
233
234 smaps = seek_to_smaps_entry(addr);
235 if (!smaps) {
236 printf("Unable to parse /proc/self/smaps\n");
237 goto out;
238 }
239
240 while (getline(&line, &size, smaps) > 0) {
241 if (!strstr(line, SIZE)) {
242 free(line);
243 line = NULL;
244 size = 0;
245 continue;
246 }
247
248 value = line + strlen(SIZE);
249 if (sscanf(value, "%lu kB", &vma_size) < 1) {
250 printf("Unable to parse smaps entry for Size\n");
251 goto out;
252 }
253 break;
254 }
255
256 while (getline(&line, &size, smaps) > 0) {
257 if (!strstr(line, RSS)) {
258 free(line);
259 line = NULL;
260 size = 0;
261 continue;
262 }
263
264 value = line + strlen(RSS);
265 if (sscanf(value, "%lu kB", &vma_rss) < 1) {
266 printf("Unable to parse smaps entry for Rss\n");
267 goto out;
268 }
269 break;
270 }
271
272 ret = locked && (vma_rss < vma_size);
273 out:
274 free(line);
275 if (smaps)
276 fclose(smaps);
277 return ret;
278 }
279
280 #define PRESENT_BIT 0x8000000000000000ULL
281 #define PFN_MASK 0x007FFFFFFFFFFFFFULL
282 #define UNEVICTABLE_BIT (1UL << 18)
283
lock_check(char * map)284 static int lock_check(char *map)
285 {
286 unsigned long page_size = getpagesize();
287 uint64_t page1_flags, page2_flags;
288
289 page1_flags = get_pageflags((unsigned long)map);
290 page2_flags = get_pageflags((unsigned long)map + page_size);
291
292 /* Both pages should be present */
293 if (((page1_flags & PRESENT_BIT) == 0) ||
294 ((page2_flags & PRESENT_BIT) == 0)) {
295 printf("Failed to make both pages present\n");
296 return 1;
297 }
298
299 page1_flags = get_kpageflags(page1_flags & PFN_MASK);
300 page2_flags = get_kpageflags(page2_flags & PFN_MASK);
301
302 /* Both pages should be unevictable */
303 if (((page1_flags & UNEVICTABLE_BIT) == 0) ||
304 ((page2_flags & UNEVICTABLE_BIT) == 0)) {
305 printf("Failed to make both pages unevictable\n");
306 return 1;
307 }
308
309 if (!is_vmflag_set((unsigned long)map, LOCKED)) {
310 printf("VMA flag %s is missing on page 1\n", LOCKED);
311 return 1;
312 }
313
314 if (!is_vmflag_set((unsigned long)map + page_size, LOCKED)) {
315 printf("VMA flag %s is missing on page 2\n", LOCKED);
316 return 1;
317 }
318
319 return 0;
320 }
321
unlock_lock_check(char * map)322 static int unlock_lock_check(char *map)
323 {
324 unsigned long page_size = getpagesize();
325 uint64_t page1_flags, page2_flags;
326
327 page1_flags = get_pageflags((unsigned long)map);
328 page2_flags = get_pageflags((unsigned long)map + page_size);
329 page1_flags = get_kpageflags(page1_flags & PFN_MASK);
330 page2_flags = get_kpageflags(page2_flags & PFN_MASK);
331
332 if ((page1_flags & UNEVICTABLE_BIT) || (page2_flags & UNEVICTABLE_BIT)) {
333 printf("A page is still marked unevictable after unlock\n");
334 return 1;
335 }
336
337 if (is_vmflag_set((unsigned long)map, LOCKED)) {
338 printf("VMA flag %s is present on page 1 after unlock\n", LOCKED);
339 return 1;
340 }
341
342 if (is_vmflag_set((unsigned long)map + page_size, LOCKED)) {
343 printf("VMA flag %s is present on page 2 after unlock\n", LOCKED);
344 return 1;
345 }
346
347 return 0;
348 }
349
test_mlock_lock()350 static int test_mlock_lock()
351 {
352 char *map;
353 int ret = 1;
354 unsigned long page_size = getpagesize();
355
356 map = mmap(NULL, 2 * page_size, PROT_READ | PROT_WRITE,
357 MAP_ANONYMOUS | MAP_PRIVATE, 0, 0);
358 if (map == MAP_FAILED) {
359 perror("test_mlock_locked mmap");
360 goto out;
361 }
362
363 if (mlock2_(map, 2 * page_size, 0)) {
364 if (errno == ENOSYS) {
365 printf("Cannot call new mlock family, skipping test\n");
366 _exit(0);
367 }
368 perror("mlock2(0)");
369 goto unmap;
370 }
371
372 if (lock_check(map))
373 goto unmap;
374
375 /* Now unlock and recheck attributes */
376 if (munlock(map, 2 * page_size)) {
377 perror("munlock()");
378 goto unmap;
379 }
380
381 ret = unlock_lock_check(map);
382
383 unmap:
384 munmap(map, 2 * page_size);
385 out:
386 return ret;
387 }
388
onfault_check(char * map)389 static int onfault_check(char *map)
390 {
391 unsigned long page_size = getpagesize();
392 uint64_t page1_flags, page2_flags;
393
394 page1_flags = get_pageflags((unsigned long)map);
395 page2_flags = get_pageflags((unsigned long)map + page_size);
396
397 /* Neither page should be present */
398 if ((page1_flags & PRESENT_BIT) || (page2_flags & PRESENT_BIT)) {
399 printf("Pages were made present by MLOCK_ONFAULT\n");
400 return 1;
401 }
402
403 *map = 'a';
404 page1_flags = get_pageflags((unsigned long)map);
405 page2_flags = get_pageflags((unsigned long)map + page_size);
406
407 /* Only page 1 should be present */
408 if ((page1_flags & PRESENT_BIT) == 0) {
409 printf("Page 1 is not present after fault\n");
410 return 1;
411 } else if (page2_flags & PRESENT_BIT) {
412 printf("Page 2 was made present\n");
413 return 1;
414 }
415
416 page1_flags = get_kpageflags(page1_flags & PFN_MASK);
417
418 /* Page 1 should be unevictable */
419 if ((page1_flags & UNEVICTABLE_BIT) == 0) {
420 printf("Failed to make faulted page unevictable\n");
421 return 1;
422 }
423
424 if (!is_vma_lock_on_fault((unsigned long)map)) {
425 printf("VMA is not marked for lock on fault\n");
426 return 1;
427 }
428
429 if (!is_vma_lock_on_fault((unsigned long)map + page_size)) {
430 printf("VMA is not marked for lock on fault\n");
431 return 1;
432 }
433
434 return 0;
435 }
436
unlock_onfault_check(char * map)437 static int unlock_onfault_check(char *map)
438 {
439 unsigned long page_size = getpagesize();
440 uint64_t page1_flags;
441
442 page1_flags = get_pageflags((unsigned long)map);
443 page1_flags = get_kpageflags(page1_flags & PFN_MASK);
444
445 if (page1_flags & UNEVICTABLE_BIT) {
446 printf("Page 1 is still marked unevictable after unlock\n");
447 return 1;
448 }
449
450 if (is_vma_lock_on_fault((unsigned long)map) ||
451 is_vma_lock_on_fault((unsigned long)map + page_size)) {
452 printf("VMA is still lock on fault after unlock\n");
453 return 1;
454 }
455
456 return 0;
457 }
458
test_mlock_onfault()459 static int test_mlock_onfault()
460 {
461 char *map;
462 int ret = 1;
463 unsigned long page_size = getpagesize();
464
465 map = mmap(NULL, 2 * page_size, PROT_READ | PROT_WRITE,
466 MAP_ANONYMOUS | MAP_PRIVATE, 0, 0);
467 if (map == MAP_FAILED) {
468 perror("test_mlock_locked mmap");
469 goto out;
470 }
471
472 if (mlock2_(map, 2 * page_size, MLOCK_ONFAULT)) {
473 if (errno == ENOSYS) {
474 printf("Cannot call new mlock family, skipping test\n");
475 _exit(0);
476 }
477 perror("mlock2(MLOCK_ONFAULT)");
478 goto unmap;
479 }
480
481 if (onfault_check(map))
482 goto unmap;
483
484 /* Now unlock and recheck attributes */
485 if (munlock(map, 2 * page_size)) {
486 if (errno == ENOSYS) {
487 printf("Cannot call new mlock family, skipping test\n");
488 _exit(0);
489 }
490 perror("munlock()");
491 goto unmap;
492 }
493
494 ret = unlock_onfault_check(map);
495 unmap:
496 munmap(map, 2 * page_size);
497 out:
498 return ret;
499 }
500
test_lock_onfault_of_present()501 static int test_lock_onfault_of_present()
502 {
503 char *map;
504 int ret = 1;
505 unsigned long page_size = getpagesize();
506 uint64_t page1_flags, page2_flags;
507
508 map = mmap(NULL, 2 * page_size, PROT_READ | PROT_WRITE,
509 MAP_ANONYMOUS | MAP_PRIVATE, 0, 0);
510 if (map == MAP_FAILED) {
511 perror("test_mlock_locked mmap");
512 goto out;
513 }
514
515 *map = 'a';
516
517 if (mlock2_(map, 2 * page_size, MLOCK_ONFAULT)) {
518 if (errno == ENOSYS) {
519 printf("Cannot call new mlock family, skipping test\n");
520 _exit(0);
521 }
522 perror("mlock2(MLOCK_ONFAULT)");
523 goto unmap;
524 }
525
526 page1_flags = get_pageflags((unsigned long)map);
527 page2_flags = get_pageflags((unsigned long)map + page_size);
528 page1_flags = get_kpageflags(page1_flags & PFN_MASK);
529 page2_flags = get_kpageflags(page2_flags & PFN_MASK);
530
531 /* Page 1 should be unevictable */
532 if ((page1_flags & UNEVICTABLE_BIT) == 0) {
533 printf("Failed to make present page unevictable\n");
534 goto unmap;
535 }
536
537 if (!is_vma_lock_on_fault((unsigned long)map) ||
538 !is_vma_lock_on_fault((unsigned long)map + page_size)) {
539 printf("VMA with present pages is not marked lock on fault\n");
540 goto unmap;
541 }
542 ret = 0;
543 unmap:
544 munmap(map, 2 * page_size);
545 out:
546 return ret;
547 }
548
test_munlockall()549 static int test_munlockall()
550 {
551 char *map;
552 int ret = 1;
553 unsigned long page_size = getpagesize();
554
555 map = mmap(NULL, 2 * page_size, PROT_READ | PROT_WRITE,
556 MAP_ANONYMOUS | MAP_PRIVATE, 0, 0);
557
558 if (map == MAP_FAILED) {
559 perror("test_munlockall mmap");
560 goto out;
561 }
562
563 if (mlockall(MCL_CURRENT)) {
564 perror("mlockall(MCL_CURRENT)");
565 goto out;
566 }
567
568 if (lock_check(map))
569 goto unmap;
570
571 if (munlockall()) {
572 perror("munlockall()");
573 goto unmap;
574 }
575
576 if (unlock_lock_check(map))
577 goto unmap;
578
579 munmap(map, 2 * page_size);
580
581 map = mmap(NULL, 2 * page_size, PROT_READ | PROT_WRITE,
582 MAP_ANONYMOUS | MAP_PRIVATE, 0, 0);
583
584 if (map == MAP_FAILED) {
585 perror("test_munlockall second mmap");
586 goto out;
587 }
588
589 if (mlockall(MCL_CURRENT | MCL_ONFAULT)) {
590 perror("mlockall(MCL_CURRENT | MCL_ONFAULT)");
591 goto unmap;
592 }
593
594 if (onfault_check(map))
595 goto unmap;
596
597 if (munlockall()) {
598 perror("munlockall()");
599 goto unmap;
600 }
601
602 if (unlock_onfault_check(map))
603 goto unmap;
604
605 if (mlockall(MCL_CURRENT | MCL_FUTURE)) {
606 perror("mlockall(MCL_CURRENT | MCL_FUTURE)");
607 goto out;
608 }
609
610 if (lock_check(map))
611 goto unmap;
612
613 if (munlockall()) {
614 perror("munlockall()");
615 goto unmap;
616 }
617
618 ret = unlock_lock_check(map);
619
620 unmap:
621 munmap(map, 2 * page_size);
622 out:
623 munlockall();
624 return ret;
625 }
626
test_vma_management(bool call_mlock)627 static int test_vma_management(bool call_mlock)
628 {
629 int ret = 1;
630 void *map;
631 unsigned long page_size = getpagesize();
632 struct vm_boundaries page1;
633 struct vm_boundaries page2;
634 struct vm_boundaries page3;
635
636 map = mmap(NULL, 3 * page_size, PROT_READ | PROT_WRITE,
637 MAP_ANONYMOUS | MAP_PRIVATE, 0, 0);
638 if (map == MAP_FAILED) {
639 perror("mmap()");
640 return ret;
641 }
642
643 if (call_mlock && mlock2_(map, 3 * page_size, MLOCK_ONFAULT)) {
644 if (errno == ENOSYS) {
645 printf("Cannot call new mlock family, skipping test\n");
646 _exit(0);
647 }
648 perror("mlock(ONFAULT)\n");
649 goto out;
650 }
651
652 if (get_vm_area((unsigned long)map, &page1) ||
653 get_vm_area((unsigned long)map + page_size, &page2) ||
654 get_vm_area((unsigned long)map + page_size * 2, &page3)) {
655 printf("couldn't find mapping in /proc/self/maps\n");
656 goto out;
657 }
658
659 /*
660 * Before we unlock a portion, we need to that all three pages are in
661 * the same VMA. If they are not we abort this test (Note that this is
662 * not a failure)
663 */
664 if (page1.start != page2.start || page2.start != page3.start) {
665 printf("VMAs are not merged to start, aborting test\n");
666 ret = 0;
667 goto out;
668 }
669
670 if (munlock(map + page_size, page_size)) {
671 perror("munlock()");
672 goto out;
673 }
674
675 if (get_vm_area((unsigned long)map, &page1) ||
676 get_vm_area((unsigned long)map + page_size, &page2) ||
677 get_vm_area((unsigned long)map + page_size * 2, &page3)) {
678 printf("couldn't find mapping in /proc/self/maps\n");
679 goto out;
680 }
681
682 /* All three VMAs should be different */
683 if (page1.start == page2.start || page2.start == page3.start) {
684 printf("failed to split VMA for munlock\n");
685 goto out;
686 }
687
688 /* Now unlock the first and third page and check the VMAs again */
689 if (munlock(map, page_size * 3)) {
690 perror("munlock()");
691 goto out;
692 }
693
694 if (get_vm_area((unsigned long)map, &page1) ||
695 get_vm_area((unsigned long)map + page_size, &page2) ||
696 get_vm_area((unsigned long)map + page_size * 2, &page3)) {
697 printf("couldn't find mapping in /proc/self/maps\n");
698 goto out;
699 }
700
701 /* Now all three VMAs should be the same */
702 if (page1.start != page2.start || page2.start != page3.start) {
703 printf("failed to merge VMAs after munlock\n");
704 goto out;
705 }
706
707 ret = 0;
708 out:
709 munmap(map, 3 * page_size);
710 return ret;
711 }
712
test_mlockall(int (test_function)(bool call_mlock))713 static int test_mlockall(int (test_function)(bool call_mlock))
714 {
715 int ret = 1;
716
717 if (mlockall(MCL_CURRENT | MCL_ONFAULT | MCL_FUTURE)) {
718 perror("mlockall");
719 return ret;
720 }
721
722 ret = test_function(false);
723 munlockall();
724 return ret;
725 }
726
main(int argc,char ** argv)727 int main(int argc, char **argv)
728 {
729 int ret = 0;
730 ret += test_mlock_lock();
731 ret += test_mlock_onfault();
732 ret += test_munlockall();
733 ret += test_lock_onfault_of_present();
734 ret += test_vma_management(true);
735 ret += test_mlockall(test_vma_management);
736 return ret;
737 }
738