145 lines
3.5 KiB
C
145 lines
3.5 KiB
C
|
/*
|
||
|
* Stress test for transparent huge pages, memory compaction and migration.
|
||
|
*
|
||
|
* Authors: Konstantin Khlebnikov <koct9i@gmail.com>
|
||
|
*
|
||
|
* This is free and unencumbered software released into the public domain.
|
||
|
*/
|
||
|
|
||
|
#include <stdlib.h>
|
||
|
#include <stdio.h>
|
||
|
#include <stdint.h>
|
||
|
#include <err.h>
|
||
|
#include <time.h>
|
||
|
#include <unistd.h>
|
||
|
#include <fcntl.h>
|
||
|
#include <string.h>
|
||
|
#include <sys/mman.h>
|
||
|
|
||
|
#define PAGE_SHIFT 12
|
||
|
#define HPAGE_SHIFT 21
|
||
|
|
||
|
#define PAGE_SIZE (1 << PAGE_SHIFT)
|
||
|
#define HPAGE_SIZE (1 << HPAGE_SHIFT)
|
||
|
|
||
|
#define PAGEMAP_PRESENT(ent) (((ent) & (1ull << 63)) != 0)
|
||
|
#define PAGEMAP_PFN(ent) ((ent) & ((1ull << 55) - 1))
|
||
|
|
||
|
int pagemap_fd;
|
||
|
|
||
|
int64_t allocate_transhuge(void *ptr)
|
||
|
{
|
||
|
uint64_t ent[2];
|
||
|
|
||
|
/* drop pmd */
|
||
|
if (mmap(ptr, HPAGE_SIZE, PROT_READ | PROT_WRITE,
|
||
|
MAP_FIXED | MAP_ANONYMOUS |
|
||
|
MAP_NORESERVE | MAP_PRIVATE, -1, 0) != ptr)
|
||
|
errx(2, "mmap transhuge");
|
||
|
|
||
|
if (madvise(ptr, HPAGE_SIZE, MADV_HUGEPAGE))
|
||
|
err(2, "MADV_HUGEPAGE");
|
||
|
|
||
|
/* allocate transparent huge page */
|
||
|
*(volatile void **)ptr = ptr;
|
||
|
|
||
|
if (pread(pagemap_fd, ent, sizeof(ent),
|
||
|
(uintptr_t)ptr >> (PAGE_SHIFT - 3)) != sizeof(ent))
|
||
|
err(2, "read pagemap");
|
||
|
|
||
|
if (PAGEMAP_PRESENT(ent[0]) && PAGEMAP_PRESENT(ent[1]) &&
|
||
|
PAGEMAP_PFN(ent[0]) + 1 == PAGEMAP_PFN(ent[1]) &&
|
||
|
!(PAGEMAP_PFN(ent[0]) & ((1 << (HPAGE_SHIFT - PAGE_SHIFT)) - 1)))
|
||
|
return PAGEMAP_PFN(ent[0]);
|
||
|
|
||
|
return -1;
|
||
|
}
|
||
|
|
||
|
int main(int argc, char **argv)
|
||
|
{
|
||
|
size_t ram, len;
|
||
|
void *ptr, *p;
|
||
|
struct timespec a, b;
|
||
|
double s;
|
||
|
uint8_t *map;
|
||
|
size_t map_len;
|
||
|
|
||
|
ram = sysconf(_SC_PHYS_PAGES);
|
||
|
if (ram > SIZE_MAX / sysconf(_SC_PAGESIZE) / 4)
|
||
|
ram = SIZE_MAX / 4;
|
||
|
else
|
||
|
ram *= sysconf(_SC_PAGESIZE);
|
||
|
|
||
|
if (argc == 1)
|
||
|
len = ram;
|
||
|
else if (!strcmp(argv[1], "-h"))
|
||
|
errx(1, "usage: %s [size in MiB]", argv[0]);
|
||
|
else
|
||
|
len = atoll(argv[1]) << 20;
|
||
|
|
||
|
warnx("allocate %zd transhuge pages, using %zd MiB virtual memory"
|
||
|
" and %zd MiB of ram", len >> HPAGE_SHIFT, len >> 20,
|
||
|
len >> (20 + HPAGE_SHIFT - PAGE_SHIFT - 1));
|
||
|
|
||
|
pagemap_fd = open("/proc/self/pagemap", O_RDONLY);
|
||
|
if (pagemap_fd < 0)
|
||
|
err(2, "open pagemap");
|
||
|
|
||
|
len -= len % HPAGE_SIZE;
|
||
|
ptr = mmap(NULL, len + HPAGE_SIZE, PROT_READ | PROT_WRITE,
|
||
|
MAP_ANONYMOUS | MAP_NORESERVE | MAP_PRIVATE, -1, 0);
|
||
|
if (ptr == MAP_FAILED)
|
||
|
err(2, "initial mmap");
|
||
|
ptr += HPAGE_SIZE - (uintptr_t)ptr % HPAGE_SIZE;
|
||
|
|
||
|
if (madvise(ptr, len, MADV_HUGEPAGE))
|
||
|
err(2, "MADV_HUGEPAGE");
|
||
|
|
||
|
map_len = ram >> (HPAGE_SHIFT - 1);
|
||
|
map = malloc(map_len);
|
||
|
if (!map)
|
||
|
errx(2, "map malloc");
|
||
|
|
||
|
while (1) {
|
||
|
int nr_succeed = 0, nr_failed = 0, nr_pages = 0;
|
||
|
|
||
|
memset(map, 0, map_len);
|
||
|
|
||
|
clock_gettime(CLOCK_MONOTONIC, &a);
|
||
|
for (p = ptr; p < ptr + len; p += HPAGE_SIZE) {
|
||
|
int64_t pfn;
|
||
|
|
||
|
pfn = allocate_transhuge(p);
|
||
|
|
||
|
if (pfn < 0) {
|
||
|
nr_failed++;
|
||
|
} else {
|
||
|
size_t idx = pfn >> (HPAGE_SHIFT - PAGE_SHIFT);
|
||
|
|
||
|
nr_succeed++;
|
||
|
if (idx >= map_len) {
|
||
|
map = realloc(map, idx + 1);
|
||
|
if (!map)
|
||
|
errx(2, "map realloc");
|
||
|
memset(map + map_len, 0, idx + 1 - map_len);
|
||
|
map_len = idx + 1;
|
||
|
}
|
||
|
if (!map[idx])
|
||
|
nr_pages++;
|
||
|
map[idx] = 1;
|
||
|
}
|
||
|
|
||
|
/* split transhuge page, keep last page */
|
||
|
if (madvise(p, HPAGE_SIZE - PAGE_SIZE, MADV_DONTNEED))
|
||
|
err(2, "MADV_DONTNEED");
|
||
|
}
|
||
|
clock_gettime(CLOCK_MONOTONIC, &b);
|
||
|
s = b.tv_sec - a.tv_sec + (b.tv_nsec - a.tv_nsec) / 1000000000.;
|
||
|
|
||
|
warnx("%.3f s/loop, %.3f ms/page, %10.3f MiB/s\t"
|
||
|
"%4d succeed, %4d failed, %4d different pages",
|
||
|
s, s * 1000 / (len >> HPAGE_SHIFT), len / s / (1 << 20),
|
||
|
nr_succeed, nr_failed, nr_pages);
|
||
|
}
|
||
|
}
|