mirror of
https://github.com/torvalds/linux.git
synced 2024-12-31 23:31:29 +00:00
selftests/vm: add thp collapse file and tmpfs testing
Add memory operations for file-backed and tmpfs memory. Call existing tests with these new memory operations to test collapse functionality of khugepaged and MADV_COLLAPSE on file-backed and tmpfs memory. Not all tests are reusable; for example, collapse_swapin_single_pte() which checks swap usage. Refactor test arguments. Usage is now: Usage: ./khugepaged <test type> [dir] <test type> : <context>:<mem_type> <context> : [all|khugepaged|madvise] <mem_type> : [all|anon|file] "file,all" mem_type requires [dir] argument "file,all" mem_type requires kernel built with CONFIG_READ_ONLY_THP_FOR_FS=y if [dir] is a (sub)directory of a tmpfs mount, tmpfs must be mounted with huge=madvise option for khugepaged tests to work Refactor calling tests to make it clear what collapse context / memory operations they support, but only invoke tests requested by user. Also log what test is being ran, and with what context / memory, to make test logs more human readable. A new test file is created and deleted for every test to ensure no pages remain in the page cache between tests (tests also may attempt to collapse different amount of memory). For file-backed memory where the file is stored on a block device, disable /sys/block/<device>/queue/read_ahead_kb so that pages don't find their way into the page cache without the tests faulting them in. Add file and shmem wrappers to vm_utils check for file and shmem hugepages in smaps. [zokeefe@google.com: fix "add thp collapse file and tmpfs testing" for tmpfs] Link: https://lkml.kernel.org/r/20220913212517.3163701-1-zokeefe@google.com Link: https://lkml.kernel.org/r/20220907144521.3115321-8-zokeefe@google.com Link: https://lkml.kernel.org/r/20220922224046.1143204-8-zokeefe@google.com Signed-off-by: Zach O'Keefe <zokeefe@google.com> Cc: Axel Rasmussen <axelrasmussen@google.com> Cc: Chris Kennelly <ckennelly@google.com> Cc: David Hildenbrand <david@redhat.com> Cc: David Rientjes <rientjes@google.com> Cc: Hugh Dickins <hughd@google.com> Cc: James Houghton <jthoughton@google.com> Cc: "Kirill A. Shutemov" <kirill.shutemov@linux.intel.com> Cc: Matthew Wilcox <willy@infradead.org> Cc: Miaohe Lin <linmiaohe@huawei.com> Cc: Minchan Kim <minchan@kernel.org> Cc: Pasha Tatashin <pasha.tatashin@soleen.com> Cc: Peter Xu <peterx@redhat.com> Cc: Rongwei Wang <rongwei.wang@linux.alibaba.com> Cc: SeongJae Park <sj@kernel.org> Cc: Song Liu <songliubraving@fb.com> Cc: Vlastimil Babka <vbabka@suse.cz> Cc: Yang Shi <shy828301@gmail.com> Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
This commit is contained in:
parent
8e638707a3
commit
1b03d0d558
@ -1,7 +1,9 @@
|
|||||||
#define _GNU_SOURCE
|
#define _GNU_SOURCE
|
||||||
|
#include <ctype.h>
|
||||||
#include <errno.h>
|
#include <errno.h>
|
||||||
#include <fcntl.h>
|
#include <fcntl.h>
|
||||||
#include <limits.h>
|
#include <limits.h>
|
||||||
|
#include <dirent.h>
|
||||||
#include <signal.h>
|
#include <signal.h>
|
||||||
#include <stdio.h>
|
#include <stdio.h>
|
||||||
#include <stdlib.h>
|
#include <stdlib.h>
|
||||||
@ -11,12 +13,21 @@
|
|||||||
|
|
||||||
#include <sys/mman.h>
|
#include <sys/mman.h>
|
||||||
#include <sys/wait.h>
|
#include <sys/wait.h>
|
||||||
|
#include <sys/types.h>
|
||||||
|
#include <sys/stat.h>
|
||||||
|
#include <sys/sysmacros.h>
|
||||||
|
#include <sys/vfs.h>
|
||||||
|
|
||||||
|
#include "linux/magic.h"
|
||||||
|
|
||||||
#include "vm_util.h"
|
#include "vm_util.h"
|
||||||
|
|
||||||
#ifndef MADV_PAGEOUT
|
#ifndef MADV_PAGEOUT
|
||||||
#define MADV_PAGEOUT 21
|
#define MADV_PAGEOUT 21
|
||||||
#endif
|
#endif
|
||||||
|
#ifndef MADV_POPULATE_READ
|
||||||
|
#define MADV_POPULATE_READ 22
|
||||||
|
#endif
|
||||||
#ifndef MADV_COLLAPSE
|
#ifndef MADV_COLLAPSE
|
||||||
#define MADV_COLLAPSE 25
|
#define MADV_COLLAPSE 25
|
||||||
#endif
|
#endif
|
||||||
@ -28,20 +39,47 @@ static int hpage_pmd_nr;
|
|||||||
|
|
||||||
#define THP_SYSFS "/sys/kernel/mm/transparent_hugepage/"
|
#define THP_SYSFS "/sys/kernel/mm/transparent_hugepage/"
|
||||||
#define PID_SMAPS "/proc/self/smaps"
|
#define PID_SMAPS "/proc/self/smaps"
|
||||||
|
#define TEST_FILE "collapse_test_file"
|
||||||
|
|
||||||
|
#define MAX_LINE_LENGTH 500
|
||||||
|
|
||||||
|
enum vma_type {
|
||||||
|
VMA_ANON,
|
||||||
|
VMA_FILE,
|
||||||
|
VMA_SHMEM,
|
||||||
|
};
|
||||||
|
|
||||||
struct mem_ops {
|
struct mem_ops {
|
||||||
void *(*setup_area)(int nr_hpages);
|
void *(*setup_area)(int nr_hpages);
|
||||||
void (*cleanup_area)(void *p, unsigned long size);
|
void (*cleanup_area)(void *p, unsigned long size);
|
||||||
void (*fault)(void *p, unsigned long start, unsigned long end);
|
void (*fault)(void *p, unsigned long start, unsigned long end);
|
||||||
bool (*check_huge)(void *addr, int nr_hpages);
|
bool (*check_huge)(void *addr, int nr_hpages);
|
||||||
|
const char *name;
|
||||||
};
|
};
|
||||||
|
|
||||||
|
static struct mem_ops *file_ops;
|
||||||
|
static struct mem_ops *anon_ops;
|
||||||
|
|
||||||
struct collapse_context {
|
struct collapse_context {
|
||||||
void (*collapse)(const char *msg, char *p, int nr_hpages,
|
void (*collapse)(const char *msg, char *p, int nr_hpages,
|
||||||
struct mem_ops *ops, bool expect);
|
struct mem_ops *ops, bool expect);
|
||||||
bool enforce_pte_scan_limits;
|
bool enforce_pte_scan_limits;
|
||||||
|
const char *name;
|
||||||
};
|
};
|
||||||
|
|
||||||
|
static struct collapse_context *khugepaged_context;
|
||||||
|
static struct collapse_context *madvise_context;
|
||||||
|
|
||||||
|
struct file_info {
|
||||||
|
const char *dir;
|
||||||
|
char path[PATH_MAX];
|
||||||
|
enum vma_type type;
|
||||||
|
int fd;
|
||||||
|
char dev_queue_read_ahead_path[PATH_MAX];
|
||||||
|
};
|
||||||
|
|
||||||
|
static struct file_info finfo;
|
||||||
|
|
||||||
enum thp_enabled {
|
enum thp_enabled {
|
||||||
THP_ALWAYS,
|
THP_ALWAYS,
|
||||||
THP_MADVISE,
|
THP_MADVISE,
|
||||||
@ -107,6 +145,7 @@ struct settings {
|
|||||||
enum shmem_enabled shmem_enabled;
|
enum shmem_enabled shmem_enabled;
|
||||||
bool use_zero_page;
|
bool use_zero_page;
|
||||||
struct khugepaged_settings khugepaged;
|
struct khugepaged_settings khugepaged;
|
||||||
|
unsigned long read_ahead_kb;
|
||||||
};
|
};
|
||||||
|
|
||||||
static struct settings saved_settings;
|
static struct settings saved_settings;
|
||||||
@ -125,6 +164,11 @@ static void fail(const char *msg)
|
|||||||
exit_status++;
|
exit_status++;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static void skip(const char *msg)
|
||||||
|
{
|
||||||
|
printf(" \e[33m%s\e[0m\n", msg);
|
||||||
|
}
|
||||||
|
|
||||||
static int read_file(const char *path, char *buf, size_t buflen)
|
static int read_file(const char *path, char *buf, size_t buflen)
|
||||||
{
|
{
|
||||||
int fd;
|
int fd;
|
||||||
@ -152,13 +196,19 @@ static int write_file(const char *path, const char *buf, size_t buflen)
|
|||||||
ssize_t numwritten;
|
ssize_t numwritten;
|
||||||
|
|
||||||
fd = open(path, O_WRONLY);
|
fd = open(path, O_WRONLY);
|
||||||
if (fd == -1)
|
if (fd == -1) {
|
||||||
|
printf("open(%s)\n", path);
|
||||||
|
exit(EXIT_FAILURE);
|
||||||
return 0;
|
return 0;
|
||||||
|
}
|
||||||
|
|
||||||
numwritten = write(fd, buf, buflen - 1);
|
numwritten = write(fd, buf, buflen - 1);
|
||||||
close(fd);
|
close(fd);
|
||||||
if (numwritten < 1)
|
if (numwritten < 1) {
|
||||||
|
printf("write(%s)\n", buf);
|
||||||
|
exit(EXIT_FAILURE);
|
||||||
return 0;
|
return 0;
|
||||||
|
}
|
||||||
|
|
||||||
return (unsigned int) numwritten;
|
return (unsigned int) numwritten;
|
||||||
}
|
}
|
||||||
@ -225,20 +275,11 @@ static void write_string(const char *name, const char *val)
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
static const unsigned long read_num(const char *name)
|
static const unsigned long _read_num(const char *path)
|
||||||
{
|
{
|
||||||
char path[PATH_MAX];
|
|
||||||
char buf[21];
|
char buf[21];
|
||||||
int ret;
|
|
||||||
|
|
||||||
ret = snprintf(path, PATH_MAX, THP_SYSFS "%s", name);
|
if (read_file(path, buf, sizeof(buf)) < 0) {
|
||||||
if (ret >= PATH_MAX) {
|
|
||||||
printf("%s: Pathname is too long\n", __func__);
|
|
||||||
exit(EXIT_FAILURE);
|
|
||||||
}
|
|
||||||
|
|
||||||
ret = read_file(path, buf, sizeof(buf));
|
|
||||||
if (ret < 0) {
|
|
||||||
perror("read_file(read_num)");
|
perror("read_file(read_num)");
|
||||||
exit(EXIT_FAILURE);
|
exit(EXIT_FAILURE);
|
||||||
}
|
}
|
||||||
@ -246,10 +287,9 @@ static const unsigned long read_num(const char *name)
|
|||||||
return strtoul(buf, NULL, 10);
|
return strtoul(buf, NULL, 10);
|
||||||
}
|
}
|
||||||
|
|
||||||
static void write_num(const char *name, unsigned long num)
|
static const unsigned long read_num(const char *name)
|
||||||
{
|
{
|
||||||
char path[PATH_MAX];
|
char path[PATH_MAX];
|
||||||
char buf[21];
|
|
||||||
int ret;
|
int ret;
|
||||||
|
|
||||||
ret = snprintf(path, PATH_MAX, THP_SYSFS "%s", name);
|
ret = snprintf(path, PATH_MAX, THP_SYSFS "%s", name);
|
||||||
@ -257,6 +297,12 @@ static void write_num(const char *name, unsigned long num)
|
|||||||
printf("%s: Pathname is too long\n", __func__);
|
printf("%s: Pathname is too long\n", __func__);
|
||||||
exit(EXIT_FAILURE);
|
exit(EXIT_FAILURE);
|
||||||
}
|
}
|
||||||
|
return _read_num(path);
|
||||||
|
}
|
||||||
|
|
||||||
|
static void _write_num(const char *path, unsigned long num)
|
||||||
|
{
|
||||||
|
char buf[21];
|
||||||
|
|
||||||
sprintf(buf, "%ld", num);
|
sprintf(buf, "%ld", num);
|
||||||
if (!write_file(path, buf, strlen(buf) + 1)) {
|
if (!write_file(path, buf, strlen(buf) + 1)) {
|
||||||
@ -265,6 +311,19 @@ static void write_num(const char *name, unsigned long num)
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static void write_num(const char *name, unsigned long num)
|
||||||
|
{
|
||||||
|
char path[PATH_MAX];
|
||||||
|
int ret;
|
||||||
|
|
||||||
|
ret = snprintf(path, PATH_MAX, THP_SYSFS "%s", name);
|
||||||
|
if (ret >= PATH_MAX) {
|
||||||
|
printf("%s: Pathname is too long\n", __func__);
|
||||||
|
exit(EXIT_FAILURE);
|
||||||
|
}
|
||||||
|
_write_num(path, num);
|
||||||
|
}
|
||||||
|
|
||||||
static void write_settings(struct settings *settings)
|
static void write_settings(struct settings *settings)
|
||||||
{
|
{
|
||||||
struct khugepaged_settings *khugepaged = &settings->khugepaged;
|
struct khugepaged_settings *khugepaged = &settings->khugepaged;
|
||||||
@ -284,6 +343,10 @@ static void write_settings(struct settings *settings)
|
|||||||
write_num("khugepaged/max_ptes_swap", khugepaged->max_ptes_swap);
|
write_num("khugepaged/max_ptes_swap", khugepaged->max_ptes_swap);
|
||||||
write_num("khugepaged/max_ptes_shared", khugepaged->max_ptes_shared);
|
write_num("khugepaged/max_ptes_shared", khugepaged->max_ptes_shared);
|
||||||
write_num("khugepaged/pages_to_scan", khugepaged->pages_to_scan);
|
write_num("khugepaged/pages_to_scan", khugepaged->pages_to_scan);
|
||||||
|
|
||||||
|
if (file_ops && finfo.type == VMA_FILE)
|
||||||
|
_write_num(finfo.dev_queue_read_ahead_path,
|
||||||
|
settings->read_ahead_kb);
|
||||||
}
|
}
|
||||||
|
|
||||||
#define MAX_SETTINGS_DEPTH 4
|
#define MAX_SETTINGS_DEPTH 4
|
||||||
@ -354,6 +417,10 @@ static void save_settings(void)
|
|||||||
.max_ptes_shared = read_num("khugepaged/max_ptes_shared"),
|
.max_ptes_shared = read_num("khugepaged/max_ptes_shared"),
|
||||||
.pages_to_scan = read_num("khugepaged/pages_to_scan"),
|
.pages_to_scan = read_num("khugepaged/pages_to_scan"),
|
||||||
};
|
};
|
||||||
|
if (file_ops && finfo.type == VMA_FILE)
|
||||||
|
saved_settings.read_ahead_kb =
|
||||||
|
_read_num(finfo.dev_queue_read_ahead_path);
|
||||||
|
|
||||||
success("OK");
|
success("OK");
|
||||||
|
|
||||||
signal(SIGTERM, restore_settings);
|
signal(SIGTERM, restore_settings);
|
||||||
@ -362,7 +429,90 @@ static void save_settings(void)
|
|||||||
signal(SIGQUIT, restore_settings);
|
signal(SIGQUIT, restore_settings);
|
||||||
}
|
}
|
||||||
|
|
||||||
#define MAX_LINE_LENGTH 500
|
static void get_finfo(const char *dir)
|
||||||
|
{
|
||||||
|
struct stat path_stat;
|
||||||
|
struct statfs fs;
|
||||||
|
char buf[1 << 10];
|
||||||
|
char path[PATH_MAX];
|
||||||
|
char *str, *end;
|
||||||
|
|
||||||
|
finfo.dir = dir;
|
||||||
|
stat(finfo.dir, &path_stat);
|
||||||
|
if (!S_ISDIR(path_stat.st_mode)) {
|
||||||
|
printf("%s: Not a directory (%s)\n", __func__, finfo.dir);
|
||||||
|
exit(EXIT_FAILURE);
|
||||||
|
}
|
||||||
|
if (snprintf(finfo.path, sizeof(finfo.path), "%s/" TEST_FILE,
|
||||||
|
finfo.dir) >= sizeof(finfo.path)) {
|
||||||
|
printf("%s: Pathname is too long\n", __func__);
|
||||||
|
exit(EXIT_FAILURE);
|
||||||
|
}
|
||||||
|
if (statfs(finfo.dir, &fs)) {
|
||||||
|
perror("statfs()");
|
||||||
|
exit(EXIT_FAILURE);
|
||||||
|
}
|
||||||
|
finfo.type = fs.f_type == TMPFS_MAGIC ? VMA_SHMEM : VMA_FILE;
|
||||||
|
if (finfo.type == VMA_SHMEM)
|
||||||
|
return;
|
||||||
|
|
||||||
|
/* Find owning device's queue/read_ahead_kb control */
|
||||||
|
if (snprintf(path, sizeof(path), "/sys/dev/block/%d:%d/uevent",
|
||||||
|
major(path_stat.st_dev), minor(path_stat.st_dev))
|
||||||
|
>= sizeof(path)) {
|
||||||
|
printf("%s: Pathname is too long\n", __func__);
|
||||||
|
exit(EXIT_FAILURE);
|
||||||
|
}
|
||||||
|
if (read_file(path, buf, sizeof(buf)) < 0) {
|
||||||
|
perror("read_file(read_num)");
|
||||||
|
exit(EXIT_FAILURE);
|
||||||
|
}
|
||||||
|
if (strstr(buf, "DEVTYPE=disk")) {
|
||||||
|
/* Found it */
|
||||||
|
if (snprintf(finfo.dev_queue_read_ahead_path,
|
||||||
|
sizeof(finfo.dev_queue_read_ahead_path),
|
||||||
|
"/sys/dev/block/%d:%d/queue/read_ahead_kb",
|
||||||
|
major(path_stat.st_dev), minor(path_stat.st_dev))
|
||||||
|
>= sizeof(finfo.dev_queue_read_ahead_path)) {
|
||||||
|
printf("%s: Pathname is too long\n", __func__);
|
||||||
|
exit(EXIT_FAILURE);
|
||||||
|
}
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
if (!strstr(buf, "DEVTYPE=partition")) {
|
||||||
|
printf("%s: Unknown device type: %s\n", __func__, path);
|
||||||
|
exit(EXIT_FAILURE);
|
||||||
|
}
|
||||||
|
/*
|
||||||
|
* Partition of block device - need to find actual device.
|
||||||
|
* Using naming convention that devnameN is partition of
|
||||||
|
* device devname.
|
||||||
|
*/
|
||||||
|
str = strstr(buf, "DEVNAME=");
|
||||||
|
if (!str) {
|
||||||
|
printf("%s: Could not read: %s", __func__, path);
|
||||||
|
exit(EXIT_FAILURE);
|
||||||
|
}
|
||||||
|
str += 8;
|
||||||
|
end = str;
|
||||||
|
while (*end) {
|
||||||
|
if (isdigit(*end)) {
|
||||||
|
*end = '\0';
|
||||||
|
if (snprintf(finfo.dev_queue_read_ahead_path,
|
||||||
|
sizeof(finfo.dev_queue_read_ahead_path),
|
||||||
|
"/sys/block/%s/queue/read_ahead_kb",
|
||||||
|
str) >= sizeof(finfo.dev_queue_read_ahead_path)) {
|
||||||
|
printf("%s: Pathname is too long\n", __func__);
|
||||||
|
exit(EXIT_FAILURE);
|
||||||
|
}
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
++end;
|
||||||
|
}
|
||||||
|
printf("%s: Could not read: %s\n", __func__, path);
|
||||||
|
exit(EXIT_FAILURE);
|
||||||
|
}
|
||||||
|
|
||||||
static bool check_swap(void *addr, unsigned long size)
|
static bool check_swap(void *addr, unsigned long size)
|
||||||
{
|
{
|
||||||
bool swap = false;
|
bool swap = false;
|
||||||
@ -518,11 +668,91 @@ static bool anon_check_huge(void *addr, int nr_hpages)
|
|||||||
return check_huge_anon(addr, nr_hpages, hpage_pmd_size);
|
return check_huge_anon(addr, nr_hpages, hpage_pmd_size);
|
||||||
}
|
}
|
||||||
|
|
||||||
static struct mem_ops anon_ops = {
|
static void *file_setup_area(int nr_hpages)
|
||||||
|
{
|
||||||
|
int fd;
|
||||||
|
void *p;
|
||||||
|
unsigned long size;
|
||||||
|
|
||||||
|
unlink(finfo.path); /* Cleanup from previous failed tests */
|
||||||
|
printf("Creating %s for collapse%s...", finfo.path,
|
||||||
|
finfo.type == VMA_SHMEM ? " (tmpfs)" : "");
|
||||||
|
fd = open(finfo.path, O_DSYNC | O_CREAT | O_RDWR | O_TRUNC | O_EXCL,
|
||||||
|
777);
|
||||||
|
if (fd < 0) {
|
||||||
|
perror("open()");
|
||||||
|
exit(EXIT_FAILURE);
|
||||||
|
}
|
||||||
|
|
||||||
|
size = nr_hpages * hpage_pmd_size;
|
||||||
|
p = alloc_mapping(nr_hpages);
|
||||||
|
fill_memory(p, 0, size);
|
||||||
|
write(fd, p, size);
|
||||||
|
close(fd);
|
||||||
|
munmap(p, size);
|
||||||
|
success("OK");
|
||||||
|
|
||||||
|
printf("Opening %s read only for collapse...", finfo.path);
|
||||||
|
finfo.fd = open(finfo.path, O_RDONLY, 777);
|
||||||
|
if (finfo.fd < 0) {
|
||||||
|
perror("open()");
|
||||||
|
exit(EXIT_FAILURE);
|
||||||
|
}
|
||||||
|
p = mmap(BASE_ADDR, size, PROT_READ | PROT_EXEC,
|
||||||
|
MAP_PRIVATE, finfo.fd, 0);
|
||||||
|
if (p == MAP_FAILED || p != BASE_ADDR) {
|
||||||
|
perror("mmap()");
|
||||||
|
exit(EXIT_FAILURE);
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Drop page cache */
|
||||||
|
write_file("/proc/sys/vm/drop_caches", "3", 2);
|
||||||
|
success("OK");
|
||||||
|
return p;
|
||||||
|
}
|
||||||
|
|
||||||
|
static void file_cleanup_area(void *p, unsigned long size)
|
||||||
|
{
|
||||||
|
munmap(p, size);
|
||||||
|
close(finfo.fd);
|
||||||
|
unlink(finfo.path);
|
||||||
|
}
|
||||||
|
|
||||||
|
static void file_fault(void *p, unsigned long start, unsigned long end)
|
||||||
|
{
|
||||||
|
if (madvise(((char *)p) + start, end - start, MADV_POPULATE_READ)) {
|
||||||
|
perror("madvise(MADV_POPULATE_READ");
|
||||||
|
exit(EXIT_FAILURE);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
static bool file_check_huge(void *addr, int nr_hpages)
|
||||||
|
{
|
||||||
|
switch (finfo.type) {
|
||||||
|
case VMA_FILE:
|
||||||
|
return check_huge_file(addr, nr_hpages, hpage_pmd_size);
|
||||||
|
case VMA_SHMEM:
|
||||||
|
return check_huge_shmem(addr, nr_hpages, hpage_pmd_size);
|
||||||
|
default:
|
||||||
|
exit(EXIT_FAILURE);
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
static struct mem_ops __anon_ops = {
|
||||||
.setup_area = &anon_setup_area,
|
.setup_area = &anon_setup_area,
|
||||||
.cleanup_area = &anon_cleanup_area,
|
.cleanup_area = &anon_cleanup_area,
|
||||||
.fault = &anon_fault,
|
.fault = &anon_fault,
|
||||||
.check_huge = &anon_check_huge,
|
.check_huge = &anon_check_huge,
|
||||||
|
.name = "anon",
|
||||||
|
};
|
||||||
|
|
||||||
|
static struct mem_ops __file_ops = {
|
||||||
|
.setup_area = &file_setup_area,
|
||||||
|
.cleanup_area = &file_cleanup_area,
|
||||||
|
.fault = &file_fault,
|
||||||
|
.check_huge = &file_check_huge,
|
||||||
|
.name = "file",
|
||||||
};
|
};
|
||||||
|
|
||||||
static void __madvise_collapse(const char *msg, char *p, int nr_hpages,
|
static void __madvise_collapse(const char *msg, char *p, int nr_hpages,
|
||||||
@ -538,6 +768,7 @@ static void __madvise_collapse(const char *msg, char *p, int nr_hpages,
|
|||||||
* ignores /sys/kernel/mm/transparent_hugepage/enabled
|
* ignores /sys/kernel/mm/transparent_hugepage/enabled
|
||||||
*/
|
*/
|
||||||
settings.thp_enabled = THP_NEVER;
|
settings.thp_enabled = THP_NEVER;
|
||||||
|
settings.shmem_enabled = SHMEM_NEVER;
|
||||||
push_settings(&settings);
|
push_settings(&settings);
|
||||||
|
|
||||||
/* Clear VM_NOHUGEPAGE */
|
/* Clear VM_NOHUGEPAGE */
|
||||||
@ -608,12 +839,37 @@ static void khugepaged_collapse(const char *msg, char *p, int nr_hpages,
|
|||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* For file and shmem memory, khugepaged only retracts pte entries after
|
||||||
|
* putting the new hugepage in the page cache. The hugepage must be
|
||||||
|
* subsequently refaulted to install the pmd mapping for the mm.
|
||||||
|
*/
|
||||||
|
if (ops != &__anon_ops)
|
||||||
|
ops->fault(p, 0, nr_hpages * hpage_pmd_size);
|
||||||
|
|
||||||
if (ops->check_huge(p, expect ? nr_hpages : 0))
|
if (ops->check_huge(p, expect ? nr_hpages : 0))
|
||||||
success("OK");
|
success("OK");
|
||||||
else
|
else
|
||||||
fail("Fail");
|
fail("Fail");
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static struct collapse_context __khugepaged_context = {
|
||||||
|
.collapse = &khugepaged_collapse,
|
||||||
|
.enforce_pte_scan_limits = true,
|
||||||
|
.name = "khugepaged",
|
||||||
|
};
|
||||||
|
|
||||||
|
static struct collapse_context __madvise_context = {
|
||||||
|
.collapse = &madvise_collapse,
|
||||||
|
.enforce_pte_scan_limits = false,
|
||||||
|
.name = "madvise",
|
||||||
|
};
|
||||||
|
|
||||||
|
static bool is_tmpfs(struct mem_ops *ops)
|
||||||
|
{
|
||||||
|
return ops == &__file_ops && finfo.type == VMA_SHMEM;
|
||||||
|
}
|
||||||
|
|
||||||
static void alloc_at_fault(void)
|
static void alloc_at_fault(void)
|
||||||
{
|
{
|
||||||
struct settings settings = *current_settings();
|
struct settings settings = *current_settings();
|
||||||
@ -686,6 +942,13 @@ static void collapse_max_ptes_none(struct collapse_context *c, struct mem_ops *o
|
|||||||
|
|
||||||
p = ops->setup_area(1);
|
p = ops->setup_area(1);
|
||||||
|
|
||||||
|
if (is_tmpfs(ops)) {
|
||||||
|
/* shmem pages always in the page cache */
|
||||||
|
printf("tmpfs...");
|
||||||
|
skip("Skip");
|
||||||
|
goto skip;
|
||||||
|
}
|
||||||
|
|
||||||
ops->fault(p, 0, (hpage_pmd_nr - max_ptes_none - 1) * page_size);
|
ops->fault(p, 0, (hpage_pmd_nr - max_ptes_none - 1) * page_size);
|
||||||
c->collapse("Maybe collapse with max_ptes_none exceeded", p, 1,
|
c->collapse("Maybe collapse with max_ptes_none exceeded", p, 1,
|
||||||
ops, !c->enforce_pte_scan_limits);
|
ops, !c->enforce_pte_scan_limits);
|
||||||
@ -698,6 +961,7 @@ static void collapse_max_ptes_none(struct collapse_context *c, struct mem_ops *o
|
|||||||
validate_memory(p, 0,
|
validate_memory(p, 0,
|
||||||
(hpage_pmd_nr - max_ptes_none) * page_size);
|
(hpage_pmd_nr - max_ptes_none) * page_size);
|
||||||
}
|
}
|
||||||
|
skip:
|
||||||
ops->cleanup_area(p, hpage_pmd_size);
|
ops->cleanup_area(p, hpage_pmd_size);
|
||||||
pop_settings();
|
pop_settings();
|
||||||
}
|
}
|
||||||
@ -781,6 +1045,13 @@ static void collapse_single_pte_entry_compound(struct collapse_context *c, struc
|
|||||||
|
|
||||||
p = alloc_hpage(ops);
|
p = alloc_hpage(ops);
|
||||||
|
|
||||||
|
if (is_tmpfs(ops)) {
|
||||||
|
/* MADV_DONTNEED won't evict tmpfs pages */
|
||||||
|
printf("tmpfs...");
|
||||||
|
skip("Skip");
|
||||||
|
goto skip;
|
||||||
|
}
|
||||||
|
|
||||||
madvise(p, hpage_pmd_size, MADV_NOHUGEPAGE);
|
madvise(p, hpage_pmd_size, MADV_NOHUGEPAGE);
|
||||||
printf("Split huge page leaving single PTE mapping compound page...");
|
printf("Split huge page leaving single PTE mapping compound page...");
|
||||||
madvise(p + page_size, hpage_pmd_size - page_size, MADV_DONTNEED);
|
madvise(p + page_size, hpage_pmd_size - page_size, MADV_DONTNEED);
|
||||||
@ -792,6 +1063,7 @@ static void collapse_single_pte_entry_compound(struct collapse_context *c, struc
|
|||||||
c->collapse("Collapse PTE table with single PTE mapping compound page",
|
c->collapse("Collapse PTE table with single PTE mapping compound page",
|
||||||
p, 1, ops, true);
|
p, 1, ops, true);
|
||||||
validate_memory(p, 0, page_size);
|
validate_memory(p, 0, page_size);
|
||||||
|
skip:
|
||||||
ops->cleanup_area(p, hpage_pmd_size);
|
ops->cleanup_area(p, hpage_pmd_size);
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -1038,9 +1310,70 @@ static void madvise_collapse_existing_thps(struct collapse_context *c,
|
|||||||
ops->cleanup_area(p, hpage_pmd_size);
|
ops->cleanup_area(p, hpage_pmd_size);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static void usage(void)
|
||||||
|
{
|
||||||
|
fprintf(stderr, "\nUsage: ./khugepaged <test type> [dir]\n\n");
|
||||||
|
fprintf(stderr, "\t<test type>\t: <context>:<mem_type>\n");
|
||||||
|
fprintf(stderr, "\t<context>\t: [all|khugepaged|madvise]\n");
|
||||||
|
fprintf(stderr, "\t<mem_type>\t: [all|anon|file]\n");
|
||||||
|
fprintf(stderr, "\n\t\"file,all\" mem_type requires [dir] argument\n");
|
||||||
|
fprintf(stderr, "\n\t\"file,all\" mem_type requires kernel built with\n");
|
||||||
|
fprintf(stderr, "\tCONFIG_READ_ONLY_THP_FOR_FS=y\n");
|
||||||
|
fprintf(stderr, "\n\tif [dir] is a (sub)directory of a tmpfs mount, tmpfs must be\n");
|
||||||
|
fprintf(stderr, "\tmounted with huge=madvise option for khugepaged tests to work\n");
|
||||||
|
exit(1);
|
||||||
|
}
|
||||||
|
|
||||||
|
static void parse_test_type(int argc, const char **argv)
|
||||||
|
{
|
||||||
|
char *buf;
|
||||||
|
const char *token;
|
||||||
|
|
||||||
|
if (argc == 1) {
|
||||||
|
/* Backwards compatibility */
|
||||||
|
khugepaged_context = &__khugepaged_context;
|
||||||
|
madvise_context = &__madvise_context;
|
||||||
|
anon_ops = &__anon_ops;
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
|
buf = strdup(argv[1]);
|
||||||
|
token = strsep(&buf, ":");
|
||||||
|
|
||||||
|
if (!strcmp(token, "all")) {
|
||||||
|
khugepaged_context = &__khugepaged_context;
|
||||||
|
madvise_context = &__madvise_context;
|
||||||
|
} else if (!strcmp(token, "khugepaged")) {
|
||||||
|
khugepaged_context = &__khugepaged_context;
|
||||||
|
} else if (!strcmp(token, "madvise")) {
|
||||||
|
madvise_context = &__madvise_context;
|
||||||
|
} else {
|
||||||
|
usage();
|
||||||
|
}
|
||||||
|
|
||||||
|
if (!buf)
|
||||||
|
usage();
|
||||||
|
|
||||||
|
if (!strcmp(buf, "all")) {
|
||||||
|
file_ops = &__file_ops;
|
||||||
|
anon_ops = &__anon_ops;
|
||||||
|
} else if (!strcmp(buf, "anon")) {
|
||||||
|
anon_ops = &__anon_ops;
|
||||||
|
} else if (!strcmp(buf, "file")) {
|
||||||
|
file_ops = &__file_ops;
|
||||||
|
} else {
|
||||||
|
usage();
|
||||||
|
}
|
||||||
|
|
||||||
|
if (!file_ops)
|
||||||
|
return;
|
||||||
|
|
||||||
|
if (argc != 3)
|
||||||
|
usage();
|
||||||
|
}
|
||||||
|
|
||||||
int main(int argc, const char **argv)
|
int main(int argc, const char **argv)
|
||||||
{
|
{
|
||||||
struct collapse_context c;
|
|
||||||
struct settings default_settings = {
|
struct settings default_settings = {
|
||||||
.thp_enabled = THP_MADVISE,
|
.thp_enabled = THP_MADVISE,
|
||||||
.thp_defrag = THP_DEFRAG_ALWAYS,
|
.thp_defrag = THP_DEFRAG_ALWAYS,
|
||||||
@ -1051,8 +1384,20 @@ int main(int argc, const char **argv)
|
|||||||
.alloc_sleep_millisecs = 10,
|
.alloc_sleep_millisecs = 10,
|
||||||
.scan_sleep_millisecs = 10,
|
.scan_sleep_millisecs = 10,
|
||||||
},
|
},
|
||||||
|
/*
|
||||||
|
* When testing file-backed memory, the collapse path
|
||||||
|
* looks at how many pages are found in the page cache, not
|
||||||
|
* what pages are mapped. Disable read ahead optimization so
|
||||||
|
* pages don't find their way into the page cache unless
|
||||||
|
* we mem_ops->fault() them in.
|
||||||
|
*/
|
||||||
|
.read_ahead_kb = 0,
|
||||||
};
|
};
|
||||||
const char *tests = argc == 1 ? "all" : argv[1];
|
|
||||||
|
parse_test_type(argc, argv);
|
||||||
|
|
||||||
|
if (file_ops)
|
||||||
|
get_finfo(argv[2]);
|
||||||
|
|
||||||
setbuf(stdout, NULL);
|
setbuf(stdout, NULL);
|
||||||
|
|
||||||
@ -1070,43 +1415,61 @@ int main(int argc, const char **argv)
|
|||||||
|
|
||||||
alloc_at_fault();
|
alloc_at_fault();
|
||||||
|
|
||||||
if (!strcmp(tests, "khugepaged") || !strcmp(tests, "all")) {
|
#define TEST(t, c, o) do { \
|
||||||
printf("\n*** Testing context: khugepaged ***\n");
|
if (c && o) { \
|
||||||
c.collapse = &khugepaged_collapse;
|
printf("\nRun test: " #t " (%s:%s)\n", c->name, o->name); \
|
||||||
c.enforce_pte_scan_limits = true;
|
t(c, o); \
|
||||||
|
} \
|
||||||
|
} while (0)
|
||||||
|
|
||||||
collapse_full(&c, &anon_ops);
|
TEST(collapse_full, khugepaged_context, anon_ops);
|
||||||
collapse_empty(&c, &anon_ops);
|
TEST(collapse_full, khugepaged_context, file_ops);
|
||||||
collapse_single_pte_entry(&c, &anon_ops);
|
TEST(collapse_full, madvise_context, anon_ops);
|
||||||
collapse_max_ptes_none(&c, &anon_ops);
|
TEST(collapse_full, madvise_context, file_ops);
|
||||||
collapse_swapin_single_pte(&c, &anon_ops);
|
|
||||||
collapse_max_ptes_swap(&c, &anon_ops);
|
|
||||||
collapse_single_pte_entry_compound(&c, &anon_ops);
|
|
||||||
collapse_full_of_compound(&c, &anon_ops);
|
|
||||||
collapse_compound_extreme(&c, &anon_ops);
|
|
||||||
collapse_fork(&c, &anon_ops);
|
|
||||||
collapse_fork_compound(&c, &anon_ops);
|
|
||||||
collapse_max_ptes_shared(&c, &anon_ops);
|
|
||||||
}
|
|
||||||
if (!strcmp(tests, "madvise") || !strcmp(tests, "all")) {
|
|
||||||
printf("\n*** Testing context: madvise ***\n");
|
|
||||||
c.collapse = &madvise_collapse;
|
|
||||||
c.enforce_pte_scan_limits = false;
|
|
||||||
|
|
||||||
collapse_full(&c, &anon_ops);
|
TEST(collapse_empty, khugepaged_context, anon_ops);
|
||||||
collapse_empty(&c, &anon_ops);
|
TEST(collapse_empty, madvise_context, anon_ops);
|
||||||
collapse_single_pte_entry(&c, &anon_ops);
|
|
||||||
collapse_max_ptes_none(&c, &anon_ops);
|
TEST(collapse_single_pte_entry, khugepaged_context, anon_ops);
|
||||||
collapse_swapin_single_pte(&c, &anon_ops);
|
TEST(collapse_single_pte_entry, khugepaged_context, file_ops);
|
||||||
collapse_max_ptes_swap(&c, &anon_ops);
|
TEST(collapse_single_pte_entry, madvise_context, anon_ops);
|
||||||
collapse_single_pte_entry_compound(&c, &anon_ops);
|
TEST(collapse_single_pte_entry, madvise_context, file_ops);
|
||||||
collapse_full_of_compound(&c, &anon_ops);
|
|
||||||
collapse_compound_extreme(&c, &anon_ops);
|
TEST(collapse_max_ptes_none, khugepaged_context, anon_ops);
|
||||||
collapse_fork(&c, &anon_ops);
|
TEST(collapse_max_ptes_none, khugepaged_context, file_ops);
|
||||||
collapse_fork_compound(&c, &anon_ops);
|
TEST(collapse_max_ptes_none, madvise_context, anon_ops);
|
||||||
collapse_max_ptes_shared(&c, &anon_ops);
|
TEST(collapse_max_ptes_none, madvise_context, file_ops);
|
||||||
madvise_collapse_existing_thps(&c, &anon_ops);
|
|
||||||
}
|
TEST(collapse_single_pte_entry_compound, khugepaged_context, anon_ops);
|
||||||
|
TEST(collapse_single_pte_entry_compound, khugepaged_context, file_ops);
|
||||||
|
TEST(collapse_single_pte_entry_compound, madvise_context, anon_ops);
|
||||||
|
TEST(collapse_single_pte_entry_compound, madvise_context, file_ops);
|
||||||
|
|
||||||
|
TEST(collapse_full_of_compound, khugepaged_context, anon_ops);
|
||||||
|
TEST(collapse_full_of_compound, khugepaged_context, file_ops);
|
||||||
|
TEST(collapse_full_of_compound, madvise_context, anon_ops);
|
||||||
|
TEST(collapse_full_of_compound, madvise_context, file_ops);
|
||||||
|
|
||||||
|
TEST(collapse_compound_extreme, khugepaged_context, anon_ops);
|
||||||
|
TEST(collapse_compound_extreme, madvise_context, anon_ops);
|
||||||
|
|
||||||
|
TEST(collapse_swapin_single_pte, khugepaged_context, anon_ops);
|
||||||
|
TEST(collapse_swapin_single_pte, madvise_context, anon_ops);
|
||||||
|
|
||||||
|
TEST(collapse_max_ptes_swap, khugepaged_context, anon_ops);
|
||||||
|
TEST(collapse_max_ptes_swap, madvise_context, anon_ops);
|
||||||
|
|
||||||
|
TEST(collapse_fork, khugepaged_context, anon_ops);
|
||||||
|
TEST(collapse_fork, madvise_context, anon_ops);
|
||||||
|
|
||||||
|
TEST(collapse_fork_compound, khugepaged_context, anon_ops);
|
||||||
|
TEST(collapse_fork_compound, madvise_context, anon_ops);
|
||||||
|
|
||||||
|
TEST(collapse_max_ptes_shared, khugepaged_context, anon_ops);
|
||||||
|
TEST(collapse_max_ptes_shared, madvise_context, anon_ops);
|
||||||
|
|
||||||
|
TEST(madvise_collapse_existing_thps, madvise_context, anon_ops);
|
||||||
|
TEST(madvise_collapse_existing_thps, madvise_context, file_ops);
|
||||||
|
|
||||||
restore_settings(0);
|
restore_settings(0);
|
||||||
}
|
}
|
||||||
|
@ -114,3 +114,13 @@ bool check_huge_anon(void *addr, int nr_hpages, uint64_t hpage_size)
|
|||||||
{
|
{
|
||||||
return __check_huge(addr, "AnonHugePages: ", nr_hpages, hpage_size);
|
return __check_huge(addr, "AnonHugePages: ", nr_hpages, hpage_size);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
bool check_huge_file(void *addr, int nr_hpages, uint64_t hpage_size)
|
||||||
|
{
|
||||||
|
return __check_huge(addr, "FilePmdMapped:", nr_hpages, hpage_size);
|
||||||
|
}
|
||||||
|
|
||||||
|
bool check_huge_shmem(void *addr, int nr_hpages, uint64_t hpage_size)
|
||||||
|
{
|
||||||
|
return __check_huge(addr, "ShmemPmdMapped:", nr_hpages, hpage_size);
|
||||||
|
}
|
||||||
|
@ -8,3 +8,5 @@ void clear_softdirty(void);
|
|||||||
bool check_for_pattern(FILE *fp, const char *pattern, char *buf, size_t len);
|
bool check_for_pattern(FILE *fp, const char *pattern, char *buf, size_t len);
|
||||||
uint64_t read_pmd_pagesize(void);
|
uint64_t read_pmd_pagesize(void);
|
||||||
bool check_huge_anon(void *addr, int nr_hpages, uint64_t hpage_size);
|
bool check_huge_anon(void *addr, int nr_hpages, uint64_t hpage_size);
|
||||||
|
bool check_huge_file(void *addr, int nr_hpages, uint64_t hpage_size);
|
||||||
|
bool check_huge_shmem(void *addr, int nr_hpages, uint64_t hpage_size);
|
||||||
|
Loading…
Reference in New Issue
Block a user