[RFC 2/2] selftests/powerpc: Add tests for various hash page fault paths

Anshuman Khandual khandual at linux.vnet.ibm.com
Wed Feb 17 18:00:33 AEDT 2016


This new test case tries to create virtual memory scenarios to
drive different types of hash page faults. It also uses perf
API to capture the number of times it went through the intended
hash fault paths.

Signed-off-by: Anshuman Khandual <khandual at linux.vnet.ibm.com>
---
Test result looks like this now. The objective is to auto verify
the count of these traces for various buffer sizes and scenarios.
created.

vm.nr_hugepages = 10
HugeTLB allocation::::::::
[              faults]:          1
[        major-faults]:          0
[        minor-faults]:          1
[         hash_faults]:          2
[     hash_faults_thp]:          0
[     hash_faults_64K]:          0
[      hash_faults_4K]:          0
[ hash_faults_hugetlb]:          1
THP allocation::::::::
[              faults]:          256
[        major-faults]:          0
[        minor-faults]:          256
[         hash_faults]:          256
[     hash_faults_thp]:          0
[     hash_faults_64K]:          256
[      hash_faults_4K]:          0
[ hash_faults_hugetlb]:          0
SUBPAGE protection::::
[              faults]:          0
[        major-faults]:          0
[        minor-faults]:          0
[         hash_faults]:          4096
[     hash_faults_thp]:          0
[     hash_faults_64K]:          0
[      hash_faults_4K]:          4096
[ hash_faults_hugetlb]:          0
PFN flush::::::::::::
[              faults]:          256
[        major-faults]:          0
[        minor-faults]:          256
[         hash_faults]:          4352
[     hash_faults_thp]:          0
[     hash_faults_64K]:          0
[      hash_faults_4K]:          4096
[ hash_faults_hugetlb]:          0
vm.nr_hugepages = 0

THP allocation on a free system is not happening even after a call to
MADVISE_HUGEPAGE. Problem seems to be related to NUMA memory configuration
which I will debug further.

 tools/testing/selftests/powerpc/mm/Makefile     |   2 +-
 tools/testing/selftests/powerpc/mm/mem_perf.c   | 198 ++++++++++++++++++++++++
 tools/testing/selftests/powerpc/mm/run_mem_perf |   3 +
 3 files changed, 202 insertions(+), 1 deletion(-)
 create mode 100644 tools/testing/selftests/powerpc/mm/mem_perf.c
 create mode 100755 tools/testing/selftests/powerpc/mm/run_mem_perf

diff --git a/tools/testing/selftests/powerpc/mm/Makefile b/tools/testing/selftests/powerpc/mm/Makefile
index ee179e2..13bc5c3 100644
--- a/tools/testing/selftests/powerpc/mm/Makefile
+++ b/tools/testing/selftests/powerpc/mm/Makefile
@@ -1,7 +1,7 @@
 noarg:
 	$(MAKE) -C ../
 
-TEST_PROGS := hugetlb_vs_thp_test subpage_prot
+TEST_PROGS := hugetlb_vs_thp_test subpage_prot mem_perf
 TEST_FILES := tempfile
 
 all: $(TEST_PROGS) $(TEST_FILES)
diff --git a/tools/testing/selftests/powerpc/mm/mem_perf.c b/tools/testing/selftests/powerpc/mm/mem_perf.c
new file mode 100644
index 0000000..f5d8348
--- /dev/null
+++ b/tools/testing/selftests/powerpc/mm/mem_perf.c
@@ -0,0 +1,198 @@
+/*
+ * Copyright 2016, Anshuman Khandual, IBM Corp.
+ * Licensed under GPLv2.
+ */
+
+#include <unistd.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <sys/mman.h>
+
+#include "../pmu/event.c"
+
+#define ADDR_INPUT	0xa0000000000UL
+#define HPAGE_SIZE	0x1000000
+#define PSIZE_64K	0x10000
+#define PSIZE_4K	0x1000
+
+#define MAX_MM_EVENTS	8
+
+struct event mm_events[MAX_MM_EVENTS];
+
+static void setup_event(struct event *e, u64 config, char *name)
+{
+	event_init_opts(e, config, PERF_TYPE_SOFTWARE, name);
+	e->attr.disabled = 1;
+	e->attr.exclude_kernel = 1;
+	e->attr.exclude_hv = 1;
+	e->attr.exclude_idle = 1;
+}
+
+static void setup_event_tr(struct event *e, u64 config, char *name)
+{
+	memset(e, 0, sizeof(*e));
+
+	e->name = name;
+	e->attr.type = PERF_TYPE_TRACEPOINT;
+	e->attr.config = config;
+	e->attr.size = sizeof(e->attr);
+	e->attr.sample_period = PERF_SAMPLE_IDENTIFIER;
+	e->attr.inherit = 1;
+	e->attr.enable_on_exec = 1;
+	e->attr.exclude_guest = 1;
+
+	/* This has to match the structure layout in the header */
+	e->attr.read_format = PERF_FORMAT_TOTAL_TIME_ENABLED | \
+				PERF_FORMAT_TOTAL_TIME_RUNNING;
+	e->attr.disabled = 1;
+}
+
+
+static void prepare_events(void)
+{
+	int i;
+
+	for (i = 0; i < MAX_MM_EVENTS; i++)
+		event_reset(&mm_events[i]);
+
+	for (i = 0; i < MAX_MM_EVENTS; i++)
+		event_enable(&mm_events[i]);
+}
+
+static void close_events(void)
+{
+	int i;
+
+	for (i = 0; i < MAX_MM_EVENTS; i++)
+		event_close(&mm_events[i]);
+}
+
+static void display_events(void)
+{
+	int i;
+
+	for (i = 0; i < MAX_MM_EVENTS; i++)
+		event_disable(&mm_events[i]);
+
+	for (i = 0; i < MAX_MM_EVENTS; i++)
+		event_read(&mm_events[i]);
+
+	for (i = 0; i < MAX_MM_EVENTS; i++)
+		printf("[%20s]: \t %llu\n", mm_events[i].name, mm_events[i].result.value);
+}
+
+static void setup_events(void)
+{
+	setup_event(&mm_events[0], PERF_COUNT_SW_PAGE_FAULTS, "faults");
+	setup_event(&mm_events[1], PERF_COUNT_SW_PAGE_FAULTS_MAJ, "major-faults");
+	setup_event(&mm_events[2], PERF_COUNT_SW_PAGE_FAULTS_MIN, "minor-faults");
+
+	setup_event_tr(&mm_events[3], 22 , "hash_faults");
+	setup_event_tr(&mm_events[4], 20 , "hash_faults_thp");
+	setup_event_tr(&mm_events[5], 19 , "hash_faults_64K");
+	setup_event_tr(&mm_events[6], 18 , "hash_faults_4K");
+	setup_event_tr(&mm_events[7], 21 , "hash_faults_hugetlb");
+}
+
+static void open_events()
+{
+	int i;
+
+	for (i = 0; i < MAX_MM_EVENTS; i++) {
+		if (event_open(&mm_events[i]))
+			perror("event_open() failed");
+	}
+}
+
+static void subpage_prot_change(char *ptr, unsigned long size)
+{
+	unsigned int *map;
+	unsigned long npages, i, err;
+
+	npages = size / PSIZE_64K;
+	map = malloc(sizeof(unsigned int) * npages);
+	if (!map)  {
+		perror("malloc() failed");
+		exit(-1);
+	}
+
+	for (i = 0; i < npages; i++)
+		map[i] = 0;
+
+	err = syscall(__NR_subpage_prot, ptr, size, map);
+	if (err) {
+		perror("subpage() protection failed");
+		exit(-1);
+	}
+}
+
+static void dont_need_request(char *ptr, unsigned long size)
+{
+	if (madvise(ptr, size, MADV_DONTNEED)){
+		perror("madvise");
+		exit(-1);
+	}
+}
+
+static void thp_request(char *ptr, unsigned long size)
+{
+	if (madvise(ptr, size, MADV_HUGEPAGE)){
+		perror("madvise");
+		exit(-1);
+	}
+}
+
+int main(int argc, char *argv[])
+{
+	int nr_hp = strtol(argv[1], NULL, 0);
+	char *ptr, *htlb;
+
+	setup_events();
+	open_events();
+
+	do {
+		printf("HugeTLB allocation::::::::\n");
+		htlb = mmap(NULL, nr_hp * HPAGE_SIZE, PROT_READ | PROT_WRITE,MAP_PRIVATE | MAP_ANONYMOUS | MAP_NORESERVE | MAP_HUGETLB, -1, 0);
+		if (!htlb) {
+			perror("mmap");
+			exit(-1);
+		}
+
+		prepare_events();
+		memset(htlb, 0, nr_hp * HPAGE_SIZE);
+		display_events();
+
+		printf("THP allocation::::::::\n");
+		ptr = mmap((void *) ADDR_INPUT, nr_hp * HPAGE_SIZE, PROT_READ | PROT_WRITE, MAP_PRIVATE | MAP_ANONYMOUS | MAP_NORESERVE, -1, 0);
+		if (ptr != (void *) ADDR_INPUT) {
+			perror("mmap");
+			exit(-1);
+		}
+
+		thp_request(ptr, nr_hp * HPAGE_SIZE);
+		prepare_events();
+		memset(ptr, 0, nr_hp * HPAGE_SIZE);
+		display_events();
+
+		printf("SUBPAGE protection::::\n");
+		subpage_prot_change(ptr, nr_hp * HPAGE_SIZE);
+
+		prepare_events();
+		memset(ptr, 0, nr_hp * HPAGE_SIZE);
+		display_events();
+
+		printf("PFN flush::::::::::::\n");
+		dont_need_request(ptr, nr_hp * HPAGE_SIZE);
+
+		prepare_events();
+		memset(ptr, 0, nr_hp * HPAGE_SIZE);
+		display_events();
+
+		munmap(ptr, nr_hp * HPAGE_SIZE);
+		munmap(htlb, nr_hp * HPAGE_SIZE);
+
+	} while(0);
+	close_events();
+	return 0;
+}
diff --git a/tools/testing/selftests/powerpc/mm/run_mem_perf b/tools/testing/selftests/powerpc/mm/run_mem_perf
new file mode 100755
index 0000000..ee510f5
--- /dev/null
+++ b/tools/testing/selftests/powerpc/mm/run_mem_perf
@@ -0,0 +1,3 @@
+sysctl vm.nr_hugepages=10
+./mem_perf 1
+sysctl vm.nr_hugepages=0
-- 
2.1.0



More information about the Linuxppc-dev mailing list