KVM: selftests: Rename perf_test_util.[ch] to memstress.[ch]
authorDavid Matlack <dmatlack@google.com>
Wed, 12 Oct 2022 16:57:27 +0000 (09:57 -0700)
committerSean Christopherson <seanjc@google.com>
Wed, 16 Nov 2022 18:57:34 +0000 (10:57 -0800)
Rename the perf_test_util.[ch] files to memstress.[ch]. Symbols are
renamed in the following commit to reduce the amount of churn here in
hopes of playiing nice with git's file rename detection.

The name "memstress" was chosen to better describe the functionality
proveded by this library, which is to create and run a VM that
reads/writes to guest memory on all vCPUs in parallel.

"memstress" also contains the same number of chracters as "perf_test",
making it a drop-in replacement in symbols, e.g. function names, without
impacting line lengths. Also the lack of underscore between "mem" and
"stress" makes it clear "memstress" is a noun.

Signed-off-by: David Matlack <dmatlack@google.com>
Reviewed-by: Sean Christopherson <seanjc@google.com>
Link: https://lore.kernel.org/r/20221012165729.3505266-2-dmatlack@google.com
Signed-off-by: Sean Christopherson <seanjc@google.com>
tools/testing/selftests/kvm/Makefile
tools/testing/selftests/kvm/access_tracking_perf_test.c
tools/testing/selftests/kvm/demand_paging_test.c
tools/testing/selftests/kvm/dirty_log_perf_test.c
tools/testing/selftests/kvm/include/memstress.h [new file with mode: 0644]
tools/testing/selftests/kvm/include/perf_test_util.h [deleted file]
tools/testing/selftests/kvm/lib/memstress.c [new file with mode: 0644]
tools/testing/selftests/kvm/lib/perf_test_util.c [deleted file]
tools/testing/selftests/kvm/lib/x86_64/memstress.c [new file with mode: 0644]
tools/testing/selftests/kvm/lib/x86_64/perf_test_util.c [deleted file]
tools/testing/selftests/kvm/memslot_modification_stress_test.c

index 0172eb6cb6eee228cd2b3bea864abdb561f4346c..a00253b79040b3a0e038bff44e7df642a89ad369 100644 (file)
@@ -43,7 +43,7 @@ LIBKVM += lib/elf.c
 LIBKVM += lib/guest_modes.c
 LIBKVM += lib/io.c
 LIBKVM += lib/kvm_util.c
-LIBKVM += lib/perf_test_util.c
+LIBKVM += lib/memstress.c
 LIBKVM += lib/rbtree.c
 LIBKVM += lib/sparsebit.c
 LIBKVM += lib/test_util.c
@@ -52,7 +52,7 @@ LIBKVM_STRING += lib/string_override.c
 
 LIBKVM_x86_64 += lib/x86_64/apic.c
 LIBKVM_x86_64 += lib/x86_64/handlers.S
-LIBKVM_x86_64 += lib/x86_64/perf_test_util.c
+LIBKVM_x86_64 += lib/x86_64/memstress.c
 LIBKVM_x86_64 += lib/x86_64/processor.c
 LIBKVM_x86_64 += lib/x86_64/svm.c
 LIBKVM_x86_64 += lib/x86_64/ucall.c
index c0cdf07de1471c7e50c3fc605c72a6a79fb5f937..534d18cc4a6af99acefbc415f0a77f4a33ef0c1e 100644 (file)
@@ -44,7 +44,7 @@
 
 #include "kvm_util.h"
 #include "test_util.h"
-#include "perf_test_util.h"
+#include "memstress.h"
 #include "guest_modes.h"
 
 /* Global variable used to synchronize all of the vCPU threads. */
index 0c98181fa24894c13228278c7dd7641ece0fe1d6..37501e83d1d8764ad62960d81c0766cf1d1ceb73 100644 (file)
@@ -20,7 +20,7 @@
 
 #include "kvm_util.h"
 #include "test_util.h"
-#include "perf_test_util.h"
+#include "memstress.h"
 #include "guest_modes.h"
 
 #ifdef __NR_userfaultfd
index 47cbda3580fd6d161d519682372e917fe299de01..d2bac493da5dda698a4a9b6a75c6ef36bcab9508 100644 (file)
@@ -16,7 +16,7 @@
 
 #include "kvm_util.h"
 #include "test_util.h"
-#include "perf_test_util.h"
+#include "memstress.h"
 #include "guest_modes.h"
 
 #ifdef __aarch64__
diff --git a/tools/testing/selftests/kvm/include/memstress.h b/tools/testing/selftests/kvm/include/memstress.h
new file mode 100644 (file)
index 0000000..64a523e
--- /dev/null
@@ -0,0 +1,72 @@
+// SPDX-License-Identifier: GPL-2.0
+/*
+ * tools/testing/selftests/kvm/include/memstress.h
+ *
+ * Copyright (C) 2020, Google LLC.
+ */
+
+#ifndef SELFTEST_KVM_MEMSTRESS_H
+#define SELFTEST_KVM_MEMSTRESS_H
+
+#include <pthread.h>
+
+#include "kvm_util.h"
+
+/* Default guest test virtual memory offset */
+#define DEFAULT_GUEST_TEST_MEM         0xc0000000
+
+#define DEFAULT_PER_VCPU_MEM_SIZE      (1 << 30) /* 1G */
+
+#define PERF_TEST_MEM_SLOT_INDEX       1
+
+struct perf_test_vcpu_args {
+       uint64_t gpa;
+       uint64_t gva;
+       uint64_t pages;
+
+       /* Only used by the host userspace part of the vCPU thread */
+       struct kvm_vcpu *vcpu;
+       int vcpu_idx;
+};
+
+struct perf_test_args {
+       struct kvm_vm *vm;
+       /* The starting address and size of the guest test region. */
+       uint64_t gpa;
+       uint64_t size;
+       uint64_t guest_page_size;
+       uint32_t random_seed;
+       uint32_t write_percent;
+
+       /* Run vCPUs in L2 instead of L1, if the architecture supports it. */
+       bool nested;
+       /* Randomize which pages are accessed by the guest. */
+       bool random_access;
+       /* True if all vCPUs are pinned to pCPUs */
+       bool pin_vcpus;
+       /* The vCPU=>pCPU pinning map. Only valid if pin_vcpus is true. */
+       uint32_t vcpu_to_pcpu[KVM_MAX_VCPUS];
+
+       struct perf_test_vcpu_args vcpu_args[KVM_MAX_VCPUS];
+};
+
+extern struct perf_test_args perf_test_args;
+
+struct kvm_vm *perf_test_create_vm(enum vm_guest_mode mode, int nr_vcpus,
+                                  uint64_t vcpu_memory_bytes, int slots,
+                                  enum vm_mem_backing_src_type backing_src,
+                                  bool partition_vcpu_memory_access);
+void perf_test_destroy_vm(struct kvm_vm *vm);
+
+void perf_test_set_write_percent(struct kvm_vm *vm, uint32_t write_percent);
+void perf_test_set_random_seed(struct kvm_vm *vm, uint32_t random_seed);
+void perf_test_set_random_access(struct kvm_vm *vm, bool random_access);
+
+void perf_test_start_vcpu_threads(int vcpus, void (*vcpu_fn)(struct perf_test_vcpu_args *));
+void perf_test_join_vcpu_threads(int vcpus);
+void perf_test_guest_code(uint32_t vcpu_id);
+
+uint64_t perf_test_nested_pages(int nr_vcpus);
+void perf_test_setup_nested(struct kvm_vm *vm, int nr_vcpus, struct kvm_vcpu *vcpus[]);
+
+#endif /* SELFTEST_KVM_MEMSTRESS_H */
diff --git a/tools/testing/selftests/kvm/include/perf_test_util.h b/tools/testing/selftests/kvm/include/perf_test_util.h
deleted file mode 100644 (file)
index 75ca679..0000000
+++ /dev/null
@@ -1,72 +0,0 @@
-// SPDX-License-Identifier: GPL-2.0
-/*
- * tools/testing/selftests/kvm/include/perf_test_util.h
- *
- * Copyright (C) 2020, Google LLC.
- */
-
-#ifndef SELFTEST_KVM_PERF_TEST_UTIL_H
-#define SELFTEST_KVM_PERF_TEST_UTIL_H
-
-#include <pthread.h>
-
-#include "kvm_util.h"
-
-/* Default guest test virtual memory offset */
-#define DEFAULT_GUEST_TEST_MEM         0xc0000000
-
-#define DEFAULT_PER_VCPU_MEM_SIZE      (1 << 30) /* 1G */
-
-#define PERF_TEST_MEM_SLOT_INDEX       1
-
-struct perf_test_vcpu_args {
-       uint64_t gpa;
-       uint64_t gva;
-       uint64_t pages;
-
-       /* Only used by the host userspace part of the vCPU thread */
-       struct kvm_vcpu *vcpu;
-       int vcpu_idx;
-};
-
-struct perf_test_args {
-       struct kvm_vm *vm;
-       /* The starting address and size of the guest test region. */
-       uint64_t gpa;
-       uint64_t size;
-       uint64_t guest_page_size;
-       uint32_t random_seed;
-       uint32_t write_percent;
-
-       /* Run vCPUs in L2 instead of L1, if the architecture supports it. */
-       bool nested;
-       /* Randomize which pages are accessed by the guest. */
-       bool random_access;
-       /* True if all vCPUs are pinned to pCPUs */
-       bool pin_vcpus;
-       /* The vCPU=>pCPU pinning map. Only valid if pin_vcpus is true. */
-       uint32_t vcpu_to_pcpu[KVM_MAX_VCPUS];
-
-       struct perf_test_vcpu_args vcpu_args[KVM_MAX_VCPUS];
-};
-
-extern struct perf_test_args perf_test_args;
-
-struct kvm_vm *perf_test_create_vm(enum vm_guest_mode mode, int nr_vcpus,
-                                  uint64_t vcpu_memory_bytes, int slots,
-                                  enum vm_mem_backing_src_type backing_src,
-                                  bool partition_vcpu_memory_access);
-void perf_test_destroy_vm(struct kvm_vm *vm);
-
-void perf_test_set_write_percent(struct kvm_vm *vm, uint32_t write_percent);
-void perf_test_set_random_seed(struct kvm_vm *vm, uint32_t random_seed);
-void perf_test_set_random_access(struct kvm_vm *vm, bool random_access);
-
-void perf_test_start_vcpu_threads(int vcpus, void (*vcpu_fn)(struct perf_test_vcpu_args *));
-void perf_test_join_vcpu_threads(int vcpus);
-void perf_test_guest_code(uint32_t vcpu_id);
-
-uint64_t perf_test_nested_pages(int nr_vcpus);
-void perf_test_setup_nested(struct kvm_vm *vm, int nr_vcpus, struct kvm_vcpu *vcpus[]);
-
-#endif /* SELFTEST_KVM_PERF_TEST_UTIL_H */
diff --git a/tools/testing/selftests/kvm/lib/memstress.c b/tools/testing/selftests/kvm/lib/memstress.c
new file mode 100644 (file)
index 0000000..72f88e5
--- /dev/null
@@ -0,0 +1,322 @@
+// SPDX-License-Identifier: GPL-2.0
+/*
+ * Copyright (C) 2020, Google LLC.
+ */
+#define _GNU_SOURCE
+
+#include <inttypes.h>
+
+#include "kvm_util.h"
+#include "memstress.h"
+#include "processor.h"
+
+struct perf_test_args perf_test_args;
+
+/*
+ * Guest virtual memory offset of the testing memory slot.
+ * Must not conflict with identity mapped test code.
+ */
+static uint64_t guest_test_virt_mem = DEFAULT_GUEST_TEST_MEM;
+
+struct vcpu_thread {
+       /* The index of the vCPU. */
+       int vcpu_idx;
+
+       /* The pthread backing the vCPU. */
+       pthread_t thread;
+
+       /* Set to true once the vCPU thread is up and running. */
+       bool running;
+};
+
+/* The vCPU threads involved in this test. */
+static struct vcpu_thread vcpu_threads[KVM_MAX_VCPUS];
+
+/* The function run by each vCPU thread, as provided by the test. */
+static void (*vcpu_thread_fn)(struct perf_test_vcpu_args *);
+
+/* Set to true once all vCPU threads are up and running. */
+static bool all_vcpu_threads_running;
+
+static struct kvm_vcpu *vcpus[KVM_MAX_VCPUS];
+
+/*
+ * Continuously write to the first 8 bytes of each page in the
+ * specified region.
+ */
+void perf_test_guest_code(uint32_t vcpu_idx)
+{
+       struct perf_test_args *pta = &perf_test_args;
+       struct perf_test_vcpu_args *vcpu_args = &pta->vcpu_args[vcpu_idx];
+       struct guest_random_state rand_state;
+       uint64_t gva;
+       uint64_t pages;
+       uint64_t addr;
+       uint64_t page;
+       int i;
+
+       rand_state = new_guest_random_state(pta->random_seed + vcpu_idx);
+
+       gva = vcpu_args->gva;
+       pages = vcpu_args->pages;
+
+       /* Make sure vCPU args data structure is not corrupt. */
+       GUEST_ASSERT(vcpu_args->vcpu_idx == vcpu_idx);
+
+       while (true) {
+               for (i = 0; i < pages; i++) {
+                       if (pta->random_access)
+                               page = guest_random_u32(&rand_state) % pages;
+                       else
+                               page = i;
+
+                       addr = gva + (page * pta->guest_page_size);
+
+                       if (guest_random_u32(&rand_state) % 100 < pta->write_percent)
+                               *(uint64_t *)addr = 0x0123456789ABCDEF;
+                       else
+                               READ_ONCE(*(uint64_t *)addr);
+               }
+
+               GUEST_SYNC(1);
+       }
+}
+
+void perf_test_setup_vcpus(struct kvm_vm *vm, int nr_vcpus,
+                          struct kvm_vcpu *vcpus[],
+                          uint64_t vcpu_memory_bytes,
+                          bool partition_vcpu_memory_access)
+{
+       struct perf_test_args *pta = &perf_test_args;
+       struct perf_test_vcpu_args *vcpu_args;
+       int i;
+
+       for (i = 0; i < nr_vcpus; i++) {
+               vcpu_args = &pta->vcpu_args[i];
+
+               vcpu_args->vcpu = vcpus[i];
+               vcpu_args->vcpu_idx = i;
+
+               if (partition_vcpu_memory_access) {
+                       vcpu_args->gva = guest_test_virt_mem +
+                                        (i * vcpu_memory_bytes);
+                       vcpu_args->pages = vcpu_memory_bytes /
+                                          pta->guest_page_size;
+                       vcpu_args->gpa = pta->gpa + (i * vcpu_memory_bytes);
+               } else {
+                       vcpu_args->gva = guest_test_virt_mem;
+                       vcpu_args->pages = (nr_vcpus * vcpu_memory_bytes) /
+                                          pta->guest_page_size;
+                       vcpu_args->gpa = pta->gpa;
+               }
+
+               vcpu_args_set(vcpus[i], 1, i);
+
+               pr_debug("Added VCPU %d with test mem gpa [%lx, %lx)\n",
+                        i, vcpu_args->gpa, vcpu_args->gpa +
+                        (vcpu_args->pages * pta->guest_page_size));
+       }
+}
+
+struct kvm_vm *perf_test_create_vm(enum vm_guest_mode mode, int nr_vcpus,
+                                  uint64_t vcpu_memory_bytes, int slots,
+                                  enum vm_mem_backing_src_type backing_src,
+                                  bool partition_vcpu_memory_access)
+{
+       struct perf_test_args *pta = &perf_test_args;
+       struct kvm_vm *vm;
+       uint64_t guest_num_pages, slot0_pages = 0;
+       uint64_t backing_src_pagesz = get_backing_src_pagesz(backing_src);
+       uint64_t region_end_gfn;
+       int i;
+
+       pr_info("Testing guest mode: %s\n", vm_guest_mode_string(mode));
+
+       /* By default vCPUs will write to memory. */
+       pta->write_percent = 100;
+
+       /*
+        * Snapshot the non-huge page size.  This is used by the guest code to
+        * access/dirty pages at the logging granularity.
+        */
+       pta->guest_page_size = vm_guest_mode_params[mode].page_size;
+
+       guest_num_pages = vm_adjust_num_guest_pages(mode,
+                               (nr_vcpus * vcpu_memory_bytes) / pta->guest_page_size);
+
+       TEST_ASSERT(vcpu_memory_bytes % getpagesize() == 0,
+                   "Guest memory size is not host page size aligned.");
+       TEST_ASSERT(vcpu_memory_bytes % pta->guest_page_size == 0,
+                   "Guest memory size is not guest page size aligned.");
+       TEST_ASSERT(guest_num_pages % slots == 0,
+                   "Guest memory cannot be evenly divided into %d slots.",
+                   slots);
+
+       /*
+        * If using nested, allocate extra pages for the nested page tables and
+        * in-memory data structures.
+        */
+       if (pta->nested)
+               slot0_pages += perf_test_nested_pages(nr_vcpus);
+
+       /*
+        * Pass guest_num_pages to populate the page tables for test memory.
+        * The memory is also added to memslot 0, but that's a benign side
+        * effect as KVM allows aliasing HVAs in meslots.
+        */
+       vm = __vm_create_with_vcpus(mode, nr_vcpus, slot0_pages + guest_num_pages,
+                                   perf_test_guest_code, vcpus);
+
+       pta->vm = vm;
+
+       /* Put the test region at the top guest physical memory. */
+       region_end_gfn = vm->max_gfn + 1;
+
+#ifdef __x86_64__
+       /*
+        * When running vCPUs in L2, restrict the test region to 48 bits to
+        * avoid needing 5-level page tables to identity map L2.
+        */
+       if (pta->nested)
+               region_end_gfn = min(region_end_gfn, (1UL << 48) / pta->guest_page_size);
+#endif
+       /*
+        * If there should be more memory in the guest test region than there
+        * can be pages in the guest, it will definitely cause problems.
+        */
+       TEST_ASSERT(guest_num_pages < region_end_gfn,
+                   "Requested more guest memory than address space allows.\n"
+                   "    guest pages: %" PRIx64 " max gfn: %" PRIx64
+                   " nr_vcpus: %d wss: %" PRIx64 "]\n",
+                   guest_num_pages, region_end_gfn - 1, nr_vcpus, vcpu_memory_bytes);
+
+       pta->gpa = (region_end_gfn - guest_num_pages - 1) * pta->guest_page_size;
+       pta->gpa = align_down(pta->gpa, backing_src_pagesz);
+#ifdef __s390x__
+       /* Align to 1M (segment size) */
+       pta->gpa = align_down(pta->gpa, 1 << 20);
+#endif
+       pta->size = guest_num_pages * pta->guest_page_size;
+       pr_info("guest physical test memory: [0x%lx, 0x%lx)\n",
+               pta->gpa, pta->gpa + pta->size);
+
+       /* Add extra memory slots for testing */
+       for (i = 0; i < slots; i++) {
+               uint64_t region_pages = guest_num_pages / slots;
+               vm_paddr_t region_start = pta->gpa + region_pages * pta->guest_page_size * i;
+
+               vm_userspace_mem_region_add(vm, backing_src, region_start,
+                                           PERF_TEST_MEM_SLOT_INDEX + i,
+                                           region_pages, 0);
+       }
+
+       /* Do mapping for the demand paging memory slot */
+       virt_map(vm, guest_test_virt_mem, pta->gpa, guest_num_pages);
+
+       perf_test_setup_vcpus(vm, nr_vcpus, vcpus, vcpu_memory_bytes,
+                             partition_vcpu_memory_access);
+
+       if (pta->nested) {
+               pr_info("Configuring vCPUs to run in L2 (nested).\n");
+               perf_test_setup_nested(vm, nr_vcpus, vcpus);
+       }
+
+       ucall_init(vm, NULL);
+
+       /* Export the shared variables to the guest. */
+       sync_global_to_guest(vm, perf_test_args);
+
+       return vm;
+}
+
+void perf_test_destroy_vm(struct kvm_vm *vm)
+{
+       ucall_uninit(vm);
+       kvm_vm_free(vm);
+}
+
+void perf_test_set_write_percent(struct kvm_vm *vm, uint32_t write_percent)
+{
+       perf_test_args.write_percent = write_percent;
+       sync_global_to_guest(vm, perf_test_args.write_percent);
+}
+
+void perf_test_set_random_seed(struct kvm_vm *vm, uint32_t random_seed)
+{
+       perf_test_args.random_seed = random_seed;
+       sync_global_to_guest(vm, perf_test_args.random_seed);
+}
+
+void perf_test_set_random_access(struct kvm_vm *vm, bool random_access)
+{
+       perf_test_args.random_access = random_access;
+       sync_global_to_guest(vm, perf_test_args.random_access);
+}
+
+uint64_t __weak perf_test_nested_pages(int nr_vcpus)
+{
+       return 0;
+}
+
+void __weak perf_test_setup_nested(struct kvm_vm *vm, int nr_vcpus, struct kvm_vcpu **vcpus)
+{
+       pr_info("%s() not support on this architecture, skipping.\n", __func__);
+       exit(KSFT_SKIP);
+}
+
+static void *vcpu_thread_main(void *data)
+{
+       struct vcpu_thread *vcpu = data;
+       int vcpu_idx = vcpu->vcpu_idx;
+
+       if (perf_test_args.pin_vcpus)
+               kvm_pin_this_task_to_pcpu(perf_test_args.vcpu_to_pcpu[vcpu_idx]);
+
+       WRITE_ONCE(vcpu->running, true);
+
+       /*
+        * Wait for all vCPU threads to be up and running before calling the test-
+        * provided vCPU thread function. This prevents thread creation (which
+        * requires taking the mmap_sem in write mode) from interfering with the
+        * guest faulting in its memory.
+        */
+       while (!READ_ONCE(all_vcpu_threads_running))
+               ;
+
+       vcpu_thread_fn(&perf_test_args.vcpu_args[vcpu_idx]);
+
+       return NULL;
+}
+
+void perf_test_start_vcpu_threads(int nr_vcpus,
+                                 void (*vcpu_fn)(struct perf_test_vcpu_args *))
+{
+       int i;
+
+       vcpu_thread_fn = vcpu_fn;
+       WRITE_ONCE(all_vcpu_threads_running, false);
+
+       for (i = 0; i < nr_vcpus; i++) {
+               struct vcpu_thread *vcpu = &vcpu_threads[i];
+
+               vcpu->vcpu_idx = i;
+               WRITE_ONCE(vcpu->running, false);
+
+               pthread_create(&vcpu->thread, NULL, vcpu_thread_main, vcpu);
+       }
+
+       for (i = 0; i < nr_vcpus; i++) {
+               while (!READ_ONCE(vcpu_threads[i].running))
+                       ;
+       }
+
+       WRITE_ONCE(all_vcpu_threads_running, true);
+}
+
+void perf_test_join_vcpu_threads(int nr_vcpus)
+{
+       int i;
+
+       for (i = 0; i < nr_vcpus; i++)
+               pthread_join(vcpu_threads[i].thread, NULL);
+}
diff --git a/tools/testing/selftests/kvm/lib/perf_test_util.c b/tools/testing/selftests/kvm/lib/perf_test_util.c
deleted file mode 100644 (file)
index 3a9a3ea..0000000
+++ /dev/null
@@ -1,322 +0,0 @@
-// SPDX-License-Identifier: GPL-2.0
-/*
- * Copyright (C) 2020, Google LLC.
- */
-#define _GNU_SOURCE
-
-#include <inttypes.h>
-
-#include "kvm_util.h"
-#include "perf_test_util.h"
-#include "processor.h"
-
-struct perf_test_args perf_test_args;
-
-/*
- * Guest virtual memory offset of the testing memory slot.
- * Must not conflict with identity mapped test code.
- */
-static uint64_t guest_test_virt_mem = DEFAULT_GUEST_TEST_MEM;
-
-struct vcpu_thread {
-       /* The index of the vCPU. */
-       int vcpu_idx;
-
-       /* The pthread backing the vCPU. */
-       pthread_t thread;
-
-       /* Set to true once the vCPU thread is up and running. */
-       bool running;
-};
-
-/* The vCPU threads involved in this test. */
-static struct vcpu_thread vcpu_threads[KVM_MAX_VCPUS];
-
-/* The function run by each vCPU thread, as provided by the test. */
-static void (*vcpu_thread_fn)(struct perf_test_vcpu_args *);
-
-/* Set to true once all vCPU threads are up and running. */
-static bool all_vcpu_threads_running;
-
-static struct kvm_vcpu *vcpus[KVM_MAX_VCPUS];
-
-/*
- * Continuously write to the first 8 bytes of each page in the
- * specified region.
- */
-void perf_test_guest_code(uint32_t vcpu_idx)
-{
-       struct perf_test_args *pta = &perf_test_args;
-       struct perf_test_vcpu_args *vcpu_args = &pta->vcpu_args[vcpu_idx];
-       struct guest_random_state rand_state;
-       uint64_t gva;
-       uint64_t pages;
-       uint64_t addr;
-       uint64_t page;
-       int i;
-
-       rand_state = new_guest_random_state(pta->random_seed + vcpu_idx);
-
-       gva = vcpu_args->gva;
-       pages = vcpu_args->pages;
-
-       /* Make sure vCPU args data structure is not corrupt. */
-       GUEST_ASSERT(vcpu_args->vcpu_idx == vcpu_idx);
-
-       while (true) {
-               for (i = 0; i < pages; i++) {
-                       if (pta->random_access)
-                               page = guest_random_u32(&rand_state) % pages;
-                       else
-                               page = i;
-
-                       addr = gva + (page * pta->guest_page_size);
-
-                       if (guest_random_u32(&rand_state) % 100 < pta->write_percent)
-                               *(uint64_t *)addr = 0x0123456789ABCDEF;
-                       else
-                               READ_ONCE(*(uint64_t *)addr);
-               }
-
-               GUEST_SYNC(1);
-       }
-}
-
-void perf_test_setup_vcpus(struct kvm_vm *vm, int nr_vcpus,
-                          struct kvm_vcpu *vcpus[],
-                          uint64_t vcpu_memory_bytes,
-                          bool partition_vcpu_memory_access)
-{
-       struct perf_test_args *pta = &perf_test_args;
-       struct perf_test_vcpu_args *vcpu_args;
-       int i;
-
-       for (i = 0; i < nr_vcpus; i++) {
-               vcpu_args = &pta->vcpu_args[i];
-
-               vcpu_args->vcpu = vcpus[i];
-               vcpu_args->vcpu_idx = i;
-
-               if (partition_vcpu_memory_access) {
-                       vcpu_args->gva = guest_test_virt_mem +
-                                        (i * vcpu_memory_bytes);
-                       vcpu_args->pages = vcpu_memory_bytes /
-                                          pta->guest_page_size;
-                       vcpu_args->gpa = pta->gpa + (i * vcpu_memory_bytes);
-               } else {
-                       vcpu_args->gva = guest_test_virt_mem;
-                       vcpu_args->pages = (nr_vcpus * vcpu_memory_bytes) /
-                                          pta->guest_page_size;
-                       vcpu_args->gpa = pta->gpa;
-               }
-
-               vcpu_args_set(vcpus[i], 1, i);
-
-               pr_debug("Added VCPU %d with test mem gpa [%lx, %lx)\n",
-                        i, vcpu_args->gpa, vcpu_args->gpa +
-                        (vcpu_args->pages * pta->guest_page_size));
-       }
-}
-
-struct kvm_vm *perf_test_create_vm(enum vm_guest_mode mode, int nr_vcpus,
-                                  uint64_t vcpu_memory_bytes, int slots,
-                                  enum vm_mem_backing_src_type backing_src,
-                                  bool partition_vcpu_memory_access)
-{
-       struct perf_test_args *pta = &perf_test_args;
-       struct kvm_vm *vm;
-       uint64_t guest_num_pages, slot0_pages = 0;
-       uint64_t backing_src_pagesz = get_backing_src_pagesz(backing_src);
-       uint64_t region_end_gfn;
-       int i;
-
-       pr_info("Testing guest mode: %s\n", vm_guest_mode_string(mode));
-
-       /* By default vCPUs will write to memory. */
-       pta->write_percent = 100;
-
-       /*
-        * Snapshot the non-huge page size.  This is used by the guest code to
-        * access/dirty pages at the logging granularity.
-        */
-       pta->guest_page_size = vm_guest_mode_params[mode].page_size;
-
-       guest_num_pages = vm_adjust_num_guest_pages(mode,
-                               (nr_vcpus * vcpu_memory_bytes) / pta->guest_page_size);
-
-       TEST_ASSERT(vcpu_memory_bytes % getpagesize() == 0,
-                   "Guest memory size is not host page size aligned.");
-       TEST_ASSERT(vcpu_memory_bytes % pta->guest_page_size == 0,
-                   "Guest memory size is not guest page size aligned.");
-       TEST_ASSERT(guest_num_pages % slots == 0,
-                   "Guest memory cannot be evenly divided into %d slots.",
-                   slots);
-
-       /*
-        * If using nested, allocate extra pages for the nested page tables and
-        * in-memory data structures.
-        */
-       if (pta->nested)
-               slot0_pages += perf_test_nested_pages(nr_vcpus);
-
-       /*
-        * Pass guest_num_pages to populate the page tables for test memory.
-        * The memory is also added to memslot 0, but that's a benign side
-        * effect as KVM allows aliasing HVAs in meslots.
-        */
-       vm = __vm_create_with_vcpus(mode, nr_vcpus, slot0_pages + guest_num_pages,
-                                   perf_test_guest_code, vcpus);
-
-       pta->vm = vm;
-
-       /* Put the test region at the top guest physical memory. */
-       region_end_gfn = vm->max_gfn + 1;
-
-#ifdef __x86_64__
-       /*
-        * When running vCPUs in L2, restrict the test region to 48 bits to
-        * avoid needing 5-level page tables to identity map L2.
-        */
-       if (pta->nested)
-               region_end_gfn = min(region_end_gfn, (1UL << 48) / pta->guest_page_size);
-#endif
-       /*
-        * If there should be more memory in the guest test region than there
-        * can be pages in the guest, it will definitely cause problems.
-        */
-       TEST_ASSERT(guest_num_pages < region_end_gfn,
-                   "Requested more guest memory than address space allows.\n"
-                   "    guest pages: %" PRIx64 " max gfn: %" PRIx64
-                   " nr_vcpus: %d wss: %" PRIx64 "]\n",
-                   guest_num_pages, region_end_gfn - 1, nr_vcpus, vcpu_memory_bytes);
-
-       pta->gpa = (region_end_gfn - guest_num_pages - 1) * pta->guest_page_size;
-       pta->gpa = align_down(pta->gpa, backing_src_pagesz);
-#ifdef __s390x__
-       /* Align to 1M (segment size) */
-       pta->gpa = align_down(pta->gpa, 1 << 20);
-#endif
-       pta->size = guest_num_pages * pta->guest_page_size;
-       pr_info("guest physical test memory: [0x%lx, 0x%lx)\n",
-               pta->gpa, pta->gpa + pta->size);
-
-       /* Add extra memory slots for testing */
-       for (i = 0; i < slots; i++) {
-               uint64_t region_pages = guest_num_pages / slots;
-               vm_paddr_t region_start = pta->gpa + region_pages * pta->guest_page_size * i;
-
-               vm_userspace_mem_region_add(vm, backing_src, region_start,
-                                           PERF_TEST_MEM_SLOT_INDEX + i,
-                                           region_pages, 0);
-       }
-
-       /* Do mapping for the demand paging memory slot */
-       virt_map(vm, guest_test_virt_mem, pta->gpa, guest_num_pages);
-
-       perf_test_setup_vcpus(vm, nr_vcpus, vcpus, vcpu_memory_bytes,
-                             partition_vcpu_memory_access);
-
-       if (pta->nested) {
-               pr_info("Configuring vCPUs to run in L2 (nested).\n");
-               perf_test_setup_nested(vm, nr_vcpus, vcpus);
-       }
-
-       ucall_init(vm, NULL);
-
-       /* Export the shared variables to the guest. */
-       sync_global_to_guest(vm, perf_test_args);
-
-       return vm;
-}
-
-void perf_test_destroy_vm(struct kvm_vm *vm)
-{
-       ucall_uninit(vm);
-       kvm_vm_free(vm);
-}
-
-void perf_test_set_write_percent(struct kvm_vm *vm, uint32_t write_percent)
-{
-       perf_test_args.write_percent = write_percent;
-       sync_global_to_guest(vm, perf_test_args.write_percent);
-}
-
-void perf_test_set_random_seed(struct kvm_vm *vm, uint32_t random_seed)
-{
-       perf_test_args.random_seed = random_seed;
-       sync_global_to_guest(vm, perf_test_args.random_seed);
-}
-
-void perf_test_set_random_access(struct kvm_vm *vm, bool random_access)
-{
-       perf_test_args.random_access = random_access;
-       sync_global_to_guest(vm, perf_test_args.random_access);
-}
-
-uint64_t __weak perf_test_nested_pages(int nr_vcpus)
-{
-       return 0;
-}
-
-void __weak perf_test_setup_nested(struct kvm_vm *vm, int nr_vcpus, struct kvm_vcpu **vcpus)
-{
-       pr_info("%s() not support on this architecture, skipping.\n", __func__);
-       exit(KSFT_SKIP);
-}
-
-static void *vcpu_thread_main(void *data)
-{
-       struct vcpu_thread *vcpu = data;
-       int vcpu_idx = vcpu->vcpu_idx;
-
-       if (perf_test_args.pin_vcpus)
-               kvm_pin_this_task_to_pcpu(perf_test_args.vcpu_to_pcpu[vcpu_idx]);
-
-       WRITE_ONCE(vcpu->running, true);
-
-       /*
-        * Wait for all vCPU threads to be up and running before calling the test-
-        * provided vCPU thread function. This prevents thread creation (which
-        * requires taking the mmap_sem in write mode) from interfering with the
-        * guest faulting in its memory.
-        */
-       while (!READ_ONCE(all_vcpu_threads_running))
-               ;
-
-       vcpu_thread_fn(&perf_test_args.vcpu_args[vcpu_idx]);
-
-       return NULL;
-}
-
-void perf_test_start_vcpu_threads(int nr_vcpus,
-                                 void (*vcpu_fn)(struct perf_test_vcpu_args *))
-{
-       int i;
-
-       vcpu_thread_fn = vcpu_fn;
-       WRITE_ONCE(all_vcpu_threads_running, false);
-
-       for (i = 0; i < nr_vcpus; i++) {
-               struct vcpu_thread *vcpu = &vcpu_threads[i];
-
-               vcpu->vcpu_idx = i;
-               WRITE_ONCE(vcpu->running, false);
-
-               pthread_create(&vcpu->thread, NULL, vcpu_thread_main, vcpu);
-       }
-
-       for (i = 0; i < nr_vcpus; i++) {
-               while (!READ_ONCE(vcpu_threads[i].running))
-                       ;
-       }
-
-       WRITE_ONCE(all_vcpu_threads_running, true);
-}
-
-void perf_test_join_vcpu_threads(int nr_vcpus)
-{
-       int i;
-
-       for (i = 0; i < nr_vcpus; i++)
-               pthread_join(vcpu_threads[i].thread, NULL);
-}
diff --git a/tools/testing/selftests/kvm/lib/x86_64/memstress.c b/tools/testing/selftests/kvm/lib/x86_64/memstress.c
new file mode 100644 (file)
index 0000000..0bb717a
--- /dev/null
@@ -0,0 +1,111 @@
+// SPDX-License-Identifier: GPL-2.0
+/*
+ * x86_64-specific extensions to memstress.c.
+ *
+ * Copyright (C) 2022, Google, Inc.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <linux/bitmap.h>
+#include <linux/bitops.h>
+
+#include "test_util.h"
+#include "kvm_util.h"
+#include "memstress.h"
+#include "processor.h"
+#include "vmx.h"
+
+void perf_test_l2_guest_code(uint64_t vcpu_id)
+{
+       perf_test_guest_code(vcpu_id);
+       vmcall();
+}
+
+extern char perf_test_l2_guest_entry[];
+__asm__(
+"perf_test_l2_guest_entry:"
+"      mov (%rsp), %rdi;"
+"      call perf_test_l2_guest_code;"
+"      ud2;"
+);
+
+static void perf_test_l1_guest_code(struct vmx_pages *vmx, uint64_t vcpu_id)
+{
+#define L2_GUEST_STACK_SIZE 64
+       unsigned long l2_guest_stack[L2_GUEST_STACK_SIZE];
+       unsigned long *rsp;
+
+       GUEST_ASSERT(vmx->vmcs_gpa);
+       GUEST_ASSERT(prepare_for_vmx_operation(vmx));
+       GUEST_ASSERT(load_vmcs(vmx));
+       GUEST_ASSERT(ept_1g_pages_supported());
+
+       rsp = &l2_guest_stack[L2_GUEST_STACK_SIZE - 1];
+       *rsp = vcpu_id;
+       prepare_vmcs(vmx, perf_test_l2_guest_entry, rsp);
+
+       GUEST_ASSERT(!vmlaunch());
+       GUEST_ASSERT(vmreadz(VM_EXIT_REASON) == EXIT_REASON_VMCALL);
+       GUEST_DONE();
+}
+
+uint64_t perf_test_nested_pages(int nr_vcpus)
+{
+       /*
+        * 513 page tables is enough to identity-map 256 TiB of L2 with 1G
+        * pages and 4-level paging, plus a few pages per-vCPU for data
+        * structures such as the VMCS.
+        */
+       return 513 + 10 * nr_vcpus;
+}
+
+void perf_test_setup_ept(struct vmx_pages *vmx, struct kvm_vm *vm)
+{
+       uint64_t start, end;
+
+       prepare_eptp(vmx, vm, 0);
+
+       /*
+        * Identity map the first 4G and the test region with 1G pages so that
+        * KVM can shadow the EPT12 with the maximum huge page size supported
+        * by the backing source.
+        */
+       nested_identity_map_1g(vmx, vm, 0, 0x100000000ULL);
+
+       start = align_down(perf_test_args.gpa, PG_SIZE_1G);
+       end = align_up(perf_test_args.gpa + perf_test_args.size, PG_SIZE_1G);
+       nested_identity_map_1g(vmx, vm, start, end - start);
+}
+
+void perf_test_setup_nested(struct kvm_vm *vm, int nr_vcpus, struct kvm_vcpu *vcpus[])
+{
+       struct vmx_pages *vmx, *vmx0 = NULL;
+       struct kvm_regs regs;
+       vm_vaddr_t vmx_gva;
+       int vcpu_id;
+
+       TEST_REQUIRE(kvm_cpu_has(X86_FEATURE_VMX));
+
+       for (vcpu_id = 0; vcpu_id < nr_vcpus; vcpu_id++) {
+               vmx = vcpu_alloc_vmx(vm, &vmx_gva);
+
+               if (vcpu_id == 0) {
+                       perf_test_setup_ept(vmx, vm);
+                       vmx0 = vmx;
+               } else {
+                       /* Share the same EPT table across all vCPUs. */
+                       vmx->eptp = vmx0->eptp;
+                       vmx->eptp_hva = vmx0->eptp_hva;
+                       vmx->eptp_gpa = vmx0->eptp_gpa;
+               }
+
+               /*
+                * Override the vCPU to run perf_test_l1_guest_code() which will
+                * bounce it into L2 before calling perf_test_guest_code().
+                */
+               vcpu_regs_get(vcpus[vcpu_id], &regs);
+               regs.rip = (unsigned long) perf_test_l1_guest_code;
+               vcpu_regs_set(vcpus[vcpu_id], &regs);
+               vcpu_args_set(vcpus[vcpu_id], 2, vmx_gva, vcpu_id);
+       }
+}
diff --git a/tools/testing/selftests/kvm/lib/x86_64/perf_test_util.c b/tools/testing/selftests/kvm/lib/x86_64/perf_test_util.c
deleted file mode 100644 (file)
index 0f344a7..0000000
+++ /dev/null
@@ -1,111 +0,0 @@
-// SPDX-License-Identifier: GPL-2.0
-/*
- * x86_64-specific extensions to perf_test_util.c.
- *
- * Copyright (C) 2022, Google, Inc.
- */
-#include <stdio.h>
-#include <stdlib.h>
-#include <linux/bitmap.h>
-#include <linux/bitops.h>
-
-#include "test_util.h"
-#include "kvm_util.h"
-#include "perf_test_util.h"
-#include "processor.h"
-#include "vmx.h"
-
-void perf_test_l2_guest_code(uint64_t vcpu_id)
-{
-       perf_test_guest_code(vcpu_id);
-       vmcall();
-}
-
-extern char perf_test_l2_guest_entry[];
-__asm__(
-"perf_test_l2_guest_entry:"
-"      mov (%rsp), %rdi;"
-"      call perf_test_l2_guest_code;"
-"      ud2;"
-);
-
-static void perf_test_l1_guest_code(struct vmx_pages *vmx, uint64_t vcpu_id)
-{
-#define L2_GUEST_STACK_SIZE 64
-       unsigned long l2_guest_stack[L2_GUEST_STACK_SIZE];
-       unsigned long *rsp;
-
-       GUEST_ASSERT(vmx->vmcs_gpa);
-       GUEST_ASSERT(prepare_for_vmx_operation(vmx));
-       GUEST_ASSERT(load_vmcs(vmx));
-       GUEST_ASSERT(ept_1g_pages_supported());
-
-       rsp = &l2_guest_stack[L2_GUEST_STACK_SIZE - 1];
-       *rsp = vcpu_id;
-       prepare_vmcs(vmx, perf_test_l2_guest_entry, rsp);
-
-       GUEST_ASSERT(!vmlaunch());
-       GUEST_ASSERT(vmreadz(VM_EXIT_REASON) == EXIT_REASON_VMCALL);
-       GUEST_DONE();
-}
-
-uint64_t perf_test_nested_pages(int nr_vcpus)
-{
-       /*
-        * 513 page tables is enough to identity-map 256 TiB of L2 with 1G
-        * pages and 4-level paging, plus a few pages per-vCPU for data
-        * structures such as the VMCS.
-        */
-       return 513 + 10 * nr_vcpus;
-}
-
-void perf_test_setup_ept(struct vmx_pages *vmx, struct kvm_vm *vm)
-{
-       uint64_t start, end;
-
-       prepare_eptp(vmx, vm, 0);
-
-       /*
-        * Identity map the first 4G and the test region with 1G pages so that
-        * KVM can shadow the EPT12 with the maximum huge page size supported
-        * by the backing source.
-        */
-       nested_identity_map_1g(vmx, vm, 0, 0x100000000ULL);
-
-       start = align_down(perf_test_args.gpa, PG_SIZE_1G);
-       end = align_up(perf_test_args.gpa + perf_test_args.size, PG_SIZE_1G);
-       nested_identity_map_1g(vmx, vm, start, end - start);
-}
-
-void perf_test_setup_nested(struct kvm_vm *vm, int nr_vcpus, struct kvm_vcpu *vcpus[])
-{
-       struct vmx_pages *vmx, *vmx0 = NULL;
-       struct kvm_regs regs;
-       vm_vaddr_t vmx_gva;
-       int vcpu_id;
-
-       TEST_REQUIRE(kvm_cpu_has(X86_FEATURE_VMX));
-
-       for (vcpu_id = 0; vcpu_id < nr_vcpus; vcpu_id++) {
-               vmx = vcpu_alloc_vmx(vm, &vmx_gva);
-
-               if (vcpu_id == 0) {
-                       perf_test_setup_ept(vmx, vm);
-                       vmx0 = vmx;
-               } else {
-                       /* Share the same EPT table across all vCPUs. */
-                       vmx->eptp = vmx0->eptp;
-                       vmx->eptp_hva = vmx0->eptp_hva;
-                       vmx->eptp_gpa = vmx0->eptp_gpa;
-               }
-
-               /*
-                * Override the vCPU to run perf_test_l1_guest_code() which will
-                * bounce it into L2 before calling perf_test_guest_code().
-                */
-               vcpu_regs_get(vcpus[vcpu_id], &regs);
-               regs.rip = (unsigned long) perf_test_l1_guest_code;
-               vcpu_regs_set(vcpus[vcpu_id], &regs);
-               vcpu_args_set(vcpus[vcpu_id], 2, vmx_gva, vcpu_id);
-       }
-}
index 4bdfc910ba4d3f87d51d76b97990f68da19f4847..0490bd4606e50eface677b4518d57e53b4717277 100644 (file)
@@ -21,7 +21,7 @@
 #include <linux/bitops.h>
 #include <linux/userfaultfd.h>
 
-#include "perf_test_util.h"
+#include "memstress.h"
 #include "processor.h"
 #include "test_util.h"
 #include "guest_modes.h"
@@ -72,7 +72,7 @@ static void add_remove_memslot(struct kvm_vm *vm, useconds_t delay,
        int i;
 
        /*
-        * Add the dummy memslot just below the perf_test_util memslot, which is
+        * Add the dummy memslot just below the memstress memslot, which is
         * at the top of the guest physical address space.
         */
        gpa = perf_test_args.gpa - pages * vm->page_size;