KVM: selftests: Rename perf_test_util.[ch] to memstress.[ch]

author David Matlack <dmatlack@google.com>

Wed, 12 Oct 2022 16:57:27 +0000 (09:57 -0700)

committer Sean Christopherson <seanjc@google.com>

Wed, 16 Nov 2022 18:57:34 +0000 (10:57 -0800)
author David Matlack <dmatlack@google.com>
Wed, 12 Oct 2022 16:57:27 +0000 (09:57 -0700)
committer Sean Christopherson <seanjc@google.com>
Wed, 16 Nov 2022 18:57:34 +0000 (10:57 -0800)
diff --git a/tools/testing/selftests/kvm/Makefile b/tools/testing/selftests/kvm/Makefile

index 0172eb6cb6eee228cd2b3bea864abdb561f4346c..a00253b79040b3a0e038bff44e7df642a89ad369 100644 (file)
--- a/tools/testing/selftests/kvm/Makefile
+++ b/tools/testing/selftests/kvm/Makefile
@@ -43,7 +43,7 @@ LIBKVM += lib/elf.c
  LIBKVM += lib/guest_modes.c
  LIBKVM += lib/io.c
  LIBKVM += lib/kvm_util.c
-LIBKVM += lib/perf_test_util.c
+LIBKVM += lib/memstress.c
  LIBKVM += lib/rbtree.c
  LIBKVM += lib/sparsebit.c
  LIBKVM += lib/test_util.c
@@ -52,7 +52,7 @@ LIBKVM_STRING += lib/string_override.c
  
  LIBKVM_x86_64 += lib/x86_64/apic.c
  LIBKVM_x86_64 += lib/x86_64/handlers.S
-LIBKVM_x86_64 += lib/x86_64/perf_test_util.c
+LIBKVM_x86_64 += lib/x86_64/memstress.c
  LIBKVM_x86_64 += lib/x86_64/processor.c
  LIBKVM_x86_64 += lib/x86_64/svm.c
  LIBKVM_x86_64 += lib/x86_64/ucall.c
diff --git a/tools/testing/selftests/kvm/access_tracking_perf_test.c b/tools/testing/selftests/kvm/access_tracking_perf_test.c

index c0cdf07de1471c7e50c3fc605c72a6a79fb5f937..534d18cc4a6af99acefbc415f0a77f4a33ef0c1e 100644 (file)
--- a/tools/testing/selftests/kvm/access_tracking_perf_test.c
+++ b/tools/testing/selftests/kvm/access_tracking_perf_test.c
@@ -44,7 +44,7 @@
  
  #include "kvm_util.h"
  #include "test_util.h"
-#include "perf_test_util.h"
+#include "memstress.h"
  #include "guest_modes.h"
  
  /* Global variable used to synchronize all of the vCPU threads. */
diff --git a/tools/testing/selftests/kvm/demand_paging_test.c b/tools/testing/selftests/kvm/demand_paging_test.c

index 0c98181fa24894c13228278c7dd7641ece0fe1d6..37501e83d1d8764ad62960d81c0766cf1d1ceb73 100644 (file)
--- a/tools/testing/selftests/kvm/demand_paging_test.c
+++ b/tools/testing/selftests/kvm/demand_paging_test.c
@@ -20,7 +20,7 @@
  
  #include "kvm_util.h"
  #include "test_util.h"
-#include "perf_test_util.h"
+#include "memstress.h"
  #include "guest_modes.h"
  
  #ifdef __NR_userfaultfd
diff --git a/tools/testing/selftests/kvm/dirty_log_perf_test.c b/tools/testing/selftests/kvm/dirty_log_perf_test.c

index 47cbda3580fd6d161d519682372e917fe299de01..d2bac493da5dda698a4a9b6a75c6ef36bcab9508 100644 (file)
--- a/tools/testing/selftests/kvm/dirty_log_perf_test.c
+++ b/tools/testing/selftests/kvm/dirty_log_perf_test.c
@@ -16,7 +16,7 @@
  
  #include "kvm_util.h"
  #include "test_util.h"
-#include "perf_test_util.h"
+#include "memstress.h"
  #include "guest_modes.h"
  
  #ifdef __aarch64__
diff --git a/tools/testing/selftests/kvm/include/memstress.h b/tools/testing/selftests/kvm/include/memstress.h

new file mode 100644 (file)

index 0000000..64a523e
--- /dev/null
+++ b/tools/testing/selftests/kvm/include/memstress.h
@@ -0,0 +1,72 @@
+// SPDX-License-Identifier: GPL-2.0
+/*
+ * tools/testing/selftests/kvm/include/memstress.h
+ *
+ * Copyright (C) 2020, Google LLC.
+ */
+
+#ifndef SELFTEST_KVM_MEMSTRESS_H
+#define SELFTEST_KVM_MEMSTRESS_H
+
+#include <pthread.h>
+
+#include "kvm_util.h"
+
+/* Default guest test virtual memory offset */
+#define DEFAULT_GUEST_TEST_MEM         0xc0000000
+
+#define DEFAULT_PER_VCPU_MEM_SIZE      (1 << 30) /* 1G */
+
+#define PERF_TEST_MEM_SLOT_INDEX       1
+
+struct perf_test_vcpu_args {
+       uint64_t gpa;
+       uint64_t gva;
+       uint64_t pages;
+
+       /* Only used by the host userspace part of the vCPU thread */
+       struct kvm_vcpu *vcpu;
+       int vcpu_idx;
+};
+
+struct perf_test_args {
+       struct kvm_vm *vm;
+       /* The starting address and size of the guest test region. */
+       uint64_t gpa;
+       uint64_t size;
+       uint64_t guest_page_size;
+       uint32_t random_seed;
+       uint32_t write_percent;
+
+       /* Run vCPUs in L2 instead of L1, if the architecture supports it. */
+       bool nested;
+       /* Randomize which pages are accessed by the guest. */
+       bool random_access;
+       /* True if all vCPUs are pinned to pCPUs */
+       bool pin_vcpus;
+       /* The vCPU=>pCPU pinning map. Only valid if pin_vcpus is true. */
+       uint32_t vcpu_to_pcpu[KVM_MAX_VCPUS];
+
+       struct perf_test_vcpu_args vcpu_args[KVM_MAX_VCPUS];
+};
+
+extern struct perf_test_args perf_test_args;
+
+struct kvm_vm *perf_test_create_vm(enum vm_guest_mode mode, int nr_vcpus,
+                                  uint64_t vcpu_memory_bytes, int slots,
+                                  enum vm_mem_backing_src_type backing_src,
+                                  bool partition_vcpu_memory_access);
+void perf_test_destroy_vm(struct kvm_vm *vm);
+
+void perf_test_set_write_percent(struct kvm_vm *vm, uint32_t write_percent);
+void perf_test_set_random_seed(struct kvm_vm *vm, uint32_t random_seed);
+void perf_test_set_random_access(struct kvm_vm *vm, bool random_access);
+
+void perf_test_start_vcpu_threads(int vcpus, void (*vcpu_fn)(struct perf_test_vcpu_args *));
+void perf_test_join_vcpu_threads(int vcpus);
+void perf_test_guest_code(uint32_t vcpu_id);
+
+uint64_t perf_test_nested_pages(int nr_vcpus);
+void perf_test_setup_nested(struct kvm_vm *vm, int nr_vcpus, struct kvm_vcpu *vcpus[]);
+
+#endif /* SELFTEST_KVM_MEMSTRESS_H */
diff --git a/tools/testing/selftests/kvm/include/perf_test_util.h b/tools/testing/selftests/kvm/include/perf_test_util.h

deleted file mode 100644 (file)

index 75ca679..0000000
--- a/tools/testing/selftests/kvm/include/perf_test_util.h
+++ /dev/null
@@ -1,72 +0,0 @@
-// SPDX-License-Identifier: GPL-2.0
-/*
- * tools/testing/selftests/kvm/include/perf_test_util.h
- *
- * Copyright (C) 2020, Google LLC.
- */
-
-#ifndef SELFTEST_KVM_PERF_TEST_UTIL_H
-#define SELFTEST_KVM_PERF_TEST_UTIL_H
-
-#include <pthread.h>
-
-#include "kvm_util.h"
-
-/* Default guest test virtual memory offset */
-#define DEFAULT_GUEST_TEST_MEM         0xc0000000
-
-#define DEFAULT_PER_VCPU_MEM_SIZE      (1 << 30) /* 1G */
-
-#define PERF_TEST_MEM_SLOT_INDEX       1
-
-struct perf_test_vcpu_args {
-       uint64_t gpa;
-       uint64_t gva;
-       uint64_t pages;
-
-       /* Only used by the host userspace part of the vCPU thread */
-       struct kvm_vcpu *vcpu;
-       int vcpu_idx;
-};
-
-struct perf_test_args {
-       struct kvm_vm *vm;
-       /* The starting address and size of the guest test region. */
-       uint64_t gpa;
-       uint64_t size;
-       uint64_t guest_page_size;
-       uint32_t random_seed;
-       uint32_t write_percent;
-
-       /* Run vCPUs in L2 instead of L1, if the architecture supports it. */
-       bool nested;
-       /* Randomize which pages are accessed by the guest. */
-       bool random_access;
-       /* True if all vCPUs are pinned to pCPUs */
-       bool pin_vcpus;
-       /* The vCPU=>pCPU pinning map. Only valid if pin_vcpus is true. */
-       uint32_t vcpu_to_pcpu[KVM_MAX_VCPUS];
-
-       struct perf_test_vcpu_args vcpu_args[KVM_MAX_VCPUS];
-};
-
-extern struct perf_test_args perf_test_args;
-
-struct kvm_vm *perf_test_create_vm(enum vm_guest_mode mode, int nr_vcpus,
-                                  uint64_t vcpu_memory_bytes, int slots,
-                                  enum vm_mem_backing_src_type backing_src,
-                                  bool partition_vcpu_memory_access);
-void perf_test_destroy_vm(struct kvm_vm *vm);
-
-void perf_test_set_write_percent(struct kvm_vm *vm, uint32_t write_percent);
-void perf_test_set_random_seed(struct kvm_vm *vm, uint32_t random_seed);
-void perf_test_set_random_access(struct kvm_vm *vm, bool random_access);
-
-void perf_test_start_vcpu_threads(int vcpus, void (*vcpu_fn)(struct perf_test_vcpu_args *));
-void perf_test_join_vcpu_threads(int vcpus);
-void perf_test_guest_code(uint32_t vcpu_id);
-
-uint64_t perf_test_nested_pages(int nr_vcpus);
-void perf_test_setup_nested(struct kvm_vm *vm, int nr_vcpus, struct kvm_vcpu *vcpus[]);
-
-#endif /* SELFTEST_KVM_PERF_TEST_UTIL_H */
diff --git a/tools/testing/selftests/kvm/lib/memstress.c b/tools/testing/selftests/kvm/lib/memstress.c

new file mode 100644 (file)

index 0000000..72f88e5
--- /dev/null
+++ b/tools/testing/selftests/kvm/lib/memstress.c
@@ -0,0 +1,322 @@
+// SPDX-License-Identifier: GPL-2.0
+/*
+ * Copyright (C) 2020, Google LLC.
+ */
+#define _GNU_SOURCE
+
+#include <inttypes.h>
+
+#include "kvm_util.h"
+#include "memstress.h"
+#include "processor.h"
+
+struct perf_test_args perf_test_args;
+
+/*
+ * Guest virtual memory offset of the testing memory slot.
+ * Must not conflict with identity mapped test code.
+ */
+static uint64_t guest_test_virt_mem = DEFAULT_GUEST_TEST_MEM;
+
+struct vcpu_thread {
+       /* The index of the vCPU. */
+       int vcpu_idx;
+
+       /* The pthread backing the vCPU. */
+       pthread_t thread;
+
+       /* Set to true once the vCPU thread is up and running. */
+       bool running;
+};
+
+/* The vCPU threads involved in this test. */
+static struct vcpu_thread vcpu_threads[KVM_MAX_VCPUS];
+
+/* The function run by each vCPU thread, as provided by the test. */
+static void (*vcpu_thread_fn)(struct perf_test_vcpu_args *);
+
+/* Set to true once all vCPU threads are up and running. */
+static bool all_vcpu_threads_running;
+
+static struct kvm_vcpu *vcpus[KVM_MAX_VCPUS];
+
+/*
+ * Continuously write to the first 8 bytes of each page in the
+ * specified region.
+ */
+void perf_test_guest_code(uint32_t vcpu_idx)
+{
+       struct perf_test_args *pta = &perf_test_args;
+       struct perf_test_vcpu_args *vcpu_args = &pta->vcpu_args[vcpu_idx];
+       struct guest_random_state rand_state;
+       uint64_t gva;
+       uint64_t pages;
+       uint64_t addr;
+       uint64_t page;
+       int i;
+
+       rand_state = new_guest_random_state(pta->random_seed + vcpu_idx);
+
+       gva = vcpu_args->gva;
+       pages = vcpu_args->pages;
+
+       /* Make sure vCPU args data structure is not corrupt. */
+       GUEST_ASSERT(vcpu_args->vcpu_idx == vcpu_idx);
+
+       while (true) {
+               for (i = 0; i < pages; i++) {
+                       if (pta->random_access)
+                               page = guest_random_u32(&rand_state) % pages;
+                       else
+                               page = i;
+
+                       addr = gva + (page * pta->guest_page_size);
+
+                       if (guest_random_u32(&rand_state) % 100 < pta->write_percent)
+                               *(uint64_t *)addr = 0x0123456789ABCDEF;
+                       else
+                               READ_ONCE(*(uint64_t *)addr);
+               }
+
+               GUEST_SYNC(1);
+       }
+}
+
+void perf_test_setup_vcpus(struct kvm_vm *vm, int nr_vcpus,
+                          struct kvm_vcpu *vcpus[],
+                          uint64_t vcpu_memory_bytes,
+                          bool partition_vcpu_memory_access)
+{
+       struct perf_test_args *pta = &perf_test_args;
+       struct perf_test_vcpu_args *vcpu_args;
+       int i;
+
+       for (i = 0; i < nr_vcpus; i++) {
+               vcpu_args = &pta->vcpu_args[i];
+
+               vcpu_args->vcpu = vcpus[i];
+               vcpu_args->vcpu_idx = i;
+
+               if (partition_vcpu_memory_access) {
+                       vcpu_args->gva = guest_test_virt_mem +
+                                        (i * vcpu_memory_bytes);
+                       vcpu_args->pages = vcpu_memory_bytes /
+                                          pta->guest_page_size;
+                       vcpu_args->gpa = pta->gpa + (i * vcpu_memory_bytes);
+               } else {
+                       vcpu_args->gva = guest_test_virt_mem;
+                       vcpu_args->pages = (nr_vcpus * vcpu_memory_bytes) /
+                                          pta->guest_page_size;
+                       vcpu_args->gpa = pta->gpa;
+               }
+
+               vcpu_args_set(vcpus[i], 1, i);
+
+               pr_debug("Added VCPU %d with test mem gpa [%lx, %lx)\n",
+                        i, vcpu_args->gpa, vcpu_args->gpa +
+                        (vcpu_args->pages * pta->guest_page_size));
+       }
+}
+
+struct kvm_vm *perf_test_create_vm(enum vm_guest_mode mode, int nr_vcpus,
+                                  uint64_t vcpu_memory_bytes, int slots,
+                                  enum vm_mem_backing_src_type backing_src,
+                                  bool partition_vcpu_memory_access)
+{
+       struct perf_test_args *pta = &perf_test_args;
+       struct kvm_vm *vm;
+       uint64_t guest_num_pages, slot0_pages = 0;
+       uint64_t backing_src_pagesz = get_backing_src_pagesz(backing_src);
+       uint64_t region_end_gfn;
+       int i;
+
+       pr_info("Testing guest mode: %s\n", vm_guest_mode_string(mode));
+
+       /* By default vCPUs will write to memory. */
+       pta->write_percent = 100;
+
+       /*
+        * Snapshot the non-huge page size.  This is used by the guest code to
+        * access/dirty pages at the logging granularity.
+        */
+       pta->guest_page_size = vm_guest_mode_params[mode].page_size;
+
+       guest_num_pages = vm_adjust_num_guest_pages(mode,
+                               (nr_vcpus * vcpu_memory_bytes) / pta->guest_page_size);
+
+       TEST_ASSERT(vcpu_memory_bytes % getpagesize() == 0,
+                   "Guest memory size is not host page size aligned.");
+       TEST_ASSERT(vcpu_memory_bytes % pta->guest_page_size == 0,
+                   "Guest memory size is not guest page size aligned.");
+       TEST_ASSERT(guest_num_pages % slots == 0,
+                   "Guest memory cannot be evenly divided into %d slots.",
+                   slots);
+
+       /*
+        * If using nested, allocate extra pages for the nested page tables and
+        * in-memory data structures.
+        */
+       if (pta->nested)
+               slot0_pages += perf_test_nested_pages(nr_vcpus);
+
+       /*
+        * Pass guest_num_pages to populate the page tables for test memory.
+        * The memory is also added to memslot 0, but that's a benign side
+        * effect as KVM allows aliasing HVAs in meslots.
+        */
+       vm = __vm_create_with_vcpus(mode, nr_vcpus, slot0_pages + guest_num_pages,
+                                   perf_test_guest_code, vcpus);
+
+       pta->vm = vm;
+
+       /* Put the test region at the top guest physical memory. */
+       region_end_gfn = vm->max_gfn + 1;
+
+#ifdef __x86_64__
+       /*
+        * When running vCPUs in L2, restrict the test region to 48 bits to
+        * avoid needing 5-level page tables to identity map L2.
+        */
+       if (pta->nested)
+               region_end_gfn = min(region_end_gfn, (1UL << 48) / pta->guest_page_size);
+#endif
+       /*
+        * If there should be more memory in the guest test region than there
+        * can be pages in the guest, it will definitely cause problems.
+        */
+       TEST_ASSERT(guest_num_pages < region_end_gfn,
+                   "Requested more guest memory than address space allows.\n"
+                   "    guest pages: %" PRIx64 " max gfn: %" PRIx64
+                   " nr_vcpus: %d wss: %" PRIx64 "]\n",
+                   guest_num_pages, region_end_gfn - 1, nr_vcpus, vcpu_memory_bytes);
+
+       pta->gpa = (region_end_gfn - guest_num_pages - 1) * pta->guest_page_size;
+       pta->gpa = align_down(pta->gpa, backing_src_pagesz);
+#ifdef __s390x__
+       /* Align to 1M (segment size) */
+       pta->gpa = align_down(pta->gpa, 1 << 20);
+#endif
+       pta->size = guest_num_pages * pta->guest_page_size;
+       pr_info("guest physical test memory: [0x%lx, 0x%lx)\n",
+               pta->gpa, pta->gpa + pta->size);
+
+       /* Add extra memory slots for testing */
+       for (i = 0; i < slots; i++) {
+               uint64_t region_pages = guest_num_pages / slots;
+               vm_paddr_t region_start = pta->gpa + region_pages * pta->guest_page_size * i;
+
+               vm_userspace_mem_region_add(vm, backing_src, region_start,
+                                           PERF_TEST_MEM_SLOT_INDEX + i,
+                                           region_pages, 0);
+       }
+
+       /* Do mapping for the demand paging memory slot */
+       virt_map(vm, guest_test_virt_mem, pta->gpa, guest_num_pages);
+
+       perf_test_setup_vcpus(vm, nr_vcpus, vcpus, vcpu_memory_bytes,
+                             partition_vcpu_memory_access);
+
+       if (pta->nested) {
+               pr_info("Configuring vCPUs to run in L2 (nested).\n");
+               perf_test_setup_nested(vm, nr_vcpus, vcpus);
+       }
+
+       ucall_init(vm, NULL);
+
+       /* Export the shared variables to the guest. */
+       sync_global_to_guest(vm, perf_test_args);
+
+       return vm;
+}
+
+void perf_test_destroy_vm(struct kvm_vm *vm)
+{
+       ucall_uninit(vm);
+       kvm_vm_free(vm);
+}
+
+void perf_test_set_write_percent(struct kvm_vm *vm, uint32_t write_percent)
+{
+       perf_test_args.write_percent = write_percent;
+       sync_global_to_guest(vm, perf_test_args.write_percent);
+}
+
+void perf_test_set_random_seed(struct kvm_vm *vm, uint32_t random_seed)
+{
+       perf_test_args.random_seed = random_seed;
+       sync_global_to_guest(vm, perf_test_args.random_seed);
+}
+
+void perf_test_set_random_access(struct kvm_vm *vm, bool random_access)
+{
+       perf_test_args.random_access = random_access;
+       sync_global_to_guest(vm, perf_test_args.random_access);
+}
+
+uint64_t __weak perf_test_nested_pages(int nr_vcpus)
+{
+       return 0;
+}
+
+void __weak perf_test_setup_nested(struct kvm_vm *vm, int nr_vcpus, struct kvm_vcpu **vcpus)
+{
+       pr_info("%s() not support on this architecture, skipping.\n", __func__);
+       exit(KSFT_SKIP);
+}
+
+static void *vcpu_thread_main(void *data)
+{
+       struct vcpu_thread *vcpu = data;
+       int vcpu_idx = vcpu->vcpu_idx;
+
+       if (perf_test_args.pin_vcpus)
+               kvm_pin_this_task_to_pcpu(perf_test_args.vcpu_to_pcpu[vcpu_idx]);
+
+       WRITE_ONCE(vcpu->running, true);
+
+       /*
+        * Wait for all vCPU threads to be up and running before calling the test-
+        * provided vCPU thread function. This prevents thread creation (which
+        * requires taking the mmap_sem in write mode) from interfering with the
+        * guest faulting in its memory.
+        */
+       while (!READ_ONCE(all_vcpu_threads_running))
+               ;
+
+       vcpu_thread_fn(&perf_test_args.vcpu_args[vcpu_idx]);
+
+       return NULL;
+}
+
+void perf_test_start_vcpu_threads(int nr_vcpus,
+                                 void (*vcpu_fn)(struct perf_test_vcpu_args *))
+{
+       int i;
+
+       vcpu_thread_fn = vcpu_fn;
+       WRITE_ONCE(all_vcpu_threads_running, false);
+
+       for (i = 0; i < nr_vcpus; i++) {
+               struct vcpu_thread *vcpu = &vcpu_threads[i];
+
+               vcpu->vcpu_idx = i;
+               WRITE_ONCE(vcpu->running, false);
+
+               pthread_create(&vcpu->thread, NULL, vcpu_thread_main, vcpu);
+       }
+
+       for (i = 0; i < nr_vcpus; i++) {
+               while (!READ_ONCE(vcpu_threads[i].running))
+                       ;
+       }
+
+       WRITE_ONCE(all_vcpu_threads_running, true);
+}
+
+void perf_test_join_vcpu_threads(int nr_vcpus)
+{
+       int i;
+
+       for (i = 0; i < nr_vcpus; i++)
+               pthread_join(vcpu_threads[i].thread, NULL);
+}
diff --git a/tools/testing/selftests/kvm/lib/perf_test_util.c b/tools/testing/selftests/kvm/lib/perf_test_util.c

deleted file mode 100644 (file)

index 3a9a3ea..0000000
--- a/tools/testing/selftests/kvm/lib/perf_test_util.c
+++ /dev/null
@@ -1,322 +0,0 @@
-// SPDX-License-Identifier: GPL-2.0
-/*
- * Copyright (C) 2020, Google LLC.
- */
-#define _GNU_SOURCE
-
-#include <inttypes.h>
-
-#include "kvm_util.h"
-#include "perf_test_util.h"
-#include "processor.h"
-
-struct perf_test_args perf_test_args;
-
-/*
- * Guest virtual memory offset of the testing memory slot.
- * Must not conflict with identity mapped test code.
- */
-static uint64_t guest_test_virt_mem = DEFAULT_GUEST_TEST_MEM;
-
-struct vcpu_thread {
-       /* The index of the vCPU. */
-       int vcpu_idx;
-
-       /* The pthread backing the vCPU. */
-       pthread_t thread;
-
-       /* Set to true once the vCPU thread is up and running. */
-       bool running;
-};
-
-/* The vCPU threads involved in this test. */
-static struct vcpu_thread vcpu_threads[KVM_MAX_VCPUS];
-
-/* The function run by each vCPU thread, as provided by the test. */
-static void (*vcpu_thread_fn)(struct perf_test_vcpu_args *);
-
-/* Set to true once all vCPU threads are up and running. */
-static bool all_vcpu_threads_running;
-
-static struct kvm_vcpu *vcpus[KVM_MAX_VCPUS];
-
-/*
- * Continuously write to the first 8 bytes of each page in the
- * specified region.
- */
-void perf_test_guest_code(uint32_t vcpu_idx)
-{
-       struct perf_test_args *pta = &perf_test_args;
-       struct perf_test_vcpu_args *vcpu_args = &pta->vcpu_args[vcpu_idx];
-       struct guest_random_state rand_state;
-       uint64_t gva;
-       uint64_t pages;
-       uint64_t addr;
-       uint64_t page;
-       int i;
-
-       rand_state = new_guest_random_state(pta->random_seed + vcpu_idx);
-
-       gva = vcpu_args->gva;
-       pages = vcpu_args->pages;
-
-       /* Make sure vCPU args data structure is not corrupt. */
-       GUEST_ASSERT(vcpu_args->vcpu_idx == vcpu_idx);
-
-       while (true) {
-               for (i = 0; i < pages; i++) {
-                       if (pta->random_access)
-                               page = guest_random_u32(&rand_state) % pages;
-                       else
-                               page = i;
-
-                       addr = gva + (page * pta->guest_page_size);
-
-                       if (guest_random_u32(&rand_state) % 100 < pta->write_percent)
-                               *(uint64_t *)addr = 0x0123456789ABCDEF;
-                       else
-                               READ_ONCE(*(uint64_t *)addr);
-               }
-
-               GUEST_SYNC(1);
-       }
-}
-
-void perf_test_setup_vcpus(struct kvm_vm *vm, int nr_vcpus,
-                          struct kvm_vcpu *vcpus[],
-                          uint64_t vcpu_memory_bytes,
-                          bool partition_vcpu_memory_access)
-{
-       struct perf_test_args *pta = &perf_test_args;
-       struct perf_test_vcpu_args *vcpu_args;
-       int i;
-
-       for (i = 0; i < nr_vcpus; i++) {
-               vcpu_args = &pta->vcpu_args[i];
-
-               vcpu_args->vcpu = vcpus[i];
-               vcpu_args->vcpu_idx = i;
-
-               if (partition_vcpu_memory_access) {
-                       vcpu_args->gva = guest_test_virt_mem +
-                                        (i * vcpu_memory_bytes);
-                       vcpu_args->pages = vcpu_memory_bytes /
-                                          pta->guest_page_size;
-                       vcpu_args->gpa = pta->gpa + (i * vcpu_memory_bytes);
-               } else {
-                       vcpu_args->gva = guest_test_virt_mem;
-                       vcpu_args->pages = (nr_vcpus * vcpu_memory_bytes) /
-                                          pta->guest_page_size;
-                       vcpu_args->gpa = pta->gpa;
-               }
-
-               vcpu_args_set(vcpus[i], 1, i);
-
-               pr_debug("Added VCPU %d with test mem gpa [%lx, %lx)\n",
-                        i, vcpu_args->gpa, vcpu_args->gpa +
-                        (vcpu_args->pages * pta->guest_page_size));
-       }
-}
-
-struct kvm_vm *perf_test_create_vm(enum vm_guest_mode mode, int nr_vcpus,
-                                  uint64_t vcpu_memory_bytes, int slots,
-                                  enum vm_mem_backing_src_type backing_src,
-                                  bool partition_vcpu_memory_access)
-{
-       struct perf_test_args *pta = &perf_test_args;
-       struct kvm_vm *vm;
-       uint64_t guest_num_pages, slot0_pages = 0;
-       uint64_t backing_src_pagesz = get_backing_src_pagesz(backing_src);
-       uint64_t region_end_gfn;
-       int i;
-
-       pr_info("Testing guest mode: %s\n", vm_guest_mode_string(mode));
-
-       /* By default vCPUs will write to memory. */
-       pta->write_percent = 100;
-
-       /*
-        * Snapshot the non-huge page size.  This is used by the guest code to
-        * access/dirty pages at the logging granularity.
-        */
-       pta->guest_page_size = vm_guest_mode_params[mode].page_size;
-
-       guest_num_pages = vm_adjust_num_guest_pages(mode,
-                               (nr_vcpus * vcpu_memory_bytes) / pta->guest_page_size);
-
-       TEST_ASSERT(vcpu_memory_bytes % getpagesize() == 0,
-                   "Guest memory size is not host page size aligned.");
-       TEST_ASSERT(vcpu_memory_bytes % pta->guest_page_size == 0,
-                   "Guest memory size is not guest page size aligned.");
-       TEST_ASSERT(guest_num_pages % slots == 0,
-                   "Guest memory cannot be evenly divided into %d slots.",
-                   slots);
-
-       /*
-        * If using nested, allocate extra pages for the nested page tables and
-        * in-memory data structures.
-        */
-       if (pta->nested)
-               slot0_pages += perf_test_nested_pages(nr_vcpus);
-
-       /*
-        * Pass guest_num_pages to populate the page tables for test memory.
-        * The memory is also added to memslot 0, but that's a benign side
-        * effect as KVM allows aliasing HVAs in meslots.
-        */
-       vm = __vm_create_with_vcpus(mode, nr_vcpus, slot0_pages + guest_num_pages,
-                                   perf_test_guest_code, vcpus);
-
-       pta->vm = vm;
-
-       /* Put the test region at the top guest physical memory. */
-       region_end_gfn = vm->max_gfn + 1;
-
-#ifdef __x86_64__
-       /*
-        * When running vCPUs in L2, restrict the test region to 48 bits to
-        * avoid needing 5-level page tables to identity map L2.
-        */
-       if (pta->nested)
-               region_end_gfn = min(region_end_gfn, (1UL << 48) / pta->guest_page_size);
-#endif
-       /*
-        * If there should be more memory in the guest test region than there
-        * can be pages in the guest, it will definitely cause problems.
-        */
-       TEST_ASSERT(guest_num_pages < region_end_gfn,
-                   "Requested more guest memory than address space allows.\n"
-                   "    guest pages: %" PRIx64 " max gfn: %" PRIx64
-                   " nr_vcpus: %d wss: %" PRIx64 "]\n",
-                   guest_num_pages, region_end_gfn - 1, nr_vcpus, vcpu_memory_bytes);
-
-       pta->gpa = (region_end_gfn - guest_num_pages - 1) * pta->guest_page_size;
-       pta->gpa = align_down(pta->gpa, backing_src_pagesz);
-#ifdef __s390x__
-       /* Align to 1M (segment size) */
-       pta->gpa = align_down(pta->gpa, 1 << 20);
-#endif
-       pta->size = guest_num_pages * pta->guest_page_size;
-       pr_info("guest physical test memory: [0x%lx, 0x%lx)\n",
-               pta->gpa, pta->gpa + pta->size);
-
-       /* Add extra memory slots for testing */
-       for (i = 0; i < slots; i++) {
-               uint64_t region_pages = guest_num_pages / slots;
-               vm_paddr_t region_start = pta->gpa + region_pages * pta->guest_page_size * i;
-
-               vm_userspace_mem_region_add(vm, backing_src, region_start,
-                                           PERF_TEST_MEM_SLOT_INDEX + i,
-                                           region_pages, 0);
-       }
-
-       /* Do mapping for the demand paging memory slot */
-       virt_map(vm, guest_test_virt_mem, pta->gpa, guest_num_pages);
-
-       perf_test_setup_vcpus(vm, nr_vcpus, vcpus, vcpu_memory_bytes,
-                             partition_vcpu_memory_access);
-
-       if (pta->nested) {
-               pr_info("Configuring vCPUs to run in L2 (nested).\n");
-               perf_test_setup_nested(vm, nr_vcpus, vcpus);
-       }
-
-       ucall_init(vm, NULL);
-
-       /* Export the shared variables to the guest. */
-       sync_global_to_guest(vm, perf_test_args);
-
-       return vm;
-}
-
-void perf_test_destroy_vm(struct kvm_vm *vm)
-{
-       ucall_uninit(vm);
-       kvm_vm_free(vm);
-}
-
-void perf_test_set_write_percent(struct kvm_vm *vm, uint32_t write_percent)
-{
-       perf_test_args.write_percent = write_percent;
-       sync_global_to_guest(vm, perf_test_args.write_percent);
-}
-
-void perf_test_set_random_seed(struct kvm_vm *vm, uint32_t random_seed)
-{
-       perf_test_args.random_seed = random_seed;
-       sync_global_to_guest(vm, perf_test_args.random_seed);
-}
-
-void perf_test_set_random_access(struct kvm_vm *vm, bool random_access)
-{
-       perf_test_args.random_access = random_access;
-       sync_global_to_guest(vm, perf_test_args.random_access);
-}
-
-uint64_t __weak perf_test_nested_pages(int nr_vcpus)
-{
-       return 0;
-}
-
-void __weak perf_test_setup_nested(struct kvm_vm *vm, int nr_vcpus, struct kvm_vcpu **vcpus)
-{
-       pr_info("%s() not support on this architecture, skipping.\n", __func__);
-       exit(KSFT_SKIP);
-}
-
-static void *vcpu_thread_main(void *data)
-{
-       struct vcpu_thread *vcpu = data;
-       int vcpu_idx = vcpu->vcpu_idx;
-
-       if (perf_test_args.pin_vcpus)
-               kvm_pin_this_task_to_pcpu(perf_test_args.vcpu_to_pcpu[vcpu_idx]);
-
-       WRITE_ONCE(vcpu->running, true);
-
-       /*
-        * Wait for all vCPU threads to be up and running before calling the test-
-        * provided vCPU thread function. This prevents thread creation (which
-        * requires taking the mmap_sem in write mode) from interfering with the
-        * guest faulting in its memory.
-        */
-       while (!READ_ONCE(all_vcpu_threads_running))
-               ;
-
-       vcpu_thread_fn(&perf_test_args.vcpu_args[vcpu_idx]);
-
-       return NULL;
-}
-
-void perf_test_start_vcpu_threads(int nr_vcpus,
-                                 void (*vcpu_fn)(struct perf_test_vcpu_args *))
-{
-       int i;
-
-       vcpu_thread_fn = vcpu_fn;
-       WRITE_ONCE(all_vcpu_threads_running, false);
-
-       for (i = 0; i < nr_vcpus; i++) {
-               struct vcpu_thread *vcpu = &vcpu_threads[i];
-
-               vcpu->vcpu_idx = i;
-               WRITE_ONCE(vcpu->running, false);
-
-               pthread_create(&vcpu->thread, NULL, vcpu_thread_main, vcpu);
-       }
-
-       for (i = 0; i < nr_vcpus; i++) {
-               while (!READ_ONCE(vcpu_threads[i].running))
-                       ;
-       }
-
-       WRITE_ONCE(all_vcpu_threads_running, true);
-}
-
-void perf_test_join_vcpu_threads(int nr_vcpus)
-{
-       int i;
-
-       for (i = 0; i < nr_vcpus; i++)
-               pthread_join(vcpu_threads[i].thread, NULL);
-}
diff --git a/tools/testing/selftests/kvm/lib/x86_64/memstress.c b/tools/testing/selftests/kvm/lib/x86_64/memstress.c

new file mode 100644 (file)

index 0000000..0bb717a
--- /dev/null
+++ b/tools/testing/selftests/kvm/lib/x86_64/memstress.c
@@ -0,0 +1,111 @@
+// SPDX-License-Identifier: GPL-2.0
+/*
+ * x86_64-specific extensions to memstress.c.
+ *
+ * Copyright (C) 2022, Google, Inc.
+ */
+#include <stdio.h>
+#include <stdlib.h>
+#include <linux/bitmap.h>
+#include <linux/bitops.h>
+
+#include "test_util.h"
+#include "kvm_util.h"
+#include "memstress.h"
+#include "processor.h"
+#include "vmx.h"
+
+void perf_test_l2_guest_code(uint64_t vcpu_id)
+{
+       perf_test_guest_code(vcpu_id);
+       vmcall();
+}
+
+extern char perf_test_l2_guest_entry[];
+__asm__(
+"perf_test_l2_guest_entry:"
+"      mov (%rsp), %rdi;"
+"      call perf_test_l2_guest_code;"
+"      ud2;"
+);
+
+static void perf_test_l1_guest_code(struct vmx_pages *vmx, uint64_t vcpu_id)
+{
+#define L2_GUEST_STACK_SIZE 64
+       unsigned long l2_guest_stack[L2_GUEST_STACK_SIZE];
+       unsigned long *rsp;
+
+       GUEST_ASSERT(vmx->vmcs_gpa);
+       GUEST_ASSERT(prepare_for_vmx_operation(vmx));
+       GUEST_ASSERT(load_vmcs(vmx));
+       GUEST_ASSERT(ept_1g_pages_supported());
+
+       rsp = &l2_guest_stack[L2_GUEST_STACK_SIZE - 1];
+       *rsp = vcpu_id;
+       prepare_vmcs(vmx, perf_test_l2_guest_entry, rsp);
+
+       GUEST_ASSERT(!vmlaunch());
+       GUEST_ASSERT(vmreadz(VM_EXIT_REASON) == EXIT_REASON_VMCALL);
+       GUEST_DONE();
+}
+
+uint64_t perf_test_nested_pages(int nr_vcpus)
+{
+       /*
+        * 513 page tables is enough to identity-map 256 TiB of L2 with 1G
+        * pages and 4-level paging, plus a few pages per-vCPU for data
+        * structures such as the VMCS.
+        */
+       return 513 + 10 * nr_vcpus;
+}
+
+void perf_test_setup_ept(struct vmx_pages *vmx, struct kvm_vm *vm)
+{
+       uint64_t start, end;
+
+       prepare_eptp(vmx, vm, 0);
+
+       /*
+        * Identity map the first 4G and the test region with 1G pages so that
+        * KVM can shadow the EPT12 with the maximum huge page size supported
+        * by the backing source.
+        */
+       nested_identity_map_1g(vmx, vm, 0, 0x100000000ULL);
+
+       start = align_down(perf_test_args.gpa, PG_SIZE_1G);
+       end = align_up(perf_test_args.gpa + perf_test_args.size, PG_SIZE_1G);
+       nested_identity_map_1g(vmx, vm, start, end - start);
+}
+
+void perf_test_setup_nested(struct kvm_vm *vm, int nr_vcpus, struct kvm_vcpu *vcpus[])
+{
+       struct vmx_pages *vmx, *vmx0 = NULL;
+       struct kvm_regs regs;
+       vm_vaddr_t vmx_gva;
+       int vcpu_id;
+
+       TEST_REQUIRE(kvm_cpu_has(X86_FEATURE_VMX));
+
+       for (vcpu_id = 0; vcpu_id < nr_vcpus; vcpu_id++) {
+               vmx = vcpu_alloc_vmx(vm, &vmx_gva);
+
+               if (vcpu_id == 0) {
+                       perf_test_setup_ept(vmx, vm);
+                       vmx0 = vmx;
+               } else {
+                       /* Share the same EPT table across all vCPUs. */
+                       vmx->eptp = vmx0->eptp;
+                       vmx->eptp_hva = vmx0->eptp_hva;
+                       vmx->eptp_gpa = vmx0->eptp_gpa;
+               }
+
+               /*
+                * Override the vCPU to run perf_test_l1_guest_code() which will
+                * bounce it into L2 before calling perf_test_guest_code().
+                */
+               vcpu_regs_get(vcpus[vcpu_id], &regs);
+               regs.rip = (unsigned long) perf_test_l1_guest_code;
+               vcpu_regs_set(vcpus[vcpu_id], &regs);
+               vcpu_args_set(vcpus[vcpu_id], 2, vmx_gva, vcpu_id);
+       }
+}
diff --git a/tools/testing/selftests/kvm/lib/x86_64/perf_test_util.c b/tools/testing/selftests/kvm/lib/x86_64/perf_test_util.c

deleted file mode 100644 (file)

index 0f344a7..0000000
--- a/tools/testing/selftests/kvm/lib/x86_64/perf_test_util.c
+++ /dev/null
@@ -1,111 +0,0 @@
-// SPDX-License-Identifier: GPL-2.0
-/*
- * x86_64-specific extensions to perf_test_util.c.
- *
- * Copyright (C) 2022, Google, Inc.
- */
-#include <stdio.h>
-#include <stdlib.h>
-#include <linux/bitmap.h>
-#include <linux/bitops.h>
-
-#include "test_util.h"
-#include "kvm_util.h"
-#include "perf_test_util.h"
-#include "processor.h"
-#include "vmx.h"
-
-void perf_test_l2_guest_code(uint64_t vcpu_id)
-{
-       perf_test_guest_code(vcpu_id);
-       vmcall();
-}
-
-extern char perf_test_l2_guest_entry[];
-__asm__(
-"perf_test_l2_guest_entry:"
-"      mov (%rsp), %rdi;"
-"      call perf_test_l2_guest_code;"
-"      ud2;"
-);
-
-static void perf_test_l1_guest_code(struct vmx_pages *vmx, uint64_t vcpu_id)
-{
-#define L2_GUEST_STACK_SIZE 64
-       unsigned long l2_guest_stack[L2_GUEST_STACK_SIZE];
-       unsigned long *rsp;
-
-       GUEST_ASSERT(vmx->vmcs_gpa);
-       GUEST_ASSERT(prepare_for_vmx_operation(vmx));
-       GUEST_ASSERT(load_vmcs(vmx));
-       GUEST_ASSERT(ept_1g_pages_supported());
-
-       rsp = &l2_guest_stack[L2_GUEST_STACK_SIZE - 1];
-       *rsp = vcpu_id;
-       prepare_vmcs(vmx, perf_test_l2_guest_entry, rsp);
-
-       GUEST_ASSERT(!vmlaunch());
-       GUEST_ASSERT(vmreadz(VM_EXIT_REASON) == EXIT_REASON_VMCALL);
-       GUEST_DONE();
-}
-
-uint64_t perf_test_nested_pages(int nr_vcpus)
-{
-       /*
-        * 513 page tables is enough to identity-map 256 TiB of L2 with 1G
-        * pages and 4-level paging, plus a few pages per-vCPU for data
-        * structures such as the VMCS.
-        */
-       return 513 + 10 * nr_vcpus;
-}
-
-void perf_test_setup_ept(struct vmx_pages *vmx, struct kvm_vm *vm)
-{
-       uint64_t start, end;
-
-       prepare_eptp(vmx, vm, 0);
-
-       /*
-        * Identity map the first 4G and the test region with 1G pages so that
-        * KVM can shadow the EPT12 with the maximum huge page size supported
-        * by the backing source.
-        */
-       nested_identity_map_1g(vmx, vm, 0, 0x100000000ULL);
-
-       start = align_down(perf_test_args.gpa, PG_SIZE_1G);
-       end = align_up(perf_test_args.gpa + perf_test_args.size, PG_SIZE_1G);
-       nested_identity_map_1g(vmx, vm, start, end - start);
-}
-
-void perf_test_setup_nested(struct kvm_vm *vm, int nr_vcpus, struct kvm_vcpu *vcpus[])
-{
-       struct vmx_pages *vmx, *vmx0 = NULL;
-       struct kvm_regs regs;
-       vm_vaddr_t vmx_gva;
-       int vcpu_id;
-
-       TEST_REQUIRE(kvm_cpu_has(X86_FEATURE_VMX));
-
-       for (vcpu_id = 0; vcpu_id < nr_vcpus; vcpu_id++) {
-               vmx = vcpu_alloc_vmx(vm, &vmx_gva);
-
-               if (vcpu_id == 0) {
-                       perf_test_setup_ept(vmx, vm);
-                       vmx0 = vmx;
-               } else {
-                       /* Share the same EPT table across all vCPUs. */
-                       vmx->eptp = vmx0->eptp;
-                       vmx->eptp_hva = vmx0->eptp_hva;
-                       vmx->eptp_gpa = vmx0->eptp_gpa;
-               }
-
-               /*
-                * Override the vCPU to run perf_test_l1_guest_code() which will
-                * bounce it into L2 before calling perf_test_guest_code().
-                */
-               vcpu_regs_get(vcpus[vcpu_id], &regs);
-               regs.rip = (unsigned long) perf_test_l1_guest_code;
-               vcpu_regs_set(vcpus[vcpu_id], &regs);
-               vcpu_args_set(vcpus[vcpu_id], 2, vmx_gva, vcpu_id);
-       }
-}
diff --git a/tools/testing/selftests/kvm/memslot_modification_stress_test.c b/tools/testing/selftests/kvm/memslot_modification_stress_test.c

index 4bdfc910ba4d3f87d51d76b97990f68da19f4847..0490bd4606e50eface677b4518d57e53b4717277 100644 (file)
--- a/tools/testing/selftests/kvm/memslot_modification_stress_test.c
+++ b/tools/testing/selftests/kvm/memslot_modification_stress_test.c
@@ -21,7 +21,7 @@
  #include <linux/bitops.h>
  #include <linux/userfaultfd.h>
  
-#include "perf_test_util.h"
+#include "memstress.h"
  #include "processor.h"
  #include "test_util.h"
  #include "guest_modes.h"
@@ -72,7 +72,7 @@ static void add_remove_memslot(struct kvm_vm *vm, useconds_t delay,
         int i;
  
         /*
-        * Add the dummy memslot just below the perf_test_util memslot, which is
+        * Add the dummy memslot just below the memstress memslot, which is
          * at the top of the guest physical address space.
          */
         gpa = perf_test_args.gpa - pages * vm->page_size;
author	David Matlack <dmatlack@google.com>
	Wed, 12 Oct 2022 16:57:27 +0000 (09:57 -0700)
committer	Sean Christopherson <seanjc@google.com>
	Wed, 16 Nov 2022 18:57:34 +0000 (10:57 -0800)
tools/testing/selftests/kvm/Makefile		patch \| blob \| history
tools/testing/selftests/kvm/access_tracking_perf_test.c		patch \| blob \| history
tools/testing/selftests/kvm/demand_paging_test.c		patch \| blob \| history
tools/testing/selftests/kvm/dirty_log_perf_test.c		patch \| blob \| history
tools/testing/selftests/kvm/include/memstress.h	[new file with mode: 0644]	patch \| blob
tools/testing/selftests/kvm/include/perf_test_util.h	[deleted file]	patch \| blob \| history
tools/testing/selftests/kvm/lib/memstress.c	[new file with mode: 0644]	patch \| blob
tools/testing/selftests/kvm/lib/perf_test_util.c	[deleted file]	patch \| blob \| history
tools/testing/selftests/kvm/lib/x86_64/memstress.c	[new file with mode: 0644]	patch \| blob
tools/testing/selftests/kvm/lib/x86_64/perf_test_util.c	[deleted file]	patch \| blob \| history
tools/testing/selftests/kvm/memslot_modification_stress_test.c		patch \| blob \| history