overcommit: introduce mem-lock=on-fault

author Daniil Tatianin <d-tatianin@yandex-team.ru>

Wed, 12 Feb 2025 14:39:20 +0000 (17:39 +0300)

committer Peter Xu <peterx@redhat.com>

Wed, 12 Feb 2025 16:36:13 +0000 (11:36 -0500)
author Daniil Tatianin <d-tatianin@yandex-team.ru>
Wed, 12 Feb 2025 14:39:20 +0000 (17:39 +0300)
committer Peter Xu <peterx@redhat.com>
Wed, 12 Feb 2025 16:36:13 +0000 (11:36 -0500)
diff --git a/include/system/system.h b/include/system/system.h

index dc7628357abf5b4dce3bf0827eebb9f8db44c5af..a7effe7dfd8b2b9b015a55ffd2c0794ed8d32b4e 100644 (file)
--- a/include/system/system.h
+++ b/include/system/system.h
@@ -50,9 +50,11 @@ extern QEMUClockType rtc_clock;
  typedef enum {
      MLOCK_OFF = 0,
      MLOCK_ON,
+    MLOCK_ON_FAULT,
  } MlockState;
  
  bool should_mlock(MlockState);
+bool is_mlock_on_fault(MlockState);
  
  extern MlockState mlock_state;
  
diff --git a/migration/postcopy-ram.c b/migration/postcopy-ram.c

index 04068ee0394d50833540e35b6247acf440fa3dbb..5d3edfcfec73d1559d1257fbf16727449f45d39c 100644 (file)
--- a/migration/postcopy-ram.c
+++ b/migration/postcopy-ram.c
@@ -652,7 +652,7 @@ int postcopy_ram_incoming_cleanup(MigrationIncomingState *mis)
      }
  
      if (should_mlock(mlock_state)) {
-        if (os_mlock(false) < 0) {
+        if (os_mlock(is_mlock_on_fault(mlock_state)) < 0) {
              error_report("mlock: %s", strerror(errno));
              /*
               * It doesn't feel right to fail at this point, we have a valid
diff --git a/qemu-options.hx b/qemu-options.hx

index 1b26ad53bda760b3762e8bf23f706901798d22ff..61270e3206701d840c5bc68c219eec80b44bfef8 100644 (file)
--- a/qemu-options.hx
+++ b/qemu-options.hx
@@ -4632,21 +4632,25 @@ SRST
  ERST
  
  DEF("overcommit", HAS_ARG, QEMU_OPTION_overcommit,
-    "-overcommit [mem-lock=on|off][cpu-pm=on|off]\n"
+    "-overcommit [mem-lock=on|off|on-fault][cpu-pm=on|off]\n"
      "                run qemu with overcommit hints\n"
-    "                mem-lock=on|off controls memory lock support (default: off)\n"
+    "                mem-lock=on|off|on-fault controls memory lock support (default: off)\n"
      "                cpu-pm=on|off controls cpu power management (default: off)\n",
      QEMU_ARCH_ALL)
  SRST
-``-overcommit mem-lock=on|off``
+``-overcommit mem-lock=on|off|on-fault``
    \ 
  ``-overcommit cpu-pm=on|off``
      Run qemu with hints about host resource overcommit. The default is
      to assume that host overcommits all resources.
  
      Locking qemu and guest memory can be enabled via ``mem-lock=on``
-    (disabled by default). This works when host memory is not
-    overcommitted and reduces the worst-case latency for guest.
+    or ``mem-lock=on-fault`` (disabled by default). This works when
+    host memory is not overcommitted and reduces the worst-case latency for
+    guest. The on-fault option is better for reducing the memory footprint
+    since it makes allocations lazy, but the pages still get locked in place
+    once faulted by the guest or QEMU. Note that the two options are mutually
+    exclusive.
  
      Guest ability to manage power state of host cpus (increasing latency
      for other processes on the same host cpu, but decreasing latency for
diff --git a/system/globals.c b/system/globals.c

index adeff383484648f499c0552d963bbb64d065f6ec..316623bd20af32840d0f2d7740804c25af86b850 100644 (file)
--- a/system/globals.c
+++ b/system/globals.c
@@ -33,7 +33,12 @@
  
  bool should_mlock(MlockState state)
  {
-    return state == MLOCK_ON;
+    return state == MLOCK_ON || state == MLOCK_ON_FAULT;
+}
+
+bool is_mlock_on_fault(MlockState state)
+{
+    return state == MLOCK_ON_FAULT;
  }
  
  enum vga_retrace_method vga_retrace_method = VGA_RETRACE_DUMB;
diff --git a/system/vl.c b/system/vl.c

index 2895824c1ad65fe9f35b81fde82add721e95c22f..3c0fa2ff642ccc1d6c85fd7223ea0e143913f219 100644 (file)
--- a/system/vl.c
+++ b/system/vl.c
@@ -351,7 +351,7 @@ static QemuOptsList qemu_overcommit_opts = {
      .desc = {
          {
              .name = "mem-lock",
-            .type = QEMU_OPT_BOOL,
+            .type = QEMU_OPT_STRING,
          },
          {
              .name = "cpu-pm",
@@ -797,7 +797,7 @@ static QemuOptsList qemu_run_with_opts = {
  static void realtime_init(void)
  {
      if (should_mlock(mlock_state)) {
-        if (os_mlock(false) < 0) {
+        if (os_mlock(is_mlock_on_fault(mlock_state)) < 0) {
              error_report("locking memory failed");
              exit(1);
          }
@@ -1878,7 +1878,7 @@ static void object_option_parse(const char *str)
  static void overcommit_parse(const char *str)
  {
      QemuOpts *opts;
-    bool enable_mlock;
+    const char *mem_lock_opt;
  
      opts = qemu_opts_parse_noisily(qemu_find_opts("overcommit"),
                                     str, false);
@@ -1886,11 +1886,31 @@ static void overcommit_parse(const char *str)
          exit(1);
      }
  
-    enable_mlock = qemu_opt_get_bool(opts, "mem-lock",
-                                     should_mlock(mlock_state));
-    mlock_state = enable_mlock ? MLOCK_ON : MLOCK_OFF;
-
      enable_cpu_pm = qemu_opt_get_bool(opts, "cpu-pm", enable_cpu_pm);
+
+    mem_lock_opt = qemu_opt_get(opts, "mem-lock");
+    if (!mem_lock_opt) {
+        return;
+    }
+
+    if (strcmp(mem_lock_opt, "on") == 0) {
+        mlock_state = MLOCK_ON;
+        return;
+    }
+
+    if (strcmp(mem_lock_opt, "off") == 0) {
+        mlock_state = MLOCK_OFF;
+        return;
+    }
+
+    if (strcmp(mem_lock_opt, "on-fault") == 0) {
+        mlock_state = MLOCK_ON_FAULT;
+        return;
+    }
+
+    error_report("parameter 'mem-lock' expects one of "
+                 "'on', 'off', 'on-fault'");
+    exit(1);
  }
  
  /*
author	Daniil Tatianin <d-tatianin@yandex-team.ru>
	Wed, 12 Feb 2025 14:39:20 +0000 (17:39 +0300)
committer	Peter Xu <peterx@redhat.com>
	Wed, 12 Feb 2025 16:36:13 +0000 (11:36 -0500)
include/system/system.h		patch \| blob \| history
migration/postcopy-ram.c		patch \| blob \| history
qemu-options.hx		patch \| blob \| history
system/globals.c		patch \| blob \| history
system/vl.c		patch \| blob \| history