cpu-exec: simplify jump cache management

author Paolo Bonzini <pbonzini@redhat.com>

Mon, 22 Jan 2024 15:34:09 +0000 (16:34 +0100)

committer Richard Henderson <richard.henderson@linaro.org>

Sun, 28 Jan 2024 21:06:03 +0000 (07:06 +1000)
author Paolo Bonzini <pbonzini@redhat.com>
Mon, 22 Jan 2024 15:34:09 +0000 (16:34 +0100)
committer Richard Henderson <richard.henderson@linaro.org>
Sun, 28 Jan 2024 21:06:03 +0000 (07:06 +1000)
diff --git a/accel/tcg/cpu-exec.c b/accel/tcg/cpu-exec.c

index 67eda9865ee2a89f7d5a4f3a4142efb1a869d4fd..40c268bfa1f3060eda62061b3263ab3c4af3abda 100644 (file)
--- a/accel/tcg/cpu-exec.c
+++ b/accel/tcg/cpu-exec.c
@@ -253,43 +253,29 @@ static inline TranslationBlock *tb_lookup(CPUState *cpu, vaddr pc,
      hash = tb_jmp_cache_hash_func(pc);
      jc = cpu->tb_jmp_cache;
  
-    if (cflags & CF_PCREL) {
-        /* Use acquire to ensure current load of pc from jc. */
-        tb = qatomic_load_acquire(&jc->array[hash].tb);
-
-        if (likely(tb &&
-                   jc->array[hash].pc == pc &&
-                   tb->cs_base == cs_base &&
-                   tb->flags == flags &&
-                   tb_cflags(tb) == cflags)) {
-            return tb;
-        }
-        tb = tb_htable_lookup(cpu, pc, cs_base, flags, cflags);
-        if (tb == NULL) {
-            return NULL;
-        }
-        jc->array[hash].pc = pc;
-        /* Ensure pc is written first. */
-        qatomic_store_release(&jc->array[hash].tb, tb);
-    } else {
-        /* Use rcu_read to ensure current load of pc from *tb. */
-        tb = qatomic_rcu_read(&jc->array[hash].tb);
-
-        if (likely(tb &&
-                   tb->pc == pc &&
-                   tb->cs_base == cs_base &&
-                   tb->flags == flags &&
-                   tb_cflags(tb) == cflags)) {
-            return tb;
-        }
-        tb = tb_htable_lookup(cpu, pc, cs_base, flags, cflags);
-        if (tb == NULL) {
-            return NULL;
-        }
-        /* Use the pc value already stored in tb->pc. */
-        qatomic_set(&jc->array[hash].tb, tb);
+    tb = qatomic_read(&jc->array[hash].tb);
+    if (likely(tb &&
+               jc->array[hash].pc == pc &&
+               tb->cs_base == cs_base &&
+               tb->flags == flags &&
+               tb_cflags(tb) == cflags)) {
+        goto hit;
      }
  
+    tb = tb_htable_lookup(cpu, pc, cs_base, flags, cflags);
+    if (tb == NULL) {
+        return NULL;
+    }
+
+    jc->array[hash].pc = pc;
+    qatomic_set(&jc->array[hash].tb, tb);
+
+hit:
+    /*
+     * As long as tb is not NULL, the contents are consistent.  Therefore,
+     * the virtual PC has to match for non-CF_PCREL translations.
+     */
+    assert((tb_cflags(tb) & CF_PCREL) || tb->pc == pc);
      return tb;
  }
  
@@ -1012,14 +998,8 @@ cpu_exec_loop(CPUState *cpu, SyncClocks *sc)
                   */
                  h = tb_jmp_cache_hash_func(pc);
                  jc = cpu->tb_jmp_cache;
-                if (cflags & CF_PCREL) {
-                    jc->array[h].pc = pc;
-                    /* Ensure pc is written first. */
-                    qatomic_store_release(&jc->array[h].tb, tb);
-                } else {
-                    /* Use the pc value already stored in tb->pc. */
-                    qatomic_set(&jc->array[h].tb, tb);
-                }
+                jc->array[h].pc = pc;
+                qatomic_set(&jc->array[h].tb, tb);
              }
  
  #ifndef CONFIG_USER_ONLY
diff --git a/accel/tcg/tb-jmp-cache.h b/accel/tcg/tb-jmp-cache.h

index bb424c8a05b75c47e99ffe9bbe5c849725b6a549..4ab8553afcc02ff2cc754d1ff545bda9b29830f9 100644 (file)
--- a/accel/tcg/tb-jmp-cache.h
+++ b/accel/tcg/tb-jmp-cache.h
@@ -13,9 +13,11 @@
  #define TB_JMP_CACHE_SIZE (1 << TB_JMP_CACHE_BITS)
  
  /*
- * Accessed in parallel; all accesses to 'tb' must be atomic.
- * For CF_PCREL, accesses to 'pc' must be protected by a
- * load_acquire/store_release to 'tb'.
+ * Invalidated in parallel; all accesses to 'tb' must be atomic.
+ * A valid entry is read/written by a single CPU, therefore there is
+ * no need for qatomic_rcu_read() and pc is always consistent with a
+ * non-NULL value of 'tb'.  Strictly speaking pc is only needed for
+ * CF_PCREL, but it's used always for simplicity.
   */
  struct CPUJumpCache {
      struct rcu_head rcu;
author	Paolo Bonzini <pbonzini@redhat.com>
	Mon, 22 Jan 2024 15:34:09 +0000 (16:34 +0100)
committer	Richard Henderson <richard.henderson@linaro.org>
	Sun, 28 Jan 2024 21:06:03 +0000 (07:06 +1000)
accel/tcg/cpu-exec.c		patch \| blob \| history
accel/tcg/tb-jmp-cache.h		patch \| blob \| history