thebeanogamer / rpms / qemu-kvm

Forked from rpms/qemu-kvm 5 months ago
Clone

Blame SOURCES/kvm-qemu-thread-posix-cleanup-fix-document-QemuEvent.patch

ed5979
From aa61e4c437d29a791ea09a01f7230231f1e53356 Mon Sep 17 00:00:00 2001
ed5979
From: Emanuele Giuseppe Esposito <eesposit@redhat.com>
ed5979
Date: Thu, 9 Mar 2023 08:24:36 -0500
ed5979
Subject: [PATCH 05/12] qemu-thread-posix: cleanup, fix, document QemuEvent
ed5979
ed5979
RH-Author: Emanuele Giuseppe Esposito <eesposit@redhat.com>
ed5979
RH-MergeRequest: 158: qatomic: add smp_mb__before/after_rmw()
ed5979
RH-Bugzilla: 2175660
ed5979
RH-Acked-by: Paolo Bonzini <pbonzini@redhat.com>
ed5979
RH-Acked-by: Cornelia Huck <cohuck@redhat.com>
ed5979
RH-Acked-by: David Hildenbrand <david@redhat.com>
ed5979
RH-Acked-by: Eric Auger <eric.auger@redhat.com>
ed5979
RH-Commit: [2/9] c3bdf75f884e137c667316aaac96bb4a0b9ec2d9 (eesposit/qemu-kvm)
ed5979
ed5979
Bugzilla: https://bugzilla.redhat.com/show_bug.cgi?id=2175660
ed5979
ed5979
commit 9586a1329f5dce6c1d7f4de53cf0536644d7e593
ed5979
Author: Paolo Bonzini <pbonzini@redhat.com>
ed5979
Date:   Thu Mar 2 11:19:52 2023 +0100
ed5979
ed5979
    qemu-thread-posix: cleanup, fix, document QemuEvent
ed5979
ed5979
    QemuEvent is currently broken on ARM due to missing memory barriers
ed5979
    after qatomic_*().  Apart from adding the memory barrier, a closer look
ed5979
    reveals some unpaired memory barriers too.  Document more clearly what
ed5979
    is going on.
ed5979
ed5979
    Reviewed-by: Richard Henderson <richard.henderson@linaro.org>
ed5979
    Reviewed-by: David Hildenbrand <david@redhat.com>
ed5979
    Signed-off-by: Paolo Bonzini <pbonzini@redhat.com>
ed5979
ed5979
Signed-off-by: Emanuele Giuseppe Esposito <eesposit@redhat.com>
ed5979
---
ed5979
 util/qemu-thread-posix.c | 69 ++++++++++++++++++++++++++++------------
ed5979
 1 file changed, 49 insertions(+), 20 deletions(-)
ed5979
ed5979
diff --git a/util/qemu-thread-posix.c b/util/qemu-thread-posix.c
ed5979
index bae938c670..cc74f4ede0 100644
ed5979
--- a/util/qemu-thread-posix.c
ed5979
+++ b/util/qemu-thread-posix.c
ed5979
@@ -379,13 +379,21 @@ void qemu_event_destroy(QemuEvent *ev)
ed5979
 
ed5979
 void qemu_event_set(QemuEvent *ev)
ed5979
 {
ed5979
-    /* qemu_event_set has release semantics, but because it *loads*
ed5979
+    assert(ev->initialized);
ed5979
+
ed5979
+    /*
ed5979
+     * Pairs with both qemu_event_reset() and qemu_event_wait().
ed5979
+     *
ed5979
+     * qemu_event_set has release semantics, but because it *loads*
ed5979
      * ev->value we need a full memory barrier here.
ed5979
      */
ed5979
-    assert(ev->initialized);
ed5979
     smp_mb();
ed5979
     if (qatomic_read(&ev->value) != EV_SET) {
ed5979
-        if (qatomic_xchg(&ev->value, EV_SET) == EV_BUSY) {
ed5979
+        int old = qatomic_xchg(&ev->value, EV_SET);
ed5979
+
ed5979
+        /* Pairs with memory barrier in kernel futex_wait system call.  */
ed5979
+        smp_mb__after_rmw();
ed5979
+        if (old == EV_BUSY) {
ed5979
             /* There were waiters, wake them up.  */
ed5979
             qemu_futex_wake(ev, INT_MAX);
ed5979
         }
ed5979
@@ -394,18 +402,19 @@ void qemu_event_set(QemuEvent *ev)
ed5979
 
ed5979
 void qemu_event_reset(QemuEvent *ev)
ed5979
 {
ed5979
-    unsigned value;
ed5979
-
ed5979
     assert(ev->initialized);
ed5979
-    value = qatomic_read(&ev->value);
ed5979
-    smp_mb_acquire();
ed5979
-    if (value == EV_SET) {
ed5979
-        /*
ed5979
-         * If there was a concurrent reset (or even reset+wait),
ed5979
-         * do nothing.  Otherwise change EV_SET->EV_FREE.
ed5979
-         */
ed5979
-        qatomic_or(&ev->value, EV_FREE);
ed5979
-    }
ed5979
+
ed5979
+    /*
ed5979
+     * If there was a concurrent reset (or even reset+wait),
ed5979
+     * do nothing.  Otherwise change EV_SET->EV_FREE.
ed5979
+     */
ed5979
+    qatomic_or(&ev->value, EV_FREE);
ed5979
+
ed5979
+    /*
ed5979
+     * Order reset before checking the condition in the caller.
ed5979
+     * Pairs with the first memory barrier in qemu_event_set().
ed5979
+     */
ed5979
+    smp_mb__after_rmw();
ed5979
 }
ed5979
 
ed5979
 void qemu_event_wait(QemuEvent *ev)
ed5979
@@ -413,20 +422,40 @@ void qemu_event_wait(QemuEvent *ev)
ed5979
     unsigned value;
ed5979
 
ed5979
     assert(ev->initialized);
ed5979
-    value = qatomic_read(&ev->value);
ed5979
-    smp_mb_acquire();
ed5979
+
ed5979
+    /*
ed5979
+     * qemu_event_wait must synchronize with qemu_event_set even if it does
ed5979
+     * not go down the slow path, so this load-acquire is needed that
ed5979
+     * synchronizes with the first memory barrier in qemu_event_set().
ed5979
+     *
ed5979
+     * If we do go down the slow path, there is no requirement at all: we
ed5979
+     * might miss a qemu_event_set() here but ultimately the memory barrier in
ed5979
+     * qemu_futex_wait() will ensure the check is done correctly.
ed5979
+     */
ed5979
+    value = qatomic_load_acquire(&ev->value);
ed5979
     if (value != EV_SET) {
ed5979
         if (value == EV_FREE) {
ed5979
             /*
ed5979
-             * Leave the event reset and tell qemu_event_set that there
ed5979
-             * are waiters.  No need to retry, because there cannot be
ed5979
-             * a concurrent busy->free transition.  After the CAS, the
ed5979
-             * event will be either set or busy.
ed5979
+             * Leave the event reset and tell qemu_event_set that there are
ed5979
+             * waiters.  No need to retry, because there cannot be a concurrent
ed5979
+             * busy->free transition.  After the CAS, the event will be either
ed5979
+             * set or busy.
ed5979
+             *
ed5979
+             * This cmpxchg doesn't have particular ordering requirements if it
ed5979
+             * succeeds (moving the store earlier can only cause qemu_event_set()
ed5979
+             * to issue _more_ wakeups), the failing case needs acquire semantics
ed5979
+             * like the load above.
ed5979
              */
ed5979
             if (qatomic_cmpxchg(&ev->value, EV_FREE, EV_BUSY) == EV_SET) {
ed5979
                 return;
ed5979
             }
ed5979
         }
ed5979
+
ed5979
+        /*
ed5979
+         * This is the final check for a concurrent set, so it does need
ed5979
+         * a smp_mb() pairing with the second barrier of qemu_event_set().
ed5979
+         * The barrier is inside the FUTEX_WAIT system call.
ed5979
+         */
ed5979
         qemu_futex_wait(ev, EV_BUSY);
ed5979
     }
ed5979
 }
ed5979
-- 
ed5979
2.39.1
ed5979