Drivers: hv: vmbus: Don't bind the offer&rescind works to a specific CPU
authorAndrea Parri (Microsoft) <parri.andrea@gmail.com>
Mon, 6 Apr 2020 00:15:05 +0000 (02:15 +0200)
committerWei Liu <wei.liu@kernel.org>
Thu, 23 Apr 2020 13:17:11 +0000 (13:17 +0000)
The offer and rescind works are currently scheduled on the so called
"connect CPU".  However, this is not really needed: we can synchronize
the works by relying on the usage of the offer_in_progress counter and
of the channel_mutex mutex.  This synchronization is already in place.
So, remove this unnecessary "bind to the connect CPU" constraint and
update the inline comments accordingly.

Suggested-by: Dexuan Cui <decui@microsoft.com>
Signed-off-by: Andrea Parri (Microsoft) <parri.andrea@gmail.com>
Link: https://lore.kernel.org/r/20200406001514.19876-3-parri.andrea@gmail.com
Reviewed-by: Michael Kelley <mikelley@microsoft.com>
Signed-off-by: Wei Liu <wei.liu@kernel.org>
drivers/hv/channel_mgmt.c
drivers/hv/vmbus_drv.c

index 3a5700c8486afe0ca48509d4daf25ebd1a3779af..0ced32ef2715a54a6bcabc91b61037fdc71fa99c 100644 (file)
@@ -1028,11 +1028,22 @@ static void vmbus_onoffer_rescind(struct vmbus_channel_message_header *hdr)
         * offer comes in first and then the rescind.
         * Since we process these events in work elements,
         * and with preemption, we may end up processing
-        * the events out of order. Given that we handle these
-        * work elements on the same CPU, this is possible only
-        * in the case of preemption. In any case wait here
-        * until the offer processing has moved beyond the
-        * point where the channel is discoverable.
+        * the events out of order.  We rely on the synchronization
+        * provided by offer_in_progress and by channel_mutex for
+        * ordering these events:
+        *
+        * { Initially: offer_in_progress = 1 }
+        *
+        * CPU1                         CPU2
+        *
+        * [vmbus_process_offer()]      [vmbus_onoffer_rescind()]
+        *
+        * LOCK channel_mutex           WAIT_ON offer_in_progress == 0
+        * DECREMENT offer_in_progress  LOCK channel_mutex
+        * INSERT chn_list              SEARCH chn_list
+        * UNLOCK channel_mutex         UNLOCK channel_mutex
+        *
+        * Forbids: CPU2's SEARCH from *not* seeing CPU1's INSERT
         */
 
        while (atomic_read(&vmbus_connection.offer_in_progress) != 0) {
index 495337ec68f13d419a48caac5504ba10a91838ba..1f3e69d18d3563e91262aad9ec1ee39b9e783fb8 100644 (file)
@@ -1101,8 +1101,9 @@ void vmbus_on_msg_dpc(unsigned long data)
                /*
                 * The host can generate a rescind message while we
                 * may still be handling the original offer. We deal with
-                * this condition by ensuring the processing is done on the
-                * same CPU.
+                * this condition by relying on the synchronization provided
+                * by offer_in_progress and by channel_mutex.  See also the
+                * inline comments in vmbus_onoffer_rescind().
                 */
                switch (hdr->msgtype) {
                case CHANNELMSG_RESCIND_CHANNELOFFER:
@@ -1124,16 +1125,34 @@ void vmbus_on_msg_dpc(unsigned long data)
                         * work queue: the RESCIND handler can not start to
                         * run before the OFFER handler finishes.
                         */
-                       schedule_work_on(VMBUS_CONNECT_CPU,
-                                        &ctx->work);
+                       schedule_work(&ctx->work);
                        break;
 
                case CHANNELMSG_OFFERCHANNEL:
+                       /*
+                        * The host sends the offer message of a given channel
+                        * before sending the rescind message of the same
+                        * channel.  These messages are sent to the guest's
+                        * connect CPU; the guest then starts processing them
+                        * in the tasklet handler on this CPU:
+                        *
+                        * VMBUS_CONNECT_CPU
+                        *
+                        * [vmbus_on_msg_dpc()]
+                        * atomic_inc()  // CHANNELMSG_OFFERCHANNEL
+                        * queue_work()
+                        * ...
+                        * [vmbus_on_msg_dpc()]
+                        * schedule_work()  // CHANNELMSG_RESCIND_CHANNELOFFER
+                        *
+                        * We rely on the memory-ordering properties of the
+                        * queue_work() and schedule_work() primitives, which
+                        * guarantee that the atomic increment will be visible
+                        * to the CPUs which will execute the offer & rescind
+                        * works by the time these works will start execution.
+                        */
                        atomic_inc(&vmbus_connection.offer_in_progress);
-                       queue_work_on(VMBUS_CONNECT_CPU,
-                                     vmbus_connection.work_queue,
-                                     &ctx->work);
-                       break;
+                       fallthrough;
 
                default:
                        queue_work(vmbus_connection.work_queue, &ctx->work);
@@ -1178,9 +1197,7 @@ static void vmbus_force_channel_rescinded(struct vmbus_channel *channel)
 
        INIT_WORK(&ctx->work, vmbus_onmessage_work);
 
-       queue_work_on(VMBUS_CONNECT_CPU,
-                     vmbus_connection.work_queue,
-                     &ctx->work);
+       queue_work(vmbus_connection.work_queue, &ctx->work);
 }
 #endif /* CONFIG_PM_SLEEP */