coroutine-lock: add mutex argument to CoQueue APIs

author Paolo Bonzini <pbonzini@redhat.com>

Mon, 13 Feb 2017 18:12:43 +0000 (19:12 +0100)

committer Stefan Hajnoczi <stefanha@redhat.com>

Tue, 21 Feb 2017 11:39:40 +0000 (11:39 +0000)
author Paolo Bonzini <pbonzini@redhat.com>
Mon, 13 Feb 2017 18:12:43 +0000 (19:12 +0100)
committer Stefan Hajnoczi <stefanha@redhat.com>
Tue, 21 Feb 2017 11:39:40 +0000 (11:39 +0000)
diff --git a/block/backup.c b/block/backup.c

index ea387338495f145ddac3cc2899ed4c701ea60d11..fe010e78e33cbb9c232e90a7ac38850bdf6905d4 100644 (file)
--- a/block/backup.c
+++ b/block/backup.c
@@ -64,7 +64,7 @@ static void coroutine_fn wait_for_overlapping_requests(BackupBlockJob *job,
          retry = false;
          QLIST_FOREACH(req, &job->inflight_reqs, list) {
              if (end > req->start && start < req->end) {
-                qemu_co_queue_wait(&req->wait_queue);
+                qemu_co_queue_wait(&req->wait_queue, NULL);
                  retry = true;
                  break;
              }
diff --git a/block/io.c b/block/io.c

index a5c7d36d8c28a0a3c27c9d649b4d892914fec228..d5c45447fd4d0d195e53cc57348a0ae0dd960fe9 100644 (file)
--- a/block/io.c
+++ b/block/io.c
@@ -539,7 +539,7 @@ static bool coroutine_fn wait_serialising_requests(BdrvTrackedRequest *self)
                   * (instead of producing a deadlock in the former case). */
                  if (!req->waiting_for) {
                      self->waiting_for = req;
-                    qemu_co_queue_wait(&req->wait_queue);
+                    qemu_co_queue_wait(&req->wait_queue, NULL);
                      self->waiting_for = NULL;
                      retry = true;
                      waited = true;
@@ -2275,7 +2275,7 @@ int coroutine_fn bdrv_co_flush(BlockDriverState *bs)
  
      /* Wait until any previous flushes are completed */
      while (bs->active_flush_req) {
-        qemu_co_queue_wait(&bs->flush_queue);
+        qemu_co_queue_wait(&bs->flush_queue, NULL);
      }
  
      bs->active_flush_req = true;
diff --git a/block/nbd-client.c b/block/nbd-client.c

index 10fcc9e81d93f9011fe72aef2de98b3cc80af95f..0dc12c2d671898c7a6fdc50ad55a1f1dd07658dd 100644 (file)
--- a/block/nbd-client.c
+++ b/block/nbd-client.c
@@ -182,7 +182,7 @@ static void nbd_coroutine_start(NBDClientSession *s,
      /* Poor man semaphore.  The free_sema is locked when no other request
       * can be accepted, and unlocked after receiving one reply.  */
      if (s->in_flight == MAX_NBD_REQUESTS) {
-        qemu_co_queue_wait(&s->free_sema);
+        qemu_co_queue_wait(&s->free_sema, NULL);
          assert(s->in_flight < MAX_NBD_REQUESTS);
      }
      s->in_flight++;
diff --git a/block/qcow2-cluster.c b/block/qcow2-cluster.c

index 928c1e298d572fe70fd9be19a10c28491934d004..78c11d494895bcf300889c641c4521c011f562fc 100644 (file)
--- a/block/qcow2-cluster.c
+++ b/block/qcow2-cluster.c
@@ -932,9 +932,7 @@ static int handle_dependencies(BlockDriverState *bs, uint64_t guest_offset,
              if (bytes == 0) {
                  /* Wait for the dependency to complete. We need to recheck
                   * the free/allocated clusters when we continue. */
-                qemu_co_mutex_unlock(&s->lock);
-                qemu_co_queue_wait(&old_alloc->dependent_requests);
-                qemu_co_mutex_lock(&s->lock);
+                qemu_co_queue_wait(&old_alloc->dependent_requests, &s->lock);
                  return -EAGAIN;
              }
          }
diff --git a/block/sheepdog.c b/block/sheepdog.c

index 32c4e4c5073eb0acc4f124572c297be46c0e133b..860ba6150247116e8be58d460942f5927973afae 100644 (file)
--- a/block/sheepdog.c
+++ b/block/sheepdog.c
@@ -486,7 +486,7 @@ static void wait_for_overlapping_aiocb(BDRVSheepdogState *s, SheepdogAIOCB *acb)
  retry:
      QLIST_FOREACH(cb, &s->inflight_aiocb_head, aiocb_siblings) {
          if (AIOCBOverlapping(acb, cb)) {
-            qemu_co_queue_wait(&s->overlapping_queue);
+            qemu_co_queue_wait(&s->overlapping_queue, NULL);
              goto retry;
          }
      }
diff --git a/block/throttle-groups.c b/block/throttle-groups.c

index aade5def399a8a80934be7fe6d759deb551b5e88..b73e7a800b7140cac356e23457375147c2582a50 100644 (file)
--- a/block/throttle-groups.c
+++ b/block/throttle-groups.c
@@ -326,7 +326,7 @@ void coroutine_fn throttle_group_co_io_limits_intercept(BlockBackend *blk,
      if (must_wait || blkp->pending_reqs[is_write]) {
          blkp->pending_reqs[is_write]++;
          qemu_mutex_unlock(&tg->lock);
-        qemu_co_queue_wait(&blkp->throttled_reqs[is_write]);
+        qemu_co_queue_wait(&blkp->throttled_reqs[is_write], NULL);
          qemu_mutex_lock(&tg->lock);
          blkp->pending_reqs[is_write]--;
      }
diff --git a/hw/9pfs/9p.c b/hw/9pfs/9p.c

index 99e94723b9de110403a9e3388157def8585a6987..3af1c93dc87dd2a1d96f29bfdcfb3ecee5812618 100644 (file)
--- a/hw/9pfs/9p.c
+++ b/hw/9pfs/9p.c
@@ -2374,7 +2374,7 @@ static void coroutine_fn v9fs_flush(void *opaque)
          /*
           * Wait for pdu to complete.
           */
-        qemu_co_queue_wait(&cancel_pdu->complete);
+        qemu_co_queue_wait(&cancel_pdu->complete, NULL);
          cancel_pdu->cancelled = 0;
          pdu_free(cancel_pdu);
      }
diff --git a/include/qemu/coroutine.h b/include/qemu/coroutine.h

index 9f685794d2914f21cd0484b0aa88330e72b59003..d2de268981fb9dc1427313c44e96a9300073df5f 100644 (file)
--- a/include/qemu/coroutine.h
+++ b/include/qemu/coroutine.h
@@ -160,7 +160,8 @@ void coroutine_fn qemu_co_mutex_unlock(CoMutex *mutex);
  
  /**
   * CoQueues are a mechanism to queue coroutines in order to continue executing
- * them later.
+ * them later.  They are similar to condition variables, but they need help
+ * from an external mutex in order to maintain thread-safety.
   */
  typedef struct CoQueue {
      QSIMPLEQ_HEAD(, Coroutine) entries;
@@ -174,9 +175,10 @@ void qemu_co_queue_init(CoQueue *queue);
  
  /**
   * Adds the current coroutine to the CoQueue and transfers control to the
- * caller of the coroutine.
+ * caller of the coroutine.  The mutex is unlocked during the wait and
+ * locked again afterwards.
   */
-void coroutine_fn qemu_co_queue_wait(CoQueue *queue);
+void coroutine_fn qemu_co_queue_wait(CoQueue *queue, CoMutex *mutex);
  
  /**
   * Restarts the next coroutine in the CoQueue and removes it from the queue.
diff --git a/util/qemu-coroutine-lock.c b/util/qemu-coroutine-lock.c

index 73fe77cc8044079be53ae7f86c9e9e21150e6625..b0a554f40d4af9a36329a30c937ad393513dead0 100644 (file)
--- a/util/qemu-coroutine-lock.c
+++ b/util/qemu-coroutine-lock.c
@@ -40,12 +40,30 @@ void qemu_co_queue_init(CoQueue *queue)
      QSIMPLEQ_INIT(&queue->entries);
  }
  
-void coroutine_fn qemu_co_queue_wait(CoQueue *queue)
+void coroutine_fn qemu_co_queue_wait(CoQueue *queue, CoMutex *mutex)
  {
      Coroutine *self = qemu_coroutine_self();
      QSIMPLEQ_INSERT_TAIL(&queue->entries, self, co_queue_next);
+
+    if (mutex) {
+        qemu_co_mutex_unlock(mutex);
+    }
+
+    /* There is no race condition here.  Other threads will call
+     * aio_co_schedule on our AioContext, which can reenter this
+     * coroutine but only after this yield and after the main loop
+     * has gone through the next iteration.
+     */
      qemu_coroutine_yield();
      assert(qemu_in_coroutine());
+
+    /* TODO: OSv implements wait morphing here, where the wakeup
+     * primitive automatically places the woken coroutine on the
+     * mutex's queue.  This avoids the thundering herd effect.
+     */
+    if (mutex) {
+        qemu_co_mutex_lock(mutex);
+    }
  }
  
  /**
@@ -335,7 +353,7 @@ void qemu_co_rwlock_rdlock(CoRwlock *lock)
      Coroutine *self = qemu_coroutine_self();
  
      while (lock->writer) {
-        qemu_co_queue_wait(&lock->queue);
+        qemu_co_queue_wait(&lock->queue, NULL);
      }
      lock->reader++;
      self->locks_held++;
@@ -365,7 +383,7 @@ void qemu_co_rwlock_wrlock(CoRwlock *lock)
      Coroutine *self = qemu_coroutine_self();
  
      while (lock->writer || lock->reader) {
-        qemu_co_queue_wait(&lock->queue);
+        qemu_co_queue_wait(&lock->queue, NULL);
      }
      lock->writer = true;
      self->locks_held++;
author	Paolo Bonzini <pbonzini@redhat.com>
	Mon, 13 Feb 2017 18:12:43 +0000 (19:12 +0100)
committer	Stefan Hajnoczi <stefanha@redhat.com>
	Tue, 21 Feb 2017 11:39:40 +0000 (11:39 +0000)
block/backup.c		patch \| blob \| history
block/io.c		patch \| blob \| history
block/nbd-client.c		patch \| blob \| history
block/qcow2-cluster.c		patch \| blob \| history
block/sheepdog.c		patch \| blob \| history
block/throttle-groups.c		patch \| blob \| history
hw/9pfs/9p.c		patch \| blob \| history
include/qemu/coroutine.h		patch \| blob \| history
util/qemu-coroutine-lock.c		patch \| blob \| history