9de5f2b408
* checkpatch: fix g_malloc check * fix mremap() and RDMA detection * confine igd-passthrough-isa-bridge to Xen-enabled builds * cover PCI in arm-virt machine qtests * add -M boot and -M mem compound properties * bump SLIRP submodule * support CFI with system libslirp (>= 4.7) * clean up CoQueue wakeup functions * fix vhost-vsock regression * fix --disable-vnc compilation * other minor bugfixes -----BEGIN PGP SIGNATURE----- iQFIBAABCAAyFiEE8TM4V0tmI4mGbHaCv/vSX3jHroMFAmJ8/KMUHHBib256aW5p QHJlZGhhdC5jb20ACgkQv/vSX3jHroNTTAf9Et1C8iZn+OlZi99wMEeMy8a4mIE5 CpkBpFphhkBvt3AH7XNsCyL4Gea4QgsI7nOIEVUwvW7gPf85PiBUX8mjrIVg3x1k bmMEwMKSTYPmDieAnYBP9zCqZQXNYP8L8WxVs2jFY2GXZ2ZogODYFbvCY4yEEB72 UR6uIvQRdpiB6BEj8UZ+5i+sDtb0zxqrjzUz8T/PJC9/2JSNgi+sAWWQoQT3PPU7 R7z2nmEa1VeVLPP6mUHvJKhBltVXF+LyIjQHvo+Tp9tSqp9JwXfFBNQ5W/MFes2D skF47N7PdgKRH9Dp4r0j+MqBwoAq86+ao+MKsbQ1Gb91HhoCWt/MrVrVyg== =1E6P -----END PGP SIGNATURE----- Merge tag 'for-upstream' of https://gitlab.com/bonzini/qemu into staging * small cleanups for pc-bios/optionrom Makefiles * checkpatch: fix g_malloc check * fix mremap() and RDMA detection * confine igd-passthrough-isa-bridge to Xen-enabled builds * cover PCI in arm-virt machine qtests * add -M boot and -M mem compound properties * bump SLIRP submodule * support CFI with system libslirp (>= 4.7) * clean up CoQueue wakeup functions * fix vhost-vsock regression * fix --disable-vnc compilation * other minor bugfixes # -----BEGIN PGP SIGNATURE----- # # iQFIBAABCAAyFiEE8TM4V0tmI4mGbHaCv/vSX3jHroMFAmJ8/KMUHHBib256aW5p # QHJlZGhhdC5jb20ACgkQv/vSX3jHroNTTAf9Et1C8iZn+OlZi99wMEeMy8a4mIE5 # CpkBpFphhkBvt3AH7XNsCyL4Gea4QgsI7nOIEVUwvW7gPf85PiBUX8mjrIVg3x1k # bmMEwMKSTYPmDieAnYBP9zCqZQXNYP8L8WxVs2jFY2GXZ2ZogODYFbvCY4yEEB72 # UR6uIvQRdpiB6BEj8UZ+5i+sDtb0zxqrjzUz8T/PJC9/2JSNgi+sAWWQoQT3PPU7 # R7z2nmEa1VeVLPP6mUHvJKhBltVXF+LyIjQHvo+Tp9tSqp9JwXfFBNQ5W/MFes2D # skF47N7PdgKRH9Dp4r0j+MqBwoAq86+ao+MKsbQ1Gb91HhoCWt/MrVrVyg== # =1E6P # -----END PGP SIGNATURE----- # gpg: Signature made Thu 12 May 2022 05:25:07 AM PDT # gpg: using RSA key F13338574B662389866C7682BFFBD25F78C7AE83 # gpg: issuer "pbonzini@redhat.com" # gpg: Good signature from "Paolo Bonzini <bonzini@gnu.org>" [undefined] # gpg: aka "Paolo Bonzini <pbonzini@redhat.com>" [undefined] # gpg: WARNING: This key is not certified with a trusted signature! # gpg: There is no indication that the signature belongs to the owner. # Primary key fingerprint: 46F5 9FBD 57D6 12E7 BFD4 E2F7 7E15 100C CD36 69B1 # Subkey fingerprint: F133 3857 4B66 2389 866C 7682 BFFB D25F 78C7 AE83 * tag 'for-upstream' of https://gitlab.com/bonzini/qemu: (27 commits) vmxcap: add tertiary execution controls vl: make machine type deprecation a warning meson: link libpng independent of vnc vhost-backend: do not depend on CONFIG_VHOST_VSOCK coroutine-lock: qemu_co_queue_restart_all is a coroutine-only qemu_co_enter_all coroutine-lock: introduce qemu_co_queue_enter_all coroutine-lock: qemu_co_queue_next is a coroutine-only qemu_co_enter_next net: slirp: allow CFI with libslirp >= 4.7 net: slirp: add support for CFI-friendly timer API net: slirp: switch to slirp_new net: slirp: introduce a wrapper struct for QemuTimer slirp: bump submodule past 4.7 release machine: move more memory validation to Machine object machine: make memory-backend a link property machine: add mem compound property machine: add boot compound property machine: use QAPI struct for boot configuration tests/qtest/libqos: Add generic pci host bridge in arm-virt machine tests/qtest/libqos: Skip hotplug tests if pci root bus is not hotpluggable tests/qtest/libqos/pci: Introduce pio_limit ... Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
385 lines
12 KiB
C
385 lines
12 KiB
C
/*
|
|
* QEMU coroutine implementation
|
|
*
|
|
* Copyright IBM, Corp. 2011
|
|
*
|
|
* Authors:
|
|
* Stefan Hajnoczi <stefanha@linux.vnet.ibm.com>
|
|
* Kevin Wolf <kwolf@redhat.com>
|
|
*
|
|
* This work is licensed under the terms of the GNU LGPL, version 2 or later.
|
|
* See the COPYING.LIB file in the top-level directory.
|
|
*
|
|
*/
|
|
|
|
#ifndef QEMU_COROUTINE_H
|
|
#define QEMU_COROUTINE_H
|
|
|
|
#include "qemu/queue.h"
|
|
#include "qemu/timer.h"
|
|
|
|
/**
|
|
* Coroutines are a mechanism for stack switching and can be used for
|
|
* cooperative userspace threading. These functions provide a simple but
|
|
* useful flavor of coroutines that is suitable for writing sequential code,
|
|
* rather than callbacks, for operations that need to give up control while
|
|
* waiting for events to complete.
|
|
*
|
|
* These functions are re-entrant and may be used outside the global mutex.
|
|
*/
|
|
|
|
/**
|
|
* Mark a function that executes in coroutine context
|
|
*
|
|
* Functions that execute in coroutine context cannot be called directly from
|
|
* normal functions. In the future it would be nice to enable compiler or
|
|
* static checker support for catching such errors. This annotation might make
|
|
* it possible and in the meantime it serves as documentation.
|
|
*
|
|
* For example:
|
|
*
|
|
* static void coroutine_fn foo(void) {
|
|
* ....
|
|
* }
|
|
*/
|
|
#define coroutine_fn
|
|
|
|
typedef struct Coroutine Coroutine;
|
|
|
|
/**
|
|
* Coroutine entry point
|
|
*
|
|
* When the coroutine is entered for the first time, opaque is passed in as an
|
|
* argument.
|
|
*
|
|
* When this function returns, the coroutine is destroyed automatically and
|
|
* execution continues in the caller who last entered the coroutine.
|
|
*/
|
|
typedef void coroutine_fn CoroutineEntry(void *opaque);
|
|
|
|
/**
|
|
* Create a new coroutine
|
|
*
|
|
* Use qemu_coroutine_enter() to actually transfer control to the coroutine.
|
|
* The opaque argument is passed as the argument to the entry point.
|
|
*/
|
|
Coroutine *qemu_coroutine_create(CoroutineEntry *entry, void *opaque);
|
|
|
|
/**
|
|
* Transfer control to a coroutine
|
|
*/
|
|
void qemu_coroutine_enter(Coroutine *coroutine);
|
|
|
|
/**
|
|
* Transfer control to a coroutine if it's not active (i.e. part of the call
|
|
* stack of the running coroutine). Otherwise, do nothing.
|
|
*/
|
|
void qemu_coroutine_enter_if_inactive(Coroutine *co);
|
|
|
|
/**
|
|
* Transfer control to a coroutine and associate it with ctx
|
|
*/
|
|
void qemu_aio_coroutine_enter(AioContext *ctx, Coroutine *co);
|
|
|
|
/**
|
|
* Transfer control back to a coroutine's caller
|
|
*
|
|
* This function does not return until the coroutine is re-entered using
|
|
* qemu_coroutine_enter().
|
|
*/
|
|
void coroutine_fn qemu_coroutine_yield(void);
|
|
|
|
/**
|
|
* Get the AioContext of the given coroutine
|
|
*/
|
|
AioContext *coroutine_fn qemu_coroutine_get_aio_context(Coroutine *co);
|
|
|
|
/**
|
|
* Get the currently executing coroutine
|
|
*/
|
|
Coroutine *coroutine_fn qemu_coroutine_self(void);
|
|
|
|
/**
|
|
* Return whether or not currently inside a coroutine
|
|
*
|
|
* This can be used to write functions that work both when in coroutine context
|
|
* and when not in coroutine context. Note that such functions cannot use the
|
|
* coroutine_fn annotation since they work outside coroutine context.
|
|
*/
|
|
bool qemu_in_coroutine(void);
|
|
|
|
/**
|
|
* Return true if the coroutine is currently entered
|
|
*
|
|
* A coroutine is "entered" if it has not yielded from the current
|
|
* qemu_coroutine_enter() call used to run it. This does not mean that the
|
|
* coroutine is currently executing code since it may have transferred control
|
|
* to another coroutine using qemu_coroutine_enter().
|
|
*
|
|
* When several coroutines enter each other there may be no way to know which
|
|
* ones have already been entered. In such situations this function can be
|
|
* used to avoid recursively entering coroutines.
|
|
*/
|
|
bool qemu_coroutine_entered(Coroutine *co);
|
|
|
|
/**
|
|
* Provides a mutex that can be used to synchronise coroutines
|
|
*/
|
|
struct CoWaitRecord;
|
|
struct CoMutex {
|
|
/* Count of pending lockers; 0 for a free mutex, 1 for an
|
|
* uncontended mutex.
|
|
*/
|
|
unsigned locked;
|
|
|
|
/* Context that is holding the lock. Useful to avoid spinning
|
|
* when two coroutines on the same AioContext try to get the lock. :)
|
|
*/
|
|
AioContext *ctx;
|
|
|
|
/* A queue of waiters. Elements are added atomically in front of
|
|
* from_push. to_pop is only populated, and popped from, by whoever
|
|
* is in charge of the next wakeup. This can be an unlocker or,
|
|
* through the handoff protocol, a locker that is about to go to sleep.
|
|
*/
|
|
QSLIST_HEAD(, CoWaitRecord) from_push, to_pop;
|
|
|
|
unsigned handoff, sequence;
|
|
|
|
Coroutine *holder;
|
|
};
|
|
|
|
/**
|
|
* Initialises a CoMutex. This must be called before any other operation is used
|
|
* on the CoMutex.
|
|
*/
|
|
void qemu_co_mutex_init(CoMutex *mutex);
|
|
|
|
/**
|
|
* Locks the mutex. If the lock cannot be taken immediately, control is
|
|
* transferred to the caller of the current coroutine.
|
|
*/
|
|
void coroutine_fn qemu_co_mutex_lock(CoMutex *mutex);
|
|
|
|
/**
|
|
* Unlocks the mutex and schedules the next coroutine that was waiting for this
|
|
* lock to be run.
|
|
*/
|
|
void coroutine_fn qemu_co_mutex_unlock(CoMutex *mutex);
|
|
|
|
/**
|
|
* Assert that the current coroutine holds @mutex.
|
|
*/
|
|
static inline coroutine_fn void qemu_co_mutex_assert_locked(CoMutex *mutex)
|
|
{
|
|
/*
|
|
* mutex->holder doesn't need any synchronisation if the assertion holds
|
|
* true because the mutex protects it. If it doesn't hold true, we still
|
|
* don't mind if another thread takes or releases mutex behind our back,
|
|
* because the condition will be false no matter whether we read NULL or
|
|
* the pointer for any other coroutine.
|
|
*/
|
|
assert(qatomic_read(&mutex->locked) &&
|
|
mutex->holder == qemu_coroutine_self());
|
|
}
|
|
|
|
/**
|
|
* CoQueues are a mechanism to queue coroutines in order to continue executing
|
|
* them later. They are similar to condition variables, but they need help
|
|
* from an external mutex in order to maintain thread-safety.
|
|
*/
|
|
typedef struct CoQueue {
|
|
QSIMPLEQ_HEAD(, Coroutine) entries;
|
|
} CoQueue;
|
|
|
|
/**
|
|
* Initialise a CoQueue. This must be called before any other operation is used
|
|
* on the CoQueue.
|
|
*/
|
|
void qemu_co_queue_init(CoQueue *queue);
|
|
|
|
/**
|
|
* Adds the current coroutine to the CoQueue and transfers control to the
|
|
* caller of the coroutine. The mutex is unlocked during the wait and
|
|
* locked again afterwards.
|
|
*/
|
|
#define qemu_co_queue_wait(queue, lock) \
|
|
qemu_co_queue_wait_impl(queue, QEMU_MAKE_LOCKABLE(lock))
|
|
void coroutine_fn qemu_co_queue_wait_impl(CoQueue *queue, QemuLockable *lock);
|
|
|
|
/**
|
|
* Removes the next coroutine from the CoQueue, and queue it to run after
|
|
* the currently-running coroutine yields.
|
|
* Returns true if a coroutine was removed, false if the queue is empty.
|
|
* Used from coroutine context, use qemu_co_enter_next outside.
|
|
*/
|
|
bool coroutine_fn qemu_co_queue_next(CoQueue *queue);
|
|
|
|
/**
|
|
* Empties the CoQueue and queues the coroutine to run after
|
|
* the currently-running coroutine yields.
|
|
* Used from coroutine context, use qemu_co_enter_all outside.
|
|
*/
|
|
void coroutine_fn qemu_co_queue_restart_all(CoQueue *queue);
|
|
|
|
/**
|
|
* Removes the next coroutine from the CoQueue, and wake it up. Unlike
|
|
* qemu_co_queue_next, this function releases the lock during aio_co_wake
|
|
* because it is meant to be used outside coroutine context; in that case, the
|
|
* coroutine is entered immediately, before qemu_co_enter_next returns.
|
|
*
|
|
* If used in coroutine context, qemu_co_enter_next is equivalent to
|
|
* qemu_co_queue_next.
|
|
*/
|
|
#define qemu_co_enter_next(queue, lock) \
|
|
qemu_co_enter_next_impl(queue, QEMU_MAKE_LOCKABLE(lock))
|
|
bool qemu_co_enter_next_impl(CoQueue *queue, QemuLockable *lock);
|
|
|
|
/**
|
|
* Empties the CoQueue, waking the waiting coroutine one at a time. Unlike
|
|
* qemu_co_queue_all, this function releases the lock during aio_co_wake
|
|
* because it is meant to be used outside coroutine context; in that case, the
|
|
* coroutine is entered immediately, before qemu_co_enter_all returns.
|
|
*
|
|
* If used in coroutine context, qemu_co_enter_all is equivalent to
|
|
* qemu_co_queue_all.
|
|
*/
|
|
#define qemu_co_enter_all(queue, lock) \
|
|
qemu_co_enter_all_impl(queue, QEMU_MAKE_LOCKABLE(lock))
|
|
void qemu_co_enter_all_impl(CoQueue *queue, QemuLockable *lock);
|
|
|
|
/**
|
|
* Checks if the CoQueue is empty.
|
|
*/
|
|
bool qemu_co_queue_empty(CoQueue *queue);
|
|
|
|
|
|
typedef struct CoRwTicket CoRwTicket;
|
|
typedef struct CoRwlock {
|
|
CoMutex mutex;
|
|
|
|
/* Number of readers, or -1 if owned for writing. */
|
|
int owners;
|
|
|
|
/* Waiting coroutines. */
|
|
QSIMPLEQ_HEAD(, CoRwTicket) tickets;
|
|
} CoRwlock;
|
|
|
|
/**
|
|
* Initialises a CoRwlock. This must be called before any other operation
|
|
* is used on the CoRwlock
|
|
*/
|
|
void qemu_co_rwlock_init(CoRwlock *lock);
|
|
|
|
/**
|
|
* Read locks the CoRwlock. If the lock cannot be taken immediately because
|
|
* of a parallel writer, control is transferred to the caller of the current
|
|
* coroutine.
|
|
*/
|
|
void qemu_co_rwlock_rdlock(CoRwlock *lock);
|
|
|
|
/**
|
|
* Write Locks the CoRwlock from a reader. This is a bit more efficient than
|
|
* @qemu_co_rwlock_unlock followed by a separate @qemu_co_rwlock_wrlock.
|
|
* Note that if the lock cannot be upgraded immediately, control is transferred
|
|
* to the caller of the current coroutine; another writer might run while
|
|
* @qemu_co_rwlock_upgrade blocks.
|
|
*/
|
|
void qemu_co_rwlock_upgrade(CoRwlock *lock);
|
|
|
|
/**
|
|
* Downgrades a write-side critical section to a reader. Downgrading with
|
|
* @qemu_co_rwlock_downgrade never blocks, unlike @qemu_co_rwlock_unlock
|
|
* followed by @qemu_co_rwlock_rdlock. This makes it more efficient, but
|
|
* may also sometimes be necessary for correctness.
|
|
*/
|
|
void qemu_co_rwlock_downgrade(CoRwlock *lock);
|
|
|
|
/**
|
|
* Write Locks the mutex. If the lock cannot be taken immediately because
|
|
* of a parallel reader, control is transferred to the caller of the current
|
|
* coroutine.
|
|
*/
|
|
void qemu_co_rwlock_wrlock(CoRwlock *lock);
|
|
|
|
/**
|
|
* Unlocks the read/write lock and schedules the next coroutine that was
|
|
* waiting for this lock to be run.
|
|
*/
|
|
void qemu_co_rwlock_unlock(CoRwlock *lock);
|
|
|
|
typedef struct QemuCoSleep {
|
|
Coroutine *to_wake;
|
|
} QemuCoSleep;
|
|
|
|
/**
|
|
* Yield the coroutine for a given duration. Initializes @w so that,
|
|
* during this yield, it can be passed to qemu_co_sleep_wake() to
|
|
* terminate the sleep.
|
|
*/
|
|
void coroutine_fn qemu_co_sleep_ns_wakeable(QemuCoSleep *w,
|
|
QEMUClockType type, int64_t ns);
|
|
|
|
/**
|
|
* Yield the coroutine until the next call to qemu_co_sleep_wake.
|
|
*/
|
|
void coroutine_fn qemu_co_sleep(QemuCoSleep *w);
|
|
|
|
static inline void coroutine_fn qemu_co_sleep_ns(QEMUClockType type, int64_t ns)
|
|
{
|
|
QemuCoSleep w = { 0 };
|
|
qemu_co_sleep_ns_wakeable(&w, type, ns);
|
|
}
|
|
|
|
/**
|
|
* Wake a coroutine if it is sleeping in qemu_co_sleep_ns. The timer will be
|
|
* deleted. @sleep_state must be the variable whose address was given to
|
|
* qemu_co_sleep_ns() and should be checked to be non-NULL before calling
|
|
* qemu_co_sleep_wake().
|
|
*/
|
|
void qemu_co_sleep_wake(QemuCoSleep *w);
|
|
|
|
/**
|
|
* Yield until a file descriptor becomes readable
|
|
*
|
|
* Note that this function clobbers the handlers for the file descriptor.
|
|
*/
|
|
void coroutine_fn yield_until_fd_readable(int fd);
|
|
|
|
/**
|
|
* Increase coroutine pool size
|
|
*/
|
|
void qemu_coroutine_inc_pool_size(unsigned int additional_pool_size);
|
|
|
|
/**
|
|
* Decrease coroutine pool size
|
|
*/
|
|
void qemu_coroutine_dec_pool_size(unsigned int additional_pool_size);
|
|
|
|
#include "qemu/lockable.h"
|
|
|
|
/**
|
|
* Sends a (part of) iovec down a socket, yielding when the socket is full, or
|
|
* Receives data into a (part of) iovec from a socket,
|
|
* yielding when there is no data in the socket.
|
|
* The same interface as qemu_sendv_recvv(), with added yielding.
|
|
* XXX should mark these as coroutine_fn
|
|
*/
|
|
ssize_t qemu_co_sendv_recvv(int sockfd, struct iovec *iov, unsigned iov_cnt,
|
|
size_t offset, size_t bytes, bool do_send);
|
|
#define qemu_co_recvv(sockfd, iov, iov_cnt, offset, bytes) \
|
|
qemu_co_sendv_recvv(sockfd, iov, iov_cnt, offset, bytes, false)
|
|
#define qemu_co_sendv(sockfd, iov, iov_cnt, offset, bytes) \
|
|
qemu_co_sendv_recvv(sockfd, iov, iov_cnt, offset, bytes, true)
|
|
|
|
/**
|
|
* The same as above, but with just a single buffer
|
|
*/
|
|
ssize_t qemu_co_send_recv(int sockfd, void *buf, size_t bytes, bool do_send);
|
|
#define qemu_co_recv(sockfd, buf, bytes) \
|
|
qemu_co_send_recv(sockfd, buf, bytes, false)
|
|
#define qemu_co_send(sockfd, buf, bytes) \
|
|
qemu_co_send_recv(sockfd, buf, bytes, true)
|
|
|
|
#endif /* QEMU_COROUTINE_H */
|