These functions assume that the job lock is held by the caller, to avoid TOC/TOU conditions.
Introduce also additional helpers that define _locked functions (useful when the job_mutex is globally applied). Signed-off-by: Emanuele Giuseppe Esposito <eespo...@redhat.com> --- include/qemu/job-monitor.h | 61 ++++++++++++++++++++++++++++++++++++++ job.c | 22 ++++++++++++-- 2 files changed, 81 insertions(+), 2 deletions(-) diff --git a/include/qemu/job-monitor.h b/include/qemu/job-monitor.h index b5b41a7548..d92bc4f39d 100644 --- a/include/qemu/job-monitor.h +++ b/include/qemu/job-monitor.h @@ -28,6 +28,21 @@ #include "job-common.h" +/* + * Job monitor API. + * + * These functions use are used by the QEMU monitor, for example + * to execute QMP commands. The monitor is aware of the job_mutex + * presence, so these functions assume it is held by the caller + * to protect job fields (see job-common.h). + * This prevents TOC/TOU bugs, allowing the caller to hold the + * lock between a check in the job state and the actual action. + * + * Therefore, each function in this API that needs protection + * must have the comment + * "Called between job_lock and job_unlock." + */ + /** * Allocate and return a new job transaction. Jobs can be added to the * transaction using job_txn_add_job(). @@ -56,18 +71,24 @@ void job_txn_unref(JobTxn *txn); * the reference that is automatically grabbed here. * * If @txn is NULL, the function does nothing. + * + * Called between job_lock and job_unlock. */ void job_txn_add_job(JobTxn *txn, Job *job); /** * Add a reference to Job refcnt, it will be decreased with job_unref, and then * be freed if it comes to be the last reference. + * + * Called between job_lock and job_unlock. */ void job_ref(Job *job); /** * Release a reference that was previously acquired with job_ref() or * job_create(). If it's the last reference to the object, it will be freed. + * + * Called between job_lock and job_unlock. */ void job_unref(Job *job); @@ -75,6 +96,8 @@ void job_unref(Job *job); * Conditionally enter the job coroutine if the job is ready to run, not * already busy and fn() returns true. fn() is called while under the job_lock * critical section. + * + * Called between job_lock and job_unlock, but it releases the lock temporarly. */ void job_enter_cond(Job *job, bool(*fn)(Job *job)); @@ -85,6 +108,7 @@ bool job_is_internal(Job *job); /** * Returns whether the job is in a completed state. + * Called between job_lock and job_unlock. */ bool job_is_completed(Job *job); @@ -92,28 +116,36 @@ bool job_is_completed(Job *job); * Request @job to pause at the next pause point. Must be paired with * job_resume(). If the job is supposed to be resumed by user action, call * job_user_pause() instead. + * + * Called between job_lock and job_unlock. */ void job_pause(Job *job); /** * Resumes a @job paused with job_pause. + * Called between job_lock and job_unlock. */ void job_resume(Job *job); /** * Asynchronously pause the specified @job. * Do not allow a resume until a matching call to job_user_resume. + * + * Called between job_lock and job_unlock. */ void job_user_pause(Job *job, Error **errp); /** * Returns true if the job is user-paused. + * Called between job_lock and job_unlock. */ bool job_user_paused(Job *job); /** * Resume the specified @job. * Must be paired with a preceding job_user_pause. + * + * Called between job_lock and job_unlock. */ void job_user_resume(Job *job, Error **errp); @@ -122,6 +154,8 @@ void job_user_resume(Job *job, Error **errp); * first one if @job is %NULL. * * Returns the requested job, or %NULL if there are no more jobs left. + * + * Called between job_lock and job_unlock. */ Job *job_next(Job *job); @@ -129,6 +163,8 @@ Job *job_next(Job *job); * Get the job identified by @id (which must not be %NULL). * * Returns the requested job, or %NULL if it doesn't exist. + * + * Called between job_lock and job_unlock. */ Job *job_get(const char *id); @@ -136,23 +172,30 @@ Job *job_get(const char *id); * Check whether the verb @verb can be applied to @job in its current state. * Returns 0 if the verb can be applied; otherwise errp is set and -EPERM * returned. + * + * Called between job_lock and job_unlock. */ int job_apply_verb(Job *job, JobVerb verb, Error **errp); /** * Asynchronously complete the specified @job. + * Called between job_lock and job_unlock, but it releases the lock temporarly. */ void job_complete(Job *job, Error **errp); /** * Asynchronously cancel the specified @job. If @force is true, the job should * be cancelled immediately without waiting for a consistent state. + * + * Called between job_lock and job_unlock. */ void job_cancel(Job *job, bool force); /** * Cancels the specified job like job_cancel(), but may refuse to do so if the * operation isn't meaningful in the current state of the job. + * + * Called between job_lock and job_unlock. */ void job_user_cancel(Job *job, bool force, Error **errp); @@ -171,6 +214,10 @@ int job_cancel_sync(Job *job, bool force); /** * Synchronously force-cancels all jobs using job_cancel_sync(). + * + * Called with job_lock *not* held, unlike most other APIs consumed + * by the monitor! This is primarly to avoid adding unnecessary lock-unlock + * patterns in the caller. */ void job_cancel_sync_all(void); @@ -187,6 +234,8 @@ void job_cancel_sync_all(void); * Returns the return value from the job. * * Callers must hold the AioContext lock of job->aio_context. + * + * Called between job_lock and job_unlock. */ int job_complete_sync(Job *job, Error **errp); @@ -197,12 +246,16 @@ int job_complete_sync(Job *job, Error **errp); * FIXME: Make the below statement universally true: * For jobs that support the manual workflow mode, all graph changes that occur * as a result will occur after this command and before a successful reply. + * + * Called between job_lock and job_unlock. */ void job_finalize(Job *job, Error **errp); /** * Remove the concluded @job from the query list and resets the passed pointer * to %NULL. Returns an error if the job is not actually concluded. + * + * Called between job_lock and job_unlock. */ void job_dismiss(Job **job, Error **errp); @@ -214,7 +267,15 @@ void job_dismiss(Job **job, Error **errp); * cancelled before completing, and -errno in other error cases. * * Callers must hold the AioContext lock of job->aio_context. + * + * Called between job_lock and job_unlock, but it releases the lock temporarly. */ int job_finish_sync(Job *job, void (*finish)(Job *, Error **errp), Error **errp); +/** Same as job_is_ready(), but assumes job_lock is held. */ +bool job_is_ready_locked(Job *job); + +/** Same as job_early_fail(), but assumes job_lock is held. */ +void job_early_fail_locked(Job *job); + #endif diff --git a/job.c b/job.c index e003f136f0..b66d59b746 100644 --- a/job.c +++ b/job.c @@ -225,7 +225,8 @@ bool job_cancel_requested(Job *job) return job->cancelled; } -bool job_is_ready(Job *job) +/* Called with job_mutex held. */ +bool job_is_ready_locked(Job *job) { switch (job->status) { case JOB_STATUS_UNDEFINED: @@ -247,6 +248,16 @@ bool job_is_ready(Job *job) return false; } +/* Called with job_mutex lock *not* held */ +bool job_is_ready(Job *job) +{ + bool res; + job_lock(); + res = job_is_ready_locked(job); + job_unlock(); + return res; +} + bool job_is_completed(Job *job) { switch (job->status) { @@ -642,12 +653,19 @@ void job_dismiss(Job **jobptr, Error **errp) *jobptr = NULL; } -void job_early_fail(Job *job) +void job_early_fail_locked(Job *job) { assert(job->status == JOB_STATUS_CREATED); job_do_dismiss(job); } +void job_early_fail(Job *job) +{ + job_lock(); + job_early_fail_locked(job); + job_unlock(); +} + static void job_conclude(Job *job) { job_state_transition(job, JOB_STATUS_CONCLUDED); -- 2.27.0