]> git.proxmox.com Git - mirror_qemu.git/blame - blockjob.c
blockjobs: add commit, abort, clean helpers
[mirror_qemu.git] / blockjob.c
CommitLineData
2f0c9fe6
PB
1/*
2 * QEMU System Emulator block driver
3 *
4 * Copyright (c) 2011 IBM Corp.
5 * Copyright (c) 2012 Red Hat, Inc.
6 *
7 * Permission is hereby granted, free of charge, to any person obtaining a copy
8 * of this software and associated documentation files (the "Software"), to deal
9 * in the Software without restriction, including without limitation the rights
10 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
11 * copies of the Software, and to permit persons to whom the Software is
12 * furnished to do so, subject to the following conditions:
13 *
14 * The above copyright notice and this permission notice shall be included in
15 * all copies or substantial portions of the Software.
16 *
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
20 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
22 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
23 * THE SOFTWARE.
24 */
25
d38ea87a 26#include "qemu/osdep.h"
2f0c9fe6 27#include "qemu-common.h"
737e150e 28#include "block/block.h"
c87621ea 29#include "block/blockjob_int.h"
737e150e 30#include "block/block_int.h"
c9de4050 31#include "block/trace.h"
373340b2 32#include "sysemu/block-backend.h"
e688df6b 33#include "qapi/error.h"
9af23989 34#include "qapi/qapi-events-block-core.h"
cc7a8ea7 35#include "qapi/qmp/qerror.h"
10817bf0 36#include "qemu/coroutine.h"
7f0317cf 37#include "qemu/id.h"
1de7afc9 38#include "qemu/timer.h"
2f0c9fe6 39
fc24908e
PB
40/* Right now, this mutex is only needed to synchronize accesses to job->busy
41 * and job->sleep_timer, such as concurrent calls to block_job_do_yield and
42 * block_job_enter. */
43static QemuMutex block_job_mutex;
44
c9de4050
JS
45/* BlockJob State Transition Table */
46bool BlockJobSTT[BLOCK_JOB_STATUS__MAX][BLOCK_JOB_STATUS__MAX] = {
3925cd3b
JS
47 /* U, C, R, P, Y, S, X, E, N */
48 /* U: */ [BLOCK_JOB_STATUS_UNDEFINED] = {0, 1, 0, 0, 0, 0, 0, 0, 0},
49 /* C: */ [BLOCK_JOB_STATUS_CREATED] = {0, 0, 1, 0, 0, 0, 1, 0, 1},
50 /* R: */ [BLOCK_JOB_STATUS_RUNNING] = {0, 0, 0, 1, 1, 0, 1, 1, 0},
51 /* P: */ [BLOCK_JOB_STATUS_PAUSED] = {0, 0, 1, 0, 0, 0, 0, 0, 0},
52 /* Y: */ [BLOCK_JOB_STATUS_READY] = {0, 0, 0, 0, 0, 1, 1, 1, 0},
53 /* S: */ [BLOCK_JOB_STATUS_STANDBY] = {0, 0, 0, 0, 1, 0, 0, 0, 0},
35d6b368 54 /* X: */ [BLOCK_JOB_STATUS_ABORTING] = {0, 0, 0, 0, 0, 0, 1, 1, 0},
3925cd3b
JS
55 /* E: */ [BLOCK_JOB_STATUS_CONCLUDED] = {0, 0, 0, 0, 0, 0, 0, 0, 1},
56 /* N: */ [BLOCK_JOB_STATUS_NULL] = {0, 0, 0, 0, 0, 0, 0, 0, 0},
c9de4050
JS
57};
58
0ec4dfb8 59bool BlockJobVerbTable[BLOCK_JOB_VERB__MAX][BLOCK_JOB_STATUS__MAX] = {
3925cd3b
JS
60 /* U, C, R, P, Y, S, X, E, N */
61 [BLOCK_JOB_VERB_CANCEL] = {0, 1, 1, 1, 1, 1, 0, 0, 0},
62 [BLOCK_JOB_VERB_PAUSE] = {0, 1, 1, 1, 1, 1, 0, 0, 0},
63 [BLOCK_JOB_VERB_RESUME] = {0, 1, 1, 1, 1, 1, 0, 0, 0},
64 [BLOCK_JOB_VERB_SET_SPEED] = {0, 1, 1, 1, 1, 1, 0, 0, 0},
65 [BLOCK_JOB_VERB_COMPLETE] = {0, 0, 0, 0, 1, 0, 0, 0, 0},
75f71059 66 [BLOCK_JOB_VERB_DISMISS] = {0, 0, 0, 0, 0, 0, 0, 1, 0},
0ec4dfb8
JS
67};
68
c9de4050
JS
69static void block_job_state_transition(BlockJob *job, BlockJobStatus s1)
70{
71 BlockJobStatus s0 = job->status;
72 assert(s1 >= 0 && s1 <= BLOCK_JOB_STATUS__MAX);
73 trace_block_job_state_transition(job, job->ret, BlockJobSTT[s0][s1] ?
74 "allowed" : "disallowed",
75 qapi_enum_lookup(&BlockJobStatus_lookup,
76 s0),
77 qapi_enum_lookup(&BlockJobStatus_lookup,
78 s1));
79 assert(BlockJobSTT[s0][s1]);
80 job->status = s1;
81}
82
0ec4dfb8
JS
83static int block_job_apply_verb(BlockJob *job, BlockJobVerb bv, Error **errp)
84{
85 assert(bv >= 0 && bv <= BLOCK_JOB_VERB__MAX);
86 trace_block_job_apply_verb(job, qapi_enum_lookup(&BlockJobStatus_lookup,
87 job->status),
88 qapi_enum_lookup(&BlockJobVerb_lookup, bv),
89 BlockJobVerbTable[bv][job->status] ?
90 "allowed" : "prohibited");
91 if (BlockJobVerbTable[bv][job->status]) {
92 return 0;
93 }
94 error_setg(errp, "Job '%s' in state '%s' cannot accept command verb '%s'",
95 job->id, qapi_enum_lookup(&BlockJobStatus_lookup, job->status),
96 qapi_enum_lookup(&BlockJobVerb_lookup, bv));
97 return -EPERM;
98}
99
fc24908e
PB
100static void block_job_lock(void)
101{
102 qemu_mutex_lock(&block_job_mutex);
103}
104
105static void block_job_unlock(void)
106{
107 qemu_mutex_unlock(&block_job_mutex);
108}
109
110static void __attribute__((__constructor__)) block_job_init(void)
111{
112 qemu_mutex_init(&block_job_mutex);
113}
114
8254b6d9
JS
115static void block_job_event_cancelled(BlockJob *job);
116static void block_job_event_completed(BlockJob *job, const char *msg);
aa9ef2e6 117static void block_job_enter_cond(BlockJob *job, bool(*fn)(BlockJob *job));
8254b6d9 118
c55a832f
FZ
119/* Transactional group of block jobs */
120struct BlockJobTxn {
121
122 /* Is this txn being cancelled? */
123 bool aborting;
124
125 /* List of jobs */
126 QLIST_HEAD(, BlockJob) jobs;
127
128 /* Reference count */
129 int refcnt;
130};
131
a7112795
AG
132static QLIST_HEAD(, BlockJob) block_jobs = QLIST_HEAD_INITIALIZER(block_jobs);
133
88691b37
PB
134/*
135 * The block job API is composed of two categories of functions.
136 *
137 * The first includes functions used by the monitor. The monitor is
138 * peculiar in that it accesses the block job list with block_job_get, and
139 * therefore needs consistency across block_job_get and the actual operation
140 * (e.g. block_job_set_speed). The consistency is achieved with
141 * aio_context_acquire/release. These functions are declared in blockjob.h.
142 *
143 * The second includes functions used by the block job drivers and sometimes
144 * by the core block layer. These do not care about locking, because the
145 * whole coroutine runs under the AioContext lock, and are declared in
146 * blockjob_int.h.
147 */
148
a7112795
AG
149BlockJob *block_job_next(BlockJob *job)
150{
151 if (!job) {
152 return QLIST_FIRST(&block_jobs);
153 }
154 return QLIST_NEXT(job, job_list);
155}
156
ffb1f10c
AG
157BlockJob *block_job_get(const char *id)
158{
159 BlockJob *job;
160
161 QLIST_FOREACH(job, &block_jobs, job_list) {
559b935f 162 if (job->id && !strcmp(id, job->id)) {
ffb1f10c
AG
163 return job;
164 }
165 }
166
167 return NULL;
168}
169
c8ab5c2d
PB
170BlockJobTxn *block_job_txn_new(void)
171{
172 BlockJobTxn *txn = g_new0(BlockJobTxn, 1);
173 QLIST_INIT(&txn->jobs);
174 txn->refcnt = 1;
175 return txn;
176}
177
178static void block_job_txn_ref(BlockJobTxn *txn)
179{
180 txn->refcnt++;
181}
182
183void block_job_txn_unref(BlockJobTxn *txn)
184{
185 if (txn && --txn->refcnt == 0) {
186 g_free(txn);
187 }
188}
189
190void block_job_txn_add_job(BlockJobTxn *txn, BlockJob *job)
191{
192 if (!txn) {
193 return;
194 }
195
196 assert(!job->txn);
197 job->txn = txn;
198
199 QLIST_INSERT_HEAD(&txn->jobs, job, txn_list);
200 block_job_txn_ref(txn);
201}
202
f321dcb5
PB
203static void block_job_pause(BlockJob *job)
204{
205 job->pause_count++;
206}
207
208static void block_job_resume(BlockJob *job)
209{
210 assert(job->pause_count > 0);
211 job->pause_count--;
212 if (job->pause_count) {
213 return;
214 }
215 block_job_enter(job);
216}
217
4172a003 218void block_job_ref(BlockJob *job)
05b0d8e3
PB
219{
220 ++job->refcnt;
221}
222
223static void block_job_attached_aio_context(AioContext *new_context,
224 void *opaque);
225static void block_job_detach_aio_context(void *opaque);
226
4172a003 227void block_job_unref(BlockJob *job)
05b0d8e3
PB
228{
229 if (--job->refcnt == 0) {
3925cd3b 230 assert(job->status == BLOCK_JOB_STATUS_NULL);
05b0d8e3 231 BlockDriverState *bs = blk_bs(job->blk);
0a3e155f 232 QLIST_REMOVE(job, job_list);
05b0d8e3
PB
233 bs->job = NULL;
234 block_job_remove_all_bdrv(job);
235 blk_remove_aio_context_notifier(job->blk,
236 block_job_attached_aio_context,
237 block_job_detach_aio_context, job);
238 blk_unref(job->blk);
239 error_free(job->blocker);
240 g_free(job->id);
fc24908e 241 assert(!timer_pending(&job->sleep_timer));
05b0d8e3
PB
242 g_free(job);
243 }
244}
245
463e0be1
SH
246static void block_job_attached_aio_context(AioContext *new_context,
247 void *opaque)
248{
249 BlockJob *job = opaque;
250
251 if (job->driver->attached_aio_context) {
252 job->driver->attached_aio_context(job, new_context);
253 }
254
255 block_job_resume(job);
256}
257
bae8196d
PB
258static void block_job_drain(BlockJob *job)
259{
260 /* If job is !job->busy this kicks it into the next pause point. */
261 block_job_enter(job);
262
263 blk_drain(job->blk);
264 if (job->driver->drain) {
265 job->driver->drain(job);
266 }
267}
268
463e0be1
SH
269static void block_job_detach_aio_context(void *opaque)
270{
271 BlockJob *job = opaque;
272
273 /* In case the job terminates during aio_poll()... */
274 block_job_ref(job);
275
276 block_job_pause(job);
277
463e0be1 278 while (!job->paused && !job->completed) {
bae8196d 279 block_job_drain(job);
463e0be1
SH
280 }
281
282 block_job_unref(job);
283}
284
f321dcb5
PB
285static char *child_job_get_parent_desc(BdrvChild *c)
286{
287 BlockJob *job = c->opaque;
288 return g_strdup_printf("%s job '%s'",
977c736f 289 BlockJobType_str(job->driver->job_type),
f321dcb5
PB
290 job->id);
291}
292
ad90feba 293static void child_job_drained_begin(BdrvChild *c)
f321dcb5 294{
ad90feba 295 BlockJob *job = c->opaque;
f321dcb5
PB
296 block_job_pause(job);
297}
298
ad90feba 299static void child_job_drained_end(BdrvChild *c)
f321dcb5 300{
ad90feba 301 BlockJob *job = c->opaque;
f321dcb5
PB
302 block_job_resume(job);
303}
304
ad90feba
KW
305static const BdrvChildRole child_job = {
306 .get_parent_desc = child_job_get_parent_desc,
307 .drained_begin = child_job_drained_begin,
308 .drained_end = child_job_drained_end,
309 .stay_at_node = true,
f321dcb5
PB
310};
311
bbc02b90
KW
312void block_job_remove_all_bdrv(BlockJob *job)
313{
314 GSList *l;
315 for (l = job->nodes; l; l = l->next) {
316 BdrvChild *c = l->data;
317 bdrv_op_unblock_all(c->bs, job->blocker);
318 bdrv_root_unref_child(c);
319 }
320 g_slist_free(job->nodes);
321 job->nodes = NULL;
322}
323
76d554e2
KW
324int block_job_add_bdrv(BlockJob *job, const char *name, BlockDriverState *bs,
325 uint64_t perm, uint64_t shared_perm, Error **errp)
23d402d4 326{
76d554e2
KW
327 BdrvChild *c;
328
329 c = bdrv_root_attach_child(bs, name, &child_job, perm, shared_perm,
330 job, errp);
331 if (c == NULL) {
332 return -EPERM;
333 }
334
335 job->nodes = g_slist_prepend(job->nodes, c);
23d402d4
AG
336 bdrv_ref(bs);
337 bdrv_op_block_all(bs, job->blocker);
76d554e2
KW
338
339 return 0;
23d402d4
AG
340}
341
559b935f
JS
342bool block_job_is_internal(BlockJob *job)
343{
344 return (job->id == NULL);
345}
346
5ccac6f1
JS
347static bool block_job_started(BlockJob *job)
348{
349 return job->co;
350}
351
e3796a24
JS
352/**
353 * All jobs must allow a pause point before entering their job proper. This
354 * ensures that jobs can be paused prior to being started, then resumed later.
355 */
356static void coroutine_fn block_job_co_entry(void *opaque)
357{
358 BlockJob *job = opaque;
359
360 assert(job && job->driver && job->driver->start);
361 block_job_pause_point(job);
362 job->driver->start(job);
363}
364
fc24908e
PB
365static void block_job_sleep_timer_cb(void *opaque)
366{
367 BlockJob *job = opaque;
368
369 block_job_enter(job);
370}
371
5ccac6f1
JS
372void block_job_start(BlockJob *job)
373{
374 assert(job && !block_job_started(job) && job->paused &&
e3796a24
JS
375 job->driver && job->driver->start);
376 job->co = qemu_coroutine_create(block_job_co_entry, job);
377 job->pause_count--;
378 job->busy = true;
379 job->paused = false;
c9de4050 380 block_job_state_transition(job, BLOCK_JOB_STATUS_RUNNING);
aef4278c 381 bdrv_coroutine_enter(blk_bs(job->blk), job->co);
5ccac6f1
JS
382}
383
3925cd3b
JS
384static void block_job_decommission(BlockJob *job)
385{
386 assert(job);
387 job->completed = true;
388 job->busy = false;
389 job->paused = false;
390 job->deferred_to_main_loop = true;
391 block_job_state_transition(job, BLOCK_JOB_STATUS_NULL);
392 block_job_unref(job);
393}
394
75f71059
JS
395static void block_job_do_dismiss(BlockJob *job)
396{
397 block_job_decommission(job);
398}
399
e0cf0364
JS
400static void block_job_conclude(BlockJob *job)
401{
402 block_job_state_transition(job, BLOCK_JOB_STATUS_CONCLUDED);
75f71059
JS
403 if (job->auto_dismiss || !block_job_started(job)) {
404 block_job_do_dismiss(job);
405 }
e0cf0364
JS
406}
407
35d6b368
JS
408static void block_job_update_rc(BlockJob *job)
409{
410 if (!job->ret && block_job_is_cancelled(job)) {
411 job->ret = -ECANCELED;
412 }
413 if (job->ret) {
414 block_job_state_transition(job, BLOCK_JOB_STATUS_ABORTING);
415 }
416}
417
43628d93
JS
418static void block_job_commit(BlockJob *job)
419{
420 assert(!job->ret);
421 if (job->driver->commit) {
422 job->driver->commit(job);
423 }
424}
425
426static void block_job_abort(BlockJob *job)
427{
428 assert(job->ret);
429 if (job->driver->abort) {
430 job->driver->abort(job);
431 }
432}
433
434static void block_job_clean(BlockJob *job)
435{
436 if (job->driver->clean) {
437 job->driver->clean(job);
438 }
439}
440
c55a832f
FZ
441static void block_job_completed_single(BlockJob *job)
442{
4fb588e9
PB
443 assert(job->completed);
444
35d6b368
JS
445 /* Ensure abort is called for late-transactional failures */
446 block_job_update_rc(job);
10a3fbb0 447
c55a832f 448 if (!job->ret) {
43628d93 449 block_job_commit(job);
c55a832f 450 } else {
43628d93 451 block_job_abort(job);
e8a40bf7 452 }
43628d93 453 block_job_clean(job);
8254b6d9
JS
454
455 if (job->cb) {
456 job->cb(job->opaque, job->ret);
457 }
5ccac6f1
JS
458
459 /* Emit events only if we actually started */
460 if (block_job_started(job)) {
461 if (block_job_is_cancelled(job)) {
462 block_job_event_cancelled(job);
463 } else {
464 const char *msg = NULL;
465 if (job->ret < 0) {
466 msg = strerror(-job->ret);
467 }
468 block_job_event_completed(job, msg);
8254b6d9 469 }
8254b6d9
JS
470 }
471
75859b94
JS
472 QLIST_REMOVE(job, txn_list);
473 block_job_txn_unref(job->txn);
e0cf0364 474 block_job_conclude(job);
c55a832f
FZ
475}
476
4c241cf5
PB
477static void block_job_cancel_async(BlockJob *job)
478{
479 if (job->iostatus != BLOCK_DEVICE_IO_STATUS_OK) {
480 block_job_iostatus_reset(job);
481 }
482 if (job->user_paused) {
483 /* Do not call block_job_enter here, the caller will handle it. */
484 job->user_paused = false;
485 job->pause_count--;
486 }
487 job->cancelled = true;
488}
489
c8ab5c2d
PB
490static int block_job_finish_sync(BlockJob *job,
491 void (*finish)(BlockJob *, Error **errp),
492 Error **errp)
493{
494 Error *local_err = NULL;
495 int ret;
496
497 assert(blk_bs(job->blk)->job == job);
498
499 block_job_ref(job);
500
4fb588e9
PB
501 if (finish) {
502 finish(job, &local_err);
503 }
c8ab5c2d
PB
504 if (local_err) {
505 error_propagate(errp, local_err);
506 block_job_unref(job);
507 return -EBUSY;
508 }
509 /* block_job_drain calls block_job_enter, and it should be enough to
510 * induce progress until the job completes or moves to the main thread.
511 */
512 while (!job->deferred_to_main_loop && !job->completed) {
513 block_job_drain(job);
514 }
515 while (!job->completed) {
516 aio_poll(qemu_get_aio_context(), true);
517 }
518 ret = (job->cancelled && job->ret == 0) ? -ECANCELED : job->ret;
519 block_job_unref(job);
520 return ret;
521}
522
c55a832f
FZ
523static void block_job_completed_txn_abort(BlockJob *job)
524{
525 AioContext *ctx;
526 BlockJobTxn *txn = job->txn;
4fb588e9 527 BlockJob *other_job;
c55a832f
FZ
528
529 if (txn->aborting) {
530 /*
531 * We are cancelled by another job, which will handle everything.
532 */
533 return;
534 }
535 txn->aborting = true;
4fb588e9
PB
536 block_job_txn_ref(txn);
537
c55a832f
FZ
538 /* We are the first failed job. Cancel other jobs. */
539 QLIST_FOREACH(other_job, &txn->jobs, txn_list) {
b6d2e599 540 ctx = blk_get_aio_context(other_job->blk);
c55a832f
FZ
541 aio_context_acquire(ctx);
542 }
4fb588e9
PB
543
544 /* Other jobs are effectively cancelled by us, set the status for
545 * them; this job, however, may or may not be cancelled, depending
546 * on the caller, so leave it. */
c55a832f 547 QLIST_FOREACH(other_job, &txn->jobs, txn_list) {
4fb588e9
PB
548 if (other_job != job) {
549 block_job_cancel_async(other_job);
c55a832f 550 }
c55a832f 551 }
4fb588e9
PB
552 while (!QLIST_EMPTY(&txn->jobs)) {
553 other_job = QLIST_FIRST(&txn->jobs);
b6d2e599 554 ctx = blk_get_aio_context(other_job->blk);
4fb588e9
PB
555 if (!other_job->completed) {
556 assert(other_job->cancelled);
557 block_job_finish_sync(other_job, NULL, NULL);
558 }
c55a832f
FZ
559 block_job_completed_single(other_job);
560 aio_context_release(ctx);
561 }
4fb588e9
PB
562
563 block_job_txn_unref(txn);
c55a832f
FZ
564}
565
566static void block_job_completed_txn_success(BlockJob *job)
567{
568 AioContext *ctx;
569 BlockJobTxn *txn = job->txn;
570 BlockJob *other_job, *next;
571 /*
572 * Successful completion, see if there are other running jobs in this
573 * txn.
574 */
575 QLIST_FOREACH(other_job, &txn->jobs, txn_list) {
576 if (!other_job->completed) {
577 return;
578 }
579 }
580 /* We are the last completed job, commit the transaction. */
581 QLIST_FOREACH_SAFE(other_job, &txn->jobs, txn_list, next) {
b6d2e599 582 ctx = blk_get_aio_context(other_job->blk);
c55a832f
FZ
583 aio_context_acquire(ctx);
584 assert(other_job->ret == 0);
585 block_job_completed_single(other_job);
586 aio_context_release(ctx);
587 }
588}
589
aa9ef2e6
JS
590/* Assumes the block_job_mutex is held */
591static bool block_job_timer_pending(BlockJob *job)
592{
593 return timer_pending(&job->sleep_timer);
594}
595
2f0c9fe6
PB
596void block_job_set_speed(BlockJob *job, int64_t speed, Error **errp)
597{
598 Error *local_err = NULL;
aa9ef2e6 599 int64_t old_speed = job->speed;
2f0c9fe6 600
3fc4b10a 601 if (!job->driver->set_speed) {
c6bd8c70 602 error_setg(errp, QERR_UNSUPPORTED);
2f0c9fe6
PB
603 return;
604 }
0ec4dfb8
JS
605 if (block_job_apply_verb(job, BLOCK_JOB_VERB_SET_SPEED, errp)) {
606 return;
607 }
3fc4b10a 608 job->driver->set_speed(job, speed, &local_err);
84d18f06 609 if (local_err) {
2f0c9fe6
PB
610 error_propagate(errp, local_err);
611 return;
612 }
613
614 job->speed = speed;
d4fce188 615 if (speed && speed <= old_speed) {
aa9ef2e6
JS
616 return;
617 }
618
619 /* kick only if a timer is pending */
620 block_job_enter_cond(job, block_job_timer_pending);
2f0c9fe6
PB
621}
622
aeae883b
PB
623void block_job_complete(BlockJob *job, Error **errp)
624{
559b935f
JS
625 /* Should not be reachable via external interface for internal jobs */
626 assert(job->id);
0ec4dfb8
JS
627 if (block_job_apply_verb(job, BLOCK_JOB_VERB_COMPLETE, errp)) {
628 return;
629 }
630 if (job->pause_count || job->cancelled || !job->driver->complete) {
9df229c3
AG
631 error_setg(errp, "The active block job '%s' cannot be completed",
632 job->id);
aeae883b
PB
633 return;
634 }
635
3fc4b10a 636 job->driver->complete(job, errp);
aeae883b
PB
637}
638
75f71059
JS
639void block_job_dismiss(BlockJob **jobptr, Error **errp)
640{
641 BlockJob *job = *jobptr;
642 /* similarly to _complete, this is QMP-interface only. */
643 assert(job->id);
644 if (block_job_apply_verb(job, BLOCK_JOB_VERB_DISMISS, errp)) {
645 return;
646 }
647
648 block_job_do_dismiss(job);
649 *jobptr = NULL;
650}
651
0ec4dfb8 652void block_job_user_pause(BlockJob *job, Error **errp)
0df4ba58 653{
0ec4dfb8
JS
654 if (block_job_apply_verb(job, BLOCK_JOB_VERB_PAUSE, errp)) {
655 return;
656 }
657 if (job->user_paused) {
658 error_setg(errp, "Job is already paused");
659 return;
660 }
0df4ba58
JS
661 job->user_paused = true;
662 block_job_pause(job);
663}
664
0df4ba58
JS
665bool block_job_user_paused(BlockJob *job)
666{
6573d9c6 667 return job->user_paused;
0df4ba58
JS
668}
669
0ec4dfb8 670void block_job_user_resume(BlockJob *job, Error **errp)
0df4ba58 671{
0ec4dfb8
JS
672 assert(job);
673 if (!job->user_paused || job->pause_count <= 0) {
674 error_setg(errp, "Can't resume a job that was not paused");
675 return;
0df4ba58 676 }
0ec4dfb8
JS
677 if (block_job_apply_verb(job, BLOCK_JOB_VERB_RESUME, errp)) {
678 return;
679 }
680 block_job_iostatus_reset(job);
681 job->user_paused = false;
682 block_job_resume(job);
0df4ba58
JS
683}
684
8acc72a4
PB
685void block_job_cancel(BlockJob *job)
686{
e0cf0364 687 if (job->status == BLOCK_JOB_STATUS_CONCLUDED) {
75f71059 688 block_job_do_dismiss(job);
e0cf0364 689 } else if (block_job_started(job)) {
4c241cf5 690 block_job_cancel_async(job);
5ccac6f1
JS
691 block_job_enter(job);
692 } else {
693 block_job_completed(job, -ECANCELED);
694 }
8acc72a4
PB
695}
696
0ec4dfb8
JS
697void block_job_user_cancel(BlockJob *job, Error **errp)
698{
699 if (block_job_apply_verb(job, BLOCK_JOB_VERB_CANCEL, errp)) {
700 return;
701 }
702 block_job_cancel(job);
703}
704
345f9e1b
HR
705/* A wrapper around block_job_cancel() taking an Error ** parameter so it may be
706 * used with block_job_finish_sync() without the need for (rather nasty)
707 * function pointer casts there. */
708static void block_job_cancel_err(BlockJob *job, Error **errp)
709{
710 block_job_cancel(job);
711}
712
713int block_job_cancel_sync(BlockJob *job)
714{
715 return block_job_finish_sync(job, &block_job_cancel_err, NULL);
716}
717
a1a2af07
KW
718void block_job_cancel_sync_all(void)
719{
720 BlockJob *job;
721 AioContext *aio_context;
722
723 while ((job = QLIST_FIRST(&block_jobs))) {
b6d2e599 724 aio_context = blk_get_aio_context(job->blk);
a1a2af07
KW
725 aio_context_acquire(aio_context);
726 block_job_cancel_sync(job);
727 aio_context_release(aio_context);
728 }
729}
730
345f9e1b
HR
731int block_job_complete_sync(BlockJob *job, Error **errp)
732{
733 return block_job_finish_sync(job, &block_job_complete, errp);
734}
735
559b935f 736BlockJobInfo *block_job_query(BlockJob *job, Error **errp)
30e628b7 737{
559b935f
JS
738 BlockJobInfo *info;
739
740 if (block_job_is_internal(job)) {
741 error_setg(errp, "Cannot query QEMU internal jobs");
742 return NULL;
743 }
744 info = g_new0(BlockJobInfo, 1);
977c736f 745 info->type = g_strdup(BlockJobType_str(job->driver->job_type));
8ccb9569 746 info->device = g_strdup(job->id);
32c81a4a 747 info->len = job->len;
fc24908e 748 info->busy = atomic_read(&job->busy);
751ebd76 749 info->paused = job->pause_count > 0;
32c81a4a
PB
750 info->offset = job->offset;
751 info->speed = job->speed;
752 info->io_status = job->iostatus;
ef6dbf1e 753 info->ready = job->ready;
58b295ba 754 info->status = job->status;
30e628b7
PB
755 return info;
756}
32c81a4a
PB
757
758static void block_job_iostatus_set_err(BlockJob *job, int error)
759{
760 if (job->iostatus == BLOCK_DEVICE_IO_STATUS_OK) {
761 job->iostatus = error == ENOSPC ? BLOCK_DEVICE_IO_STATUS_NOSPACE :
762 BLOCK_DEVICE_IO_STATUS_FAILED;
763 }
764}
765
8254b6d9 766static void block_job_event_cancelled(BlockJob *job)
bcada37b 767{
559b935f
JS
768 if (block_job_is_internal(job)) {
769 return;
770 }
771
bcada37b 772 qapi_event_send_block_job_cancelled(job->driver->job_type,
8ccb9569 773 job->id,
bcada37b
WX
774 job->len,
775 job->offset,
776 job->speed,
777 &error_abort);
778}
32c81a4a 779
8254b6d9 780static void block_job_event_completed(BlockJob *job, const char *msg)
a66a2a36 781{
559b935f
JS
782 if (block_job_is_internal(job)) {
783 return;
784 }
785
bcada37b 786 qapi_event_send_block_job_completed(job->driver->job_type,
8ccb9569 787 job->id,
bcada37b
WX
788 job->len,
789 job->offset,
790 job->speed,
791 !!msg,
792 msg,
793 &error_abort);
a66a2a36
PB
794}
795
88691b37
PB
796/*
797 * API for block job drivers and the block layer. These functions are
798 * declared in blockjob_int.h.
799 */
800
801void *block_job_create(const char *job_id, const BlockJobDriver *driver,
75859b94 802 BlockJobTxn *txn, BlockDriverState *bs, uint64_t perm,
88691b37
PB
803 uint64_t shared_perm, int64_t speed, int flags,
804 BlockCompletionFunc *cb, void *opaque, Error **errp)
805{
806 BlockBackend *blk;
807 BlockJob *job;
808 int ret;
809
810 if (bs->job) {
811 error_setg(errp, QERR_DEVICE_IN_USE, bdrv_get_device_name(bs));
812 return NULL;
813 }
814
815 if (job_id == NULL && !(flags & BLOCK_JOB_INTERNAL)) {
816 job_id = bdrv_get_device_name(bs);
817 if (!*job_id) {
818 error_setg(errp, "An explicit job ID is required for this node");
819 return NULL;
820 }
821 }
822
823 if (job_id) {
824 if (flags & BLOCK_JOB_INTERNAL) {
825 error_setg(errp, "Cannot specify job ID for internal block job");
826 return NULL;
827 }
828
829 if (!id_wellformed(job_id)) {
830 error_setg(errp, "Invalid job ID '%s'", job_id);
831 return NULL;
832 }
833
834 if (block_job_get(job_id)) {
835 error_setg(errp, "Job ID '%s' already in use", job_id);
836 return NULL;
837 }
838 }
839
840 blk = blk_new(perm, shared_perm);
841 ret = blk_insert_bs(blk, bs, errp);
842 if (ret < 0) {
843 blk_unref(blk);
844 return NULL;
845 }
846
847 job = g_malloc0(driver->instance_size);
848 job->driver = driver;
849 job->id = g_strdup(job_id);
850 job->blk = blk;
851 job->cb = cb;
852 job->opaque = opaque;
853 job->busy = false;
854 job->paused = true;
855 job->pause_count = 1;
856 job->refcnt = 1;
75f71059 857 job->auto_dismiss = !(flags & BLOCK_JOB_MANUAL_DISMISS);
c9de4050 858 block_job_state_transition(job, BLOCK_JOB_STATUS_CREATED);
fc24908e
PB
859 aio_timer_init(qemu_get_aio_context(), &job->sleep_timer,
860 QEMU_CLOCK_REALTIME, SCALE_NS,
861 block_job_sleep_timer_cb, job);
88691b37
PB
862
863 error_setg(&job->blocker, "block device is in use by block job: %s",
977c736f 864 BlockJobType_str(driver->job_type));
88691b37
PB
865 block_job_add_bdrv(job, "main node", bs, 0, BLK_PERM_ALL, &error_abort);
866 bs->job = job;
867
88691b37
PB
868 bdrv_op_unblock(bs, BLOCK_OP_TYPE_DATAPLANE, job->blocker);
869
870 QLIST_INSERT_HEAD(&block_jobs, job, job_list);
871
872 blk_add_aio_context_notifier(blk, block_job_attached_aio_context,
873 block_job_detach_aio_context, job);
874
875 /* Only set speed when necessary to avoid NotSupported error */
876 if (speed != 0) {
877 Error *local_err = NULL;
878
879 block_job_set_speed(job, speed, &local_err);
880 if (local_err) {
3925cd3b 881 block_job_early_fail(job);
88691b37
PB
882 error_propagate(errp, local_err);
883 return NULL;
884 }
885 }
75859b94
JS
886
887 /* Single jobs are modeled as single-job transactions for sake of
888 * consolidating the job management logic */
889 if (!txn) {
890 txn = block_job_txn_new();
891 block_job_txn_add_job(txn, job);
892 block_job_txn_unref(txn);
893 } else {
894 block_job_txn_add_job(txn, job);
895 }
896
88691b37
PB
897 return job;
898}
899
f321dcb5
PB
900void block_job_pause_all(void)
901{
902 BlockJob *job = NULL;
903 while ((job = block_job_next(job))) {
904 AioContext *aio_context = blk_get_aio_context(job->blk);
905
906 aio_context_acquire(aio_context);
3d5d319e 907 block_job_ref(job);
f321dcb5
PB
908 block_job_pause(job);
909 aio_context_release(aio_context);
910 }
911}
912
88691b37
PB
913void block_job_early_fail(BlockJob *job)
914{
3925cd3b
JS
915 assert(job->status == BLOCK_JOB_STATUS_CREATED);
916 block_job_decommission(job);
88691b37
PB
917}
918
919void block_job_completed(BlockJob *job, int ret)
920{
75859b94 921 assert(job && job->txn && !job->completed);
88691b37 922 assert(blk_bs(job->blk)->job == job);
88691b37
PB
923 job->completed = true;
924 job->ret = ret;
35d6b368
JS
925 block_job_update_rc(job);
926 trace_block_job_completed(job, ret, job->ret);
927 if (job->ret) {
88691b37
PB
928 block_job_completed_txn_abort(job);
929 } else {
930 block_job_completed_txn_success(job);
931 }
932}
933
934static bool block_job_should_pause(BlockJob *job)
935{
936 return job->pause_count > 0;
937}
938
fc24908e
PB
939/* Yield, and schedule a timer to reenter the coroutine after @ns nanoseconds.
940 * Reentering the job coroutine with block_job_enter() before the timer has
941 * expired is allowed and cancels the timer.
942 *
943 * If @ns is (uint64_t) -1, no timer is scheduled and block_job_enter() must be
944 * called explicitly. */
945static void block_job_do_yield(BlockJob *job, uint64_t ns)
356f59b8 946{
fc24908e
PB
947 block_job_lock();
948 if (ns != -1) {
949 timer_mod(&job->sleep_timer, ns);
950 }
356f59b8 951 job->busy = false;
fc24908e 952 block_job_unlock();
356f59b8
PB
953 qemu_coroutine_yield();
954
955 /* Set by block_job_enter before re-entering the coroutine. */
956 assert(job->busy);
957}
958
88691b37
PB
959void coroutine_fn block_job_pause_point(BlockJob *job)
960{
961 assert(job && block_job_started(job));
962
963 if (!block_job_should_pause(job)) {
964 return;
965 }
966 if (block_job_is_cancelled(job)) {
967 return;
968 }
969
970 if (job->driver->pause) {
971 job->driver->pause(job);
972 }
973
974 if (block_job_should_pause(job) && !block_job_is_cancelled(job)) {
58b295ba 975 BlockJobStatus status = job->status;
c9de4050
JS
976 block_job_state_transition(job, status == BLOCK_JOB_STATUS_READY ? \
977 BLOCK_JOB_STATUS_STANDBY : \
978 BLOCK_JOB_STATUS_PAUSED);
88691b37 979 job->paused = true;
fc24908e 980 block_job_do_yield(job, -1);
88691b37 981 job->paused = false;
c9de4050 982 block_job_state_transition(job, status);
88691b37
PB
983 }
984
985 if (job->driver->resume) {
986 job->driver->resume(job);
987 }
988}
989
f321dcb5
PB
990void block_job_resume_all(void)
991{
3d5d319e
AG
992 BlockJob *job, *next;
993
994 QLIST_FOREACH_SAFE(job, &block_jobs, job_list, next) {
f321dcb5
PB
995 AioContext *aio_context = blk_get_aio_context(job->blk);
996
997 aio_context_acquire(aio_context);
998 block_job_resume(job);
3d5d319e 999 block_job_unref(job);
f321dcb5
PB
1000 aio_context_release(aio_context);
1001 }
1002}
1003
aa9ef2e6
JS
1004/*
1005 * Conditionally enter a block_job pending a call to fn() while
1006 * under the block_job_lock critical section.
1007 */
1008static void block_job_enter_cond(BlockJob *job, bool(*fn)(BlockJob *job))
88691b37 1009{
eb05e011
PB
1010 if (!block_job_started(job)) {
1011 return;
1012 }
1013 if (job->deferred_to_main_loop) {
1014 return;
1015 }
1016
fc24908e 1017 block_job_lock();
356f59b8 1018 if (job->busy) {
fc24908e 1019 block_job_unlock();
356f59b8 1020 return;
88691b37 1021 }
356f59b8 1022
aa9ef2e6
JS
1023 if (fn && !fn(job)) {
1024 block_job_unlock();
1025 return;
1026 }
1027
fc24908e
PB
1028 assert(!job->deferred_to_main_loop);
1029 timer_del(&job->sleep_timer);
356f59b8 1030 job->busy = true;
fc24908e 1031 block_job_unlock();
356f59b8 1032 aio_co_wake(job->co);
88691b37
PB
1033}
1034
aa9ef2e6
JS
1035void block_job_enter(BlockJob *job)
1036{
1037 block_job_enter_cond(job, NULL);
1038}
1039
88691b37
PB
1040bool block_job_is_cancelled(BlockJob *job)
1041{
1042 return job->cancelled;
1043}
1044
5bf1d5a7 1045void block_job_sleep_ns(BlockJob *job, int64_t ns)
88691b37
PB
1046{
1047 assert(job->busy);
1048
1049 /* Check cancellation *before* setting busy = false, too! */
1050 if (block_job_is_cancelled(job)) {
1051 return;
1052 }
1053
88691b37 1054 if (!block_job_should_pause(job)) {
fc24908e 1055 block_job_do_yield(job, qemu_clock_get_ns(QEMU_CLOCK_REALTIME) + ns);
88691b37 1056 }
88691b37
PB
1057
1058 block_job_pause_point(job);
1059}
1060
1061void block_job_yield(BlockJob *job)
1062{
1063 assert(job->busy);
1064
1065 /* Check cancellation *before* setting busy = false, too! */
1066 if (block_job_is_cancelled(job)) {
1067 return;
1068 }
1069
88691b37 1070 if (!block_job_should_pause(job)) {
fc24908e 1071 block_job_do_yield(job, -1);
88691b37 1072 }
88691b37
PB
1073
1074 block_job_pause_point(job);
1075}
1076
2caf63a9
PB
1077void block_job_iostatus_reset(BlockJob *job)
1078{
4c241cf5
PB
1079 if (job->iostatus == BLOCK_DEVICE_IO_STATUS_OK) {
1080 return;
1081 }
1082 assert(job->user_paused && job->pause_count > 0);
2caf63a9
PB
1083 job->iostatus = BLOCK_DEVICE_IO_STATUS_OK;
1084}
1085
bcada37b 1086void block_job_event_ready(BlockJob *job)
a66a2a36 1087{
c9de4050 1088 block_job_state_transition(job, BLOCK_JOB_STATUS_READY);
ef6dbf1e
HR
1089 job->ready = true;
1090
559b935f
JS
1091 if (block_job_is_internal(job)) {
1092 return;
1093 }
1094
518848a2 1095 qapi_event_send_block_job_ready(job->driver->job_type,
8ccb9569 1096 job->id,
518848a2
MA
1097 job->len,
1098 job->offset,
1099 job->speed, &error_abort);
a66a2a36
PB
1100}
1101
81e254dc 1102BlockErrorAction block_job_error_action(BlockJob *job, BlockdevOnError on_err,
32c81a4a
PB
1103 int is_read, int error)
1104{
1105 BlockErrorAction action;
1106
1107 switch (on_err) {
1108 case BLOCKDEV_ON_ERROR_ENOSPC:
8c398252 1109 case BLOCKDEV_ON_ERROR_AUTO:
a589569f
WX
1110 action = (error == ENOSPC) ?
1111 BLOCK_ERROR_ACTION_STOP : BLOCK_ERROR_ACTION_REPORT;
32c81a4a
PB
1112 break;
1113 case BLOCKDEV_ON_ERROR_STOP:
a589569f 1114 action = BLOCK_ERROR_ACTION_STOP;
32c81a4a
PB
1115 break;
1116 case BLOCKDEV_ON_ERROR_REPORT:
a589569f 1117 action = BLOCK_ERROR_ACTION_REPORT;
32c81a4a
PB
1118 break;
1119 case BLOCKDEV_ON_ERROR_IGNORE:
a589569f 1120 action = BLOCK_ERROR_ACTION_IGNORE;
32c81a4a
PB
1121 break;
1122 default:
1123 abort();
1124 }
559b935f
JS
1125 if (!block_job_is_internal(job)) {
1126 qapi_event_send_block_job_error(job->id,
1127 is_read ? IO_OPERATION_TYPE_READ :
1128 IO_OPERATION_TYPE_WRITE,
1129 action, &error_abort);
1130 }
a589569f 1131 if (action == BLOCK_ERROR_ACTION_STOP) {
0ec4dfb8 1132 block_job_pause(job);
751ebd76 1133 /* make the pause user visible, which will be resumed from QMP. */
0ec4dfb8 1134 job->user_paused = true;
32c81a4a 1135 block_job_iostatus_set_err(job, error);
32c81a4a
PB
1136 }
1137 return action;
1138}
dec7d421
SH
1139
1140typedef struct {
1141 BlockJob *job;
dec7d421
SH
1142 AioContext *aio_context;
1143 BlockJobDeferToMainLoopFn *fn;
1144 void *opaque;
1145} BlockJobDeferToMainLoopData;
1146
1147static void block_job_defer_to_main_loop_bh(void *opaque)
1148{
1149 BlockJobDeferToMainLoopData *data = opaque;
1150 AioContext *aio_context;
1151
dec7d421
SH
1152 /* Prevent race with block_job_defer_to_main_loop() */
1153 aio_context_acquire(data->aio_context);
1154
1155 /* Fetch BDS AioContext again, in case it has changed */
b6d2e599 1156 aio_context = blk_get_aio_context(data->job->blk);
d79df2a2
PB
1157 if (aio_context != data->aio_context) {
1158 aio_context_acquire(aio_context);
1159 }
dec7d421
SH
1160
1161 data->fn(data->job, data->opaque);
1162
d79df2a2
PB
1163 if (aio_context != data->aio_context) {
1164 aio_context_release(aio_context);
1165 }
dec7d421
SH
1166
1167 aio_context_release(data->aio_context);
1168
1169 g_free(data);
1170}
1171
1172void block_job_defer_to_main_loop(BlockJob *job,
1173 BlockJobDeferToMainLoopFn *fn,
1174 void *opaque)
1175{
1176 BlockJobDeferToMainLoopData *data = g_malloc(sizeof(*data));
1177 data->job = job;
b6d2e599 1178 data->aio_context = blk_get_aio_context(job->blk);
dec7d421
SH
1179 data->fn = fn;
1180 data->opaque = opaque;
794f0141 1181 job->deferred_to_main_loop = true;
dec7d421 1182
fffb6e12
PB
1183 aio_bh_schedule_oneshot(qemu_get_aio_context(),
1184 block_job_defer_to_main_loop_bh, data);
dec7d421 1185}