]> git.proxmox.com Git - mirror_qemu.git/blame - block/qcow2-snapshot.c
meson: convert hw/smbios
[mirror_qemu.git] / block / qcow2-snapshot.c
CommitLineData
c142442b
KW
1/*
2 * Block driver for the QCOW version 2 format
3 *
4 * Copyright (c) 2004-2006 Fabrice Bellard
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
24
80c71a24 25#include "qemu/osdep.h"
7fa140ab 26#include "sysemu/block-backend.h"
da34e65c 27#include "qapi/error.h"
0d8c41da 28#include "qcow2.h"
58369e22 29#include "qemu/bswap.h"
d49b6836 30#include "qemu/error-report.h"
f348b6d1 31#include "qemu/cutils.h"
c142442b 32
099febf3
HR
33static void qcow2_free_single_snapshot(BlockDriverState *bs, int i)
34{
35 BDRVQcow2State *s = bs->opaque;
36
37 assert(i >= 0 && i < s->nb_snapshots);
38 g_free(s->snapshots[i].name);
39 g_free(s->snapshots[i].id_str);
40 g_free(s->snapshots[i].unknown_extra_data);
41 memset(&s->snapshots[i], 0, sizeof(s->snapshots[i]));
42}
43
ed6ccf0f 44void qcow2_free_snapshots(BlockDriverState *bs)
c142442b 45{
ff99129a 46 BDRVQcow2State *s = bs->opaque;
c142442b
KW
47 int i;
48
49 for(i = 0; i < s->nb_snapshots; i++) {
099febf3 50 qcow2_free_single_snapshot(bs, i);
c142442b 51 }
7267c094 52 g_free(s->snapshots);
c142442b
KW
53 s->snapshots = NULL;
54 s->nb_snapshots = 0;
55}
56
f91f1f15
HR
57/*
58 * If @repair is true, try to repair a broken snapshot table instead
59 * of just returning an error:
60 *
099febf3
HR
61 * - If the snapshot table was too long, set *nb_clusters_reduced to
62 * the number of snapshots removed off the end.
63 * The caller will update the on-disk nb_snapshots accordingly;
64 * this leaks clusters, but is safe.
65 * (The on-disk information must be updated before
66 * qcow2_check_refcounts(), because that function relies on
67 * s->nb_snapshots to reflect the on-disk value.)
68 *
f91f1f15
HR
69 * - If there were snapshots with too much extra metadata, increment
70 * *extra_data_dropped for each.
71 * This requires the caller to eventually rewrite the whole snapshot
72 * table, which requires cluster allocation. Therefore, this should
73 * be done only after qcow2_check_refcounts() made sure the refcount
74 * structures are valid.
75 * (In the meantime, the image is still valid because
76 * qcow2_check_refcounts() does not do anything with snapshots'
77 * extra data.)
78 */
79static int qcow2_do_read_snapshots(BlockDriverState *bs, bool repair,
099febf3 80 int *nb_clusters_reduced,
f91f1f15
HR
81 int *extra_data_dropped,
82 Error **errp)
c142442b 83{
ff99129a 84 BDRVQcow2State *s = bs->opaque;
c142442b 85 QCowSnapshotHeader h;
c2c9a466 86 QCowSnapshotExtraData extra;
c142442b
KW
87 QCowSnapshot *sn;
88 int i, id_str_size, name_size;
099febf3 89 int64_t offset, pre_sn_offset;
62414335 90 uint64_t table_length = 0;
42deb29f 91 int ret;
c142442b
KW
92
93 if (!s->nb_snapshots) {
94 s->snapshots = NULL;
95 s->snapshots_size = 0;
96 return 0;
97 }
98
99 offset = s->snapshots_offset;
5839e53b 100 s->snapshots = g_new0(QCowSnapshot, s->nb_snapshots);
42deb29f 101
c142442b 102 for(i = 0; i < s->nb_snapshots; i++) {
f91f1f15
HR
103 bool truncate_unknown_extra_data = false;
104
099febf3 105 pre_sn_offset = offset;
62414335
HR
106 table_length = ROUND_UP(table_length, 8);
107
42deb29f 108 /* Read statically sized part of the snapshot header */
9e029689 109 offset = ROUND_UP(offset, 8);
cf2ab8fc 110 ret = bdrv_pread(bs->file, offset, &h, sizeof(h));
42deb29f 111 if (ret < 0) {
ecf6c7c0 112 error_setg_errno(errp, -ret, "Failed to read snapshot table");
c142442b 113 goto fail;
42deb29f
KW
114 }
115
c142442b
KW
116 offset += sizeof(h);
117 sn = s->snapshots + i;
118 sn->l1_table_offset = be64_to_cpu(h.l1_table_offset);
119 sn->l1_size = be32_to_cpu(h.l1_size);
120 sn->vm_state_size = be32_to_cpu(h.vm_state_size);
121 sn->date_sec = be32_to_cpu(h.date_sec);
122 sn->date_nsec = be32_to_cpu(h.date_nsec);
123 sn->vm_clock_nsec = be64_to_cpu(h.vm_clock_nsec);
fcf9a6b7 124 sn->extra_data_size = be32_to_cpu(h.extra_data_size);
c142442b
KW
125
126 id_str_size = be16_to_cpu(h.id_str_size);
127 name_size = be16_to_cpu(h.name_size);
128
fcf9a6b7 129 if (sn->extra_data_size > QCOW_MAX_SNAPSHOT_EXTRA_DATA) {
f91f1f15
HR
130 if (!repair) {
131 ret = -EFBIG;
132 error_setg(errp, "Too much extra metadata in snapshot table "
133 "entry %i", i);
134 error_append_hint(errp, "You can force-remove this extra "
135 "metadata with qemu-img check -r all\n");
136 goto fail;
137 }
138
139 fprintf(stderr, "Discarding too much extra metadata in snapshot "
140 "table entry %i (%" PRIu32 " > %u)\n",
141 i, sn->extra_data_size, QCOW_MAX_SNAPSHOT_EXTRA_DATA);
142
143 (*extra_data_dropped)++;
144 truncate_unknown_extra_data = true;
fcf9a6b7
HR
145 }
146
147 /* Read known extra data */
cf2ab8fc 148 ret = bdrv_pread(bs->file, offset, &extra,
fcf9a6b7 149 MIN(sizeof(extra), sn->extra_data_size));
c2c9a466 150 if (ret < 0) {
ecf6c7c0 151 error_setg_errno(errp, -ret, "Failed to read snapshot table");
c2c9a466
KW
152 goto fail;
153 }
fcf9a6b7 154 offset += MIN(sizeof(extra), sn->extra_data_size);
c142442b 155
fcf9a6b7
HR
156 if (sn->extra_data_size >= endof(QCowSnapshotExtraData,
157 vm_state_size_large)) {
c2c9a466
KW
158 sn->vm_state_size = be64_to_cpu(extra.vm_state_size_large);
159 }
160
fcf9a6b7 161 if (sn->extra_data_size >= endof(QCowSnapshotExtraData, disk_size)) {
90b27759
KW
162 sn->disk_size = be64_to_cpu(extra.disk_size);
163 } else {
164 sn->disk_size = bs->total_sectors * BDRV_SECTOR_SIZE;
165 }
166
fcf9a6b7 167 if (sn->extra_data_size > sizeof(extra)) {
f91f1f15
HR
168 uint64_t extra_data_end;
169 size_t unknown_extra_data_size;
170
171 extra_data_end = offset + sn->extra_data_size - sizeof(extra);
fcf9a6b7 172
f91f1f15
HR
173 if (truncate_unknown_extra_data) {
174 sn->extra_data_size = QCOW_MAX_SNAPSHOT_EXTRA_DATA;
175 }
176
177 /* Store unknown extra data */
178 unknown_extra_data_size = sn->extra_data_size - sizeof(extra);
fcf9a6b7
HR
179 sn->unknown_extra_data = g_malloc(unknown_extra_data_size);
180 ret = bdrv_pread(bs->file, offset, sn->unknown_extra_data,
181 unknown_extra_data_size);
182 if (ret < 0) {
f91f1f15
HR
183 error_setg_errno(errp, -ret,
184 "Failed to read snapshot table");
fcf9a6b7
HR
185 goto fail;
186 }
f91f1f15 187 offset = extra_data_end;
fcf9a6b7
HR
188 }
189
42deb29f 190 /* Read snapshot ID */
7267c094 191 sn->id_str = g_malloc(id_str_size + 1);
cf2ab8fc 192 ret = bdrv_pread(bs->file, offset, sn->id_str, id_str_size);
42deb29f 193 if (ret < 0) {
ecf6c7c0 194 error_setg_errno(errp, -ret, "Failed to read snapshot table");
c142442b 195 goto fail;
42deb29f 196 }
c142442b
KW
197 offset += id_str_size;
198 sn->id_str[id_str_size] = '\0';
199
42deb29f 200 /* Read snapshot name */
7267c094 201 sn->name = g_malloc(name_size + 1);
cf2ab8fc 202 ret = bdrv_pread(bs->file, offset, sn->name, name_size);
42deb29f 203 if (ret < 0) {
ecf6c7c0 204 error_setg_errno(errp, -ret, "Failed to read snapshot table");
c142442b 205 goto fail;
42deb29f 206 }
c142442b
KW
207 offset += name_size;
208 sn->name[name_size] = '\0';
5dae6e30 209
62414335
HR
210 /* Note that the extra data may have been truncated */
211 table_length += sizeof(h) + sn->extra_data_size + id_str_size +
212 name_size;
213 if (!repair) {
214 assert(table_length == offset - s->snapshots_offset);
215 }
216
217 if (table_length > QCOW_MAX_SNAPSHOTS_SIZE ||
218 offset - s->snapshots_offset > INT_MAX)
219 {
099febf3
HR
220 if (!repair) {
221 ret = -EFBIG;
222 error_setg(errp, "Snapshot table is too big");
223 error_append_hint(errp, "You can force-remove all %u "
224 "overhanging snapshots with qemu-img check "
225 "-r all\n", s->nb_snapshots - i);
226 goto fail;
227 }
228
229 fprintf(stderr, "Discarding %u overhanging snapshots (snapshot "
230 "table is too big)\n", s->nb_snapshots - i);
231
232 *nb_clusters_reduced += (s->nb_snapshots - i);
233
234 /* Discard current snapshot also */
235 qcow2_free_single_snapshot(bs, i);
236
237 /*
238 * This leaks all the rest of the snapshot table and the
239 * snapshots' clusters, but we run in check -r all mode,
240 * so qcow2_check_refcounts() will take care of it.
241 */
242 s->nb_snapshots = i;
243 offset = pre_sn_offset;
244 break;
5dae6e30 245 }
c142442b 246 }
42deb29f 247
5dae6e30 248 assert(offset - s->snapshots_offset <= INT_MAX);
c142442b
KW
249 s->snapshots_size = offset - s->snapshots_offset;
250 return 0;
42deb29f
KW
251
252fail:
ed6ccf0f 253 qcow2_free_snapshots(bs);
42deb29f 254 return ret;
c142442b
KW
255}
256
f91f1f15
HR
257int qcow2_read_snapshots(BlockDriverState *bs, Error **errp)
258{
099febf3 259 return qcow2_do_read_snapshots(bs, false, NULL, NULL, errp);
f91f1f15
HR
260}
261
c142442b 262/* add at the end of the file a new list of snapshots */
e0314b56 263int qcow2_write_snapshots(BlockDriverState *bs)
c142442b 264{
ff99129a 265 BDRVQcow2State *s = bs->opaque;
c142442b
KW
266 QCowSnapshot *sn;
267 QCowSnapshotHeader h;
c2c9a466 268 QCowSnapshotExtraData extra;
c142442b 269 int i, name_size, id_str_size, snapshots_size;
d69969c4
KW
270 struct {
271 uint32_t nb_snapshots;
272 uint64_t snapshots_offset;
273 } QEMU_PACKED header_data;
5dae6e30 274 int64_t offset, snapshots_offset = 0;
07fd8779 275 int ret;
c142442b
KW
276
277 /* compute the size of the snapshots */
278 offset = 0;
279 for(i = 0; i < s->nb_snapshots; i++) {
280 sn = s->snapshots + i;
9e029689 281 offset = ROUND_UP(offset, 8);
c142442b 282 offset += sizeof(h);
fcf9a6b7 283 offset += MAX(sizeof(extra), sn->extra_data_size);
c142442b
KW
284 offset += strlen(sn->id_str);
285 offset += strlen(sn->name);
5dae6e30
KW
286
287 if (offset > QCOW_MAX_SNAPSHOTS_SIZE) {
288 ret = -EFBIG;
289 goto fail;
290 }
c142442b 291 }
5dae6e30
KW
292
293 assert(offset <= INT_MAX);
c142442b
KW
294 snapshots_size = offset;
295
07fd8779 296 /* Allocate space for the new snapshot list */
ed6ccf0f 297 snapshots_offset = qcow2_alloc_clusters(bs, snapshots_size);
c142442b 298 offset = snapshots_offset;
5d757b56 299 if (offset < 0) {
37d41f0a
HR
300 ret = offset;
301 goto fail;
5d757b56 302 }
f6977f15
SH
303 ret = bdrv_flush(bs);
304 if (ret < 0) {
37d41f0a 305 goto fail;
f6977f15 306 }
c142442b 307
cf93980e
HR
308 /* The snapshot list position has not yet been updated, so these clusters
309 * must indeed be completely free */
966b000f 310 ret = qcow2_pre_write_overlap_check(bs, 0, offset, snapshots_size, false);
cf93980e 311 if (ret < 0) {
37d41f0a 312 goto fail;
cf93980e
HR
313 }
314
315
07fd8779 316 /* Write all snapshots to the new list */
c142442b
KW
317 for(i = 0; i < s->nb_snapshots; i++) {
318 sn = s->snapshots + i;
319 memset(&h, 0, sizeof(h));
320 h.l1_table_offset = cpu_to_be64(sn->l1_table_offset);
321 h.l1_size = cpu_to_be32(sn->l1_size);
c2c9a466
KW
322 /* If it doesn't fit in 32 bit, older implementations should treat it
323 * as a disk-only snapshot rather than truncate the VM state */
324 if (sn->vm_state_size <= 0xffffffff) {
325 h.vm_state_size = cpu_to_be32(sn->vm_state_size);
326 }
c142442b
KW
327 h.date_sec = cpu_to_be32(sn->date_sec);
328 h.date_nsec = cpu_to_be32(sn->date_nsec);
329 h.vm_clock_nsec = cpu_to_be64(sn->vm_clock_nsec);
fcf9a6b7
HR
330 h.extra_data_size = cpu_to_be32(MAX(sizeof(extra),
331 sn->extra_data_size));
c2c9a466
KW
332
333 memset(&extra, 0, sizeof(extra));
334 extra.vm_state_size_large = cpu_to_be64(sn->vm_state_size);
90b27759 335 extra.disk_size = cpu_to_be64(sn->disk_size);
c142442b
KW
336
337 id_str_size = strlen(sn->id_str);
338 name_size = strlen(sn->name);
88fb1535 339 assert(id_str_size <= UINT16_MAX && name_size <= UINT16_MAX);
c142442b
KW
340 h.id_str_size = cpu_to_be16(id_str_size);
341 h.name_size = cpu_to_be16(name_size);
9e029689 342 offset = ROUND_UP(offset, 8);
07fd8779 343
d9ca2ea2 344 ret = bdrv_pwrite(bs->file, offset, &h, sizeof(h));
07fd8779 345 if (ret < 0) {
c142442b 346 goto fail;
07fd8779 347 }
c142442b 348 offset += sizeof(h);
07fd8779 349
d9ca2ea2 350 ret = bdrv_pwrite(bs->file, offset, &extra, sizeof(extra));
c2c9a466
KW
351 if (ret < 0) {
352 goto fail;
353 }
354 offset += sizeof(extra);
355
fcf9a6b7
HR
356 if (sn->extra_data_size > sizeof(extra)) {
357 size_t unknown_extra_data_size =
358 sn->extra_data_size - sizeof(extra);
359
360 /* qcow2_read_snapshots() ensures no unbounded allocation */
361 assert(unknown_extra_data_size <= BDRV_REQUEST_MAX_BYTES);
362 assert(sn->unknown_extra_data);
363
364 ret = bdrv_pwrite(bs->file, offset, sn->unknown_extra_data,
365 unknown_extra_data_size);
366 if (ret < 0) {
367 goto fail;
368 }
369 offset += unknown_extra_data_size;
370 }
371
d9ca2ea2 372 ret = bdrv_pwrite(bs->file, offset, sn->id_str, id_str_size);
07fd8779 373 if (ret < 0) {
c142442b 374 goto fail;
07fd8779 375 }
c142442b 376 offset += id_str_size;
07fd8779 377
d9ca2ea2 378 ret = bdrv_pwrite(bs->file, offset, sn->name, name_size);
07fd8779 379 if (ret < 0) {
c142442b 380 goto fail;
07fd8779 381 }
c142442b
KW
382 offset += name_size;
383 }
384
07fd8779
KW
385 /*
386 * Update the header to point to the new snapshot table. This requires the
387 * new table and its refcounts to be stable on disk.
07fd8779
KW
388 */
389 ret = bdrv_flush(bs);
390 if (ret < 0) {
391 goto fail;
392 }
393
d69969c4 394 QEMU_BUILD_BUG_ON(offsetof(QCowHeader, snapshots_offset) !=
d8fa8442 395 endof(QCowHeader, nb_snapshots));
d69969c4
KW
396
397 header_data.nb_snapshots = cpu_to_be32(s->nb_snapshots);
398 header_data.snapshots_offset = cpu_to_be64(snapshots_offset);
07fd8779 399
d9ca2ea2 400 ret = bdrv_pwrite_sync(bs->file, offsetof(QCowHeader, nb_snapshots),
d69969c4 401 &header_data, sizeof(header_data));
07fd8779 402 if (ret < 0) {
c142442b 403 goto fail;
07fd8779 404 }
c142442b
KW
405
406 /* free the old snapshot table */
6cfcb9b8
KW
407 qcow2_free_clusters(bs, s->snapshots_offset, s->snapshots_size,
408 QCOW2_DISCARD_SNAPSHOT);
c142442b
KW
409 s->snapshots_offset = snapshots_offset;
410 s->snapshots_size = snapshots_size;
411 return 0;
07fd8779
KW
412
413fail:
9186ad96
HR
414 if (snapshots_offset > 0) {
415 qcow2_free_clusters(bs, snapshots_offset, snapshots_size,
416 QCOW2_DISCARD_ALWAYS);
417 }
07fd8779 418 return ret;
c142442b
KW
419}
420
8bc584fe
HR
421int coroutine_fn qcow2_check_read_snapshot_table(BlockDriverState *bs,
422 BdrvCheckResult *result,
423 BdrvCheckMode fix)
424{
425 BDRVQcow2State *s = bs->opaque;
426 Error *local_err = NULL;
099febf3 427 int nb_clusters_reduced = 0;
f91f1f15 428 int extra_data_dropped = 0;
8bc584fe
HR
429 int ret;
430 struct {
431 uint32_t nb_snapshots;
432 uint64_t snapshots_offset;
433 } QEMU_PACKED snapshot_table_pointer;
434
435 /* qcow2_do_open() discards this information in check mode */
436 ret = bdrv_pread(bs->file, offsetof(QCowHeader, nb_snapshots),
437 &snapshot_table_pointer, sizeof(snapshot_table_pointer));
438 if (ret < 0) {
439 result->check_errors++;
440 fprintf(stderr, "ERROR failed to read the snapshot table pointer from "
441 "the image header: %s\n", strerror(-ret));
442 return ret;
443 }
444
445 s->snapshots_offset = be64_to_cpu(snapshot_table_pointer.snapshots_offset);
446 s->nb_snapshots = be32_to_cpu(snapshot_table_pointer.nb_snapshots);
447
d2b1d1ec
HR
448 if (s->nb_snapshots > QCOW_MAX_SNAPSHOTS && (fix & BDRV_FIX_ERRORS)) {
449 fprintf(stderr, "Discarding %u overhanging snapshots\n",
450 s->nb_snapshots - QCOW_MAX_SNAPSHOTS);
451
452 nb_clusters_reduced += s->nb_snapshots - QCOW_MAX_SNAPSHOTS;
453 s->nb_snapshots = QCOW_MAX_SNAPSHOTS;
454 }
455
8bc584fe
HR
456 ret = qcow2_validate_table(bs, s->snapshots_offset, s->nb_snapshots,
457 sizeof(QCowSnapshotHeader),
458 sizeof(QCowSnapshotHeader) * QCOW_MAX_SNAPSHOTS,
459 "snapshot table", &local_err);
460 if (ret < 0) {
461 result->check_errors++;
462 error_reportf_err(local_err, "ERROR ");
463
d2b1d1ec
HR
464 if (s->nb_snapshots > QCOW_MAX_SNAPSHOTS) {
465 fprintf(stderr, "You can force-remove all %u overhanging snapshots "
466 "with qemu-img check -r all\n",
467 s->nb_snapshots - QCOW_MAX_SNAPSHOTS);
468 }
469
8bc584fe
HR
470 /* We did not read the snapshot table, so invalidate this information */
471 s->snapshots_offset = 0;
472 s->nb_snapshots = 0;
473
474 return ret;
475 }
476
477 qemu_co_mutex_unlock(&s->lock);
f91f1f15 478 ret = qcow2_do_read_snapshots(bs, fix & BDRV_FIX_ERRORS,
099febf3
HR
479 &nb_clusters_reduced, &extra_data_dropped,
480 &local_err);
8bc584fe
HR
481 qemu_co_mutex_lock(&s->lock);
482 if (ret < 0) {
483 result->check_errors++;
484 error_reportf_err(local_err,
485 "ERROR failed to read the snapshot table: ");
486
487 /* We did not read the snapshot table, so invalidate this information */
488 s->snapshots_offset = 0;
489 s->nb_snapshots = 0;
490
491 return ret;
492 }
099febf3
HR
493 result->corruptions += nb_clusters_reduced + extra_data_dropped;
494
495 if (nb_clusters_reduced) {
496 /*
497 * Update image header now, because:
498 * (1) qcow2_check_refcounts() relies on s->nb_snapshots to be
499 * the same as what the image header says,
500 * (2) this leaks clusters, but qcow2_check_refcounts() will
501 * fix that.
502 */
503 assert(fix & BDRV_FIX_ERRORS);
504
505 snapshot_table_pointer.nb_snapshots = cpu_to_be32(s->nb_snapshots);
506 ret = bdrv_pwrite_sync(bs->file, offsetof(QCowHeader, nb_snapshots),
507 &snapshot_table_pointer.nb_snapshots,
508 sizeof(snapshot_table_pointer.nb_snapshots));
509 if (ret < 0) {
510 result->check_errors++;
511 fprintf(stderr, "ERROR failed to update the snapshot count in the "
512 "image header: %s\n", strerror(-ret));
513 return ret;
514 }
515
516 result->corruptions_fixed += nb_clusters_reduced;
517 result->corruptions -= nb_clusters_reduced;
518 }
8bc584fe 519
e40e6e88
HR
520 /*
521 * All of v3 images' snapshot table entries need to have at least
522 * 16 bytes of extra data.
523 */
524 if (s->qcow_version >= 3) {
525 int i;
526 for (i = 0; i < s->nb_snapshots; i++) {
527 if (s->snapshots[i].extra_data_size <
528 sizeof_field(QCowSnapshotExtraData, vm_state_size_large) +
529 sizeof_field(QCowSnapshotExtraData, disk_size))
530 {
531 result->corruptions++;
532 fprintf(stderr, "%s snapshot table entry %i is incomplete\n",
533 fix & BDRV_FIX_ERRORS ? "Repairing" : "ERROR", i);
534 }
535 }
536 }
537
8bc584fe
HR
538 return 0;
539}
540
fe446b5d
HR
541int coroutine_fn qcow2_check_fix_snapshot_table(BlockDriverState *bs,
542 BdrvCheckResult *result,
543 BdrvCheckMode fix)
544{
545 BDRVQcow2State *s = bs->opaque;
546 int ret;
547
548 if (result->corruptions && (fix & BDRV_FIX_ERRORS)) {
549 qemu_co_mutex_unlock(&s->lock);
550 ret = qcow2_write_snapshots(bs);
551 qemu_co_mutex_lock(&s->lock);
552 if (ret < 0) {
553 result->check_errors++;
554 fprintf(stderr, "ERROR failed to update snapshot table: %s\n",
555 strerror(-ret));
556 return ret;
557 }
558
559 result->corruptions_fixed += result->corruptions;
560 result->corruptions = 0;
561 }
562
563 return 0;
564}
565
c142442b
KW
566static void find_new_snapshot_id(BlockDriverState *bs,
567 char *id_str, int id_str_size)
568{
ff99129a 569 BDRVQcow2State *s = bs->opaque;
c142442b 570 QCowSnapshot *sn;
00c49b21
HR
571 int i;
572 unsigned long id, id_max = 0;
c142442b
KW
573
574 for(i = 0; i < s->nb_snapshots; i++) {
575 sn = s->snapshots + i;
576 id = strtoul(sn->id_str, NULL, 10);
577 if (id > id_max)
578 id_max = id;
579 }
00c49b21 580 snprintf(id_str, id_str_size, "%lu", id_max + 1);
c142442b
KW
581}
582
a89d89d3
WX
583static int find_snapshot_by_id_and_name(BlockDriverState *bs,
584 const char *id,
585 const char *name)
c142442b 586{
ff99129a 587 BDRVQcow2State *s = bs->opaque;
c142442b
KW
588 int i;
589
a89d89d3
WX
590 if (id && name) {
591 for (i = 0; i < s->nb_snapshots; i++) {
592 if (!strcmp(s->snapshots[i].id_str, id) &&
593 !strcmp(s->snapshots[i].name, name)) {
594 return i;
595 }
596 }
597 } else if (id) {
598 for (i = 0; i < s->nb_snapshots; i++) {
599 if (!strcmp(s->snapshots[i].id_str, id)) {
600 return i;
601 }
602 }
603 } else if (name) {
604 for (i = 0; i < s->nb_snapshots; i++) {
605 if (!strcmp(s->snapshots[i].name, name)) {
606 return i;
607 }
608 }
c142442b 609 }
a89d89d3 610
c142442b
KW
611 return -1;
612}
613
a89d89d3
WX
614static int find_snapshot_by_id_or_name(BlockDriverState *bs,
615 const char *id_or_name)
c142442b 616{
a89d89d3 617 int ret;
c142442b 618
a89d89d3
WX
619 ret = find_snapshot_by_id_and_name(bs, id_or_name, NULL);
620 if (ret >= 0) {
c142442b 621 return ret;
c142442b 622 }
a89d89d3 623 return find_snapshot_by_id_and_name(bs, NULL, id_or_name);
c142442b
KW
624}
625
626/* if no id is provided, a new one is constructed */
ed6ccf0f 627int qcow2_snapshot_create(BlockDriverState *bs, QEMUSnapshotInfo *sn_info)
c142442b 628{
ff99129a 629 BDRVQcow2State *s = bs->opaque;
d1ea98d5
KW
630 QCowSnapshot *new_snapshot_list = NULL;
631 QCowSnapshot *old_snapshot_list = NULL;
632 QCowSnapshot sn1, *sn = &sn1;
c142442b
KW
633 int i, ret;
634 uint64_t *l1_table = NULL;
5d757b56 635 int64_t l1_table_offset;
c142442b 636
ce48f2f4
KW
637 if (s->nb_snapshots >= QCOW_MAX_SNAPSHOTS) {
638 return -EFBIG;
639 }
640
aa8b34c1
KW
641 if (has_data_file(bs)) {
642 return -ENOTSUP;
643 }
644
c142442b
KW
645 memset(sn, 0, sizeof(*sn));
646
407bc150
YW
647 /* Generate an ID */
648 find_new_snapshot_id(bs, sn_info->id_str, sizeof(sn_info->id_str));
c142442b 649
03343166 650 /* Populate sn with passed data */
7267c094 651 sn->id_str = g_strdup(sn_info->id_str);
7267c094 652 sn->name = g_strdup(sn_info->name);
03343166 653
90b27759 654 sn->disk_size = bs->total_sectors * BDRV_SECTOR_SIZE;
c142442b
KW
655 sn->vm_state_size = sn_info->vm_state_size;
656 sn->date_sec = sn_info->date_sec;
657 sn->date_nsec = sn_info->date_nsec;
658 sn->vm_clock_nsec = sn_info->vm_clock_nsec;
fcf9a6b7 659 sn->extra_data_size = sizeof(QCowSnapshotExtraData);
c142442b 660
03343166 661 /* Allocate the L1 table of the snapshot and copy the current one there. */
5d757b56
KW
662 l1_table_offset = qcow2_alloc_clusters(bs, s->l1_size * sizeof(uint64_t));
663 if (l1_table_offset < 0) {
d1ea98d5 664 ret = l1_table_offset;
5d757b56
KW
665 goto fail;
666 }
667
668 sn->l1_table_offset = l1_table_offset;
c142442b
KW
669 sn->l1_size = s->l1_size;
670
5839e53b 671 l1_table = g_try_new(uint64_t, s->l1_size);
de82815d
KW
672 if (s->l1_size && l1_table == NULL) {
673 ret = -ENOMEM;
674 goto fail;
675 }
676
c142442b
KW
677 for(i = 0; i < s->l1_size; i++) {
678 l1_table[i] = cpu_to_be64(s->l1_table[i]);
679 }
d1ea98d5 680
231bb267 681 ret = qcow2_pre_write_overlap_check(bs, 0, sn->l1_table_offset,
966b000f 682 s->l1_size * sizeof(uint64_t), false);
cf93980e
HR
683 if (ret < 0) {
684 goto fail;
685 }
686
d9ca2ea2 687 ret = bdrv_pwrite(bs->file, sn->l1_table_offset, l1_table,
d1ea98d5
KW
688 s->l1_size * sizeof(uint64_t));
689 if (ret < 0) {
c142442b 690 goto fail;
d1ea98d5
KW
691 }
692
7267c094 693 g_free(l1_table);
c142442b
KW
694 l1_table = NULL;
695
d1ea98d5
KW
696 /*
697 * Increase the refcounts of all clusters and make sure everything is
698 * stable on disk before updating the snapshot table to contain a pointer
699 * to the new L1 table.
700 */
701 ret = qcow2_update_snapshot_refcount(bs, s->l1_table_offset, s->l1_size, 1);
702 if (ret < 0) {
703 goto fail;
704 }
705
d1ea98d5 706 /* Append the new snapshot to the snapshot list */
5839e53b 707 new_snapshot_list = g_new(QCowSnapshot, s->nb_snapshots + 1);
c142442b 708 if (s->snapshots) {
d1ea98d5
KW
709 memcpy(new_snapshot_list, s->snapshots,
710 s->nb_snapshots * sizeof(QCowSnapshot));
711 old_snapshot_list = s->snapshots;
c142442b 712 }
d1ea98d5 713 s->snapshots = new_snapshot_list;
c142442b
KW
714 s->snapshots[s->nb_snapshots++] = *sn;
715
d1ea98d5
KW
716 ret = qcow2_write_snapshots(bs);
717 if (ret < 0) {
718 g_free(s->snapshots);
719 s->snapshots = old_snapshot_list;
84757f7e 720 s->nb_snapshots--;
c142442b 721 goto fail;
d1ea98d5
KW
722 }
723
724 g_free(old_snapshot_list);
725
1ebf561c
KW
726 /* The VM state isn't needed any more in the active L1 table; in fact, it
727 * hurts by causing expensive COW for the next snapshot. */
d2cb36af 728 qcow2_cluster_discard(bs, qcow2_vm_state_offset(s),
9e029689 729 ROUND_UP(sn->vm_state_size, s->cluster_size),
d2cb36af 730 QCOW2_DISCARD_NEVER, false);
1ebf561c 731
c142442b 732#ifdef DEBUG_ALLOC
6cbc3031
PH
733 {
734 BdrvCheckResult result = {0};
b35278f7 735 qcow2_check_refcounts(bs, &result, 0);
6cbc3031 736 }
c142442b
KW
737#endif
738 return 0;
03343166
KW
739
740fail:
741 g_free(sn->id_str);
7267c094
AL
742 g_free(sn->name);
743 g_free(l1_table);
d1ea98d5
KW
744
745 return ret;
c142442b
KW
746}
747
748/* copy the snapshot 'snapshot_name' into the current disk image */
ed6ccf0f 749int qcow2_snapshot_goto(BlockDriverState *bs, const char *snapshot_id)
c142442b 750{
ff99129a 751 BDRVQcow2State *s = bs->opaque;
c142442b 752 QCowSnapshot *sn;
a8475d75 753 Error *local_err = NULL;
35d7ace7
KW
754 int i, snapshot_index;
755 int cur_l1_bytes, sn_l1_bytes;
589f284b 756 int ret;
43a0cac4 757 uint64_t *sn_l1_table = NULL;
c142442b 758
aa8b34c1
KW
759 if (has_data_file(bs)) {
760 return -ENOTSUP;
761 }
762
589f284b 763 /* Search the snapshot */
c142442b 764 snapshot_index = find_snapshot_by_id_or_name(bs, snapshot_id);
589f284b 765 if (snapshot_index < 0) {
c142442b 766 return -ENOENT;
589f284b 767 }
c142442b
KW
768 sn = &s->snapshots[snapshot_index];
769
a8475d75
AG
770 ret = qcow2_validate_table(bs, sn->l1_table_offset, sn->l1_size,
771 sizeof(uint64_t), QCOW_MAX_L1_SIZE,
772 "Snapshot L1 table", &local_err);
773 if (ret < 0) {
774 error_report_err(local_err);
775 goto fail;
776 }
777
90b27759 778 if (sn->disk_size != bs->total_sectors * BDRV_SECTOR_SIZE) {
7fa140ab
EB
779 BlockBackend *blk = blk_new_with_bs(bs, BLK_PERM_RESIZE, BLK_PERM_ALL,
780 &local_err);
781 if (!blk) {
782 error_report_err(local_err);
783 ret = -ENOTSUP;
784 goto fail;
785 }
786
787 ret = blk_truncate(blk, sn->disk_size, true, PREALLOC_MODE_OFF, 0,
788 &local_err);
789 blk_unref(blk);
790 if (ret < 0) {
791 error_report_err(local_err);
792 goto fail;
793 }
90b27759
KW
794 }
795
589f284b
KW
796 /*
797 * Make sure that the current L1 table is big enough to contain the whole
798 * L1 table of the snapshot. If the snapshot L1 table is smaller, the
799 * current one must be padded with zeros.
800 */
801 ret = qcow2_grow_l1_table(bs, sn->l1_size, true);
802 if (ret < 0) {
c142442b 803 goto fail;
589f284b 804 }
c142442b 805
35d7ace7
KW
806 cur_l1_bytes = s->l1_size * sizeof(uint64_t);
807 sn_l1_bytes = sn->l1_size * sizeof(uint64_t);
808
589f284b
KW
809 /*
810 * Copy the snapshot L1 table to the current L1 table.
811 *
812 * Before overwriting the old current L1 table on disk, make sure to
813 * increase all refcounts for the clusters referenced by the new one.
43a0cac4
KW
814 * Decrease the refcount referenced by the old one only when the L1
815 * table is overwritten.
589f284b 816 */
de82815d
KW
817 sn_l1_table = g_try_malloc0(cur_l1_bytes);
818 if (cur_l1_bytes && sn_l1_table == NULL) {
819 ret = -ENOMEM;
820 goto fail;
821 }
43a0cac4 822
cf2ab8fc 823 ret = bdrv_pread(bs->file, sn->l1_table_offset,
9a4f4c31 824 sn_l1_table, sn_l1_bytes);
43a0cac4
KW
825 if (ret < 0) {
826 goto fail;
827 }
828
829 ret = qcow2_update_snapshot_refcount(bs, sn->l1_table_offset,
830 sn->l1_size, 1);
589f284b 831 if (ret < 0) {
c142442b 832 goto fail;
589f284b
KW
833 }
834
231bb267 835 ret = qcow2_pre_write_overlap_check(bs, QCOW2_OL_ACTIVE_L1,
966b000f
KW
836 s->l1_table_offset, cur_l1_bytes,
837 false);
cf93980e
HR
838 if (ret < 0) {
839 goto fail;
840 }
841
d9ca2ea2 842 ret = bdrv_pwrite_sync(bs->file, s->l1_table_offset, sn_l1_table,
589f284b
KW
843 cur_l1_bytes);
844 if (ret < 0) {
c142442b 845 goto fail;
589f284b
KW
846 }
847
43a0cac4
KW
848 /*
849 * Decrease refcount of clusters of current L1 table.
850 *
851 * At this point, the in-memory s->l1_table points to the old L1 table,
852 * whereas on disk we already have the new one.
853 *
854 * qcow2_update_snapshot_refcount special cases the current L1 table to use
855 * the in-memory data instead of really using the offset to load a new one,
856 * which is why this works.
857 */
858 ret = qcow2_update_snapshot_refcount(bs, s->l1_table_offset,
859 s->l1_size, -1);
860
861 /*
862 * Now update the in-memory L1 table to be in sync with the on-disk one. We
863 * need to do this even if updating refcounts failed.
864 */
c142442b 865 for(i = 0;i < s->l1_size; i++) {
43a0cac4 866 s->l1_table[i] = be64_to_cpu(sn_l1_table[i]);
c142442b
KW
867 }
868
43a0cac4
KW
869 if (ret < 0) {
870 goto fail;
871 }
872
873 g_free(sn_l1_table);
874 sn_l1_table = NULL;
875
876 /*
877 * Update QCOW_OFLAG_COPIED in the active L1 table (it may have changed
878 * when we decreased the refcount of the old snapshot.
879 */
880 ret = qcow2_update_snapshot_refcount(bs, s->l1_table_offset, s->l1_size, 0);
589f284b 881 if (ret < 0) {
c142442b 882 goto fail;
589f284b 883 }
c142442b
KW
884
885#ifdef DEBUG_ALLOC
6cbc3031
PH
886 {
887 BdrvCheckResult result = {0};
b35278f7 888 qcow2_check_refcounts(bs, &result, 0);
6cbc3031 889 }
c142442b
KW
890#endif
891 return 0;
589f284b
KW
892
893fail:
43a0cac4 894 g_free(sn_l1_table);
589f284b 895 return ret;
c142442b
KW
896}
897
a89d89d3
WX
898int qcow2_snapshot_delete(BlockDriverState *bs,
899 const char *snapshot_id,
900 const char *name,
901 Error **errp)
c142442b 902{
ff99129a 903 BDRVQcow2State *s = bs->opaque;
9a476780 904 QCowSnapshot sn;
c142442b
KW
905 int snapshot_index, ret;
906
aa8b34c1
KW
907 if (has_data_file(bs)) {
908 return -ENOTSUP;
909 }
910
9a476780 911 /* Search the snapshot */
a89d89d3 912 snapshot_index = find_snapshot_by_id_and_name(bs, snapshot_id, name);
9a476780 913 if (snapshot_index < 0) {
a89d89d3 914 error_setg(errp, "Can't find the snapshot");
c142442b 915 return -ENOENT;
9a476780
KW
916 }
917 sn = s->snapshots[snapshot_index];
c142442b 918
db5794f1
AG
919 ret = qcow2_validate_table(bs, sn.l1_table_offset, sn.l1_size,
920 sizeof(uint64_t), QCOW_MAX_L1_SIZE,
921 "Snapshot L1 table", errp);
922 if (ret < 0) {
923 return ret;
924 }
925
9a476780
KW
926 /* Remove it from the snapshot list */
927 memmove(s->snapshots + snapshot_index,
928 s->snapshots + snapshot_index + 1,
929 (s->nb_snapshots - snapshot_index - 1) * sizeof(sn));
930 s->nb_snapshots--;
931 ret = qcow2_write_snapshots(bs);
932 if (ret < 0) {
39a611a3
JC
933 error_setg_errno(errp, -ret,
934 "Failed to remove snapshot from snapshot list");
c142442b 935 return ret;
9a476780
KW
936 }
937
938 /*
939 * The snapshot is now unused, clean up. If we fail after this point, we
940 * won't recover but just leak clusters.
941 */
fcf9a6b7 942 g_free(sn.unknown_extra_data);
9a476780
KW
943 g_free(sn.id_str);
944 g_free(sn.name);
945
946 /*
947 * Now decrease the refcounts of clusters referenced by the snapshot and
948 * free the L1 table.
949 */
950 ret = qcow2_update_snapshot_refcount(bs, sn.l1_table_offset,
951 sn.l1_size, -1);
952 if (ret < 0) {
39a611a3 953 error_setg_errno(errp, -ret, "Failed to free the cluster and L1 table");
c142442b 954 return ret;
9a476780 955 }
6cfcb9b8
KW
956 qcow2_free_clusters(bs, sn.l1_table_offset, sn.l1_size * sizeof(uint64_t),
957 QCOW2_DISCARD_SNAPSHOT);
c142442b 958
9a476780
KW
959 /* must update the copied flag on the current cluster offsets */
960 ret = qcow2_update_snapshot_refcount(bs, s->l1_table_offset, s->l1_size, 0);
c142442b 961 if (ret < 0) {
39a611a3
JC
962 error_setg_errno(errp, -ret,
963 "Failed to update snapshot status in disk");
c142442b
KW
964 return ret;
965 }
9a476780 966
c142442b 967#ifdef DEBUG_ALLOC
6cbc3031
PH
968 {
969 BdrvCheckResult result = {0};
b35278f7 970 qcow2_check_refcounts(bs, &result, 0);
6cbc3031 971 }
c142442b
KW
972#endif
973 return 0;
974}
975
ed6ccf0f 976int qcow2_snapshot_list(BlockDriverState *bs, QEMUSnapshotInfo **psn_tab)
c142442b 977{
ff99129a 978 BDRVQcow2State *s = bs->opaque;
c142442b
KW
979 QEMUSnapshotInfo *sn_tab, *sn_info;
980 QCowSnapshot *sn;
981 int i;
982
aa8b34c1
KW
983 if (has_data_file(bs)) {
984 return -ENOTSUP;
985 }
c142442b
KW
986 if (!s->nb_snapshots) {
987 *psn_tab = NULL;
988 return s->nb_snapshots;
989 }
990
5839e53b 991 sn_tab = g_new0(QEMUSnapshotInfo, s->nb_snapshots);
c142442b
KW
992 for(i = 0; i < s->nb_snapshots; i++) {
993 sn_info = sn_tab + i;
994 sn = s->snapshots + i;
995 pstrcpy(sn_info->id_str, sizeof(sn_info->id_str),
996 sn->id_str);
997 pstrcpy(sn_info->name, sizeof(sn_info->name),
998 sn->name);
999 sn_info->vm_state_size = sn->vm_state_size;
1000 sn_info->date_sec = sn->date_sec;
1001 sn_info->date_nsec = sn->date_nsec;
1002 sn_info->vm_clock_nsec = sn->vm_clock_nsec;
1003 }
1004 *psn_tab = sn_tab;
1005 return s->nb_snapshots;
1006}
1007
7b4c4781
WX
1008int qcow2_snapshot_load_tmp(BlockDriverState *bs,
1009 const char *snapshot_id,
1010 const char *name,
1011 Error **errp)
51ef6727 1012{
e3f652b3 1013 int i, snapshot_index;
ff99129a 1014 BDRVQcow2State *s = bs->opaque;
51ef6727 1015 QCowSnapshot *sn;
e3f652b3
KW
1016 uint64_t *new_l1_table;
1017 int new_l1_bytes;
1018 int ret;
51ef6727 1019
e3f652b3
KW
1020 assert(bs->read_only);
1021
1022 /* Search the snapshot */
7b4c4781 1023 snapshot_index = find_snapshot_by_id_and_name(bs, snapshot_id, name);
51ef6727 1024 if (snapshot_index < 0) {
7b4c4781
WX
1025 error_setg(errp,
1026 "Can't find snapshot");
51ef6727 1027 return -ENOENT;
1028 }
51ef6727 1029 sn = &s->snapshots[snapshot_index];
51ef6727 1030
e3f652b3 1031 /* Allocate and read in the snapshot's L1 table */
314e8d39
AG
1032 ret = qcow2_validate_table(bs, sn->l1_table_offset, sn->l1_size,
1033 sizeof(uint64_t), QCOW_MAX_L1_SIZE,
1034 "Snapshot L1 table", errp);
1035 if (ret < 0) {
1036 return ret;
6a83f8b5 1037 }
c05e4667 1038 new_l1_bytes = sn->l1_size * sizeof(uint64_t);
ef97d608 1039 new_l1_table = qemu_try_blockalign(bs->file->bs, new_l1_bytes);
de82815d
KW
1040 if (new_l1_table == NULL) {
1041 return -ENOMEM;
1042 }
51ef6727 1043
cf2ab8fc 1044 ret = bdrv_pread(bs->file, sn->l1_table_offset,
9a4f4c31 1045 new_l1_table, new_l1_bytes);
e3f652b3 1046 if (ret < 0) {
7b4c4781 1047 error_setg(errp, "Failed to read l1 table for snapshot");
de82815d 1048 qemu_vfree(new_l1_table);
e3f652b3 1049 return ret;
51ef6727 1050 }
1051
e3f652b3 1052 /* Switch the L1 table */
de82815d 1053 qemu_vfree(s->l1_table);
e3f652b3
KW
1054
1055 s->l1_size = sn->l1_size;
1056 s->l1_table_offset = sn->l1_table_offset;
1057 s->l1_table = new_l1_table;
1058
51ef6727 1059 for(i = 0;i < s->l1_size; i++) {
1060 be64_to_cpus(&s->l1_table[i]);
1061 }
e3f652b3 1062
51ef6727 1063 return 0;
1064}