]> git.proxmox.com Git - qemu.git/blame - block/cow.c
block: expect errors from bdrv_co_is_allocated
[qemu.git] / block / cow.c
CommitLineData
ea2384d3
FB
1/*
2 * Block driver for the COW format
5fafdf24 3 *
ea2384d3 4 * Copyright (c) 2004 Fabrice Bellard
5fafdf24 5 *
ea2384d3
FB
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
faf07963 24#include "qemu-common.h"
737e150e 25#include "block/block_int.h"
1de7afc9 26#include "qemu/module.h"
ea2384d3
FB
27
28/**************************************************************/
29/* COW block driver using file system holes */
30
31/* user mode linux compatible COW file */
32#define COW_MAGIC 0x4f4f4f4d /* MOOO */
33#define COW_VERSION 2
34
35struct cow_header_v2 {
36 uint32_t magic;
37 uint32_t version;
38 char backing_file[1024];
39 int32_t mtime;
40 uint64_t size;
41 uint32_t sectorsize;
42};
43
44typedef struct BDRVCowState {
848c66e8 45 CoMutex lock;
ea2384d3
FB
46 int64_t cow_sectors_offset;
47} BDRVCowState;
48
49static int cow_probe(const uint8_t *buf, int buf_size, const char *filename)
50{
51 const struct cow_header_v2 *cow_header = (const void *)buf;
52
712e7874
FB
53 if (buf_size >= sizeof(struct cow_header_v2) &&
54 be32_to_cpu(cow_header->magic) == COW_MAGIC &&
5fafdf24 55 be32_to_cpu(cow_header->version) == COW_VERSION)
ea2384d3
FB
56 return 100;
57 else
58 return 0;
59}
60
1a86938f 61static int cow_open(BlockDriverState *bs, QDict *options, int flags)
ea2384d3
FB
62{
63 BDRVCowState *s = bs->opaque;
ea2384d3 64 struct cow_header_v2 cow_header;
893a9cb4 65 int bitmap_size;
ea2384d3 66 int64_t size;
16d2fc00 67 int ret;
ea2384d3 68
ea2384d3 69 /* see if it is a cow image */
16d2fc00
LZH
70 ret = bdrv_pread(bs->file, 0, &cow_header, sizeof(cow_header));
71 if (ret < 0) {
72 goto fail;
73 }
74
75 if (be32_to_cpu(cow_header.magic) != COW_MAGIC) {
15bac0d5 76 ret = -EMEDIUMTYPE;
ea2384d3
FB
77 goto fail;
78 }
79
16d2fc00
LZH
80 if (be32_to_cpu(cow_header.version) != COW_VERSION) {
81 char version[64];
82 snprintf(version, sizeof(version),
83 "COW version %d", cow_header.version);
84 qerror_report(QERR_UNKNOWN_BLOCK_FORMAT_FEATURE,
85 bs->device_name, "cow", version);
86 ret = -ENOTSUP;
ea2384d3
FB
87 goto fail;
88 }
3b46e624 89
ea2384d3
FB
90 /* cow image found */
91 size = be64_to_cpu(cow_header.size);
92 bs->total_sectors = size / 512;
93
5fafdf24 94 pstrcpy(bs->backing_file, sizeof(bs->backing_file),
ea2384d3 95 cow_header.backing_file);
3b46e624 96
893a9cb4
CH
97 bitmap_size = ((bs->total_sectors + 7) >> 3) + sizeof(cow_header);
98 s->cow_sectors_offset = (bitmap_size + 511) & ~511;
848c66e8 99 qemu_co_mutex_init(&s->lock);
ea2384d3
FB
100 return 0;
101 fail:
16d2fc00 102 return ret;
ea2384d3
FB
103}
104
893a9cb4 105/*
4e35b92a 106 * XXX(hch): right now these functions are extremely inefficient.
893a9cb4
CH
107 * We should just read the whole bitmap we'll need in one go instead.
108 */
26ae9804 109static inline int cow_set_bit(BlockDriverState *bs, int64_t bitnum, bool *first)
ea2384d3 110{
893a9cb4
CH
111 uint64_t offset = sizeof(struct cow_header_v2) + bitnum / 8;
112 uint8_t bitmap;
b0ad5a45 113 int ret;
893a9cb4 114
b0ad5a45
KW
115 ret = bdrv_pread(bs->file, offset, &bitmap, sizeof(bitmap));
116 if (ret < 0) {
117 return ret;
893a9cb4
CH
118 }
119
26ae9804
PB
120 if (bitmap & (1 << (bitnum % 8))) {
121 return 0;
122 }
123
124 if (*first) {
125 ret = bdrv_flush(bs->file);
126 if (ret < 0) {
127 return ret;
128 }
129 *first = false;
130 }
131
893a9cb4
CH
132 bitmap |= (1 << (bitnum % 8));
133
26ae9804 134 ret = bdrv_pwrite(bs->file, offset, &bitmap, sizeof(bitmap));
b0ad5a45
KW
135 if (ret < 0) {
136 return ret;
893a9cb4
CH
137 }
138 return 0;
ea2384d3
FB
139}
140
276cbc7f
PB
141#define BITS_PER_BITMAP_SECTOR (512 * 8)
142
143/* Cannot use bitmap.c on big-endian machines. */
144static int cow_test_bit(int64_t bitnum, const uint8_t *bitmap)
ea2384d3 145{
276cbc7f
PB
146 return (bitmap[bitnum / 8] & (1 << (bitnum & 7))) != 0;
147}
ea2384d3 148
276cbc7f
PB
149static int cow_find_streak(const uint8_t *bitmap, int value, int start, int nb_sectors)
150{
151 int streak_value = value ? 0xFF : 0;
152 int last = MIN(start + nb_sectors, BITS_PER_BITMAP_SECTOR);
153 int bitnum = start;
154 while (bitnum < last) {
155 if ((bitnum & 7) == 0 && bitmap[bitnum / 8] == streak_value) {
156 bitnum += 8;
157 continue;
158 }
159 if (cow_test_bit(bitnum, bitmap) == value) {
160 bitnum++;
161 continue;
162 }
163 break;
893a9cb4 164 }
276cbc7f 165 return MIN(bitnum, last) - start;
893a9cb4 166}
ea2384d3
FB
167
168/* Return true if first block has been changed (ie. current version is
169 * in COW file). Set the number of continuous blocks for which that
170 * is true. */
81145834
SH
171static int coroutine_fn cow_co_is_allocated(BlockDriverState *bs,
172 int64_t sector_num, int nb_sectors, int *num_same)
ea2384d3 173{
276cbc7f
PB
174 int64_t bitnum = sector_num + sizeof(struct cow_header_v2) * 8;
175 uint64_t offset = (bitnum / 8) & -BDRV_SECTOR_SIZE;
176 uint8_t bitmap[BDRV_SECTOR_SIZE];
177 int ret;
ea2384d3
FB
178 int changed;
179
276cbc7f
PB
180 ret = bdrv_pread(bs->file, offset, &bitmap, sizeof(bitmap));
181 if (ret < 0) {
182 return ret;
ea2384d3
FB
183 }
184
276cbc7f
PB
185 bitnum &= BITS_PER_BITMAP_SECTOR - 1;
186 changed = cow_test_bit(bitnum, bitmap);
187 *num_same = cow_find_streak(bitmap, changed, bitnum, nb_sectors);
ea2384d3
FB
188 return changed;
189}
190
893a9cb4
CH
191static int cow_update_bitmap(BlockDriverState *bs, int64_t sector_num,
192 int nb_sectors)
ea2384d3 193{
893a9cb4
CH
194 int error = 0;
195 int i;
26ae9804 196 bool first = true;
893a9cb4
CH
197
198 for (i = 0; i < nb_sectors; i++) {
26ae9804 199 error = cow_set_bit(bs, sector_num + i, &first);
893a9cb4
CH
200 if (error) {
201 break;
202 }
203 }
204
205 return error;
ea2384d3
FB
206}
207
e94d1387
SH
208static int coroutine_fn cow_read(BlockDriverState *bs, int64_t sector_num,
209 uint8_t *buf, int nb_sectors)
ea2384d3
FB
210{
211 BDRVCowState *s = bs->opaque;
212 int ret, n;
3b46e624 213
ea2384d3 214 while (nb_sectors > 0) {
d663640c
PB
215 ret = cow_co_is_allocated(bs, sector_num, nb_sectors, &n);
216 if (ret < 0) {
217 return ret;
218 }
219 if (ret) {
2063392a
CH
220 ret = bdrv_pread(bs->file,
221 s->cow_sectors_offset + sector_num * 512,
222 buf, n * 512);
16d2fc00
LZH
223 if (ret < 0) {
224 return ret;
225 }
ea2384d3 226 } else {
83f64091
FB
227 if (bs->backing_hd) {
228 /* read from the base image */
229 ret = bdrv_read(bs->backing_hd, sector_num, buf, n);
16d2fc00
LZH
230 if (ret < 0) {
231 return ret;
232 }
83f64091 233 } else {
16d2fc00
LZH
234 memset(buf, 0, n * 512);
235 }
83f64091 236 }
ea2384d3
FB
237 nb_sectors -= n;
238 sector_num += n;
239 buf += n * 512;
240 }
241 return 0;
242}
243
2914caa0
PB
244static coroutine_fn int cow_co_read(BlockDriverState *bs, int64_t sector_num,
245 uint8_t *buf, int nb_sectors)
246{
247 int ret;
248 BDRVCowState *s = bs->opaque;
249 qemu_co_mutex_lock(&s->lock);
250 ret = cow_read(bs, sector_num, buf, nb_sectors);
251 qemu_co_mutex_unlock(&s->lock);
252 return ret;
253}
254
5fafdf24 255static int cow_write(BlockDriverState *bs, int64_t sector_num,
ea2384d3
FB
256 const uint8_t *buf, int nb_sectors)
257{
258 BDRVCowState *s = bs->opaque;
893a9cb4 259 int ret;
3b46e624 260
2063392a
CH
261 ret = bdrv_pwrite(bs->file, s->cow_sectors_offset + sector_num * 512,
262 buf, nb_sectors * 512);
16d2fc00
LZH
263 if (ret < 0) {
264 return ret;
265 }
893a9cb4
CH
266
267 return cow_update_bitmap(bs, sector_num, nb_sectors);
ea2384d3
FB
268}
269
e183ef75
PB
270static coroutine_fn int cow_co_write(BlockDriverState *bs, int64_t sector_num,
271 const uint8_t *buf, int nb_sectors)
272{
273 int ret;
274 BDRVCowState *s = bs->opaque;
275 qemu_co_mutex_lock(&s->lock);
276 ret = cow_write(bs, sector_num, buf, nb_sectors);
277 qemu_co_mutex_unlock(&s->lock);
278 return ret;
279}
280
e2731add 281static void cow_close(BlockDriverState *bs)
ea2384d3 282{
ea2384d3
FB
283}
284
0e7e1989 285static int cow_create(const char *filename, QEMUOptionParameter *options)
ea2384d3 286{
ea2384d3
FB
287 struct cow_header_v2 cow_header;
288 struct stat st;
0e7e1989
KW
289 int64_t image_sectors = 0;
290 const char *image_filename = NULL;
31f38120 291 int ret;
3535a9c6 292 BlockDriverState *cow_bs;
0e7e1989
KW
293
294 /* Read out options */
295 while (options && options->name) {
296 if (!strcmp(options->name, BLOCK_OPT_SIZE)) {
297 image_sectors = options->value.n / 512;
298 } else if (!strcmp(options->name, BLOCK_OPT_BACKING_FILE)) {
299 image_filename = options->value.s;
300 }
301 options++;
302 }
ea2384d3 303
3535a9c6
LZH
304 ret = bdrv_create_file(filename, options);
305 if (ret < 0) {
306 return ret;
307 }
308
787e4a85 309 ret = bdrv_file_open(&cow_bs, filename, NULL, BDRV_O_RDWR);
3535a9c6
LZH
310 if (ret < 0) {
311 return ret;
312 }
313
ea2384d3
FB
314 memset(&cow_header, 0, sizeof(cow_header));
315 cow_header.magic = cpu_to_be32(COW_MAGIC);
316 cow_header.version = cpu_to_be32(COW_VERSION);
317 if (image_filename) {
83f64091
FB
318 /* Note: if no file, we put a dummy mtime */
319 cow_header.mtime = cpu_to_be32(0);
320
3535a9c6 321 if (stat(image_filename, &st) != 0) {
83f64091 322 goto mtime_fail;
ea2384d3 323 }
ea2384d3 324 cow_header.mtime = cpu_to_be32(st.st_mtime);
83f64091
FB
325 mtime_fail:
326 pstrcpy(cow_header.backing_file, sizeof(cow_header.backing_file),
327 image_filename);
ea2384d3
FB
328 }
329 cow_header.sectorsize = cpu_to_be32(512);
330 cow_header.size = cpu_to_be64(image_sectors * 512);
3535a9c6 331 ret = bdrv_pwrite(cow_bs, 0, &cow_header, sizeof(cow_header));
16d2fc00 332 if (ret < 0) {
31f38120
KS
333 goto exit;
334 }
335
ea2384d3 336 /* resize to include at least all the bitmap */
3535a9c6
LZH
337 ret = bdrv_truncate(cow_bs,
338 sizeof(cow_header) + ((image_sectors + 7) >> 3));
16d2fc00 339 if (ret < 0) {
31f38120
KS
340 goto exit;
341 }
342
31f38120 343exit:
4f6fd349 344 bdrv_unref(cow_bs);
31f38120 345 return ret;
ea2384d3
FB
346}
347
0e7e1989 348static QEMUOptionParameter cow_create_options[] = {
db08adf5
KW
349 {
350 .name = BLOCK_OPT_SIZE,
351 .type = OPT_SIZE,
352 .help = "Virtual disk size"
353 },
354 {
355 .name = BLOCK_OPT_BACKING_FILE,
356 .type = OPT_STRING,
357 .help = "File name of a base image"
358 },
0e7e1989
KW
359 { NULL }
360};
361
5efa9d5a 362static BlockDriver bdrv_cow = {
c68b89ac
KW
363 .format_name = "cow",
364 .instance_size = sizeof(BDRVCowState),
365
366 .bdrv_probe = cow_probe,
367 .bdrv_open = cow_open,
368 .bdrv_close = cow_close,
369 .bdrv_create = cow_create,
3ac21627 370 .bdrv_has_zero_init = bdrv_has_zero_init_1,
c68b89ac
KW
371
372 .bdrv_read = cow_co_read,
373 .bdrv_write = cow_co_write,
81145834 374 .bdrv_co_is_allocated = cow_co_is_allocated,
0e7e1989
KW
375
376 .create_options = cow_create_options,
ea2384d3 377};
5efa9d5a
AL
378
379static void bdrv_cow_init(void)
380{
381 bdrv_register(&bdrv_cow);
382}
383
384block_init(bdrv_cow_init);