]> git.proxmox.com Git - qemu.git/blame - arch_init.c
migration: do not overwrite zero pages
[qemu.git] / arch_init.c
CommitLineData
ad96090a
BS
1/*
2 * QEMU System Emulator
3 *
4 * Copyright (c) 2003-2008 Fabrice Bellard
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
24#include <stdint.h>
25#include <stdarg.h>
b2e0a138 26#include <stdlib.h>
ad96090a 27#ifndef _WIN32
1c47cb16 28#include <sys/types.h>
ad96090a
BS
29#include <sys/mman.h>
30#endif
31#include "config.h"
83c9089e 32#include "monitor/monitor.h"
9c17d615 33#include "sysemu/sysemu.h"
1de7afc9
PB
34#include "qemu/bitops.h"
35#include "qemu/bitmap.h"
9c17d615 36#include "sysemu/arch_init.h"
ad96090a 37#include "audio/audio.h"
0d09e41a 38#include "hw/i386/pc.h"
a2cb15b0 39#include "hw/pci/pci.h"
0d09e41a 40#include "hw/audio/audio.h"
9c17d615 41#include "sysemu/kvm.h"
caf71f86 42#include "migration/migration.h"
0d09e41a 43#include "hw/i386/smbios.h"
022c62cb 44#include "exec/address-spaces.h"
0d09e41a 45#include "hw/audio/pcspk.h"
caf71f86 46#include "migration/page_cache.h"
1de7afc9 47#include "qemu/config-file.h"
99afc91d 48#include "qmp-commands.h"
3c12193d 49#include "trace.h"
0d6d3c87 50#include "exec/cpu-all.h"
0445259b 51#include "hw/acpi/acpi.h"
ad96090a 52
3a697f69
OW
53#ifdef DEBUG_ARCH_INIT
54#define DPRINTF(fmt, ...) \
55 do { fprintf(stdout, "arch_init: " fmt, ## __VA_ARGS__); } while (0)
56#else
57#define DPRINTF(fmt, ...) \
58 do { } while (0)
59#endif
60
ad96090a
BS
61#ifdef TARGET_SPARC
62int graphic_width = 1024;
63int graphic_height = 768;
64int graphic_depth = 8;
65#else
66int graphic_width = 800;
67int graphic_height = 600;
68int graphic_depth = 15;
69#endif
70
ad96090a
BS
71
72#if defined(TARGET_ALPHA)
73#define QEMU_ARCH QEMU_ARCH_ALPHA
74#elif defined(TARGET_ARM)
75#define QEMU_ARCH QEMU_ARCH_ARM
76#elif defined(TARGET_CRIS)
77#define QEMU_ARCH QEMU_ARCH_CRIS
78#elif defined(TARGET_I386)
79#define QEMU_ARCH QEMU_ARCH_I386
80#elif defined(TARGET_M68K)
81#define QEMU_ARCH QEMU_ARCH_M68K
81ea0e13
MW
82#elif defined(TARGET_LM32)
83#define QEMU_ARCH QEMU_ARCH_LM32
ad96090a
BS
84#elif defined(TARGET_MICROBLAZE)
85#define QEMU_ARCH QEMU_ARCH_MICROBLAZE
86#elif defined(TARGET_MIPS)
87#define QEMU_ARCH QEMU_ARCH_MIPS
d15a9c23
AG
88#elif defined(TARGET_MOXIE)
89#define QEMU_ARCH QEMU_ARCH_MOXIE
e67db06e
JL
90#elif defined(TARGET_OPENRISC)
91#define QEMU_ARCH QEMU_ARCH_OPENRISC
ad96090a
BS
92#elif defined(TARGET_PPC)
93#define QEMU_ARCH QEMU_ARCH_PPC
94#elif defined(TARGET_S390X)
95#define QEMU_ARCH QEMU_ARCH_S390X
96#elif defined(TARGET_SH4)
97#define QEMU_ARCH QEMU_ARCH_SH4
98#elif defined(TARGET_SPARC)
99#define QEMU_ARCH QEMU_ARCH_SPARC
2328826b
MF
100#elif defined(TARGET_XTENSA)
101#define QEMU_ARCH QEMU_ARCH_XTENSA
4f23a1e6
GX
102#elif defined(TARGET_UNICORE32)
103#define QEMU_ARCH QEMU_ARCH_UNICORE32
ad96090a
BS
104#endif
105
106const uint32_t arch_type = QEMU_ARCH;
107
108/***********************************************************/
109/* ram save/restore */
110
d20878d2
YT
111#define RAM_SAVE_FLAG_FULL 0x01 /* Obsolete, not used anymore */
112#define RAM_SAVE_FLAG_COMPRESS 0x02
113#define RAM_SAVE_FLAG_MEM_SIZE 0x04
114#define RAM_SAVE_FLAG_PAGE 0x08
115#define RAM_SAVE_FLAG_EOS 0x10
116#define RAM_SAVE_FLAG_CONTINUE 0x20
17ad9b35 117#define RAM_SAVE_FLAG_XBZRLE 0x40
ad96090a 118
b5a8fe5e 119
756557de
EH
120static struct defconfig_file {
121 const char *filename;
f29a5614
EH
122 /* Indicates it is an user config file (disabled by -no-user-config) */
123 bool userconfig;
756557de 124} default_config_files[] = {
f29a5614 125 { CONFIG_QEMU_CONFDIR "/qemu.conf", true },
2e59915d 126 { CONFIG_QEMU_CONFDIR "/target-" TARGET_NAME ".conf", true },
756557de
EH
127 { NULL }, /* end of list */
128};
129
130
f29a5614 131int qemu_read_default_config_files(bool userconfig)
b5a8fe5e
EH
132{
133 int ret;
756557de 134 struct defconfig_file *f;
b5a8fe5e 135
756557de 136 for (f = default_config_files; f->filename; f++) {
f29a5614
EH
137 if (!userconfig && f->userconfig) {
138 continue;
139 }
756557de
EH
140 ret = qemu_read_config_file(f->filename);
141 if (ret < 0 && ret != -ENOENT) {
142 return ret;
143 }
b5a8fe5e 144 }
4d8b3c63 145
b5a8fe5e
EH
146 return 0;
147}
148
3edcd7e6 149static inline bool is_zero_page(uint8_t *p)
ad96090a 150{
3edcd7e6
PL
151 return buffer_find_nonzero_offset(p, TARGET_PAGE_SIZE) ==
152 TARGET_PAGE_SIZE;
ad96090a
BS
153}
154
17ad9b35
OW
155/* struct contains XBZRLE cache and a static page
156 used by the compression */
157static struct {
158 /* buffer used for XBZRLE encoding */
159 uint8_t *encoded_buf;
160 /* buffer for storing page content */
161 uint8_t *current_buf;
162 /* buffer used for XBZRLE decoding */
163 uint8_t *decoded_buf;
164 /* Cache for XBZRLE */
165 PageCache *cache;
166} XBZRLE = {
167 .encoded_buf = NULL,
168 .current_buf = NULL,
169 .decoded_buf = NULL,
170 .cache = NULL,
171};
172
9e1ba4cc
OW
173
174int64_t xbzrle_cache_resize(int64_t new_size)
175{
176 if (XBZRLE.cache != NULL) {
177 return cache_resize(XBZRLE.cache, new_size / TARGET_PAGE_SIZE) *
178 TARGET_PAGE_SIZE;
179 }
180 return pow2floor(new_size);
181}
182
004d4c10
OW
183/* accounting for migration statistics */
184typedef struct AccountingInfo {
185 uint64_t dup_pages;
f1c72795 186 uint64_t skipped_pages;
004d4c10
OW
187 uint64_t norm_pages;
188 uint64_t iterations;
f36d55af
OW
189 uint64_t xbzrle_bytes;
190 uint64_t xbzrle_pages;
191 uint64_t xbzrle_cache_miss;
192 uint64_t xbzrle_overflows;
004d4c10
OW
193} AccountingInfo;
194
195static AccountingInfo acct_info;
196
197static void acct_clear(void)
198{
199 memset(&acct_info, 0, sizeof(acct_info));
200}
201
202uint64_t dup_mig_bytes_transferred(void)
203{
204 return acct_info.dup_pages * TARGET_PAGE_SIZE;
205}
206
207uint64_t dup_mig_pages_transferred(void)
208{
209 return acct_info.dup_pages;
210}
211
f1c72795
PL
212uint64_t skipped_mig_bytes_transferred(void)
213{
214 return acct_info.skipped_pages * TARGET_PAGE_SIZE;
215}
216
217uint64_t skipped_mig_pages_transferred(void)
218{
219 return acct_info.skipped_pages;
220}
221
004d4c10
OW
222uint64_t norm_mig_bytes_transferred(void)
223{
224 return acct_info.norm_pages * TARGET_PAGE_SIZE;
225}
226
227uint64_t norm_mig_pages_transferred(void)
228{
229 return acct_info.norm_pages;
230}
231
f36d55af
OW
232uint64_t xbzrle_mig_bytes_transferred(void)
233{
234 return acct_info.xbzrle_bytes;
235}
236
237uint64_t xbzrle_mig_pages_transferred(void)
238{
239 return acct_info.xbzrle_pages;
240}
241
242uint64_t xbzrle_mig_pages_cache_miss(void)
243{
244 return acct_info.xbzrle_cache_miss;
245}
246
247uint64_t xbzrle_mig_pages_overflow(void)
248{
249 return acct_info.xbzrle_overflows;
250}
251
3f7d7b09
JQ
252static size_t save_block_hdr(QEMUFile *f, RAMBlock *block, ram_addr_t offset,
253 int cont, int flag)
0c51f43d 254{
3f7d7b09
JQ
255 size_t size;
256
257 qemu_put_be64(f, offset | cont | flag);
258 size = 8;
0c51f43d 259
3f7d7b09
JQ
260 if (!cont) {
261 qemu_put_byte(f, strlen(block->idstr));
262 qemu_put_buffer(f, (uint8_t *)block->idstr,
263 strlen(block->idstr));
264 size += 1 + strlen(block->idstr);
265 }
266 return size;
0c51f43d
OW
267}
268
17ad9b35
OW
269#define ENCODING_FLAG_XBZRLE 0x1
270
271static int save_xbzrle_page(QEMUFile *f, uint8_t *current_data,
272 ram_addr_t current_addr, RAMBlock *block,
dd051c72 273 ram_addr_t offset, int cont, bool last_stage)
17ad9b35
OW
274{
275 int encoded_len = 0, bytes_sent = -1;
276 uint8_t *prev_cached_page;
277
278 if (!cache_is_cached(XBZRLE.cache, current_addr)) {
dd051c72 279 if (!last_stage) {
ee0b44aa 280 cache_insert(XBZRLE.cache, current_addr, current_data);
dd051c72 281 }
f36d55af 282 acct_info.xbzrle_cache_miss++;
17ad9b35
OW
283 return -1;
284 }
285
286 prev_cached_page = get_cached_data(XBZRLE.cache, current_addr);
287
288 /* save current buffer into memory */
289 memcpy(XBZRLE.current_buf, current_data, TARGET_PAGE_SIZE);
290
291 /* XBZRLE encoding (if there is no overflow) */
292 encoded_len = xbzrle_encode_buffer(prev_cached_page, XBZRLE.current_buf,
293 TARGET_PAGE_SIZE, XBZRLE.encoded_buf,
294 TARGET_PAGE_SIZE);
295 if (encoded_len == 0) {
296 DPRINTF("Skipping unmodified page\n");
297 return 0;
298 } else if (encoded_len == -1) {
299 DPRINTF("Overflow\n");
f36d55af 300 acct_info.xbzrle_overflows++;
17ad9b35
OW
301 /* update data in the cache */
302 memcpy(prev_cached_page, current_data, TARGET_PAGE_SIZE);
303 return -1;
304 }
305
306 /* we need to update the data in the cache, in order to get the same data */
dd051c72
JQ
307 if (!last_stage) {
308 memcpy(prev_cached_page, XBZRLE.current_buf, TARGET_PAGE_SIZE);
309 }
17ad9b35
OW
310
311 /* Send XBZRLE based compressed page */
3f7d7b09 312 bytes_sent = save_block_hdr(f, block, offset, cont, RAM_SAVE_FLAG_XBZRLE);
17ad9b35
OW
313 qemu_put_byte(f, ENCODING_FLAG_XBZRLE);
314 qemu_put_be16(f, encoded_len);
315 qemu_put_buffer(f, XBZRLE.encoded_buf, encoded_len);
3f7d7b09 316 bytes_sent += encoded_len + 1 + 2;
f36d55af
OW
317 acct_info.xbzrle_pages++;
318 acct_info.xbzrle_bytes += bytes_sent;
17ad9b35
OW
319
320 return bytes_sent;
321}
322
b23a9a5c
JQ
323
324/* This is the last block that we have visited serching for dirty pages
325 */
326static RAMBlock *last_seen_block;
5f718a15
JQ
327/* This is the last block from where we have sent data */
328static RAMBlock *last_sent_block;
760e77ea 329static ram_addr_t last_offset;
c6bf8e0e
JQ
330static unsigned long *migration_bitmap;
331static uint64_t migration_dirty_pages;
f798b07f 332static uint32_t last_version;
78d07ae7 333static bool ram_bulk_stage;
760e77ea 334
4c8ae0f6
JQ
335static inline
336ram_addr_t migration_bitmap_find_and_reset_dirty(MemoryRegion *mr,
337 ram_addr_t start)
69268cde 338{
4c8ae0f6
JQ
339 unsigned long base = mr->ram_addr >> TARGET_PAGE_BITS;
340 unsigned long nr = base + (start >> TARGET_PAGE_BITS);
341 unsigned long size = base + (int128_get64(mr->size) >> TARGET_PAGE_BITS);
c6bf8e0e 342
70c8652b
PL
343 unsigned long next;
344
345 if (ram_bulk_stage && nr > base) {
346 next = nr + 1;
347 } else {
348 next = find_next_bit(migration_bitmap, size, nr);
349 }
69268cde 350
4c8ae0f6
JQ
351 if (next < size) {
352 clear_bit(next, migration_bitmap);
c6bf8e0e 353 migration_dirty_pages--;
69268cde 354 }
4c8ae0f6 355 return (next - base) << TARGET_PAGE_BITS;
69268cde
JQ
356}
357
c6bf8e0e
JQ
358static inline bool migration_bitmap_set_dirty(MemoryRegion *mr,
359 ram_addr_t offset)
e44d26c8 360{
c6bf8e0e
JQ
361 bool ret;
362 int nr = (mr->ram_addr + offset) >> TARGET_PAGE_BITS;
e44d26c8 363
c6bf8e0e
JQ
364 ret = test_and_set_bit(nr, migration_bitmap);
365
366 if (!ret) {
367 migration_dirty_pages++;
e44d26c8 368 }
c6bf8e0e 369 return ret;
e44d26c8
JQ
370}
371
32c835ba
PB
372/* Needs iothread lock! */
373
dd2df737
JQ
374static void migration_bitmap_sync(void)
375{
c6bf8e0e
JQ
376 RAMBlock *block;
377 ram_addr_t addr;
378 uint64_t num_dirty_pages_init = migration_dirty_pages;
8d017193
JQ
379 MigrationState *s = migrate_get_current();
380 static int64_t start_time;
381 static int64_t num_dirty_pages_period;
382 int64_t end_time;
383
384 if (!start_time) {
385 start_time = qemu_get_clock_ms(rt_clock);
386 }
3c12193d
JQ
387
388 trace_migration_bitmap_sync_start();
1d671369 389 address_space_sync_dirty_bitmap(&address_space_memory);
c6bf8e0e 390
a3161038 391 QTAILQ_FOREACH(block, &ram_list.blocks, next) {
c6bf8e0e 392 for (addr = 0; addr < block->length; addr += TARGET_PAGE_SIZE) {
ece79318
JQ
393 if (memory_region_test_and_clear_dirty(block->mr,
394 addr, TARGET_PAGE_SIZE,
395 DIRTY_MEMORY_MIGRATION)) {
c6bf8e0e
JQ
396 migration_bitmap_set_dirty(block->mr, addr);
397 }
398 }
c6bf8e0e
JQ
399 }
400 trace_migration_bitmap_sync_end(migration_dirty_pages
3c12193d 401 - num_dirty_pages_init);
8d017193
JQ
402 num_dirty_pages_period += migration_dirty_pages - num_dirty_pages_init;
403 end_time = qemu_get_clock_ms(rt_clock);
404
405 /* more than 1 second = 1000 millisecons */
406 if (end_time > start_time + 1000) {
407 s->dirty_pages_rate = num_dirty_pages_period * 1000
408 / (end_time - start_time);
90f8ae72 409 s->dirty_bytes_rate = s->dirty_pages_rate * TARGET_PAGE_SIZE;
8d017193
JQ
410 start_time = end_time;
411 num_dirty_pages_period = 0;
412 }
dd2df737
JQ
413}
414
6c779f22
OW
415/*
416 * ram_save_block: Writes a page of memory to the stream f
417 *
b823ceaa
JQ
418 * Returns: The number of bytes written.
419 * 0 means no dirty pages
6c779f22
OW
420 */
421
dd051c72 422static int ram_save_block(QEMUFile *f, bool last_stage)
ad96090a 423{
b23a9a5c 424 RAMBlock *block = last_seen_block;
e44359c3 425 ram_addr_t offset = last_offset;
4c8ae0f6 426 bool complete_round = false;
b823ceaa 427 int bytes_sent = 0;
71c510e2 428 MemoryRegion *mr;
17ad9b35 429 ram_addr_t current_addr;
ad96090a 430
e44359c3 431 if (!block)
a3161038 432 block = QTAILQ_FIRST(&ram_list.blocks);
e44359c3 433
4c8ae0f6 434 while (true) {
71c510e2 435 mr = block->mr;
4c8ae0f6
JQ
436 offset = migration_bitmap_find_and_reset_dirty(mr, offset);
437 if (complete_round && block == last_seen_block &&
438 offset >= last_offset) {
439 break;
440 }
441 if (offset >= block->length) {
442 offset = 0;
443 block = QTAILQ_NEXT(block, next);
444 if (!block) {
445 block = QTAILQ_FIRST(&ram_list.blocks);
446 complete_round = true;
78d07ae7 447 ram_bulk_stage = false;
4c8ae0f6
JQ
448 }
449 } else {
ad96090a 450 uint8_t *p;
5f718a15 451 int cont = (block == last_sent_block) ?
b23a9a5c 452 RAM_SAVE_FLAG_CONTINUE : 0;
ad96090a 453
71c510e2 454 p = memory_region_get_ram_ptr(mr) + offset;
ad96090a 455
b823ceaa
JQ
456 /* In doubt sent page as normal */
457 bytes_sent = -1;
3edcd7e6 458 if (is_zero_page(p)) {
004d4c10 459 acct_info.dup_pages++;
9ef051e5
PL
460 bytes_sent = save_block_hdr(f, block, offset, cont,
461 RAM_SAVE_FLAG_COMPRESS);
462 qemu_put_byte(f, 0);
463 bytes_sent++;
5cc11c46 464 } else if (!ram_bulk_stage && migrate_use_xbzrle()) {
17ad9b35
OW
465 current_addr = block->offset + offset;
466 bytes_sent = save_xbzrle_page(f, p, current_addr, block,
dd051c72
JQ
467 offset, cont, last_stage);
468 if (!last_stage) {
469 p = get_cached_data(XBZRLE.cache, current_addr);
470 }
17ad9b35
OW
471 }
472
b823ceaa 473 /* XBZRLE overflow or normal page */
17ad9b35 474 if (bytes_sent == -1) {
3f7d7b09 475 bytes_sent = save_block_hdr(f, block, offset, cont, RAM_SAVE_FLAG_PAGE);
500f0061 476 qemu_put_buffer_async(f, p, TARGET_PAGE_SIZE);
3f7d7b09 477 bytes_sent += TARGET_PAGE_SIZE;
004d4c10 478 acct_info.norm_pages++;
ad96090a
BS
479 }
480
17ad9b35 481 /* if page is unmodified, continue to the next */
b823ceaa 482 if (bytes_sent > 0) {
5f718a15 483 last_sent_block = block;
17ad9b35
OW
484 break;
485 }
ad96090a 486 }
4c8ae0f6 487 }
b23a9a5c 488 last_seen_block = block;
e44359c3 489 last_offset = offset;
ad96090a 490
3fc250b4 491 return bytes_sent;
ad96090a
BS
492}
493
494static uint64_t bytes_transferred;
495
496static ram_addr_t ram_save_remaining(void)
497{
c6bf8e0e 498 return migration_dirty_pages;
ad96090a
BS
499}
500
501uint64_t ram_bytes_remaining(void)
502{
503 return ram_save_remaining() * TARGET_PAGE_SIZE;
504}
505
506uint64_t ram_bytes_transferred(void)
507{
508 return bytes_transferred;
509}
510
511uint64_t ram_bytes_total(void)
512{
d17b5288
AW
513 RAMBlock *block;
514 uint64_t total = 0;
515
a3161038 516 QTAILQ_FOREACH(block, &ram_list.blocks, next)
d17b5288
AW
517 total += block->length;
518
519 return total;
ad96090a
BS
520}
521
8e21cd32
OW
522static void migration_end(void)
523{
244eaa75
PB
524 if (migration_bitmap) {
525 memory_global_dirty_log_stop();
526 g_free(migration_bitmap);
527 migration_bitmap = NULL;
528 }
17ad9b35 529
244eaa75 530 if (XBZRLE.cache) {
17ad9b35
OW
531 cache_fini(XBZRLE.cache);
532 g_free(XBZRLE.cache);
533 g_free(XBZRLE.encoded_buf);
534 g_free(XBZRLE.current_buf);
535 g_free(XBZRLE.decoded_buf);
536 XBZRLE.cache = NULL;
537 }
8e21cd32
OW
538}
539
9b5bfab0
JQ
540static void ram_migration_cancel(void *opaque)
541{
542 migration_end();
543}
544
5a170775
JQ
545static void reset_ram_globals(void)
546{
b23a9a5c 547 last_seen_block = NULL;
5f718a15 548 last_sent_block = NULL;
5a170775 549 last_offset = 0;
f798b07f 550 last_version = ram_list.version;
78d07ae7 551 ram_bulk_stage = true;
5a170775
JQ
552}
553
4508bd9e
JQ
554#define MAX_WAIT 50 /* ms, half buffered_file limit */
555
d1315aac 556static int ram_save_setup(QEMUFile *f, void *opaque)
ad96090a 557{
d1315aac 558 RAMBlock *block;
c6bf8e0e
JQ
559 int64_t ram_pages = last_ram_offset() >> TARGET_PAGE_BITS;
560
561 migration_bitmap = bitmap_new(ram_pages);
7ec81e56 562 bitmap_set(migration_bitmap, 0, ram_pages);
c6bf8e0e 563 migration_dirty_pages = ram_pages;
ad96090a 564
17ad9b35
OW
565 if (migrate_use_xbzrle()) {
566 XBZRLE.cache = cache_init(migrate_xbzrle_cache_size() /
567 TARGET_PAGE_SIZE,
568 TARGET_PAGE_SIZE);
569 if (!XBZRLE.cache) {
570 DPRINTF("Error creating cache\n");
571 return -1;
572 }
573 XBZRLE.encoded_buf = g_malloc0(TARGET_PAGE_SIZE);
574 XBZRLE.current_buf = g_malloc(TARGET_PAGE_SIZE);
004d4c10 575 acct_clear();
17ad9b35
OW
576 }
577
9b095037
PB
578 qemu_mutex_lock_iothread();
579 qemu_mutex_lock_ramlist();
580 bytes_transferred = 0;
581 reset_ram_globals();
582
d1315aac 583 memory_global_dirty_log_start();
c6bf8e0e 584 migration_bitmap_sync();
9b095037 585 qemu_mutex_unlock_iothread();
ad96090a 586
d1315aac 587 qemu_put_be64(f, ram_bytes_total() | RAM_SAVE_FLAG_MEM_SIZE);
97ab12d4 588
a3161038 589 QTAILQ_FOREACH(block, &ram_list.blocks, next) {
d1315aac
JQ
590 qemu_put_byte(f, strlen(block->idstr));
591 qemu_put_buffer(f, (uint8_t *)block->idstr, strlen(block->idstr));
592 qemu_put_be64(f, block->length);
ad96090a
BS
593 }
594
b2a8658e 595 qemu_mutex_unlock_ramlist();
d1315aac
JQ
596 qemu_put_be64(f, RAM_SAVE_FLAG_EOS);
597
598 return 0;
599}
600
16310a3c 601static int ram_save_iterate(QEMUFile *f, void *opaque)
d1315aac 602{
d1315aac
JQ
603 int ret;
604 int i;
e4ed1541 605 int64_t t0;
b823ceaa 606 int total_sent = 0;
d1315aac 607
b2a8658e
UD
608 qemu_mutex_lock_ramlist();
609
f798b07f
UD
610 if (ram_list.version != last_version) {
611 reset_ram_globals();
612 }
613
e4ed1541 614 t0 = qemu_get_clock_ns(rt_clock);
4508bd9e 615 i = 0;
2975725f 616 while ((ret = qemu_file_rate_limit(f)) == 0) {
3fc250b4 617 int bytes_sent;
ad96090a 618
dd051c72 619 bytes_sent = ram_save_block(f, false);
6c779f22 620 /* no more blocks to sent */
b823ceaa 621 if (bytes_sent == 0) {
ad96090a
BS
622 break;
623 }
b823ceaa 624 total_sent += bytes_sent;
004d4c10 625 acct_info.iterations++;
4508bd9e
JQ
626 /* we want to check in the 1st loop, just in case it was the 1st time
627 and we had to sync the dirty bitmap.
628 qemu_get_clock_ns() is a bit expensive, so we only check each some
629 iterations
630 */
631 if ((i & 63) == 0) {
e4ed1541 632 uint64_t t1 = (qemu_get_clock_ns(rt_clock) - t0) / 1000000;
4508bd9e 633 if (t1 > MAX_WAIT) {
ef37a699 634 DPRINTF("big wait: %" PRIu64 " milliseconds, %d iterations\n",
4508bd9e
JQ
635 t1, i);
636 break;
637 }
638 }
639 i++;
ad96090a
BS
640 }
641
fb3409de
PB
642 qemu_mutex_unlock_ramlist();
643
2975725f 644 if (ret < 0) {
b823ceaa 645 bytes_transferred += total_sent;
2975725f
JQ
646 return ret;
647 }
648
16310a3c 649 qemu_put_be64(f, RAM_SAVE_FLAG_EOS);
b823ceaa
JQ
650 total_sent += 8;
651 bytes_transferred += total_sent;
16310a3c 652
b823ceaa 653 return total_sent;
16310a3c
JQ
654}
655
656static int ram_save_complete(QEMUFile *f, void *opaque)
657{
b2a8658e 658 qemu_mutex_lock_ramlist();
9c339485 659 migration_bitmap_sync();
b2a8658e 660
ad96090a 661 /* try transferring iterative blocks of memory */
3a697f69 662
16310a3c 663 /* flush all remaining blocks regardless of rate limiting */
6c779f22 664 while (true) {
3fc250b4
PR
665 int bytes_sent;
666
dd051c72 667 bytes_sent = ram_save_block(f, true);
6c779f22 668 /* no more blocks to sent */
b823ceaa 669 if (bytes_sent == 0) {
6c779f22 670 break;
ad96090a 671 }
16310a3c 672 bytes_transferred += bytes_sent;
ad96090a 673 }
244eaa75 674 migration_end();
ad96090a 675
b2a8658e 676 qemu_mutex_unlock_ramlist();
ad96090a
BS
677 qemu_put_be64(f, RAM_SAVE_FLAG_EOS);
678
5b3c9638 679 return 0;
ad96090a
BS
680}
681
e4ed1541
JQ
682static uint64_t ram_save_pending(QEMUFile *f, void *opaque, uint64_t max_size)
683{
684 uint64_t remaining_size;
685
686 remaining_size = ram_save_remaining() * TARGET_PAGE_SIZE;
687
688 if (remaining_size < max_size) {
32c835ba 689 qemu_mutex_lock_iothread();
e4ed1541 690 migration_bitmap_sync();
32c835ba 691 qemu_mutex_unlock_iothread();
e4ed1541
JQ
692 remaining_size = ram_save_remaining() * TARGET_PAGE_SIZE;
693 }
694 return remaining_size;
695}
696
17ad9b35
OW
697static int load_xbzrle(QEMUFile *f, ram_addr_t addr, void *host)
698{
699 int ret, rc = 0;
700 unsigned int xh_len;
701 int xh_flags;
702
703 if (!XBZRLE.decoded_buf) {
704 XBZRLE.decoded_buf = g_malloc(TARGET_PAGE_SIZE);
705 }
706
707 /* extract RLE header */
708 xh_flags = qemu_get_byte(f);
709 xh_len = qemu_get_be16(f);
710
711 if (xh_flags != ENCODING_FLAG_XBZRLE) {
712 fprintf(stderr, "Failed to load XBZRLE page - wrong compression!\n");
713 return -1;
714 }
715
716 if (xh_len > TARGET_PAGE_SIZE) {
717 fprintf(stderr, "Failed to load XBZRLE page - len overflow!\n");
718 return -1;
719 }
720 /* load data and decode */
721 qemu_get_buffer(f, XBZRLE.decoded_buf, xh_len);
722
723 /* decode RLE */
724 ret = xbzrle_decode_buffer(XBZRLE.decoded_buf, xh_len, host,
725 TARGET_PAGE_SIZE);
726 if (ret == -1) {
727 fprintf(stderr, "Failed to load XBZRLE page - decode error!\n");
728 rc = -1;
729 } else if (ret > TARGET_PAGE_SIZE) {
730 fprintf(stderr, "Failed to load XBZRLE page - size %d exceeds %d!\n",
731 ret, TARGET_PAGE_SIZE);
732 abort();
733 }
734
735 return rc;
736}
737
a55bbe31
AW
738static inline void *host_from_stream_offset(QEMUFile *f,
739 ram_addr_t offset,
740 int flags)
741{
742 static RAMBlock *block = NULL;
743 char id[256];
744 uint8_t len;
745
746 if (flags & RAM_SAVE_FLAG_CONTINUE) {
747 if (!block) {
748 fprintf(stderr, "Ack, bad migration stream!\n");
749 return NULL;
750 }
751
dc94a7ed 752 return memory_region_get_ram_ptr(block->mr) + offset;
a55bbe31
AW
753 }
754
755 len = qemu_get_byte(f);
756 qemu_get_buffer(f, (uint8_t *)id, len);
757 id[len] = 0;
758
a3161038 759 QTAILQ_FOREACH(block, &ram_list.blocks, next) {
a55bbe31 760 if (!strncmp(id, block->idstr, sizeof(id)))
dc94a7ed 761 return memory_region_get_ram_ptr(block->mr) + offset;
a55bbe31
AW
762 }
763
764 fprintf(stderr, "Can't find block %s!\n", id);
765 return NULL;
766}
767
7908c78d 768static int ram_load(QEMUFile *f, void *opaque, int version_id)
ad96090a
BS
769{
770 ram_addr_t addr;
3a697f69 771 int flags, ret = 0;
42802d47 772 int error;
3a697f69
OW
773 static uint64_t seq_iter;
774
775 seq_iter++;
ad96090a 776
f09f2189 777 if (version_id < 4 || version_id > 4) {
ad96090a
BS
778 return -EINVAL;
779 }
780
781 do {
782 addr = qemu_get_be64(f);
783
784 flags = addr & ~TARGET_PAGE_MASK;
785 addr &= TARGET_PAGE_MASK;
786
787 if (flags & RAM_SAVE_FLAG_MEM_SIZE) {
f09f2189 788 if (version_id == 4) {
97ab12d4
AW
789 /* Synchronize RAM block list */
790 char id[256];
791 ram_addr_t length;
792 ram_addr_t total_ram_bytes = addr;
793
794 while (total_ram_bytes) {
795 RAMBlock *block;
796 uint8_t len;
797
798 len = qemu_get_byte(f);
799 qemu_get_buffer(f, (uint8_t *)id, len);
800 id[len] = 0;
801 length = qemu_get_be64(f);
802
a3161038 803 QTAILQ_FOREACH(block, &ram_list.blocks, next) {
97ab12d4 804 if (!strncmp(id, block->idstr, sizeof(id))) {
3a697f69 805 if (block->length != length) {
87d2f825
AL
806 fprintf(stderr, "Length mismatch: %s: %ld "
807 "in != " RAM_ADDR_FMT "\n", id, length,
808 block->length);
3a697f69
OW
809 ret = -EINVAL;
810 goto done;
811 }
97ab12d4
AW
812 break;
813 }
814 }
815
816 if (!block) {
fb787f81
AW
817 fprintf(stderr, "Unknown ramblock \"%s\", cannot "
818 "accept migration\n", id);
3a697f69
OW
819 ret = -EINVAL;
820 goto done;
97ab12d4
AW
821 }
822
823 total_ram_bytes -= length;
824 }
ad96090a
BS
825 }
826 }
827
828 if (flags & RAM_SAVE_FLAG_COMPRESS) {
97ab12d4
AW
829 void *host;
830 uint8_t ch;
831
f09f2189 832 host = host_from_stream_offset(f, addr, flags);
492fb99c
MT
833 if (!host) {
834 return -EINVAL;
835 }
97ab12d4 836
97ab12d4 837 ch = qemu_get_byte(f);
211ea740
PL
838 if (ch != 0 || !is_zero_page(host)) {
839 memset(host, ch, TARGET_PAGE_SIZE);
ad96090a 840#ifndef _WIN32
211ea740
PL
841 if (ch == 0 &&
842 (!kvm_enabled() || kvm_has_sync_mmu()) &&
843 getpagesize() <= TARGET_PAGE_SIZE) {
844 qemu_madvise(host, TARGET_PAGE_SIZE, QEMU_MADV_DONTNEED);
845 }
ad96090a 846#endif
211ea740 847 }
ad96090a 848 } else if (flags & RAM_SAVE_FLAG_PAGE) {
97ab12d4
AW
849 void *host;
850
f09f2189 851 host = host_from_stream_offset(f, addr, flags);
0ff1f9f5
OW
852 if (!host) {
853 return -EINVAL;
854 }
97ab12d4 855
97ab12d4 856 qemu_get_buffer(f, host, TARGET_PAGE_SIZE);
17ad9b35 857 } else if (flags & RAM_SAVE_FLAG_XBZRLE) {
17ad9b35
OW
858 void *host = host_from_stream_offset(f, addr, flags);
859 if (!host) {
860 return -EINVAL;
861 }
862
863 if (load_xbzrle(f, addr, host) < 0) {
864 ret = -EINVAL;
865 goto done;
866 }
ad96090a 867 }
42802d47
JQ
868 error = qemu_file_get_error(f);
869 if (error) {
3a697f69
OW
870 ret = error;
871 goto done;
ad96090a
BS
872 }
873 } while (!(flags & RAM_SAVE_FLAG_EOS));
874
3a697f69 875done:
ef37a699
IM
876 DPRINTF("Completed load of VM with exit code %d seq iteration "
877 "%" PRIu64 "\n", ret, seq_iter);
3a697f69 878 return ret;
ad96090a
BS
879}
880
7908c78d 881SaveVMHandlers savevm_ram_handlers = {
d1315aac 882 .save_live_setup = ram_save_setup,
16310a3c
JQ
883 .save_live_iterate = ram_save_iterate,
884 .save_live_complete = ram_save_complete,
e4ed1541 885 .save_live_pending = ram_save_pending,
7908c78d 886 .load_state = ram_load,
9b5bfab0 887 .cancel = ram_migration_cancel,
7908c78d
JQ
888};
889
0dfa5ef9
IY
890struct soundhw {
891 const char *name;
892 const char *descr;
893 int enabled;
894 int isa;
895 union {
4a0f031d 896 int (*init_isa) (ISABus *bus);
0dfa5ef9
IY
897 int (*init_pci) (PCIBus *bus);
898 } init;
899};
900
36cd6f6f
PB
901static struct soundhw soundhw[9];
902static int soundhw_count;
ad96090a 903
36cd6f6f
PB
904void isa_register_soundhw(const char *name, const char *descr,
905 int (*init_isa)(ISABus *bus))
906{
907 assert(soundhw_count < ARRAY_SIZE(soundhw) - 1);
908 soundhw[soundhw_count].name = name;
909 soundhw[soundhw_count].descr = descr;
910 soundhw[soundhw_count].isa = 1;
911 soundhw[soundhw_count].init.init_isa = init_isa;
912 soundhw_count++;
913}
ad96090a 914
36cd6f6f
PB
915void pci_register_soundhw(const char *name, const char *descr,
916 int (*init_pci)(PCIBus *bus))
917{
918 assert(soundhw_count < ARRAY_SIZE(soundhw) - 1);
919 soundhw[soundhw_count].name = name;
920 soundhw[soundhw_count].descr = descr;
921 soundhw[soundhw_count].isa = 0;
922 soundhw[soundhw_count].init.init_pci = init_pci;
923 soundhw_count++;
924}
ad96090a
BS
925
926void select_soundhw(const char *optarg)
927{
928 struct soundhw *c;
929
c8057f95 930 if (is_help_option(optarg)) {
ad96090a
BS
931 show_valid_cards:
932
36cd6f6f
PB
933 if (soundhw_count) {
934 printf("Valid sound card names (comma separated):\n");
935 for (c = soundhw; c->name; ++c) {
936 printf ("%-11s %s\n", c->name, c->descr);
937 }
938 printf("\n-soundhw all will enable all of the above\n");
939 } else {
940 printf("Machine has no user-selectable audio hardware "
941 "(it may or may not have always-present audio hardware).\n");
ad96090a 942 }
c8057f95 943 exit(!is_help_option(optarg));
ad96090a
BS
944 }
945 else {
946 size_t l;
947 const char *p;
948 char *e;
949 int bad_card = 0;
950
951 if (!strcmp(optarg, "all")) {
952 for (c = soundhw; c->name; ++c) {
953 c->enabled = 1;
954 }
955 return;
956 }
957
958 p = optarg;
959 while (*p) {
960 e = strchr(p, ',');
961 l = !e ? strlen(p) : (size_t) (e - p);
962
963 for (c = soundhw; c->name; ++c) {
964 if (!strncmp(c->name, p, l) && !c->name[l]) {
965 c->enabled = 1;
966 break;
967 }
968 }
969
970 if (!c->name) {
971 if (l > 80) {
972 fprintf(stderr,
973 "Unknown sound card name (too big to show)\n");
974 }
975 else {
976 fprintf(stderr, "Unknown sound card name `%.*s'\n",
977 (int) l, p);
978 }
979 bad_card = 1;
980 }
981 p += l + (e != NULL);
982 }
983
984 if (bad_card) {
985 goto show_valid_cards;
986 }
987 }
988}
0dfa5ef9 989
f81222bc 990void audio_init(void)
0dfa5ef9
IY
991{
992 struct soundhw *c;
f81222bc
PB
993 ISABus *isa_bus = (ISABus *) object_resolve_path_type("", TYPE_ISA_BUS, NULL);
994 PCIBus *pci_bus = (PCIBus *) object_resolve_path_type("", TYPE_PCI_BUS, NULL);
0dfa5ef9
IY
995
996 for (c = soundhw; c->name; ++c) {
997 if (c->enabled) {
998 if (c->isa) {
f81222bc
PB
999 if (!isa_bus) {
1000 fprintf(stderr, "ISA bus not available for %s\n", c->name);
1001 exit(1);
0dfa5ef9 1002 }
f81222bc 1003 c->init.init_isa(isa_bus);
0dfa5ef9 1004 } else {
f81222bc
PB
1005 if (!pci_bus) {
1006 fprintf(stderr, "PCI bus not available for %s\n", c->name);
1007 exit(1);
0dfa5ef9 1008 }
f81222bc 1009 c->init.init_pci(pci_bus);
0dfa5ef9
IY
1010 }
1011 }
1012 }
1013}
ad96090a
BS
1014
1015int qemu_uuid_parse(const char *str, uint8_t *uuid)
1016{
1017 int ret;
1018
1019 if (strlen(str) != 36) {
1020 return -1;
1021 }
1022
1023 ret = sscanf(str, UUID_FMT, &uuid[0], &uuid[1], &uuid[2], &uuid[3],
1024 &uuid[4], &uuid[5], &uuid[6], &uuid[7], &uuid[8], &uuid[9],
1025 &uuid[10], &uuid[11], &uuid[12], &uuid[13], &uuid[14],
1026 &uuid[15]);
1027
1028 if (ret != 16) {
1029 return -1;
1030 }
1031#ifdef TARGET_I386
ebc85e3f 1032 smbios_add_field(1, offsetof(struct smbios_type_1, uuid), uuid, 16);
ad96090a
BS
1033#endif
1034 return 0;
1035}
1036
0c764a9d 1037void do_acpitable_option(const QemuOpts *opts)
ad96090a
BS
1038{
1039#ifdef TARGET_I386
23084327
LE
1040 Error *err = NULL;
1041
1042 acpi_table_add(opts, &err);
1043 if (err) {
1044 fprintf(stderr, "Wrong acpi table provided: %s\n",
1045 error_get_pretty(err));
1046 error_free(err);
ad96090a
BS
1047 exit(1);
1048 }
1049#endif
1050}
1051
1052void do_smbios_option(const char *optarg)
1053{
1054#ifdef TARGET_I386
1055 if (smbios_entry_add(optarg) < 0) {
ad96090a
BS
1056 exit(1);
1057 }
1058#endif
1059}
1060
1061void cpudef_init(void)
1062{
1063#if defined(cpudef_setup)
1064 cpudef_setup(); /* parse cpu definitions in target config file */
1065#endif
1066}
1067
303d4e86
AP
1068int tcg_available(void)
1069{
1070 return 1;
1071}
1072
ad96090a
BS
1073int kvm_available(void)
1074{
1075#ifdef CONFIG_KVM
1076 return 1;
1077#else
1078 return 0;
1079#endif
1080}
1081
1082int xen_available(void)
1083{
1084#ifdef CONFIG_XEN
1085 return 1;
1086#else
1087 return 0;
1088#endif
1089}
99afc91d
DB
1090
1091
1092TargetInfo *qmp_query_target(Error **errp)
1093{
1094 TargetInfo *info = g_malloc0(sizeof(*info));
1095
c02a9552 1096 info->arch = g_strdup(TARGET_NAME);
99afc91d
DB
1097
1098 return info;
1099}