]>
Commit | Line | Data |
---|---|---|
5bb7910a AL |
1 | /* |
2 | * QEMU live migration | |
3 | * | |
4 | * Copyright IBM, Corp. 2008 | |
5 | * | |
6 | * Authors: | |
7 | * Anthony Liguori <aliguori@us.ibm.com> | |
8 | * | |
9 | * This work is licensed under the terms of the GNU GPL, version 2. See | |
10 | * the COPYING file in the top-level directory. | |
11 | * | |
6b620ca3 PB |
12 | * Contributions after 2012-01-13 are licensed under the terms of the |
13 | * GNU GPL, version 2 or (at your option) any later version. | |
5bb7910a AL |
14 | */ |
15 | ||
16 | #include "qemu-common.h" | |
caf71f86 | 17 | #include "migration/migration.h" |
83c9089e | 18 | #include "monitor/monitor.h" |
0d82d0e8 | 19 | #include "migration/qemu-file.h" |
9c17d615 | 20 | #include "sysemu/sysemu.h" |
737e150e | 21 | #include "block/block.h" |
1de7afc9 | 22 | #include "qemu/sockets.h" |
caf71f86 | 23 | #include "migration/block.h" |
766bd176 | 24 | #include "qemu/thread.h" |
791e7c82 | 25 | #include "qmp-commands.h" |
065e2813 AL |
26 | |
27 | //#define DEBUG_MIGRATION | |
28 | ||
29 | #ifdef DEBUG_MIGRATION | |
d0f2c4c6 | 30 | #define DPRINTF(fmt, ...) \ |
065e2813 AL |
31 | do { printf("migration: " fmt, ## __VA_ARGS__); } while (0) |
32 | #else | |
d0f2c4c6 | 33 | #define DPRINTF(fmt, ...) \ |
065e2813 AL |
34 | do { } while (0) |
35 | #endif | |
5bb7910a | 36 | |
7dc688ed JQ |
37 | enum { |
38 | MIG_STATE_ERROR, | |
39 | MIG_STATE_SETUP, | |
40 | MIG_STATE_CANCELLED, | |
41 | MIG_STATE_ACTIVE, | |
42 | MIG_STATE_COMPLETED, | |
43 | }; | |
5bb7910a | 44 | |
d0ae46c1 | 45 | #define MAX_THROTTLE (32 << 20) /* Migration speed throttling */ |
5bb7910a | 46 | |
5b4e1eb7 JQ |
47 | /* Amount of time to allocate to each "chunk" of bandwidth-throttled |
48 | * data. */ | |
49 | #define BUFFER_DELAY 100 | |
50 | #define XFER_LIMIT_RATIO (1000 / BUFFER_DELAY) | |
51 | ||
17ad9b35 OW |
52 | /* Migration XBZRLE default cache size */ |
53 | #define DEFAULT_MIGRATE_CACHE_SIZE (64 * 1024 * 1024) | |
54 | ||
99a0db9b GH |
55 | static NotifierList migration_state_notifiers = |
56 | NOTIFIER_LIST_INITIALIZER(migration_state_notifiers); | |
57 | ||
17549e84 JQ |
58 | /* When we add fault tolerance, we could have several |
59 | migrations at once. For now we don't need to add | |
60 | dynamic creation of migration */ | |
61 | ||
859bc756 | 62 | MigrationState *migrate_get_current(void) |
17549e84 JQ |
63 | { |
64 | static MigrationState current_migration = { | |
65 | .state = MIG_STATE_SETUP, | |
d0ae46c1 | 66 | .bandwidth_limit = MAX_THROTTLE, |
17ad9b35 | 67 | .xbzrle_cache_size = DEFAULT_MIGRATE_CACHE_SIZE, |
17549e84 JQ |
68 | }; |
69 | ||
70 | return ¤t_migration; | |
71 | } | |
72 | ||
43eaae28 | 73 | void qemu_start_incoming_migration(const char *uri, Error **errp) |
5bb7910a | 74 | { |
34c9dd8e AL |
75 | const char *p; |
76 | ||
77 | if (strstart(uri, "tcp:", &p)) | |
43eaae28 | 78 | tcp_start_incoming_migration(p, errp); |
065e2813 AL |
79 | #if !defined(WIN32) |
80 | else if (strstart(uri, "exec:", &p)) | |
43eaae28 | 81 | exec_start_incoming_migration(p, errp); |
4951f65b | 82 | else if (strstart(uri, "unix:", &p)) |
43eaae28 | 83 | unix_start_incoming_migration(p, errp); |
5ac1fad3 | 84 | else if (strstart(uri, "fd:", &p)) |
43eaae28 | 85 | fd_start_incoming_migration(p, errp); |
065e2813 | 86 | #endif |
8ca5e801 | 87 | else { |
43eaae28 | 88 | error_setg(errp, "unknown migration protocol: %s\n", uri); |
8ca5e801 | 89 | } |
5bb7910a AL |
90 | } |
91 | ||
82a4da79 | 92 | static void process_incoming_migration_co(void *opaque) |
511c0231 | 93 | { |
82a4da79 | 94 | QEMUFile *f = opaque; |
1c12e1f5 PB |
95 | int ret; |
96 | ||
97 | ret = qemu_loadvm_state(f); | |
82a4da79 | 98 | qemu_set_fd_handler(qemu_get_fd(f), NULL, NULL, NULL); |
1c12e1f5 PB |
99 | qemu_fclose(f); |
100 | if (ret < 0) { | |
511c0231 JQ |
101 | fprintf(stderr, "load of migration failed\n"); |
102 | exit(0); | |
103 | } | |
104 | qemu_announce_self(); | |
105 | DPRINTF("successfully loaded vm state\n"); | |
106 | ||
901862cb | 107 | bdrv_clear_incoming_migration_all(); |
0f15423c AL |
108 | /* Make sure all file formats flush their mutable metadata */ |
109 | bdrv_invalidate_cache_all(); | |
110 | ||
f5bbfba1 | 111 | if (autostart) { |
511c0231 | 112 | vm_start(); |
f5bbfba1 | 113 | } else { |
29ed72f1 | 114 | runstate_set(RUN_STATE_PAUSED); |
f5bbfba1 | 115 | } |
511c0231 JQ |
116 | } |
117 | ||
82a4da79 PB |
118 | static void enter_migration_coroutine(void *opaque) |
119 | { | |
120 | Coroutine *co = opaque; | |
121 | qemu_coroutine_enter(co, NULL); | |
122 | } | |
123 | ||
124 | void process_incoming_migration(QEMUFile *f) | |
125 | { | |
126 | Coroutine *co = qemu_coroutine_create(process_incoming_migration_co); | |
127 | int fd = qemu_get_fd(f); | |
128 | ||
129 | assert(fd != -1); | |
130 | socket_set_nonblock(fd); | |
131 | qemu_set_fd_handler(fd, enter_migration_coroutine, NULL, co); | |
132 | qemu_coroutine_enter(co, f); | |
133 | } | |
134 | ||
a0a3fd60 GC |
135 | /* amount of nanoseconds we are willing to wait for migration to be down. |
136 | * the choice of nanoseconds is because it is the maximum resolution that | |
137 | * get_clock() can achieve. It is an internal measure. All user-visible | |
138 | * units must be in seconds */ | |
139 | static uint64_t max_downtime = 30000000; | |
140 | ||
141 | uint64_t migrate_max_downtime(void) | |
142 | { | |
143 | return max_downtime; | |
144 | } | |
145 | ||
bbf6da32 OW |
146 | MigrationCapabilityStatusList *qmp_query_migrate_capabilities(Error **errp) |
147 | { | |
148 | MigrationCapabilityStatusList *head = NULL; | |
149 | MigrationCapabilityStatusList *caps; | |
150 | MigrationState *s = migrate_get_current(); | |
151 | int i; | |
152 | ||
153 | for (i = 0; i < MIGRATION_CAPABILITY_MAX; i++) { | |
154 | if (head == NULL) { | |
155 | head = g_malloc0(sizeof(*caps)); | |
156 | caps = head; | |
157 | } else { | |
158 | caps->next = g_malloc0(sizeof(*caps)); | |
159 | caps = caps->next; | |
160 | } | |
161 | caps->value = | |
162 | g_malloc(sizeof(*caps->value)); | |
163 | caps->value->capability = i; | |
164 | caps->value->state = s->enabled_capabilities[i]; | |
165 | } | |
166 | ||
167 | return head; | |
168 | } | |
169 | ||
f36d55af OW |
170 | static void get_xbzrle_cache_stats(MigrationInfo *info) |
171 | { | |
172 | if (migrate_use_xbzrle()) { | |
173 | info->has_xbzrle_cache = true; | |
174 | info->xbzrle_cache = g_malloc0(sizeof(*info->xbzrle_cache)); | |
175 | info->xbzrle_cache->cache_size = migrate_xbzrle_cache_size(); | |
176 | info->xbzrle_cache->bytes = xbzrle_mig_bytes_transferred(); | |
177 | info->xbzrle_cache->pages = xbzrle_mig_pages_transferred(); | |
178 | info->xbzrle_cache->cache_miss = xbzrle_mig_pages_cache_miss(); | |
179 | info->xbzrle_cache->overflow = xbzrle_mig_pages_overflow(); | |
180 | } | |
181 | } | |
182 | ||
791e7c82 | 183 | MigrationInfo *qmp_query_migrate(Error **errp) |
5bb7910a | 184 | { |
791e7c82 | 185 | MigrationInfo *info = g_malloc0(sizeof(*info)); |
17549e84 JQ |
186 | MigrationState *s = migrate_get_current(); |
187 | ||
188 | switch (s->state) { | |
189 | case MIG_STATE_SETUP: | |
190 | /* no migration has happened ever */ | |
191 | break; | |
192 | case MIG_STATE_ACTIVE: | |
791e7c82 LC |
193 | info->has_status = true; |
194 | info->status = g_strdup("active"); | |
7aa939af JQ |
195 | info->has_total_time = true; |
196 | info->total_time = qemu_get_clock_ms(rt_clock) | |
197 | - s->total_time; | |
2c52ddf1 JQ |
198 | info->has_expected_downtime = true; |
199 | info->expected_downtime = s->expected_downtime; | |
17549e84 | 200 | |
791e7c82 LC |
201 | info->has_ram = true; |
202 | info->ram = g_malloc0(sizeof(*info->ram)); | |
203 | info->ram->transferred = ram_bytes_transferred(); | |
204 | info->ram->remaining = ram_bytes_remaining(); | |
205 | info->ram->total = ram_bytes_total(); | |
004d4c10 OW |
206 | info->ram->duplicate = dup_mig_pages_transferred(); |
207 | info->ram->normal = norm_mig_pages_transferred(); | |
208 | info->ram->normal_bytes = norm_mig_bytes_transferred(); | |
8d017193 JQ |
209 | info->ram->dirty_pages_rate = s->dirty_pages_rate; |
210 | ||
17549e84 JQ |
211 | |
212 | if (blk_mig_active()) { | |
791e7c82 LC |
213 | info->has_disk = true; |
214 | info->disk = g_malloc0(sizeof(*info->disk)); | |
215 | info->disk->transferred = blk_mig_bytes_transferred(); | |
216 | info->disk->remaining = blk_mig_bytes_remaining(); | |
217 | info->disk->total = blk_mig_bytes_total(); | |
ff8d81d8 | 218 | } |
f36d55af OW |
219 | |
220 | get_xbzrle_cache_stats(info); | |
17549e84 JQ |
221 | break; |
222 | case MIG_STATE_COMPLETED: | |
f36d55af OW |
223 | get_xbzrle_cache_stats(info); |
224 | ||
791e7c82 LC |
225 | info->has_status = true; |
226 | info->status = g_strdup("completed"); | |
7aa939af | 227 | info->total_time = s->total_time; |
9c5a9fcf JQ |
228 | info->has_downtime = true; |
229 | info->downtime = s->downtime; | |
d5f8a570 JQ |
230 | |
231 | info->has_ram = true; | |
232 | info->ram = g_malloc0(sizeof(*info->ram)); | |
233 | info->ram->transferred = ram_bytes_transferred(); | |
234 | info->ram->remaining = 0; | |
235 | info->ram->total = ram_bytes_total(); | |
004d4c10 OW |
236 | info->ram->duplicate = dup_mig_pages_transferred(); |
237 | info->ram->normal = norm_mig_pages_transferred(); | |
238 | info->ram->normal_bytes = norm_mig_bytes_transferred(); | |
17549e84 JQ |
239 | break; |
240 | case MIG_STATE_ERROR: | |
791e7c82 LC |
241 | info->has_status = true; |
242 | info->status = g_strdup("failed"); | |
17549e84 JQ |
243 | break; |
244 | case MIG_STATE_CANCELLED: | |
791e7c82 LC |
245 | info->has_status = true; |
246 | info->status = g_strdup("cancelled"); | |
17549e84 | 247 | break; |
5bb7910a | 248 | } |
791e7c82 LC |
249 | |
250 | return info; | |
5bb7910a AL |
251 | } |
252 | ||
00458433 OW |
253 | void qmp_migrate_set_capabilities(MigrationCapabilityStatusList *params, |
254 | Error **errp) | |
255 | { | |
256 | MigrationState *s = migrate_get_current(); | |
257 | MigrationCapabilityStatusList *cap; | |
258 | ||
259 | if (s->state == MIG_STATE_ACTIVE) { | |
260 | error_set(errp, QERR_MIGRATION_ACTIVE); | |
261 | return; | |
262 | } | |
263 | ||
264 | for (cap = params; cap; cap = cap->next) { | |
265 | s->enabled_capabilities[cap->value->capability] = cap->value->state; | |
266 | } | |
267 | } | |
268 | ||
065e2813 AL |
269 | /* shared migration helpers */ |
270 | ||
8b6b99b3 | 271 | static int migrate_fd_cleanup(MigrationState *s) |
065e2813 | 272 | { |
41ef56e6 AL |
273 | int ret = 0; |
274 | ||
065e2813 | 275 | if (s->file) { |
d0f2c4c6 | 276 | DPRINTF("closing file\n"); |
a6d34a94 | 277 | ret = qemu_fclose(s->file); |
5d39c799 | 278 | s->file = NULL; |
065e2813 AL |
279 | } |
280 | ||
24ea1e4b | 281 | assert(s->fd == -1); |
41ef56e6 | 282 | return ret; |
065e2813 AL |
283 | } |
284 | ||
8b6b99b3 | 285 | void migrate_fd_error(MigrationState *s) |
065e2813 | 286 | { |
8b6b99b3 JQ |
287 | DPRINTF("setting error state\n"); |
288 | s->state = MIG_STATE_ERROR; | |
e0eb7390 | 289 | notifier_list_notify(&migration_state_notifiers, s); |
8b6b99b3 JQ |
290 | migrate_fd_cleanup(s); |
291 | } | |
292 | ||
458cf28e JQ |
293 | static void migrate_fd_completed(MigrationState *s) |
294 | { | |
295 | DPRINTF("setting completed state\n"); | |
296 | if (migrate_fd_cleanup(s) < 0) { | |
297 | s->state = MIG_STATE_ERROR; | |
298 | } else { | |
299 | s->state = MIG_STATE_COMPLETED; | |
300 | runstate_set(RUN_STATE_POSTMIGRATE); | |
301 | } | |
e0eb7390 | 302 | notifier_list_notify(&migration_state_notifiers, s); |
458cf28e JQ |
303 | } |
304 | ||
c87b015b JQ |
305 | ssize_t migrate_fd_put_buffer(MigrationState *s, const void *data, |
306 | size_t size) | |
065e2813 | 307 | { |
065e2813 AL |
308 | ssize_t ret; |
309 | ||
fdbecb5d JQ |
310 | if (s->state != MIG_STATE_ACTIVE) { |
311 | return -EIO; | |
312 | } | |
313 | ||
065e2813 AL |
314 | do { |
315 | ret = s->write(s, data, size); | |
95b134ea | 316 | } while (ret == -1 && ((s->get_error(s)) == EINTR)); |
065e2813 AL |
317 | |
318 | if (ret == -1) | |
319 | ret = -(s->get_error(s)); | |
320 | ||
065e2813 AL |
321 | return ret; |
322 | } | |
323 | ||
0edda1c4 | 324 | static void migrate_fd_cancel(MigrationState *s) |
065e2813 | 325 | { |
065e2813 AL |
326 | if (s->state != MIG_STATE_ACTIVE) |
327 | return; | |
328 | ||
d0f2c4c6 | 329 | DPRINTF("cancelling migration\n"); |
065e2813 AL |
330 | |
331 | s->state = MIG_STATE_CANCELLED; | |
e0eb7390 | 332 | notifier_list_notify(&migration_state_notifiers, s); |
539de124 | 333 | qemu_savevm_state_cancel(s->file); |
065e2813 AL |
334 | |
335 | migrate_fd_cleanup(s); | |
336 | } | |
337 | ||
11c76741 | 338 | int migrate_fd_close(MigrationState *s) |
065e2813 | 339 | { |
8dc592e6 PB |
340 | int rc = 0; |
341 | if (s->fd != -1) { | |
8dc592e6 PB |
342 | rc = s->close(s); |
343 | s->fd = -1; | |
344 | } | |
345 | return rc; | |
065e2813 | 346 | } |
99a0db9b GH |
347 | |
348 | void add_migration_state_change_notifier(Notifier *notify) | |
349 | { | |
350 | notifier_list_add(&migration_state_notifiers, notify); | |
351 | } | |
352 | ||
353 | void remove_migration_state_change_notifier(Notifier *notify) | |
354 | { | |
31552529 | 355 | notifier_remove(notify); |
99a0db9b GH |
356 | } |
357 | ||
afe2df69 GH |
358 | bool migration_is_active(MigrationState *s) |
359 | { | |
360 | return s->state == MIG_STATE_ACTIVE; | |
361 | } | |
362 | ||
7073693b | 363 | bool migration_has_finished(MigrationState *s) |
99a0db9b | 364 | { |
7073693b | 365 | return s->state == MIG_STATE_COMPLETED; |
99a0db9b | 366 | } |
0edda1c4 | 367 | |
afe2df69 GH |
368 | bool migration_has_failed(MigrationState *s) |
369 | { | |
370 | return (s->state == MIG_STATE_CANCELLED || | |
371 | s->state == MIG_STATE_ERROR); | |
372 | } | |
373 | ||
6607ae23 | 374 | static MigrationState *migrate_init(const MigrationParams *params) |
0edda1c4 | 375 | { |
17549e84 | 376 | MigrationState *s = migrate_get_current(); |
d0ae46c1 | 377 | int64_t bandwidth_limit = s->bandwidth_limit; |
bbf6da32 | 378 | bool enabled_capabilities[MIGRATION_CAPABILITY_MAX]; |
17ad9b35 | 379 | int64_t xbzrle_cache_size = s->xbzrle_cache_size; |
bbf6da32 OW |
380 | |
381 | memcpy(enabled_capabilities, s->enabled_capabilities, | |
382 | sizeof(enabled_capabilities)); | |
0edda1c4 | 383 | |
17549e84 | 384 | memset(s, 0, sizeof(*s)); |
d0ae46c1 | 385 | s->bandwidth_limit = bandwidth_limit; |
6607ae23 | 386 | s->params = *params; |
bbf6da32 OW |
387 | memcpy(s->enabled_capabilities, enabled_capabilities, |
388 | sizeof(enabled_capabilities)); | |
17ad9b35 | 389 | s->xbzrle_cache_size = xbzrle_cache_size; |
1299c631 | 390 | |
0edda1c4 | 391 | s->bandwidth_limit = bandwidth_limit; |
d5934dde | 392 | s->state = MIG_STATE_SETUP; |
d5f8a570 | 393 | s->total_time = qemu_get_clock_ms(rt_clock); |
0edda1c4 | 394 | |
0edda1c4 JQ |
395 | return s; |
396 | } | |
cab30143 | 397 | |
fa2756b7 AL |
398 | static GSList *migration_blockers; |
399 | ||
400 | void migrate_add_blocker(Error *reason) | |
401 | { | |
402 | migration_blockers = g_slist_prepend(migration_blockers, reason); | |
403 | } | |
404 | ||
405 | void migrate_del_blocker(Error *reason) | |
406 | { | |
407 | migration_blockers = g_slist_remove(migration_blockers, reason); | |
408 | } | |
409 | ||
e1c37d0e LC |
410 | void qmp_migrate(const char *uri, bool has_blk, bool blk, |
411 | bool has_inc, bool inc, bool has_detach, bool detach, | |
412 | Error **errp) | |
cab30143 | 413 | { |
be7059cd | 414 | Error *local_err = NULL; |
17549e84 | 415 | MigrationState *s = migrate_get_current(); |
6607ae23 | 416 | MigrationParams params; |
cab30143 | 417 | const char *p; |
cab30143 | 418 | |
6607ae23 IY |
419 | params.blk = blk; |
420 | params.shared = inc; | |
421 | ||
17549e84 | 422 | if (s->state == MIG_STATE_ACTIVE) { |
e1c37d0e LC |
423 | error_set(errp, QERR_MIGRATION_ACTIVE); |
424 | return; | |
cab30143 JQ |
425 | } |
426 | ||
e1c37d0e LC |
427 | if (qemu_savevm_state_blocked(errp)) { |
428 | return; | |
cab30143 JQ |
429 | } |
430 | ||
fa2756b7 | 431 | if (migration_blockers) { |
e1c37d0e LC |
432 | *errp = error_copy(migration_blockers->data); |
433 | return; | |
fa2756b7 AL |
434 | } |
435 | ||
6607ae23 | 436 | s = migrate_init(¶ms); |
cab30143 JQ |
437 | |
438 | if (strstart(uri, "tcp:", &p)) { | |
f37afb5a | 439 | tcp_start_outgoing_migration(s, p, &local_err); |
cab30143 JQ |
440 | #if !defined(WIN32) |
441 | } else if (strstart(uri, "exec:", &p)) { | |
f37afb5a | 442 | exec_start_outgoing_migration(s, p, &local_err); |
cab30143 | 443 | } else if (strstart(uri, "unix:", &p)) { |
f37afb5a | 444 | unix_start_outgoing_migration(s, p, &local_err); |
cab30143 | 445 | } else if (strstart(uri, "fd:", &p)) { |
f37afb5a | 446 | fd_start_outgoing_migration(s, p, &local_err); |
cab30143 | 447 | #endif |
99a0db9b | 448 | } else { |
e1c37d0e LC |
449 | error_set(errp, QERR_INVALID_PARAMETER_VALUE, "uri", "a valid migration protocol"); |
450 | return; | |
cab30143 JQ |
451 | } |
452 | ||
f37afb5a | 453 | if (local_err) { |
342ab8d1 | 454 | migrate_fd_error(s); |
f37afb5a | 455 | error_propagate(errp, local_err); |
e1c37d0e | 456 | return; |
1299c631 JQ |
457 | } |
458 | ||
e0eb7390 | 459 | notifier_list_notify(&migration_state_notifiers, s); |
cab30143 JQ |
460 | } |
461 | ||
6cdedb07 | 462 | void qmp_migrate_cancel(Error **errp) |
cab30143 | 463 | { |
17549e84 | 464 | migrate_fd_cancel(migrate_get_current()); |
cab30143 JQ |
465 | } |
466 | ||
9e1ba4cc OW |
467 | void qmp_migrate_set_cache_size(int64_t value, Error **errp) |
468 | { | |
469 | MigrationState *s = migrate_get_current(); | |
470 | ||
471 | /* Check for truncation */ | |
472 | if (value != (size_t)value) { | |
473 | error_set(errp, QERR_INVALID_PARAMETER_VALUE, "cache size", | |
474 | "exceeding address space"); | |
475 | return; | |
476 | } | |
477 | ||
478 | s->xbzrle_cache_size = xbzrle_cache_resize(value); | |
479 | } | |
480 | ||
481 | int64_t qmp_query_migrate_cache_size(Error **errp) | |
482 | { | |
483 | return migrate_xbzrle_cache_size(); | |
484 | } | |
485 | ||
3dc85383 | 486 | void qmp_migrate_set_speed(int64_t value, Error **errp) |
cab30143 | 487 | { |
cab30143 JQ |
488 | MigrationState *s; |
489 | ||
3dc85383 LC |
490 | if (value < 0) { |
491 | value = 0; | |
99a0db9b | 492 | } |
cab30143 | 493 | |
17549e84 | 494 | s = migrate_get_current(); |
3dc85383 | 495 | s->bandwidth_limit = value; |
d0ae46c1 | 496 | qemu_file_set_rate_limit(s->file, s->bandwidth_limit); |
cab30143 JQ |
497 | } |
498 | ||
4f0a993b | 499 | void qmp_migrate_set_downtime(double value, Error **errp) |
cab30143 | 500 | { |
4f0a993b LC |
501 | value *= 1e9; |
502 | value = MAX(0, MIN(UINT64_MAX, value)); | |
503 | max_downtime = (uint64_t)value; | |
99a0db9b | 504 | } |
17ad9b35 OW |
505 | |
506 | int migrate_use_xbzrle(void) | |
507 | { | |
508 | MigrationState *s; | |
509 | ||
510 | s = migrate_get_current(); | |
511 | ||
512 | return s->enabled_capabilities[MIGRATION_CAPABILITY_XBZRLE]; | |
513 | } | |
514 | ||
515 | int64_t migrate_xbzrle_cache_size(void) | |
516 | { | |
517 | MigrationState *s; | |
518 | ||
519 | s = migrate_get_current(); | |
520 | ||
521 | return s->xbzrle_cache_size; | |
522 | } | |
0d82d0e8 JQ |
523 | |
524 | /* migration thread support */ | |
525 | ||
526 | typedef struct QEMUFileBuffered { | |
527 | MigrationState *migration_state; | |
528 | QEMUFile *file; | |
529 | size_t bytes_xfer; | |
530 | size_t xfer_limit; | |
531 | uint8_t *buffer; | |
532 | size_t buffer_size; | |
533 | size_t buffer_capacity; | |
534 | QemuThread thread; | |
535 | } QEMUFileBuffered; | |
536 | ||
537 | static ssize_t buffered_flush(QEMUFileBuffered *s) | |
538 | { | |
539 | size_t offset = 0; | |
540 | ssize_t ret = 0; | |
541 | ||
542 | DPRINTF("flushing %zu byte(s) of data\n", s->buffer_size); | |
543 | ||
544 | while (s->bytes_xfer < s->xfer_limit && offset < s->buffer_size) { | |
545 | size_t to_send = MIN(s->buffer_size - offset, s->xfer_limit - s->bytes_xfer); | |
546 | ret = migrate_fd_put_buffer(s->migration_state, s->buffer + offset, | |
547 | to_send); | |
548 | if (ret <= 0) { | |
549 | DPRINTF("error flushing data, %zd\n", ret); | |
550 | break; | |
551 | } else { | |
552 | DPRINTF("flushed %zd byte(s)\n", ret); | |
553 | offset += ret; | |
554 | s->bytes_xfer += ret; | |
555 | } | |
556 | } | |
557 | ||
558 | DPRINTF("flushed %zu of %zu byte(s)\n", offset, s->buffer_size); | |
559 | memmove(s->buffer, s->buffer + offset, s->buffer_size - offset); | |
560 | s->buffer_size -= offset; | |
561 | ||
562 | if (ret < 0) { | |
563 | return ret; | |
564 | } | |
565 | return offset; | |
566 | } | |
567 | ||
568 | static int buffered_put_buffer(void *opaque, const uint8_t *buf, | |
569 | int64_t pos, int size) | |
570 | { | |
571 | QEMUFileBuffered *s = opaque; | |
572 | ssize_t error; | |
573 | ||
574 | DPRINTF("putting %d bytes at %" PRId64 "\n", size, pos); | |
575 | ||
576 | error = qemu_file_get_error(s->file); | |
577 | if (error) { | |
578 | DPRINTF("flush when error, bailing: %s\n", strerror(-error)); | |
579 | return error; | |
580 | } | |
581 | ||
582 | if (size <= 0) { | |
583 | return size; | |
584 | } | |
585 | ||
586 | if (size > (s->buffer_capacity - s->buffer_size)) { | |
587 | DPRINTF("increasing buffer capacity from %zu by %zu\n", | |
588 | s->buffer_capacity, size + 1024); | |
589 | ||
590 | s->buffer_capacity += size + 1024; | |
591 | ||
592 | s->buffer = g_realloc(s->buffer, s->buffer_capacity); | |
593 | } | |
594 | ||
595 | memcpy(s->buffer + s->buffer_size, buf, size); | |
596 | s->buffer_size += size; | |
597 | ||
598 | return size; | |
599 | } | |
600 | ||
601 | static int buffered_close(void *opaque) | |
602 | { | |
603 | QEMUFileBuffered *s = opaque; | |
604 | ssize_t ret = 0; | |
605 | int ret2; | |
606 | ||
607 | DPRINTF("closing\n"); | |
608 | ||
609 | s->xfer_limit = INT_MAX; | |
610 | while (!qemu_file_get_error(s->file) && s->buffer_size) { | |
611 | ret = buffered_flush(s); | |
612 | if (ret < 0) { | |
613 | break; | |
614 | } | |
615 | } | |
616 | ||
617 | ret2 = migrate_fd_close(s->migration_state); | |
618 | if (ret >= 0) { | |
619 | ret = ret2; | |
620 | } | |
621 | ret = migrate_fd_close(s->migration_state); | |
622 | s->migration_state->complete = true; | |
623 | return ret; | |
624 | } | |
625 | ||
626 | static int buffered_get_fd(void *opaque) | |
627 | { | |
628 | QEMUFileBuffered *s = opaque; | |
629 | ||
630 | return qemu_get_fd(s->file); | |
631 | } | |
632 | ||
633 | /* | |
634 | * The meaning of the return values is: | |
635 | * 0: We can continue sending | |
636 | * 1: Time to stop | |
637 | * negative: There has been an error | |
638 | */ | |
639 | static int buffered_rate_limit(void *opaque) | |
640 | { | |
641 | QEMUFileBuffered *s = opaque; | |
642 | int ret; | |
643 | ||
644 | ret = qemu_file_get_error(s->file); | |
645 | if (ret) { | |
646 | return ret; | |
647 | } | |
648 | ||
649 | if (s->bytes_xfer > s->xfer_limit) { | |
650 | return 1; | |
651 | } | |
652 | ||
653 | return 0; | |
654 | } | |
655 | ||
656 | static int64_t buffered_set_rate_limit(void *opaque, int64_t new_rate) | |
657 | { | |
658 | QEMUFileBuffered *s = opaque; | |
659 | if (qemu_file_get_error(s->file)) { | |
660 | goto out; | |
661 | } | |
662 | if (new_rate > SIZE_MAX) { | |
663 | new_rate = SIZE_MAX; | |
664 | } | |
665 | ||
666 | s->xfer_limit = new_rate / 10; | |
667 | ||
668 | out: | |
669 | return s->xfer_limit; | |
670 | } | |
671 | ||
672 | static int64_t buffered_get_rate_limit(void *opaque) | |
673 | { | |
674 | QEMUFileBuffered *s = opaque; | |
675 | ||
676 | return s->xfer_limit; | |
677 | } | |
678 | ||
0e288fa3 JQ |
679 | static bool migrate_fd_put_ready(MigrationState *s, uint64_t max_size) |
680 | { | |
681 | int ret; | |
682 | uint64_t pending_size; | |
683 | bool last_round = false; | |
684 | ||
685 | qemu_mutex_lock_iothread(); | |
686 | if (s->state != MIG_STATE_ACTIVE) { | |
687 | DPRINTF("put_ready returning because of non-active state\n"); | |
688 | qemu_mutex_unlock_iothread(); | |
689 | return false; | |
690 | } | |
691 | if (s->first_time) { | |
692 | s->first_time = false; | |
693 | DPRINTF("beginning savevm\n"); | |
694 | ret = qemu_savevm_state_begin(s->file, &s->params); | |
695 | if (ret < 0) { | |
696 | DPRINTF("failed, %d\n", ret); | |
697 | migrate_fd_error(s); | |
698 | qemu_mutex_unlock_iothread(); | |
699 | return false; | |
700 | } | |
701 | } | |
702 | ||
703 | DPRINTF("iterate\n"); | |
704 | pending_size = qemu_savevm_state_pending(s->file, max_size); | |
705 | DPRINTF("pending size %lu max %lu\n", pending_size, max_size); | |
706 | if (pending_size >= max_size) { | |
707 | ret = qemu_savevm_state_iterate(s->file); | |
708 | if (ret < 0) { | |
709 | migrate_fd_error(s); | |
710 | } | |
711 | } else { | |
712 | int old_vm_running = runstate_is_running(); | |
713 | int64_t start_time, end_time; | |
714 | ||
715 | DPRINTF("done iterating\n"); | |
716 | start_time = qemu_get_clock_ms(rt_clock); | |
717 | qemu_system_wakeup_request(QEMU_WAKEUP_REASON_OTHER); | |
718 | if (old_vm_running) { | |
719 | vm_stop(RUN_STATE_FINISH_MIGRATE); | |
720 | } else { | |
721 | vm_stop_force_state(RUN_STATE_FINISH_MIGRATE); | |
722 | } | |
723 | ||
724 | if (qemu_savevm_state_complete(s->file) < 0) { | |
725 | migrate_fd_error(s); | |
726 | } else { | |
727 | migrate_fd_completed(s); | |
728 | } | |
729 | end_time = qemu_get_clock_ms(rt_clock); | |
730 | s->total_time = end_time - s->total_time; | |
731 | s->downtime = end_time - start_time; | |
732 | if (s->state != MIG_STATE_COMPLETED) { | |
733 | if (old_vm_running) { | |
734 | vm_start(); | |
735 | } | |
736 | } | |
737 | last_round = true; | |
738 | } | |
739 | qemu_mutex_unlock_iothread(); | |
740 | ||
741 | return last_round; | |
742 | } | |
743 | ||
0d82d0e8 JQ |
744 | static void *buffered_file_thread(void *opaque) |
745 | { | |
746 | QEMUFileBuffered *s = opaque; | |
747 | int64_t initial_time = qemu_get_clock_ms(rt_clock); | |
748 | int64_t max_size = 0; | |
749 | bool last_round = false; | |
750 | ||
751 | while (true) { | |
752 | int64_t current_time = qemu_get_clock_ms(rt_clock); | |
753 | ||
754 | if (s->migration_state->complete) { | |
755 | break; | |
756 | } | |
757 | if (current_time >= initial_time + BUFFER_DELAY) { | |
758 | uint64_t transferred_bytes = s->bytes_xfer; | |
759 | uint64_t time_spent = current_time - initial_time; | |
760 | double bandwidth = transferred_bytes / time_spent; | |
761 | max_size = bandwidth * migrate_max_downtime() / 1000000; | |
762 | ||
763 | DPRINTF("transferred %" PRIu64 " time_spent %" PRIu64 | |
764 | " bandwidth %g max_size %" PRId64 "\n", | |
765 | transferred_bytes, time_spent, bandwidth, max_size); | |
766 | ||
767 | s->bytes_xfer = 0; | |
768 | initial_time = current_time; | |
769 | } | |
770 | if (!last_round && (s->bytes_xfer >= s->xfer_limit)) { | |
771 | /* usleep expects microseconds */ | |
772 | g_usleep((initial_time + BUFFER_DELAY - current_time)*1000); | |
773 | } | |
774 | if (buffered_flush(s) < 0) { | |
775 | break; | |
776 | } | |
777 | ||
778 | DPRINTF("file is ready\n"); | |
779 | if (s->bytes_xfer < s->xfer_limit) { | |
780 | DPRINTF("notifying client\n"); | |
781 | last_round = migrate_fd_put_ready(s->migration_state, max_size); | |
782 | } | |
783 | } | |
784 | ||
785 | g_free(s->buffer); | |
786 | g_free(s); | |
787 | return NULL; | |
788 | } | |
789 | ||
790 | static const QEMUFileOps buffered_file_ops = { | |
791 | .get_fd = buffered_get_fd, | |
792 | .put_buffer = buffered_put_buffer, | |
793 | .close = buffered_close, | |
794 | .rate_limit = buffered_rate_limit, | |
795 | .get_rate_limit = buffered_get_rate_limit, | |
796 | .set_rate_limit = buffered_set_rate_limit, | |
797 | }; | |
798 | ||
2e450865 | 799 | void migrate_fd_connect(MigrationState *migration_state) |
0d82d0e8 JQ |
800 | { |
801 | QEMUFileBuffered *s; | |
802 | ||
2e450865 JQ |
803 | migration_state->state = MIG_STATE_ACTIVE; |
804 | migration_state->first_time = true; | |
0d82d0e8 JQ |
805 | s = g_malloc0(sizeof(*s)); |
806 | ||
807 | s->migration_state = migration_state; | |
5b4e1eb7 | 808 | s->xfer_limit = s->migration_state->bandwidth_limit / XFER_LIMIT_RATIO; |
0d82d0e8 JQ |
809 | s->migration_state->complete = false; |
810 | ||
811 | s->file = qemu_fopen_ops(s, &buffered_file_ops); | |
812 | ||
813 | migration_state->file = s->file; | |
814 | ||
815 | qemu_thread_create(&s->thread, buffered_file_thread, s, | |
816 | QEMU_THREAD_DETACHED); | |
817 | } |