]>
Commit | Line | Data |
---|---|---|
5bb7910a AL |
1 | /* |
2 | * QEMU live migration | |
3 | * | |
4 | * Copyright IBM, Corp. 2008 | |
5 | * | |
6 | * Authors: | |
7 | * Anthony Liguori <[email protected]> | |
8 | * | |
9 | * This work is licensed under the terms of the GNU GPL, version 2. See | |
10 | * the COPYING file in the top-level directory. | |
11 | * | |
12 | */ | |
13 | ||
14 | #include "qemu-common.h" | |
15 | #include "migration.h" | |
376253ec | 16 | #include "monitor.h" |
065e2813 AL |
17 | #include "buffered_file.h" |
18 | #include "sysemu.h" | |
19 | #include "block.h" | |
20 | #include "qemu_socket.h" | |
25f23643 | 21 | #include "block-migration.h" |
c86a6683 | 22 | #include "qemu-objects.h" |
065e2813 AL |
23 | |
24 | //#define DEBUG_MIGRATION | |
25 | ||
26 | #ifdef DEBUG_MIGRATION | |
d0f2c4c6 | 27 | #define DPRINTF(fmt, ...) \ |
065e2813 AL |
28 | do { printf("migration: " fmt, ## __VA_ARGS__); } while (0) |
29 | #else | |
d0f2c4c6 | 30 | #define DPRINTF(fmt, ...) \ |
065e2813 AL |
31 | do { } while (0) |
32 | #endif | |
5bb7910a AL |
33 | |
34 | /* Migration speed throttling */ | |
35 | static uint32_t max_throttle = (32 << 20); | |
36 | ||
37 | static MigrationState *current_migration; | |
38 | ||
8ca5e801 | 39 | int qemu_start_incoming_migration(const char *uri) |
5bb7910a | 40 | { |
34c9dd8e | 41 | const char *p; |
8ca5e801 | 42 | int ret; |
34c9dd8e AL |
43 | |
44 | if (strstart(uri, "tcp:", &p)) | |
8ca5e801 | 45 | ret = tcp_start_incoming_migration(p); |
065e2813 AL |
46 | #if !defined(WIN32) |
47 | else if (strstart(uri, "exec:", &p)) | |
8ca5e801 | 48 | ret = exec_start_incoming_migration(p); |
4951f65b | 49 | else if (strstart(uri, "unix:", &p)) |
8ca5e801 | 50 | ret = unix_start_incoming_migration(p); |
5ac1fad3 | 51 | else if (strstart(uri, "fd:", &p)) |
8ca5e801 | 52 | ret = fd_start_incoming_migration(p); |
065e2813 | 53 | #endif |
8ca5e801 | 54 | else { |
34c9dd8e | 55 | fprintf(stderr, "unknown migration protocol: %s\n", uri); |
8ca5e801 JQ |
56 | ret = -EPROTONOSUPPORT; |
57 | } | |
58 | return ret; | |
5bb7910a AL |
59 | } |
60 | ||
511c0231 JQ |
61 | void process_incoming_migration(QEMUFile *f) |
62 | { | |
63 | if (qemu_loadvm_state(f) < 0) { | |
64 | fprintf(stderr, "load of migration failed\n"); | |
65 | exit(0); | |
66 | } | |
67 | qemu_announce_self(); | |
68 | DPRINTF("successfully loaded vm state\n"); | |
69 | ||
70 | if (autostart) | |
71 | vm_start(); | |
72 | } | |
73 | ||
b5d17adb | 74 | int do_migrate(Monitor *mon, const QDict *qdict, QObject **ret_data) |
5bb7910a | 75 | { |
34c9dd8e AL |
76 | MigrationState *s = NULL; |
77 | const char *p; | |
eb159d13 LC |
78 | int detach = qdict_get_try_bool(qdict, "detach", 0); |
79 | int blk = qdict_get_try_bool(qdict, "blk", 0); | |
80 | int inc = qdict_get_try_bool(qdict, "inc", 0); | |
f18c16de | 81 | const char *uri = qdict_get_str(qdict, "uri"); |
1302425d JK |
82 | |
83 | if (current_migration && | |
84 | current_migration->get_status(current_migration) == MIG_STATE_ACTIVE) { | |
85 | monitor_printf(mon, "migration already in progress\n"); | |
b5d17adb | 86 | return -1; |
1302425d JK |
87 | } |
88 | ||
b5d17adb | 89 | if (strstart(uri, "tcp:", &p)) { |
f327aa0c | 90 | s = tcp_start_outgoing_migration(mon, p, max_throttle, detach, |
eb159d13 | 91 | blk, inc); |
065e2813 | 92 | #if !defined(WIN32) |
b5d17adb | 93 | } else if (strstart(uri, "exec:", &p)) { |
f327aa0c | 94 | s = exec_start_outgoing_migration(mon, p, max_throttle, detach, |
eb159d13 | 95 | blk, inc); |
b5d17adb | 96 | } else if (strstart(uri, "unix:", &p)) { |
f327aa0c | 97 | s = unix_start_outgoing_migration(mon, p, max_throttle, detach, |
eb159d13 | 98 | blk, inc); |
b5d17adb | 99 | } else if (strstart(uri, "fd:", &p)) { |
c163b5ca | 100 | s = fd_start_outgoing_migration(mon, p, max_throttle, detach, |
eb159d13 | 101 | blk, inc); |
065e2813 | 102 | #endif |
b5d17adb | 103 | } else { |
376253ec | 104 | monitor_printf(mon, "unknown migration protocol: %s\n", uri); |
b5d17adb LC |
105 | return -1; |
106 | } | |
34c9dd8e | 107 | |
b5d17adb | 108 | if (s == NULL) { |
376253ec | 109 | monitor_printf(mon, "migration failed\n"); |
b5d17adb LC |
110 | return -1; |
111 | } | |
34c9dd8e | 112 | |
b5d17adb LC |
113 | if (current_migration) { |
114 | current_migration->release(current_migration); | |
34c9dd8e | 115 | } |
b5d17adb LC |
116 | |
117 | current_migration = s; | |
118 | return 0; | |
5bb7910a AL |
119 | } |
120 | ||
ef4b7eee | 121 | int do_migrate_cancel(Monitor *mon, const QDict *qdict, QObject **ret_data) |
5bb7910a AL |
122 | { |
123 | MigrationState *s = current_migration; | |
124 | ||
125 | if (s) | |
ff8d81d8 | 126 | s->cancel(s); |
ef4b7eee LC |
127 | |
128 | return 0; | |
5bb7910a AL |
129 | } |
130 | ||
ef4b7eee | 131 | int do_migrate_set_speed(Monitor *mon, const QDict *qdict, QObject **ret_data) |
5bb7910a AL |
132 | { |
133 | double d; | |
daa91de2 | 134 | FdMigrationState *s; |
5bb7910a | 135 | |
5667c493 MA |
136 | d = qdict_get_double(qdict, "value"); |
137 | d = MAX(0, MIN(UINT32_MAX, d)); | |
138 | max_throttle = d; | |
daa91de2 | 139 | |
5d39c799 JK |
140 | s = migrate_to_fms(current_migration); |
141 | if (s && s->file) { | |
daa91de2 GC |
142 | qemu_file_set_rate_limit(s->file, max_throttle); |
143 | } | |
ef4b7eee LC |
144 | |
145 | return 0; | |
5bb7910a AL |
146 | } |
147 | ||
a0a3fd60 GC |
148 | /* amount of nanoseconds we are willing to wait for migration to be down. |
149 | * the choice of nanoseconds is because it is the maximum resolution that | |
150 | * get_clock() can achieve. It is an internal measure. All user-visible | |
151 | * units must be in seconds */ | |
152 | static uint64_t max_downtime = 30000000; | |
153 | ||
154 | uint64_t migrate_max_downtime(void) | |
155 | { | |
156 | return max_downtime; | |
157 | } | |
158 | ||
ef4b7eee LC |
159 | int do_migrate_set_downtime(Monitor *mon, const QDict *qdict, |
160 | QObject **ret_data) | |
2ea42952 | 161 | { |
2ea42952 | 162 | double d; |
2ea42952 | 163 | |
b0fbf7d3 MA |
164 | d = qdict_get_double(qdict, "value") * 1e9; |
165 | d = MAX(0, MIN(UINT64_MAX, d)); | |
2ea42952 | 166 | max_downtime = (uint64_t)d; |
ef4b7eee LC |
167 | |
168 | return 0; | |
2ea42952 GC |
169 | } |
170 | ||
c86a6683 LC |
171 | static void migrate_print_status(Monitor *mon, const char *name, |
172 | const QDict *status_dict) | |
5bb7910a | 173 | { |
c86a6683 LC |
174 | QDict *qdict; |
175 | ||
176 | qdict = qobject_to_qdict(qdict_get(status_dict, name)); | |
177 | ||
178 | monitor_printf(mon, "transferred %s: %" PRIu64 " kbytes\n", name, | |
179 | qdict_get_int(qdict, "transferred") >> 10); | |
180 | monitor_printf(mon, "remaining %s: %" PRIu64 " kbytes\n", name, | |
181 | qdict_get_int(qdict, "remaining") >> 10); | |
182 | monitor_printf(mon, "total %s: %" PRIu64 " kbytes\n", name, | |
183 | qdict_get_int(qdict, "total") >> 10); | |
184 | } | |
185 | ||
186 | void do_info_migrate_print(Monitor *mon, const QObject *data) | |
187 | { | |
188 | QDict *qdict; | |
189 | ||
190 | qdict = qobject_to_qdict(data); | |
191 | ||
192 | monitor_printf(mon, "Migration status: %s\n", | |
193 | qdict_get_str(qdict, "status")); | |
194 | ||
195 | if (qdict_haskey(qdict, "ram")) { | |
196 | migrate_print_status(mon, "ram", qdict); | |
197 | } | |
198 | ||
199 | if (qdict_haskey(qdict, "disk")) { | |
200 | migrate_print_status(mon, "disk", qdict); | |
201 | } | |
202 | } | |
203 | ||
204 | static void migrate_put_status(QDict *qdict, const char *name, | |
205 | uint64_t trans, uint64_t rem, uint64_t total) | |
206 | { | |
207 | QObject *obj; | |
208 | ||
209 | obj = qobject_from_jsonf("{ 'transferred': %" PRId64 ", " | |
210 | "'remaining': %" PRId64 ", " | |
211 | "'total': %" PRId64 " }", trans, rem, total); | |
c86a6683 LC |
212 | qdict_put_obj(qdict, name, obj); |
213 | } | |
214 | ||
c86a6683 LC |
215 | void do_info_migrate(Monitor *mon, QObject **ret_data) |
216 | { | |
217 | QDict *qdict; | |
5bb7910a | 218 | MigrationState *s = current_migration; |
376253ec | 219 | |
5bb7910a | 220 | if (s) { |
ff8d81d8 AL |
221 | switch (s->get_status(s)) { |
222 | case MIG_STATE_ACTIVE: | |
c86a6683 LC |
223 | qdict = qdict_new(); |
224 | qdict_put(qdict, "status", qstring_from_str("active")); | |
225 | ||
226 | migrate_put_status(qdict, "ram", ram_bytes_transferred(), | |
227 | ram_bytes_remaining(), ram_bytes_total()); | |
228 | ||
25f23643 | 229 | if (blk_mig_active()) { |
c86a6683 LC |
230 | migrate_put_status(qdict, "disk", blk_mig_bytes_transferred(), |
231 | blk_mig_bytes_remaining(), | |
232 | blk_mig_bytes_total()); | |
25f23643 | 233 | } |
c86a6683 LC |
234 | |
235 | *ret_data = QOBJECT(qdict); | |
ff8d81d8 AL |
236 | break; |
237 | case MIG_STATE_COMPLETED: | |
c86a6683 | 238 | *ret_data = qobject_from_jsonf("{ 'status': 'completed' }"); |
ff8d81d8 AL |
239 | break; |
240 | case MIG_STATE_ERROR: | |
c86a6683 | 241 | *ret_data = qobject_from_jsonf("{ 'status': 'failed' }"); |
ff8d81d8 AL |
242 | break; |
243 | case MIG_STATE_CANCELLED: | |
c86a6683 | 244 | *ret_data = qobject_from_jsonf("{ 'status': 'cancelled' }"); |
ff8d81d8 AL |
245 | break; |
246 | } | |
5bb7910a AL |
247 | } |
248 | } | |
249 | ||
065e2813 AL |
250 | /* shared migration helpers */ |
251 | ||
f327aa0c | 252 | void migrate_fd_monitor_suspend(FdMigrationState *s, Monitor *mon) |
731b0364 | 253 | { |
f327aa0c JK |
254 | s->mon = mon; |
255 | if (monitor_suspend(mon) == 0) { | |
d0f2c4c6 | 256 | DPRINTF("suspending monitor\n"); |
f327aa0c JK |
257 | } else { |
258 | monitor_printf(mon, "terminal does not allow synchronous " | |
cde76ee1 | 259 | "migration, continuing detached\n"); |
f327aa0c | 260 | } |
731b0364 AL |
261 | } |
262 | ||
065e2813 AL |
263 | void migrate_fd_error(FdMigrationState *s) |
264 | { | |
d0f2c4c6 | 265 | DPRINTF("setting error state\n"); |
065e2813 AL |
266 | s->state = MIG_STATE_ERROR; |
267 | migrate_fd_cleanup(s); | |
268 | } | |
269 | ||
41ef56e6 | 270 | int migrate_fd_cleanup(FdMigrationState *s) |
065e2813 | 271 | { |
41ef56e6 AL |
272 | int ret = 0; |
273 | ||
065e2813 AL |
274 | qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL); |
275 | ||
276 | if (s->file) { | |
d0f2c4c6 | 277 | DPRINTF("closing file\n"); |
41ef56e6 AL |
278 | if (qemu_fclose(s->file) != 0) { |
279 | ret = -1; | |
280 | } | |
5d39c799 | 281 | s->file = NULL; |
065e2813 AL |
282 | } |
283 | ||
284 | if (s->fd != -1) | |
285 | close(s->fd); | |
286 | ||
287 | /* Don't resume monitor until we've flushed all of the buffers */ | |
f327aa0c JK |
288 | if (s->mon) { |
289 | monitor_resume(s->mon); | |
290 | } | |
065e2813 AL |
291 | |
292 | s->fd = -1; | |
41ef56e6 AL |
293 | |
294 | return ret; | |
065e2813 AL |
295 | } |
296 | ||
297 | void migrate_fd_put_notify(void *opaque) | |
298 | { | |
299 | FdMigrationState *s = opaque; | |
300 | ||
301 | qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL); | |
302 | qemu_file_put_notify(s->file); | |
303 | } | |
304 | ||
305 | ssize_t migrate_fd_put_buffer(void *opaque, const void *data, size_t size) | |
306 | { | |
307 | FdMigrationState *s = opaque; | |
308 | ssize_t ret; | |
309 | ||
310 | do { | |
311 | ret = s->write(s, data, size); | |
95b134ea | 312 | } while (ret == -1 && ((s->get_error(s)) == EINTR)); |
065e2813 AL |
313 | |
314 | if (ret == -1) | |
315 | ret = -(s->get_error(s)); | |
316 | ||
317 | if (ret == -EAGAIN) | |
318 | qemu_set_fd_handler2(s->fd, NULL, NULL, migrate_fd_put_notify, s); | |
319 | ||
320 | return ret; | |
321 | } | |
322 | ||
323 | void migrate_fd_connect(FdMigrationState *s) | |
324 | { | |
325 | int ret; | |
326 | ||
327 | s->file = qemu_fopen_ops_buffered(s, | |
328 | s->bandwidth_limit, | |
329 | migrate_fd_put_buffer, | |
330 | migrate_fd_put_ready, | |
331 | migrate_fd_wait_for_unfreeze, | |
332 | migrate_fd_close); | |
333 | ||
d0f2c4c6 | 334 | DPRINTF("beginning savevm\n"); |
f327aa0c | 335 | ret = qemu_savevm_state_begin(s->mon, s->file, s->mig_state.blk, |
c163b5ca | 336 | s->mig_state.shared); |
065e2813 | 337 | if (ret < 0) { |
d0f2c4c6 | 338 | DPRINTF("failed, %d\n", ret); |
065e2813 AL |
339 | migrate_fd_error(s); |
340 | return; | |
341 | } | |
c163b5ca | 342 | |
065e2813 AL |
343 | migrate_fd_put_ready(s); |
344 | } | |
345 | ||
346 | void migrate_fd_put_ready(void *opaque) | |
347 | { | |
348 | FdMigrationState *s = opaque; | |
349 | ||
350 | if (s->state != MIG_STATE_ACTIVE) { | |
d0f2c4c6 | 351 | DPRINTF("put_ready returning because of non-active state\n"); |
065e2813 AL |
352 | return; |
353 | } | |
354 | ||
d0f2c4c6 | 355 | DPRINTF("iterate\n"); |
f327aa0c | 356 | if (qemu_savevm_state_iterate(s->mon, s->file) == 1) { |
b161d123 | 357 | int state; |
eeb34af9 AL |
358 | int old_vm_running = vm_running; |
359 | ||
d0f2c4c6 | 360 | DPRINTF("done iterating\n"); |
065e2813 AL |
361 | vm_stop(0); |
362 | ||
0884657b | 363 | qemu_aio_flush(); |
065e2813 | 364 | bdrv_flush_all(); |
f327aa0c | 365 | if ((qemu_savevm_state_complete(s->mon, s->file)) < 0) { |
eeb34af9 AL |
366 | if (old_vm_running) { |
367 | vm_start(); | |
368 | } | |
b161d123 AL |
369 | state = MIG_STATE_ERROR; |
370 | } else { | |
371 | state = MIG_STATE_COMPLETED; | |
372 | } | |
41ef56e6 AL |
373 | if (migrate_fd_cleanup(s) < 0) { |
374 | if (old_vm_running) { | |
375 | vm_start(); | |
376 | } | |
377 | state = MIG_STATE_ERROR; | |
378 | } | |
b161d123 | 379 | s->state = state; |
065e2813 AL |
380 | } |
381 | } | |
382 | ||
383 | int migrate_fd_get_status(MigrationState *mig_state) | |
384 | { | |
385 | FdMigrationState *s = migrate_to_fms(mig_state); | |
386 | return s->state; | |
387 | } | |
388 | ||
389 | void migrate_fd_cancel(MigrationState *mig_state) | |
390 | { | |
391 | FdMigrationState *s = migrate_to_fms(mig_state); | |
392 | ||
393 | if (s->state != MIG_STATE_ACTIVE) | |
394 | return; | |
395 | ||
d0f2c4c6 | 396 | DPRINTF("cancelling migration\n"); |
065e2813 AL |
397 | |
398 | s->state = MIG_STATE_CANCELLED; | |
f327aa0c | 399 | qemu_savevm_state_cancel(s->mon, s->file); |
065e2813 AL |
400 | |
401 | migrate_fd_cleanup(s); | |
402 | } | |
403 | ||
404 | void migrate_fd_release(MigrationState *mig_state) | |
405 | { | |
406 | FdMigrationState *s = migrate_to_fms(mig_state); | |
407 | ||
d0f2c4c6 | 408 | DPRINTF("releasing state\n"); |
065e2813 AL |
409 | |
410 | if (s->state == MIG_STATE_ACTIVE) { | |
411 | s->state = MIG_STATE_CANCELLED; | |
412 | migrate_fd_cleanup(s); | |
413 | } | |
faa1f8dd | 414 | qemu_free(s); |
065e2813 AL |
415 | } |
416 | ||
417 | void migrate_fd_wait_for_unfreeze(void *opaque) | |
418 | { | |
419 | FdMigrationState *s = opaque; | |
420 | int ret; | |
421 | ||
d0f2c4c6 | 422 | DPRINTF("wait for unfreeze\n"); |
065e2813 AL |
423 | if (s->state != MIG_STATE_ACTIVE) |
424 | return; | |
425 | ||
426 | do { | |
427 | fd_set wfds; | |
428 | ||
429 | FD_ZERO(&wfds); | |
430 | FD_SET(s->fd, &wfds); | |
431 | ||
432 | ret = select(s->fd + 1, NULL, &wfds, NULL, NULL); | |
433 | } while (ret == -1 && (s->get_error(s)) == EINTR); | |
434 | } | |
435 | ||
436 | int migrate_fd_close(void *opaque) | |
437 | { | |
438 | FdMigrationState *s = opaque; | |
e19252d3 UL |
439 | |
440 | qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL); | |
065e2813 AL |
441 | return s->close(s); |
442 | } |