blob: 85c81e098335f001c46af23b28b3a27225a08c75 [file] [log] [blame]
aliguori5bb79102008-10-13 03:12:02 +00001/*
2 * QEMU live migration
3 *
4 * Copyright IBM, Corp. 2008
5 *
6 * Authors:
7 * Anthony Liguori <aliguori@us.ibm.com>
8 *
9 * This work is licensed under the terms of the GNU GPL, version 2. See
10 * the COPYING file in the top-level directory.
11 *
12 */
13
14#include "qemu-common.h"
15#include "migration.h"
aliguori376253e2009-03-05 23:01:23 +000016#include "monitor.h"
aliguori065e2812008-11-11 16:46:33 +000017#include "buffered_file.h"
18#include "sysemu.h"
19#include "block.h"
20#include "qemu_socket.h"
Jan Kiszka25f23642009-11-30 18:21:21 +010021#include "block-migration.h"
Luiz Capitulinoc86a6682009-12-10 17:16:05 -020022#include "qemu-objects.h"
aliguori065e2812008-11-11 16:46:33 +000023
24//#define DEBUG_MIGRATION
25
26#ifdef DEBUG_MIGRATION
malcd0f2c4c2010-02-07 02:03:50 +030027#define DPRINTF(fmt, ...) \
aliguori065e2812008-11-11 16:46:33 +000028 do { printf("migration: " fmt, ## __VA_ARGS__); } while (0)
29#else
malcd0f2c4c2010-02-07 02:03:50 +030030#define DPRINTF(fmt, ...) \
aliguori065e2812008-11-11 16:46:33 +000031 do { } while (0)
32#endif
aliguori5bb79102008-10-13 03:12:02 +000033
34/* Migration speed throttling */
35static uint32_t max_throttle = (32 << 20);
36
37static MigrationState *current_migration;
38
Juan Quintela8ca5e802010-06-09 14:10:54 +020039int qemu_start_incoming_migration(const char *uri)
aliguori5bb79102008-10-13 03:12:02 +000040{
aliguori34c9dd82008-10-13 03:14:31 +000041 const char *p;
Juan Quintela8ca5e802010-06-09 14:10:54 +020042 int ret;
aliguori34c9dd82008-10-13 03:14:31 +000043
44 if (strstart(uri, "tcp:", &p))
Juan Quintela8ca5e802010-06-09 14:10:54 +020045 ret = tcp_start_incoming_migration(p);
aliguori065e2812008-11-11 16:46:33 +000046#if !defined(WIN32)
47 else if (strstart(uri, "exec:", &p))
Juan Quintela8ca5e802010-06-09 14:10:54 +020048 ret = exec_start_incoming_migration(p);
Chris Lalancette4951f652009-08-05 17:24:29 +020049 else if (strstart(uri, "unix:", &p))
Juan Quintela8ca5e802010-06-09 14:10:54 +020050 ret = unix_start_incoming_migration(p);
Paolo Bonzini5ac1fad2009-08-18 15:56:25 +020051 else if (strstart(uri, "fd:", &p))
Juan Quintela8ca5e802010-06-09 14:10:54 +020052 ret = fd_start_incoming_migration(p);
aliguori065e2812008-11-11 16:46:33 +000053#endif
Juan Quintela8ca5e802010-06-09 14:10:54 +020054 else {
aliguori34c9dd82008-10-13 03:14:31 +000055 fprintf(stderr, "unknown migration protocol: %s\n", uri);
Juan Quintela8ca5e802010-06-09 14:10:54 +020056 ret = -EPROTONOSUPPORT;
57 }
58 return ret;
aliguori5bb79102008-10-13 03:12:02 +000059}
60
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020061int do_migrate(Monitor *mon, const QDict *qdict, QObject **ret_data)
aliguori5bb79102008-10-13 03:12:02 +000062{
aliguori34c9dd82008-10-13 03:14:31 +000063 MigrationState *s = NULL;
64 const char *p;
Luiz Capitulinof18c16d2009-08-28 15:27:14 -030065 int detach = qdict_get_int(qdict, "detach");
66 const char *uri = qdict_get_str(qdict, "uri");
Jan Kiszka13024252009-11-30 18:21:19 +010067
68 if (current_migration &&
69 current_migration->get_status(current_migration) == MIG_STATE_ACTIVE) {
70 monitor_printf(mon, "migration already in progress\n");
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020071 return -1;
Jan Kiszka13024252009-11-30 18:21:19 +010072 }
73
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020074 if (strstart(uri, "tcp:", &p)) {
Jan Kiszkaf327aa02009-11-30 18:21:21 +010075 s = tcp_start_outgoing_migration(mon, p, max_throttle, detach,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +020076 (int)qdict_get_int(qdict, "blk"),
77 (int)qdict_get_int(qdict, "inc"));
aliguori065e2812008-11-11 16:46:33 +000078#if !defined(WIN32)
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020079 } else if (strstart(uri, "exec:", &p)) {
Jan Kiszkaf327aa02009-11-30 18:21:21 +010080 s = exec_start_outgoing_migration(mon, p, max_throttle, detach,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +020081 (int)qdict_get_int(qdict, "blk"),
82 (int)qdict_get_int(qdict, "inc"));
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020083 } else if (strstart(uri, "unix:", &p)) {
Jan Kiszkaf327aa02009-11-30 18:21:21 +010084 s = unix_start_outgoing_migration(mon, p, max_throttle, detach,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +020085 (int)qdict_get_int(qdict, "blk"),
86 (int)qdict_get_int(qdict, "inc"));
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020087 } else if (strstart(uri, "fd:", &p)) {
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +020088 s = fd_start_outgoing_migration(mon, p, max_throttle, detach,
89 (int)qdict_get_int(qdict, "blk"),
90 (int)qdict_get_int(qdict, "inc"));
aliguori065e2812008-11-11 16:46:33 +000091#endif
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020092 } else {
aliguori376253e2009-03-05 23:01:23 +000093 monitor_printf(mon, "unknown migration protocol: %s\n", uri);
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020094 return -1;
aliguori34c9dd82008-10-13 03:14:31 +000095 }
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020096
97 if (s == NULL) {
98 monitor_printf(mon, "migration failed\n");
99 return -1;
100 }
101
102 if (current_migration) {
103 current_migration->release(current_migration);
104 }
105
106 current_migration = s;
107 return 0;
aliguori5bb79102008-10-13 03:12:02 +0000108}
109
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200110int do_migrate_cancel(Monitor *mon, const QDict *qdict, QObject **ret_data)
aliguori5bb79102008-10-13 03:12:02 +0000111{
112 MigrationState *s = current_migration;
113
114 if (s)
aliguoriff8d81d2008-10-24 22:10:31 +0000115 s->cancel(s);
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200116
117 return 0;
aliguori5bb79102008-10-13 03:12:02 +0000118}
119
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200120int do_migrate_set_speed(Monitor *mon, const QDict *qdict, QObject **ret_data)
aliguori5bb79102008-10-13 03:12:02 +0000121{
122 double d;
Glauber Costadaa91de2009-05-20 18:26:58 -0400123 FdMigrationState *s;
aliguori5bb79102008-10-13 03:12:02 +0000124
Markus Armbruster5667c492010-01-25 14:23:04 +0100125 d = qdict_get_double(qdict, "value");
126 d = MAX(0, MIN(UINT32_MAX, d));
127 max_throttle = d;
Glauber Costadaa91de2009-05-20 18:26:58 -0400128
Jan Kiszka5d39c792009-11-30 18:21:19 +0100129 s = migrate_to_fms(current_migration);
130 if (s && s->file) {
Glauber Costadaa91de2009-05-20 18:26:58 -0400131 qemu_file_set_rate_limit(s->file, max_throttle);
132 }
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200133
134 return 0;
aliguori5bb79102008-10-13 03:12:02 +0000135}
136
Glauber Costaa0a3fd62009-05-28 15:22:57 -0400137/* amount of nanoseconds we are willing to wait for migration to be down.
138 * the choice of nanoseconds is because it is the maximum resolution that
139 * get_clock() can achieve. It is an internal measure. All user-visible
140 * units must be in seconds */
141static uint64_t max_downtime = 30000000;
142
143uint64_t migrate_max_downtime(void)
144{
145 return max_downtime;
146}
147
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200148int do_migrate_set_downtime(Monitor *mon, const QDict *qdict,
149 QObject **ret_data)
Glauber Costa2ea42952009-05-28 15:22:58 -0400150{
Glauber Costa2ea42952009-05-28 15:22:58 -0400151 double d;
152
Markus Armbrusterb0fbf7d2010-01-25 14:23:07 +0100153 d = qdict_get_double(qdict, "value") * 1e9;
154 d = MAX(0, MIN(UINT64_MAX, d));
Glauber Costa2ea42952009-05-28 15:22:58 -0400155 max_downtime = (uint64_t)d;
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200156
157 return 0;
Glauber Costa2ea42952009-05-28 15:22:58 -0400158}
159
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200160static void migrate_print_status(Monitor *mon, const char *name,
161 const QDict *status_dict)
aliguori5bb79102008-10-13 03:12:02 +0000162{
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200163 QDict *qdict;
164
165 qdict = qobject_to_qdict(qdict_get(status_dict, name));
166
167 monitor_printf(mon, "transferred %s: %" PRIu64 " kbytes\n", name,
168 qdict_get_int(qdict, "transferred") >> 10);
169 monitor_printf(mon, "remaining %s: %" PRIu64 " kbytes\n", name,
170 qdict_get_int(qdict, "remaining") >> 10);
171 monitor_printf(mon, "total %s: %" PRIu64 " kbytes\n", name,
172 qdict_get_int(qdict, "total") >> 10);
173}
174
175void do_info_migrate_print(Monitor *mon, const QObject *data)
176{
177 QDict *qdict;
178
179 qdict = qobject_to_qdict(data);
180
181 monitor_printf(mon, "Migration status: %s\n",
182 qdict_get_str(qdict, "status"));
183
184 if (qdict_haskey(qdict, "ram")) {
185 migrate_print_status(mon, "ram", qdict);
186 }
187
188 if (qdict_haskey(qdict, "disk")) {
189 migrate_print_status(mon, "disk", qdict);
190 }
191}
192
193static void migrate_put_status(QDict *qdict, const char *name,
194 uint64_t trans, uint64_t rem, uint64_t total)
195{
196 QObject *obj;
197
198 obj = qobject_from_jsonf("{ 'transferred': %" PRId64 ", "
199 "'remaining': %" PRId64 ", "
200 "'total': %" PRId64 " }", trans, rem, total);
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200201 qdict_put_obj(qdict, name, obj);
202}
203
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200204void do_info_migrate(Monitor *mon, QObject **ret_data)
205{
206 QDict *qdict;
aliguori5bb79102008-10-13 03:12:02 +0000207 MigrationState *s = current_migration;
aliguori376253e2009-03-05 23:01:23 +0000208
aliguori5bb79102008-10-13 03:12:02 +0000209 if (s) {
aliguoriff8d81d2008-10-24 22:10:31 +0000210 switch (s->get_status(s)) {
211 case MIG_STATE_ACTIVE:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200212 qdict = qdict_new();
213 qdict_put(qdict, "status", qstring_from_str("active"));
214
215 migrate_put_status(qdict, "ram", ram_bytes_transferred(),
216 ram_bytes_remaining(), ram_bytes_total());
217
Jan Kiszka25f23642009-11-30 18:21:21 +0100218 if (blk_mig_active()) {
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200219 migrate_put_status(qdict, "disk", blk_mig_bytes_transferred(),
220 blk_mig_bytes_remaining(),
221 blk_mig_bytes_total());
Jan Kiszka25f23642009-11-30 18:21:21 +0100222 }
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200223
224 *ret_data = QOBJECT(qdict);
aliguoriff8d81d2008-10-24 22:10:31 +0000225 break;
226 case MIG_STATE_COMPLETED:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200227 *ret_data = qobject_from_jsonf("{ 'status': 'completed' }");
aliguoriff8d81d2008-10-24 22:10:31 +0000228 break;
229 case MIG_STATE_ERROR:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200230 *ret_data = qobject_from_jsonf("{ 'status': 'failed' }");
aliguoriff8d81d2008-10-24 22:10:31 +0000231 break;
232 case MIG_STATE_CANCELLED:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200233 *ret_data = qobject_from_jsonf("{ 'status': 'cancelled' }");
aliguoriff8d81d2008-10-24 22:10:31 +0000234 break;
235 }
aliguori5bb79102008-10-13 03:12:02 +0000236 }
237}
238
aliguori065e2812008-11-11 16:46:33 +0000239/* shared migration helpers */
240
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100241void migrate_fd_monitor_suspend(FdMigrationState *s, Monitor *mon)
aliguori731b0362009-03-05 23:01:42 +0000242{
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100243 s->mon = mon;
244 if (monitor_suspend(mon) == 0) {
malcd0f2c4c2010-02-07 02:03:50 +0300245 DPRINTF("suspending monitor\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100246 } else {
247 monitor_printf(mon, "terminal does not allow synchronous "
aliguoricde76ee2009-03-05 23:01:51 +0000248 "migration, continuing detached\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100249 }
aliguori731b0362009-03-05 23:01:42 +0000250}
251
aliguori065e2812008-11-11 16:46:33 +0000252void migrate_fd_error(FdMigrationState *s)
253{
malcd0f2c4c2010-02-07 02:03:50 +0300254 DPRINTF("setting error state\n");
aliguori065e2812008-11-11 16:46:33 +0000255 s->state = MIG_STATE_ERROR;
256 migrate_fd_cleanup(s);
257}
258
Anthony Liguori41ef56e2010-06-02 14:55:25 -0500259int migrate_fd_cleanup(FdMigrationState *s)
aliguori065e2812008-11-11 16:46:33 +0000260{
Anthony Liguori41ef56e2010-06-02 14:55:25 -0500261 int ret = 0;
262
aliguori065e2812008-11-11 16:46:33 +0000263 qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
264
265 if (s->file) {
malcd0f2c4c2010-02-07 02:03:50 +0300266 DPRINTF("closing file\n");
Anthony Liguori41ef56e2010-06-02 14:55:25 -0500267 if (qemu_fclose(s->file) != 0) {
268 ret = -1;
269 }
Jan Kiszka5d39c792009-11-30 18:21:19 +0100270 s->file = NULL;
aliguori065e2812008-11-11 16:46:33 +0000271 }
272
273 if (s->fd != -1)
274 close(s->fd);
275
276 /* Don't resume monitor until we've flushed all of the buffers */
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100277 if (s->mon) {
278 monitor_resume(s->mon);
279 }
aliguori065e2812008-11-11 16:46:33 +0000280
281 s->fd = -1;
Anthony Liguori41ef56e2010-06-02 14:55:25 -0500282
283 return ret;
aliguori065e2812008-11-11 16:46:33 +0000284}
285
286void migrate_fd_put_notify(void *opaque)
287{
288 FdMigrationState *s = opaque;
289
290 qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
291 qemu_file_put_notify(s->file);
292}
293
294ssize_t migrate_fd_put_buffer(void *opaque, const void *data, size_t size)
295{
296 FdMigrationState *s = opaque;
297 ssize_t ret;
298
299 do {
300 ret = s->write(s, data, size);
Uri Lublin95b134e2009-05-19 14:08:53 +0300301 } while (ret == -1 && ((s->get_error(s)) == EINTR));
aliguori065e2812008-11-11 16:46:33 +0000302
303 if (ret == -1)
304 ret = -(s->get_error(s));
305
306 if (ret == -EAGAIN)
307 qemu_set_fd_handler2(s->fd, NULL, NULL, migrate_fd_put_notify, s);
308
309 return ret;
310}
311
312void migrate_fd_connect(FdMigrationState *s)
313{
314 int ret;
315
316 s->file = qemu_fopen_ops_buffered(s,
317 s->bandwidth_limit,
318 migrate_fd_put_buffer,
319 migrate_fd_put_ready,
320 migrate_fd_wait_for_unfreeze,
321 migrate_fd_close);
322
malcd0f2c4c2010-02-07 02:03:50 +0300323 DPRINTF("beginning savevm\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100324 ret = qemu_savevm_state_begin(s->mon, s->file, s->mig_state.blk,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +0200325 s->mig_state.shared);
aliguori065e2812008-11-11 16:46:33 +0000326 if (ret < 0) {
malcd0f2c4c2010-02-07 02:03:50 +0300327 DPRINTF("failed, %d\n", ret);
aliguori065e2812008-11-11 16:46:33 +0000328 migrate_fd_error(s);
329 return;
330 }
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +0200331
aliguori065e2812008-11-11 16:46:33 +0000332 migrate_fd_put_ready(s);
333}
334
335void migrate_fd_put_ready(void *opaque)
336{
337 FdMigrationState *s = opaque;
338
339 if (s->state != MIG_STATE_ACTIVE) {
malcd0f2c4c2010-02-07 02:03:50 +0300340 DPRINTF("put_ready returning because of non-active state\n");
aliguori065e2812008-11-11 16:46:33 +0000341 return;
342 }
343
malcd0f2c4c2010-02-07 02:03:50 +0300344 DPRINTF("iterate\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100345 if (qemu_savevm_state_iterate(s->mon, s->file) == 1) {
aliguorib161d122009-04-05 19:30:33 +0000346 int state;
Anthony Liguorieeb34af2009-07-09 13:25:47 -0500347 int old_vm_running = vm_running;
348
malcd0f2c4c2010-02-07 02:03:50 +0300349 DPRINTF("done iterating\n");
aliguori065e2812008-11-11 16:46:33 +0000350 vm_stop(0);
351
Glauber Costa08846572009-07-06 09:32:09 -0400352 qemu_aio_flush();
aliguori065e2812008-11-11 16:46:33 +0000353 bdrv_flush_all();
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100354 if ((qemu_savevm_state_complete(s->mon, s->file)) < 0) {
Anthony Liguorieeb34af2009-07-09 13:25:47 -0500355 if (old_vm_running) {
356 vm_start();
357 }
aliguorib161d122009-04-05 19:30:33 +0000358 state = MIG_STATE_ERROR;
359 } else {
360 state = MIG_STATE_COMPLETED;
361 }
Anthony Liguori41ef56e2010-06-02 14:55:25 -0500362 if (migrate_fd_cleanup(s) < 0) {
363 if (old_vm_running) {
364 vm_start();
365 }
366 state = MIG_STATE_ERROR;
367 }
aliguorib161d122009-04-05 19:30:33 +0000368 s->state = state;
aliguori065e2812008-11-11 16:46:33 +0000369 }
370}
371
372int migrate_fd_get_status(MigrationState *mig_state)
373{
374 FdMigrationState *s = migrate_to_fms(mig_state);
375 return s->state;
376}
377
378void migrate_fd_cancel(MigrationState *mig_state)
379{
380 FdMigrationState *s = migrate_to_fms(mig_state);
381
382 if (s->state != MIG_STATE_ACTIVE)
383 return;
384
malcd0f2c4c2010-02-07 02:03:50 +0300385 DPRINTF("cancelling migration\n");
aliguori065e2812008-11-11 16:46:33 +0000386
387 s->state = MIG_STATE_CANCELLED;
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100388 qemu_savevm_state_cancel(s->mon, s->file);
aliguori065e2812008-11-11 16:46:33 +0000389
390 migrate_fd_cleanup(s);
391}
392
393void migrate_fd_release(MigrationState *mig_state)
394{
395 FdMigrationState *s = migrate_to_fms(mig_state);
396
malcd0f2c4c2010-02-07 02:03:50 +0300397 DPRINTF("releasing state\n");
aliguori065e2812008-11-11 16:46:33 +0000398
399 if (s->state == MIG_STATE_ACTIVE) {
400 s->state = MIG_STATE_CANCELLED;
401 migrate_fd_cleanup(s);
402 }
Yoshiaki Tamurafaa1f8d2010-06-09 14:44:31 +0900403 qemu_free(s);
aliguori065e2812008-11-11 16:46:33 +0000404}
405
406void migrate_fd_wait_for_unfreeze(void *opaque)
407{
408 FdMigrationState *s = opaque;
409 int ret;
410
malcd0f2c4c2010-02-07 02:03:50 +0300411 DPRINTF("wait for unfreeze\n");
aliguori065e2812008-11-11 16:46:33 +0000412 if (s->state != MIG_STATE_ACTIVE)
413 return;
414
415 do {
416 fd_set wfds;
417
418 FD_ZERO(&wfds);
419 FD_SET(s->fd, &wfds);
420
421 ret = select(s->fd + 1, NULL, &wfds, NULL, NULL);
422 } while (ret == -1 && (s->get_error(s)) == EINTR);
423}
424
425int migrate_fd_close(void *opaque)
426{
427 FdMigrationState *s = opaque;
Uri Lubline19252d2009-06-08 14:28:01 +0300428
429 qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
aliguori065e2812008-11-11 16:46:33 +0000430 return s->close(s);
431}