blob: b49964c5e3a3c81a4b8b8d87be8c7923d0f4d21b [file] [log] [blame]
aliguori5bb79102008-10-13 03:12:02 +00001/*
2 * QEMU live migration
3 *
4 * Copyright IBM, Corp. 2008
5 *
6 * Authors:
7 * Anthony Liguori <aliguori@us.ibm.com>
8 *
9 * This work is licensed under the terms of the GNU GPL, version 2. See
10 * the COPYING file in the top-level directory.
11 *
12 */
13
14#include "qemu-common.h"
15#include "migration.h"
aliguori376253e2009-03-05 23:01:23 +000016#include "monitor.h"
aliguori065e2812008-11-11 16:46:33 +000017#include "buffered_file.h"
18#include "sysemu.h"
19#include "block.h"
20#include "qemu_socket.h"
Jan Kiszka25f23642009-11-30 18:21:21 +010021#include "block-migration.h"
Luiz Capitulinoc86a6682009-12-10 17:16:05 -020022#include "qemu-objects.h"
aliguori065e2812008-11-11 16:46:33 +000023
24//#define DEBUG_MIGRATION
25
26#ifdef DEBUG_MIGRATION
malcd0f2c4c2010-02-07 02:03:50 +030027#define DPRINTF(fmt, ...) \
aliguori065e2812008-11-11 16:46:33 +000028 do { printf("migration: " fmt, ## __VA_ARGS__); } while (0)
29#else
malcd0f2c4c2010-02-07 02:03:50 +030030#define DPRINTF(fmt, ...) \
aliguori065e2812008-11-11 16:46:33 +000031 do { } while (0)
32#endif
aliguori5bb79102008-10-13 03:12:02 +000033
34/* Migration speed throttling */
35static uint32_t max_throttle = (32 << 20);
36
37static MigrationState *current_migration;
38
Juan Quintela8ca5e802010-06-09 14:10:54 +020039int qemu_start_incoming_migration(const char *uri)
aliguori5bb79102008-10-13 03:12:02 +000040{
aliguori34c9dd82008-10-13 03:14:31 +000041 const char *p;
Juan Quintela8ca5e802010-06-09 14:10:54 +020042 int ret;
aliguori34c9dd82008-10-13 03:14:31 +000043
44 if (strstart(uri, "tcp:", &p))
Juan Quintela8ca5e802010-06-09 14:10:54 +020045 ret = tcp_start_incoming_migration(p);
aliguori065e2812008-11-11 16:46:33 +000046#if !defined(WIN32)
47 else if (strstart(uri, "exec:", &p))
Juan Quintela8ca5e802010-06-09 14:10:54 +020048 ret = exec_start_incoming_migration(p);
Chris Lalancette4951f652009-08-05 17:24:29 +020049 else if (strstart(uri, "unix:", &p))
Juan Quintela8ca5e802010-06-09 14:10:54 +020050 ret = unix_start_incoming_migration(p);
Paolo Bonzini5ac1fad2009-08-18 15:56:25 +020051 else if (strstart(uri, "fd:", &p))
Juan Quintela8ca5e802010-06-09 14:10:54 +020052 ret = fd_start_incoming_migration(p);
aliguori065e2812008-11-11 16:46:33 +000053#endif
Juan Quintela8ca5e802010-06-09 14:10:54 +020054 else {
aliguori34c9dd82008-10-13 03:14:31 +000055 fprintf(stderr, "unknown migration protocol: %s\n", uri);
Juan Quintela8ca5e802010-06-09 14:10:54 +020056 ret = -EPROTONOSUPPORT;
57 }
58 return ret;
aliguori5bb79102008-10-13 03:12:02 +000059}
60
Juan Quintela511c0232010-06-09 14:10:55 +020061void process_incoming_migration(QEMUFile *f)
62{
63 if (qemu_loadvm_state(f) < 0) {
64 fprintf(stderr, "load of migration failed\n");
65 exit(0);
66 }
67 qemu_announce_self();
68 DPRINTF("successfully loaded vm state\n");
69
70 if (autostart)
71 vm_start();
72}
73
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020074int do_migrate(Monitor *mon, const QDict *qdict, QObject **ret_data)
aliguori5bb79102008-10-13 03:12:02 +000075{
aliguori34c9dd82008-10-13 03:14:31 +000076 MigrationState *s = NULL;
77 const char *p;
Luiz Capitulinof18c16d2009-08-28 15:27:14 -030078 int detach = qdict_get_int(qdict, "detach");
79 const char *uri = qdict_get_str(qdict, "uri");
Jan Kiszka13024252009-11-30 18:21:19 +010080
81 if (current_migration &&
82 current_migration->get_status(current_migration) == MIG_STATE_ACTIVE) {
83 monitor_printf(mon, "migration already in progress\n");
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020084 return -1;
Jan Kiszka13024252009-11-30 18:21:19 +010085 }
86
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020087 if (strstart(uri, "tcp:", &p)) {
Jan Kiszkaf327aa02009-11-30 18:21:21 +010088 s = tcp_start_outgoing_migration(mon, p, max_throttle, detach,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +020089 (int)qdict_get_int(qdict, "blk"),
90 (int)qdict_get_int(qdict, "inc"));
aliguori065e2812008-11-11 16:46:33 +000091#if !defined(WIN32)
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020092 } else if (strstart(uri, "exec:", &p)) {
Jan Kiszkaf327aa02009-11-30 18:21:21 +010093 s = exec_start_outgoing_migration(mon, p, max_throttle, detach,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +020094 (int)qdict_get_int(qdict, "blk"),
95 (int)qdict_get_int(qdict, "inc"));
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020096 } else if (strstart(uri, "unix:", &p)) {
Jan Kiszkaf327aa02009-11-30 18:21:21 +010097 s = unix_start_outgoing_migration(mon, p, max_throttle, detach,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +020098 (int)qdict_get_int(qdict, "blk"),
99 (int)qdict_get_int(qdict, "inc"));
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -0200100 } else if (strstart(uri, "fd:", &p)) {
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +0200101 s = fd_start_outgoing_migration(mon, p, max_throttle, detach,
102 (int)qdict_get_int(qdict, "blk"),
103 (int)qdict_get_int(qdict, "inc"));
aliguori065e2812008-11-11 16:46:33 +0000104#endif
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -0200105 } else {
aliguori376253e2009-03-05 23:01:23 +0000106 monitor_printf(mon, "unknown migration protocol: %s\n", uri);
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -0200107 return -1;
aliguori34c9dd82008-10-13 03:14:31 +0000108 }
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -0200109
110 if (s == NULL) {
111 monitor_printf(mon, "migration failed\n");
112 return -1;
113 }
114
115 if (current_migration) {
116 current_migration->release(current_migration);
117 }
118
119 current_migration = s;
120 return 0;
aliguori5bb79102008-10-13 03:12:02 +0000121}
122
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200123int do_migrate_cancel(Monitor *mon, const QDict *qdict, QObject **ret_data)
aliguori5bb79102008-10-13 03:12:02 +0000124{
125 MigrationState *s = current_migration;
126
127 if (s)
aliguoriff8d81d2008-10-24 22:10:31 +0000128 s->cancel(s);
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200129
130 return 0;
aliguori5bb79102008-10-13 03:12:02 +0000131}
132
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200133int do_migrate_set_speed(Monitor *mon, const QDict *qdict, QObject **ret_data)
aliguori5bb79102008-10-13 03:12:02 +0000134{
135 double d;
Glauber Costadaa91de2009-05-20 18:26:58 -0400136 FdMigrationState *s;
aliguori5bb79102008-10-13 03:12:02 +0000137
Markus Armbruster5667c492010-01-25 14:23:04 +0100138 d = qdict_get_double(qdict, "value");
139 d = MAX(0, MIN(UINT32_MAX, d));
140 max_throttle = d;
Glauber Costadaa91de2009-05-20 18:26:58 -0400141
Jan Kiszka5d39c792009-11-30 18:21:19 +0100142 s = migrate_to_fms(current_migration);
143 if (s && s->file) {
Glauber Costadaa91de2009-05-20 18:26:58 -0400144 qemu_file_set_rate_limit(s->file, max_throttle);
145 }
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200146
147 return 0;
aliguori5bb79102008-10-13 03:12:02 +0000148}
149
Glauber Costaa0a3fd62009-05-28 15:22:57 -0400150/* amount of nanoseconds we are willing to wait for migration to be down.
151 * the choice of nanoseconds is because it is the maximum resolution that
152 * get_clock() can achieve. It is an internal measure. All user-visible
153 * units must be in seconds */
154static uint64_t max_downtime = 30000000;
155
156uint64_t migrate_max_downtime(void)
157{
158 return max_downtime;
159}
160
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200161int do_migrate_set_downtime(Monitor *mon, const QDict *qdict,
162 QObject **ret_data)
Glauber Costa2ea42952009-05-28 15:22:58 -0400163{
Glauber Costa2ea42952009-05-28 15:22:58 -0400164 double d;
165
Markus Armbrusterb0fbf7d2010-01-25 14:23:07 +0100166 d = qdict_get_double(qdict, "value") * 1e9;
167 d = MAX(0, MIN(UINT64_MAX, d));
Glauber Costa2ea42952009-05-28 15:22:58 -0400168 max_downtime = (uint64_t)d;
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200169
170 return 0;
Glauber Costa2ea42952009-05-28 15:22:58 -0400171}
172
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200173static void migrate_print_status(Monitor *mon, const char *name,
174 const QDict *status_dict)
aliguori5bb79102008-10-13 03:12:02 +0000175{
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200176 QDict *qdict;
177
178 qdict = qobject_to_qdict(qdict_get(status_dict, name));
179
180 monitor_printf(mon, "transferred %s: %" PRIu64 " kbytes\n", name,
181 qdict_get_int(qdict, "transferred") >> 10);
182 monitor_printf(mon, "remaining %s: %" PRIu64 " kbytes\n", name,
183 qdict_get_int(qdict, "remaining") >> 10);
184 monitor_printf(mon, "total %s: %" PRIu64 " kbytes\n", name,
185 qdict_get_int(qdict, "total") >> 10);
186}
187
188void do_info_migrate_print(Monitor *mon, const QObject *data)
189{
190 QDict *qdict;
191
192 qdict = qobject_to_qdict(data);
193
194 monitor_printf(mon, "Migration status: %s\n",
195 qdict_get_str(qdict, "status"));
196
197 if (qdict_haskey(qdict, "ram")) {
198 migrate_print_status(mon, "ram", qdict);
199 }
200
201 if (qdict_haskey(qdict, "disk")) {
202 migrate_print_status(mon, "disk", qdict);
203 }
204}
205
206static void migrate_put_status(QDict *qdict, const char *name,
207 uint64_t trans, uint64_t rem, uint64_t total)
208{
209 QObject *obj;
210
211 obj = qobject_from_jsonf("{ 'transferred': %" PRId64 ", "
212 "'remaining': %" PRId64 ", "
213 "'total': %" PRId64 " }", trans, rem, total);
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200214 qdict_put_obj(qdict, name, obj);
215}
216
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200217void do_info_migrate(Monitor *mon, QObject **ret_data)
218{
219 QDict *qdict;
aliguori5bb79102008-10-13 03:12:02 +0000220 MigrationState *s = current_migration;
aliguori376253e2009-03-05 23:01:23 +0000221
aliguori5bb79102008-10-13 03:12:02 +0000222 if (s) {
aliguoriff8d81d2008-10-24 22:10:31 +0000223 switch (s->get_status(s)) {
224 case MIG_STATE_ACTIVE:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200225 qdict = qdict_new();
226 qdict_put(qdict, "status", qstring_from_str("active"));
227
228 migrate_put_status(qdict, "ram", ram_bytes_transferred(),
229 ram_bytes_remaining(), ram_bytes_total());
230
Jan Kiszka25f23642009-11-30 18:21:21 +0100231 if (blk_mig_active()) {
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200232 migrate_put_status(qdict, "disk", blk_mig_bytes_transferred(),
233 blk_mig_bytes_remaining(),
234 blk_mig_bytes_total());
Jan Kiszka25f23642009-11-30 18:21:21 +0100235 }
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200236
237 *ret_data = QOBJECT(qdict);
aliguoriff8d81d2008-10-24 22:10:31 +0000238 break;
239 case MIG_STATE_COMPLETED:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200240 *ret_data = qobject_from_jsonf("{ 'status': 'completed' }");
aliguoriff8d81d2008-10-24 22:10:31 +0000241 break;
242 case MIG_STATE_ERROR:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200243 *ret_data = qobject_from_jsonf("{ 'status': 'failed' }");
aliguoriff8d81d2008-10-24 22:10:31 +0000244 break;
245 case MIG_STATE_CANCELLED:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200246 *ret_data = qobject_from_jsonf("{ 'status': 'cancelled' }");
aliguoriff8d81d2008-10-24 22:10:31 +0000247 break;
248 }
aliguori5bb79102008-10-13 03:12:02 +0000249 }
250}
251
aliguori065e2812008-11-11 16:46:33 +0000252/* shared migration helpers */
253
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100254void migrate_fd_monitor_suspend(FdMigrationState *s, Monitor *mon)
aliguori731b0362009-03-05 23:01:42 +0000255{
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100256 s->mon = mon;
257 if (monitor_suspend(mon) == 0) {
malcd0f2c4c2010-02-07 02:03:50 +0300258 DPRINTF("suspending monitor\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100259 } else {
260 monitor_printf(mon, "terminal does not allow synchronous "
aliguoricde76ee2009-03-05 23:01:51 +0000261 "migration, continuing detached\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100262 }
aliguori731b0362009-03-05 23:01:42 +0000263}
264
aliguori065e2812008-11-11 16:46:33 +0000265void migrate_fd_error(FdMigrationState *s)
266{
malcd0f2c4c2010-02-07 02:03:50 +0300267 DPRINTF("setting error state\n");
aliguori065e2812008-11-11 16:46:33 +0000268 s->state = MIG_STATE_ERROR;
269 migrate_fd_cleanup(s);
270}
271
Anthony Liguori41ef56e2010-06-02 14:55:25 -0500272int migrate_fd_cleanup(FdMigrationState *s)
aliguori065e2812008-11-11 16:46:33 +0000273{
Anthony Liguori41ef56e2010-06-02 14:55:25 -0500274 int ret = 0;
275
aliguori065e2812008-11-11 16:46:33 +0000276 qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
277
278 if (s->file) {
malcd0f2c4c2010-02-07 02:03:50 +0300279 DPRINTF("closing file\n");
Anthony Liguori41ef56e2010-06-02 14:55:25 -0500280 if (qemu_fclose(s->file) != 0) {
281 ret = -1;
282 }
Jan Kiszka5d39c792009-11-30 18:21:19 +0100283 s->file = NULL;
aliguori065e2812008-11-11 16:46:33 +0000284 }
285
286 if (s->fd != -1)
287 close(s->fd);
288
289 /* Don't resume monitor until we've flushed all of the buffers */
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100290 if (s->mon) {
291 monitor_resume(s->mon);
292 }
aliguori065e2812008-11-11 16:46:33 +0000293
294 s->fd = -1;
Anthony Liguori41ef56e2010-06-02 14:55:25 -0500295
296 return ret;
aliguori065e2812008-11-11 16:46:33 +0000297}
298
299void migrate_fd_put_notify(void *opaque)
300{
301 FdMigrationState *s = opaque;
302
303 qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
304 qemu_file_put_notify(s->file);
305}
306
307ssize_t migrate_fd_put_buffer(void *opaque, const void *data, size_t size)
308{
309 FdMigrationState *s = opaque;
310 ssize_t ret;
311
312 do {
313 ret = s->write(s, data, size);
Uri Lublin95b134e2009-05-19 14:08:53 +0300314 } while (ret == -1 && ((s->get_error(s)) == EINTR));
aliguori065e2812008-11-11 16:46:33 +0000315
316 if (ret == -1)
317 ret = -(s->get_error(s));
318
319 if (ret == -EAGAIN)
320 qemu_set_fd_handler2(s->fd, NULL, NULL, migrate_fd_put_notify, s);
321
322 return ret;
323}
324
325void migrate_fd_connect(FdMigrationState *s)
326{
327 int ret;
328
329 s->file = qemu_fopen_ops_buffered(s,
330 s->bandwidth_limit,
331 migrate_fd_put_buffer,
332 migrate_fd_put_ready,
333 migrate_fd_wait_for_unfreeze,
334 migrate_fd_close);
335
malcd0f2c4c2010-02-07 02:03:50 +0300336 DPRINTF("beginning savevm\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100337 ret = qemu_savevm_state_begin(s->mon, s->file, s->mig_state.blk,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +0200338 s->mig_state.shared);
aliguori065e2812008-11-11 16:46:33 +0000339 if (ret < 0) {
malcd0f2c4c2010-02-07 02:03:50 +0300340 DPRINTF("failed, %d\n", ret);
aliguori065e2812008-11-11 16:46:33 +0000341 migrate_fd_error(s);
342 return;
343 }
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +0200344
aliguori065e2812008-11-11 16:46:33 +0000345 migrate_fd_put_ready(s);
346}
347
348void migrate_fd_put_ready(void *opaque)
349{
350 FdMigrationState *s = opaque;
351
352 if (s->state != MIG_STATE_ACTIVE) {
malcd0f2c4c2010-02-07 02:03:50 +0300353 DPRINTF("put_ready returning because of non-active state\n");
aliguori065e2812008-11-11 16:46:33 +0000354 return;
355 }
356
malcd0f2c4c2010-02-07 02:03:50 +0300357 DPRINTF("iterate\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100358 if (qemu_savevm_state_iterate(s->mon, s->file) == 1) {
aliguorib161d122009-04-05 19:30:33 +0000359 int state;
Anthony Liguorieeb34af2009-07-09 13:25:47 -0500360 int old_vm_running = vm_running;
361
malcd0f2c4c2010-02-07 02:03:50 +0300362 DPRINTF("done iterating\n");
aliguori065e2812008-11-11 16:46:33 +0000363 vm_stop(0);
364
Glauber Costa08846572009-07-06 09:32:09 -0400365 qemu_aio_flush();
aliguori065e2812008-11-11 16:46:33 +0000366 bdrv_flush_all();
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100367 if ((qemu_savevm_state_complete(s->mon, s->file)) < 0) {
Anthony Liguorieeb34af2009-07-09 13:25:47 -0500368 if (old_vm_running) {
369 vm_start();
370 }
aliguorib161d122009-04-05 19:30:33 +0000371 state = MIG_STATE_ERROR;
372 } else {
373 state = MIG_STATE_COMPLETED;
374 }
Anthony Liguori41ef56e2010-06-02 14:55:25 -0500375 if (migrate_fd_cleanup(s) < 0) {
376 if (old_vm_running) {
377 vm_start();
378 }
379 state = MIG_STATE_ERROR;
380 }
aliguorib161d122009-04-05 19:30:33 +0000381 s->state = state;
aliguori065e2812008-11-11 16:46:33 +0000382 }
383}
384
385int migrate_fd_get_status(MigrationState *mig_state)
386{
387 FdMigrationState *s = migrate_to_fms(mig_state);
388 return s->state;
389}
390
391void migrate_fd_cancel(MigrationState *mig_state)
392{
393 FdMigrationState *s = migrate_to_fms(mig_state);
394
395 if (s->state != MIG_STATE_ACTIVE)
396 return;
397
malcd0f2c4c2010-02-07 02:03:50 +0300398 DPRINTF("cancelling migration\n");
aliguori065e2812008-11-11 16:46:33 +0000399
400 s->state = MIG_STATE_CANCELLED;
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100401 qemu_savevm_state_cancel(s->mon, s->file);
aliguori065e2812008-11-11 16:46:33 +0000402
403 migrate_fd_cleanup(s);
404}
405
406void migrate_fd_release(MigrationState *mig_state)
407{
408 FdMigrationState *s = migrate_to_fms(mig_state);
409
malcd0f2c4c2010-02-07 02:03:50 +0300410 DPRINTF("releasing state\n");
aliguori065e2812008-11-11 16:46:33 +0000411
412 if (s->state == MIG_STATE_ACTIVE) {
413 s->state = MIG_STATE_CANCELLED;
414 migrate_fd_cleanup(s);
415 }
Yoshiaki Tamurafaa1f8d2010-06-09 14:44:31 +0900416 qemu_free(s);
aliguori065e2812008-11-11 16:46:33 +0000417}
418
419void migrate_fd_wait_for_unfreeze(void *opaque)
420{
421 FdMigrationState *s = opaque;
422 int ret;
423
malcd0f2c4c2010-02-07 02:03:50 +0300424 DPRINTF("wait for unfreeze\n");
aliguori065e2812008-11-11 16:46:33 +0000425 if (s->state != MIG_STATE_ACTIVE)
426 return;
427
428 do {
429 fd_set wfds;
430
431 FD_ZERO(&wfds);
432 FD_SET(s->fd, &wfds);
433
434 ret = select(s->fd + 1, NULL, &wfds, NULL, NULL);
435 } while (ret == -1 && (s->get_error(s)) == EINTR);
436}
437
438int migrate_fd_close(void *opaque)
439{
440 FdMigrationState *s = opaque;
Uri Lubline19252d2009-06-08 14:28:01 +0300441
442 qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
aliguori065e2812008-11-11 16:46:33 +0000443 return s->close(s);
444}