blob: f20315fcfd4f4f5331545078617684860fff39b4 [file] [log] [blame]
aliguori5bb79102008-10-13 03:12:02 +00001/*
2 * QEMU live migration
3 *
4 * Copyright IBM, Corp. 2008
5 *
6 * Authors:
7 * Anthony Liguori <aliguori@us.ibm.com>
8 *
9 * This work is licensed under the terms of the GNU GPL, version 2. See
10 * the COPYING file in the top-level directory.
11 *
12 */
13
14#include "qemu-common.h"
15#include "migration.h"
aliguori376253e2009-03-05 23:01:23 +000016#include "monitor.h"
aliguori065e2812008-11-11 16:46:33 +000017#include "buffered_file.h"
18#include "sysemu.h"
19#include "block.h"
20#include "qemu_socket.h"
Jan Kiszka25f23642009-11-30 18:21:21 +010021#include "block-migration.h"
Luiz Capitulinoc86a6682009-12-10 17:16:05 -020022#include "qemu-objects.h"
aliguori065e2812008-11-11 16:46:33 +000023
24//#define DEBUG_MIGRATION
25
26#ifdef DEBUG_MIGRATION
malcd0f2c4c2010-02-07 02:03:50 +030027#define DPRINTF(fmt, ...) \
aliguori065e2812008-11-11 16:46:33 +000028 do { printf("migration: " fmt, ## __VA_ARGS__); } while (0)
29#else
malcd0f2c4c2010-02-07 02:03:50 +030030#define DPRINTF(fmt, ...) \
aliguori065e2812008-11-11 16:46:33 +000031 do { } while (0)
32#endif
aliguori5bb79102008-10-13 03:12:02 +000033
34/* Migration speed throttling */
35static uint32_t max_throttle = (32 << 20);
36
37static MigrationState *current_migration;
38
39void qemu_start_incoming_migration(const char *uri)
40{
aliguori34c9dd82008-10-13 03:14:31 +000041 const char *p;
42
43 if (strstart(uri, "tcp:", &p))
44 tcp_start_incoming_migration(p);
aliguori065e2812008-11-11 16:46:33 +000045#if !defined(WIN32)
46 else if (strstart(uri, "exec:", &p))
47 exec_start_incoming_migration(p);
Chris Lalancette4951f652009-08-05 17:24:29 +020048 else if (strstart(uri, "unix:", &p))
49 unix_start_incoming_migration(p);
Paolo Bonzini5ac1fad2009-08-18 15:56:25 +020050 else if (strstart(uri, "fd:", &p))
51 fd_start_incoming_migration(p);
aliguori065e2812008-11-11 16:46:33 +000052#endif
aliguori34c9dd82008-10-13 03:14:31 +000053 else
54 fprintf(stderr, "unknown migration protocol: %s\n", uri);
aliguori5bb79102008-10-13 03:12:02 +000055}
56
Luiz Capitulino5f79da02009-10-16 12:23:45 -030057void do_migrate(Monitor *mon, const QDict *qdict, QObject **ret_data)
aliguori5bb79102008-10-13 03:12:02 +000058{
aliguori34c9dd82008-10-13 03:14:31 +000059 MigrationState *s = NULL;
60 const char *p;
Luiz Capitulinof18c16d2009-08-28 15:27:14 -030061 int detach = qdict_get_int(qdict, "detach");
62 const char *uri = qdict_get_str(qdict, "uri");
Jan Kiszka13024252009-11-30 18:21:19 +010063
64 if (current_migration &&
65 current_migration->get_status(current_migration) == MIG_STATE_ACTIVE) {
66 monitor_printf(mon, "migration already in progress\n");
67 return;
68 }
69
aliguori34c9dd82008-10-13 03:14:31 +000070 if (strstart(uri, "tcp:", &p))
Jan Kiszkaf327aa02009-11-30 18:21:21 +010071 s = tcp_start_outgoing_migration(mon, p, max_throttle, detach,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +020072 (int)qdict_get_int(qdict, "blk"),
73 (int)qdict_get_int(qdict, "inc"));
aliguori065e2812008-11-11 16:46:33 +000074#if !defined(WIN32)
75 else if (strstart(uri, "exec:", &p))
Jan Kiszkaf327aa02009-11-30 18:21:21 +010076 s = exec_start_outgoing_migration(mon, p, max_throttle, detach,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +020077 (int)qdict_get_int(qdict, "blk"),
78 (int)qdict_get_int(qdict, "inc"));
Chris Lalancette4951f652009-08-05 17:24:29 +020079 else if (strstart(uri, "unix:", &p))
Jan Kiszkaf327aa02009-11-30 18:21:21 +010080 s = unix_start_outgoing_migration(mon, p, max_throttle, detach,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +020081 (int)qdict_get_int(qdict, "blk"),
82 (int)qdict_get_int(qdict, "inc"));
Paolo Bonzini5ac1fad2009-08-18 15:56:25 +020083 else if (strstart(uri, "fd:", &p))
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +020084 s = fd_start_outgoing_migration(mon, p, max_throttle, detach,
85 (int)qdict_get_int(qdict, "blk"),
86 (int)qdict_get_int(qdict, "inc"));
aliguori065e2812008-11-11 16:46:33 +000087#endif
aliguori34c9dd82008-10-13 03:14:31 +000088 else
aliguori376253e2009-03-05 23:01:23 +000089 monitor_printf(mon, "unknown migration protocol: %s\n", uri);
aliguori34c9dd82008-10-13 03:14:31 +000090
91 if (s == NULL)
aliguori376253e2009-03-05 23:01:23 +000092 monitor_printf(mon, "migration failed\n");
aliguori34c9dd82008-10-13 03:14:31 +000093 else {
aliguoriff8d81d2008-10-24 22:10:31 +000094 if (current_migration)
95 current_migration->release(current_migration);
aliguori34c9dd82008-10-13 03:14:31 +000096
aliguoriff8d81d2008-10-24 22:10:31 +000097 current_migration = s;
aliguori34c9dd82008-10-13 03:14:31 +000098 }
aliguori5bb79102008-10-13 03:12:02 +000099}
100
Luiz Capitulino911d2962009-10-16 12:23:47 -0300101void do_migrate_cancel(Monitor *mon, const QDict *qdict, QObject **ret_data)
aliguori5bb79102008-10-13 03:12:02 +0000102{
103 MigrationState *s = current_migration;
104
105 if (s)
aliguoriff8d81d2008-10-24 22:10:31 +0000106 s->cancel(s);
aliguori5bb79102008-10-13 03:12:02 +0000107}
108
Markus Armbruster5fd90832010-01-25 14:23:05 +0100109void do_migrate_set_speed(Monitor *mon, const QDict *qdict, QObject **ret_data)
aliguori5bb79102008-10-13 03:12:02 +0000110{
111 double d;
Glauber Costadaa91de2009-05-20 18:26:58 -0400112 FdMigrationState *s;
aliguori5bb79102008-10-13 03:12:02 +0000113
Markus Armbruster5667c492010-01-25 14:23:04 +0100114 d = qdict_get_double(qdict, "value");
115 d = MAX(0, MIN(UINT32_MAX, d));
116 max_throttle = d;
Glauber Costadaa91de2009-05-20 18:26:58 -0400117
Jan Kiszka5d39c792009-11-30 18:21:19 +0100118 s = migrate_to_fms(current_migration);
119 if (s && s->file) {
Glauber Costadaa91de2009-05-20 18:26:58 -0400120 qemu_file_set_rate_limit(s->file, max_throttle);
121 }
aliguori5bb79102008-10-13 03:12:02 +0000122}
123
Glauber Costaa0a3fd62009-05-28 15:22:57 -0400124/* amount of nanoseconds we are willing to wait for migration to be down.
125 * the choice of nanoseconds is because it is the maximum resolution that
126 * get_clock() can achieve. It is an internal measure. All user-visible
127 * units must be in seconds */
128static uint64_t max_downtime = 30000000;
129
130uint64_t migrate_max_downtime(void)
131{
132 return max_downtime;
133}
134
Markus Armbrusterc6027f52010-01-25 14:23:08 +0100135void do_migrate_set_downtime(Monitor *mon, const QDict *qdict,
136 QObject **ret_data)
Glauber Costa2ea42952009-05-28 15:22:58 -0400137{
Glauber Costa2ea42952009-05-28 15:22:58 -0400138 double d;
139
Markus Armbrusterb0fbf7d2010-01-25 14:23:07 +0100140 d = qdict_get_double(qdict, "value") * 1e9;
141 d = MAX(0, MIN(UINT64_MAX, d));
Glauber Costa2ea42952009-05-28 15:22:58 -0400142 max_downtime = (uint64_t)d;
143}
144
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200145static void migrate_print_status(Monitor *mon, const char *name,
146 const QDict *status_dict)
aliguori5bb79102008-10-13 03:12:02 +0000147{
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200148 QDict *qdict;
149
150 qdict = qobject_to_qdict(qdict_get(status_dict, name));
151
152 monitor_printf(mon, "transferred %s: %" PRIu64 " kbytes\n", name,
153 qdict_get_int(qdict, "transferred") >> 10);
154 monitor_printf(mon, "remaining %s: %" PRIu64 " kbytes\n", name,
155 qdict_get_int(qdict, "remaining") >> 10);
156 monitor_printf(mon, "total %s: %" PRIu64 " kbytes\n", name,
157 qdict_get_int(qdict, "total") >> 10);
158}
159
160void do_info_migrate_print(Monitor *mon, const QObject *data)
161{
162 QDict *qdict;
163
164 qdict = qobject_to_qdict(data);
165
166 monitor_printf(mon, "Migration status: %s\n",
167 qdict_get_str(qdict, "status"));
168
169 if (qdict_haskey(qdict, "ram")) {
170 migrate_print_status(mon, "ram", qdict);
171 }
172
173 if (qdict_haskey(qdict, "disk")) {
174 migrate_print_status(mon, "disk", qdict);
175 }
176}
177
178static void migrate_put_status(QDict *qdict, const char *name,
179 uint64_t trans, uint64_t rem, uint64_t total)
180{
181 QObject *obj;
182
183 obj = qobject_from_jsonf("{ 'transferred': %" PRId64 ", "
184 "'remaining': %" PRId64 ", "
185 "'total': %" PRId64 " }", trans, rem, total);
186 assert(obj != NULL);
187
188 qdict_put_obj(qdict, name, obj);
189}
190
191/**
192 * do_info_migrate(): Migration status
193 *
194 * Return a QDict. If migration is active there will be another
195 * QDict with RAM migration status and if block migration is active
196 * another one with block migration status.
197 *
198 * The main QDict contains the following:
199 *
200 * - "status": migration status
201 * - "ram": only present if "status" is "active", it is a QDict with the
202 * following RAM information (in bytes):
203 * - "transferred": amount transferred
204 * - "remaining": amount remaining
205 * - "total": total
206 * - "disk": only present if "status" is "active" and it is a block migration,
207 * it is a QDict with the following disk information (in bytes):
208 * - "transferred": amount transferred
209 * - "remaining": amount remaining
210 * - "total": total
211 *
212 * Examples:
213 *
214 * 1. Migration is "completed":
215 *
216 * { "status": "completed" }
217 *
218 * 2. Migration is "active" and it is not a block migration:
219 *
220 * { "status": "active",
221 * "ram": { "transferred": 123, "remaining": 123, "total": 246 } }
222 *
223 * 3. Migration is "active" and it is a block migration:
224 *
225 * { "status": "active",
226 * "ram": { "total": 1057024, "remaining": 1053304, "transferred": 3720 },
227 * "disk": { "total": 20971520, "remaining": 20880384, "transferred": 91136 }}
228 */
229void do_info_migrate(Monitor *mon, QObject **ret_data)
230{
231 QDict *qdict;
aliguori5bb79102008-10-13 03:12:02 +0000232 MigrationState *s = current_migration;
aliguori376253e2009-03-05 23:01:23 +0000233
aliguori5bb79102008-10-13 03:12:02 +0000234 if (s) {
aliguoriff8d81d2008-10-24 22:10:31 +0000235 switch (s->get_status(s)) {
236 case MIG_STATE_ACTIVE:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200237 qdict = qdict_new();
238 qdict_put(qdict, "status", qstring_from_str("active"));
239
240 migrate_put_status(qdict, "ram", ram_bytes_transferred(),
241 ram_bytes_remaining(), ram_bytes_total());
242
Jan Kiszka25f23642009-11-30 18:21:21 +0100243 if (blk_mig_active()) {
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200244 migrate_put_status(qdict, "disk", blk_mig_bytes_transferred(),
245 blk_mig_bytes_remaining(),
246 blk_mig_bytes_total());
Jan Kiszka25f23642009-11-30 18:21:21 +0100247 }
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200248
249 *ret_data = QOBJECT(qdict);
aliguoriff8d81d2008-10-24 22:10:31 +0000250 break;
251 case MIG_STATE_COMPLETED:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200252 *ret_data = qobject_from_jsonf("{ 'status': 'completed' }");
aliguoriff8d81d2008-10-24 22:10:31 +0000253 break;
254 case MIG_STATE_ERROR:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200255 *ret_data = qobject_from_jsonf("{ 'status': 'failed' }");
aliguoriff8d81d2008-10-24 22:10:31 +0000256 break;
257 case MIG_STATE_CANCELLED:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200258 *ret_data = qobject_from_jsonf("{ 'status': 'cancelled' }");
aliguoriff8d81d2008-10-24 22:10:31 +0000259 break;
260 }
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200261 assert(*ret_data != NULL);
aliguori5bb79102008-10-13 03:12:02 +0000262 }
263}
264
aliguori065e2812008-11-11 16:46:33 +0000265/* shared migration helpers */
266
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100267void migrate_fd_monitor_suspend(FdMigrationState *s, Monitor *mon)
aliguori731b0362009-03-05 23:01:42 +0000268{
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100269 s->mon = mon;
270 if (monitor_suspend(mon) == 0) {
malcd0f2c4c2010-02-07 02:03:50 +0300271 DPRINTF("suspending monitor\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100272 } else {
273 monitor_printf(mon, "terminal does not allow synchronous "
aliguoricde76ee2009-03-05 23:01:51 +0000274 "migration, continuing detached\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100275 }
aliguori731b0362009-03-05 23:01:42 +0000276}
277
aliguori065e2812008-11-11 16:46:33 +0000278void migrate_fd_error(FdMigrationState *s)
279{
malcd0f2c4c2010-02-07 02:03:50 +0300280 DPRINTF("setting error state\n");
aliguori065e2812008-11-11 16:46:33 +0000281 s->state = MIG_STATE_ERROR;
282 migrate_fd_cleanup(s);
283}
284
285void migrate_fd_cleanup(FdMigrationState *s)
286{
287 qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
288
289 if (s->file) {
malcd0f2c4c2010-02-07 02:03:50 +0300290 DPRINTF("closing file\n");
aliguori065e2812008-11-11 16:46:33 +0000291 qemu_fclose(s->file);
Jan Kiszka5d39c792009-11-30 18:21:19 +0100292 s->file = NULL;
aliguori065e2812008-11-11 16:46:33 +0000293 }
294
295 if (s->fd != -1)
296 close(s->fd);
297
298 /* Don't resume monitor until we've flushed all of the buffers */
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100299 if (s->mon) {
300 monitor_resume(s->mon);
301 }
aliguori065e2812008-11-11 16:46:33 +0000302
303 s->fd = -1;
304}
305
306void migrate_fd_put_notify(void *opaque)
307{
308 FdMigrationState *s = opaque;
309
310 qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
311 qemu_file_put_notify(s->file);
312}
313
314ssize_t migrate_fd_put_buffer(void *opaque, const void *data, size_t size)
315{
316 FdMigrationState *s = opaque;
317 ssize_t ret;
318
319 do {
320 ret = s->write(s, data, size);
Uri Lublin95b134e2009-05-19 14:08:53 +0300321 } while (ret == -1 && ((s->get_error(s)) == EINTR));
aliguori065e2812008-11-11 16:46:33 +0000322
323 if (ret == -1)
324 ret = -(s->get_error(s));
325
326 if (ret == -EAGAIN)
327 qemu_set_fd_handler2(s->fd, NULL, NULL, migrate_fd_put_notify, s);
328
329 return ret;
330}
331
332void migrate_fd_connect(FdMigrationState *s)
333{
334 int ret;
335
336 s->file = qemu_fopen_ops_buffered(s,
337 s->bandwidth_limit,
338 migrate_fd_put_buffer,
339 migrate_fd_put_ready,
340 migrate_fd_wait_for_unfreeze,
341 migrate_fd_close);
342
malcd0f2c4c2010-02-07 02:03:50 +0300343 DPRINTF("beginning savevm\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100344 ret = qemu_savevm_state_begin(s->mon, s->file, s->mig_state.blk,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +0200345 s->mig_state.shared);
aliguori065e2812008-11-11 16:46:33 +0000346 if (ret < 0) {
malcd0f2c4c2010-02-07 02:03:50 +0300347 DPRINTF("failed, %d\n", ret);
aliguori065e2812008-11-11 16:46:33 +0000348 migrate_fd_error(s);
349 return;
350 }
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +0200351
aliguori065e2812008-11-11 16:46:33 +0000352 migrate_fd_put_ready(s);
353}
354
355void migrate_fd_put_ready(void *opaque)
356{
357 FdMigrationState *s = opaque;
358
359 if (s->state != MIG_STATE_ACTIVE) {
malcd0f2c4c2010-02-07 02:03:50 +0300360 DPRINTF("put_ready returning because of non-active state\n");
aliguori065e2812008-11-11 16:46:33 +0000361 return;
362 }
363
malcd0f2c4c2010-02-07 02:03:50 +0300364 DPRINTF("iterate\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100365 if (qemu_savevm_state_iterate(s->mon, s->file) == 1) {
aliguorib161d122009-04-05 19:30:33 +0000366 int state;
Anthony Liguorieeb34af2009-07-09 13:25:47 -0500367 int old_vm_running = vm_running;
368
malcd0f2c4c2010-02-07 02:03:50 +0300369 DPRINTF("done iterating\n");
aliguori065e2812008-11-11 16:46:33 +0000370 vm_stop(0);
371
Glauber Costa08846572009-07-06 09:32:09 -0400372 qemu_aio_flush();
aliguori065e2812008-11-11 16:46:33 +0000373 bdrv_flush_all();
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100374 if ((qemu_savevm_state_complete(s->mon, s->file)) < 0) {
Anthony Liguorieeb34af2009-07-09 13:25:47 -0500375 if (old_vm_running) {
376 vm_start();
377 }
aliguorib161d122009-04-05 19:30:33 +0000378 state = MIG_STATE_ERROR;
379 } else {
380 state = MIG_STATE_COMPLETED;
381 }
aliguori065e2812008-11-11 16:46:33 +0000382 migrate_fd_cleanup(s);
aliguorib161d122009-04-05 19:30:33 +0000383 s->state = state;
aliguori065e2812008-11-11 16:46:33 +0000384 }
385}
386
387int migrate_fd_get_status(MigrationState *mig_state)
388{
389 FdMigrationState *s = migrate_to_fms(mig_state);
390 return s->state;
391}
392
393void migrate_fd_cancel(MigrationState *mig_state)
394{
395 FdMigrationState *s = migrate_to_fms(mig_state);
396
397 if (s->state != MIG_STATE_ACTIVE)
398 return;
399
malcd0f2c4c2010-02-07 02:03:50 +0300400 DPRINTF("cancelling migration\n");
aliguori065e2812008-11-11 16:46:33 +0000401
402 s->state = MIG_STATE_CANCELLED;
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100403 qemu_savevm_state_cancel(s->mon, s->file);
aliguori065e2812008-11-11 16:46:33 +0000404
405 migrate_fd_cleanup(s);
406}
407
408void migrate_fd_release(MigrationState *mig_state)
409{
410 FdMigrationState *s = migrate_to_fms(mig_state);
411
malcd0f2c4c2010-02-07 02:03:50 +0300412 DPRINTF("releasing state\n");
aliguori065e2812008-11-11 16:46:33 +0000413
414 if (s->state == MIG_STATE_ACTIVE) {
415 s->state = MIG_STATE_CANCELLED;
416 migrate_fd_cleanup(s);
417 }
418 free(s);
419}
420
421void migrate_fd_wait_for_unfreeze(void *opaque)
422{
423 FdMigrationState *s = opaque;
424 int ret;
425
malcd0f2c4c2010-02-07 02:03:50 +0300426 DPRINTF("wait for unfreeze\n");
aliguori065e2812008-11-11 16:46:33 +0000427 if (s->state != MIG_STATE_ACTIVE)
428 return;
429
430 do {
431 fd_set wfds;
432
433 FD_ZERO(&wfds);
434 FD_SET(s->fd, &wfds);
435
436 ret = select(s->fd + 1, NULL, &wfds, NULL, NULL);
437 } while (ret == -1 && (s->get_error(s)) == EINTR);
438}
439
440int migrate_fd_close(void *opaque)
441{
442 FdMigrationState *s = opaque;
Uri Lubline19252d2009-06-08 14:28:01 +0300443
444 qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
aliguori065e2812008-11-11 16:46:33 +0000445 return s->close(s);
446}