blob: 4ab637a1fe4556663b653e7fce854c329846104f [file] [log] [blame]
aliguori5bb79102008-10-13 03:12:02 +00001/*
2 * QEMU live migration
3 *
4 * Copyright IBM, Corp. 2008
5 *
6 * Authors:
7 * Anthony Liguori <aliguori@us.ibm.com>
8 *
9 * This work is licensed under the terms of the GNU GPL, version 2. See
10 * the COPYING file in the top-level directory.
11 *
Paolo Bonzini6b620ca2012-01-13 17:44:23 +010012 * Contributions after 2012-01-13 are licensed under the terms of the
13 * GNU GPL, version 2 or (at your option) any later version.
aliguori5bb79102008-10-13 03:12:02 +000014 */
15
Peter Maydell1393a482016-01-26 18:16:54 +000016#include "qemu/osdep.h"
Veronia Bahaaf348b6d2016-03-20 19:16:19 +020017#include "qemu/cutils.h"
Markus Armbrusterd49b6832015-03-17 18:29:20 +010018#include "qemu/error-report.h"
Juan Quintela795c40b2017-04-06 12:00:28 +020019#include "migration/blocker.h"
Juan Quintelaf4dbe1b2017-04-05 15:54:10 +020020#include "exec.h"
Juan Quintela7fcac4a2017-04-05 15:58:29 +020021#include "fd.h"
Juan Quintela61e8b142017-04-05 17:40:11 +020022#include "socket.h"
Juan Quintelae1a3ece2017-04-17 20:32:36 +020023#include "rdma.h"
Juan Quintela7b1e1a22017-04-17 20:26:27 +020024#include "ram.h"
Juan Quintela84a899d2017-04-24 18:53:30 +020025#include "migration/global_state.h"
Juan Quintelac4b63b72017-04-24 19:02:44 +020026#include "migration/misc.h"
Juan Quintela6666c962017-04-24 20:07:27 +020027#include "migration.h"
Juan Quintela20a519a2017-04-20 14:48:46 +020028#include "savevm.h"
Juan Quintela40014d82017-04-17 19:34:36 +020029#include "qemu-file-channel.h"
Juan Quintela08a0aee2017-04-20 18:52:18 +020030#include "qemu-file.h"
Juan Quintela987772d2017-04-17 19:02:59 +020031#include "migration/vmstate.h"
Paolo Bonzini737e1502012-12-17 18:19:44 +010032#include "block/block.h"
Markus Armbrustere688df62018-02-01 12:18:31 +010033#include "qapi/error.h"
Markus Armbruster9af23982018-02-11 10:36:01 +010034#include "qapi/qapi-commands-migration.h"
35#include "qapi/qapi-events-migration.h"
Markus Armbrustercc7a8ea2015-03-17 17:22:46 +010036#include "qapi/qmp/qerror.h"
Markus Armbruster15280c32018-02-01 12:18:36 +010037#include "qapi/qmp/qnull.h"
Paolo Bonziniab28bd22015-07-09 08:55:38 +020038#include "qemu/rcu.h"
Juan Quintela2c9e6fe2017-04-21 14:31:22 +020039#include "block.h"
Juan Quintelabe07b0a2017-04-20 13:12:24 +020040#include "postcopy-ram.h"
Juan Quintela766bd172012-07-23 05:45:29 +020041#include "qemu/thread.h"
Kazuya Saitoc09e5bb2013-02-22 17:36:19 +010042#include "trace.h"
Juan Quintela51180422017-04-24 20:50:19 +020043#include "exec/target_page.h"
Daniel P. Berrange61b67d42016-04-27 11:05:01 +010044#include "io/channel-buffer.h"
zhanghailiang35a6ed42016-10-27 14:42:52 +080045#include "migration/colo.h"
Peter Xu4ffdb332017-06-27 12:10:18 +080046#include "hw/boards.h"
Peter Xu9d18af92017-06-27 12:10:19 +080047#include "monitor/monitor.h"
aliguori065e2812008-11-11 16:46:33 +000048
Jason J. Hernedc325622015-09-08 13:12:37 -040049#define MAX_THROTTLE (32 << 20) /* Migration transfer speed throttling */
aliguori5bb79102008-10-13 03:12:02 +000050
Juan Quintela5b4e1eb2012-12-19 10:40:48 +010051/* Amount of time to allocate to each "chunk" of bandwidth-throttled
52 * data. */
53#define BUFFER_DELAY 100
54#define XFER_LIMIT_RATIO (1000 / BUFFER_DELAY)
55
Ashijeet Acharya2ff30252016-09-15 21:50:28 +053056/* Time in milliseconds we are allowed to stop the source,
57 * for sending the last part */
58#define DEFAULT_MIGRATE_SET_DOWNTIME 300
59
Daniel Henrique Barboza87c9cc12017-02-22 12:17:29 -030060/* Maximum migrate downtime set to 2000 seconds */
61#define MAX_MIGRATE_DOWNTIME_SECONDS 2000
62#define MAX_MIGRATE_DOWNTIME (MAX_MIGRATE_DOWNTIME_SECONDS * 1000)
63
Liang Li8706d2d2015-03-23 16:32:17 +080064/* Default compression thread count */
65#define DEFAULT_MIGRATE_COMPRESS_THREAD_COUNT 8
Liang Li3fcb38c2015-03-23 16:32:18 +080066/* Default decompression thread count, usually decompression is at
67 * least 4 times as fast as compression.*/
68#define DEFAULT_MIGRATE_DECOMPRESS_THREAD_COUNT 2
Liang Li8706d2d2015-03-23 16:32:17 +080069/*0: means nocompress, 1: best speed, ... 9: best compress ratio */
70#define DEFAULT_MIGRATE_COMPRESS_LEVEL 1
Jason J. Herne1626fee2015-09-08 13:12:34 -040071/* Define default autoconverge cpu throttle migration parameters */
Jason J. Herned85a31d2016-04-21 14:07:18 -040072#define DEFAULT_MIGRATE_CPU_THROTTLE_INITIAL 20
73#define DEFAULT_MIGRATE_CPU_THROTTLE_INCREMENT 10
Liang Li8706d2d2015-03-23 16:32:17 +080074
Orit Wasserman17ad9b32012-08-06 21:42:53 +030075/* Migration XBZRLE default cache size */
Juan Quintela73af8dd2017-10-05 21:30:10 +020076#define DEFAULT_MIGRATE_XBZRLE_CACHE_SIZE (64 * 1024 * 1024)
Orit Wasserman17ad9b32012-08-06 21:42:53 +030077
zhanghailiang68b53592016-10-27 14:43:01 +080078/* The delay time (in ms) between two COLO checkpoints
79 * Note: Please change this default value to 10000 when we support hybrid mode.
80 */
81#define DEFAULT_MIGRATE_X_CHECKPOINT_DELAY 200
Juan Quintela4075fb12016-01-15 08:56:17 +010082#define DEFAULT_MIGRATE_MULTIFD_CHANNELS 2
Juan Quintela0fb86602017-04-27 10:48:25 +020083#define DEFAULT_MIGRATE_MULTIFD_PAGE_COUNT 16
zhanghailiang68b53592016-10-27 14:43:01 +080084
Gerd Hoffmann99a0db92010-12-13 17:30:12 +010085static NotifierList migration_state_notifiers =
86 NOTIFIER_LIST_INITIALIZER(migration_state_notifiers);
87
Dr. David Alan Gilbertadde2202015-02-19 11:40:27 +000088static bool deferred_incoming;
89
Juan Quintelada6f1792017-04-24 17:37:14 +020090/* Messages sent on the return path from destination to source */
91enum mig_rp_message_type {
92 MIG_RP_MSG_INVALID = 0, /* Must be 0 */
93 MIG_RP_MSG_SHUT, /* sibling will not send any more RP messages */
94 MIG_RP_MSG_PONG, /* Response to a PING; data (seq: be32 ) */
95
96 MIG_RP_MSG_REQ_PAGES_ID, /* data (start: be64, len: be32, id: string) */
97 MIG_RP_MSG_REQ_PAGES, /* data (start: be64, len: be32) */
98
99 MIG_RP_MSG_MAX
100};
101
Juan Quintela17549e82011-10-05 13:50:43 +0200102/* When we add fault tolerance, we could have several
103 migrations at once. For now we don't need to add
104 dynamic creation of migration */
105
Peter Xue5cb7e72017-06-27 12:10:13 +0800106static MigrationState *current_migration;
107
Peter Xu8b0b29d2017-07-18 11:39:06 +0800108static bool migration_object_check(MigrationState *ms, Error **errp);
Dr. David Alan Gilbert0331c8c2017-10-20 10:05:56 +0100109static int migration_maybe_pause(MigrationState *s,
110 int *current_active_state,
111 int new_state);
Peter Xu8b0b29d2017-07-18 11:39:06 +0800112
Peter Xue5cb7e72017-06-27 12:10:13 +0800113void migration_object_init(void)
114{
Peter Xu4ffdb332017-06-27 12:10:18 +0800115 MachineState *ms = MACHINE(qdev_get_machine());
Peter Xu8b0b29d2017-07-18 11:39:06 +0800116 Error *err = NULL;
Peter Xu4ffdb332017-06-27 12:10:18 +0800117
Peter Xue5cb7e72017-06-27 12:10:13 +0800118 /* This can only be called once. */
119 assert(!current_migration);
120 current_migration = MIGRATION_OBJ(object_new(TYPE_MIGRATION));
Peter Xu4ffdb332017-06-27 12:10:18 +0800121
Peter Xu8b0b29d2017-07-18 11:39:06 +0800122 if (!migration_object_check(current_migration, &err)) {
123 error_report_err(err);
124 exit(1);
125 }
126
Peter Xu4ffdb332017-06-27 12:10:18 +0800127 /*
128 * We cannot really do this in migration_instance_init() since at
129 * that time global properties are not yet applied, then this
130 * value will be definitely replaced by something else.
131 */
132 if (ms->enforce_config_section) {
133 current_migration->send_configuration = true;
134 }
Peter Xue5cb7e72017-06-27 12:10:13 +0800135}
136
Vladimir Sementsov-Ogievskiy1f895602017-12-28 12:16:16 +0300137void migration_object_finalize(void)
138{
139 object_unref(OBJECT(current_migration));
140}
141
Dr. David Alan Gilbertbca78562015-05-21 13:24:14 +0100142/* For outgoing */
Juan Quintela859bc752012-08-13 09:42:49 +0200143MigrationState *migrate_get_current(void)
Juan Quintela17549e82011-10-05 13:50:43 +0200144{
Peter Xue5cb7e72017-06-27 12:10:13 +0800145 /* This can only be called after the object created. */
146 assert(current_migration);
147 return current_migration;
Juan Quintela17549e82011-10-05 13:50:43 +0200148}
149
Dr. David Alan Gilbertbca78562015-05-21 13:24:14 +0100150MigrationIncomingState *migration_incoming_get_current(void)
151{
Juan Quintelab4b076d2017-01-23 22:32:06 +0100152 static bool once;
153 static MigrationIncomingState mis_current;
Dr. David Alan Gilbertbca78562015-05-21 13:24:14 +0100154
Juan Quintelab4b076d2017-01-23 22:32:06 +0100155 if (!once) {
156 mis_current.state = MIGRATION_STATUS_NONE;
157 memset(&mis_current, 0, sizeof(MigrationIncomingState));
Dr. David Alan Gilbert00fa4fc2018-03-12 17:21:04 +0000158 mis_current.postcopy_remote_fds = g_array_new(FALSE, TRUE,
159 sizeof(struct PostCopyFD));
Juan Quintelab4b076d2017-01-23 22:32:06 +0100160 qemu_mutex_init(&mis_current.rp_mutex);
161 qemu_event_init(&mis_current.main_thread_load_event, false);
Peter Xub411b842018-05-02 18:47:20 +0800162 qemu_sem_init(&mis_current.postcopy_pause_sem_dst, 0);
Peter Xu3a7804c2018-05-02 18:47:22 +0800163 qemu_sem_init(&mis_current.postcopy_pause_sem_fault, 0);
Vladimir Sementsov-Ogievskiyb35ebdf2018-03-13 15:34:01 -0400164
165 init_dirty_bitmap_incoming_migration();
166
Juan Quintelab4b076d2017-01-23 22:32:06 +0100167 once = true;
168 }
169 return &mis_current;
Dr. David Alan Gilbertbca78562015-05-21 13:24:14 +0100170}
171
172void migration_incoming_state_destroy(void)
173{
Juan Quintelab4b076d2017-01-23 22:32:06 +0100174 struct MigrationIncomingState *mis = migration_incoming_get_current();
175
Peter Xu34826552017-05-19 14:43:29 +0800176 if (mis->to_src_file) {
Peter Xu660819b2017-05-19 14:43:30 +0800177 /* Tell source that we are done */
178 migrate_send_rp_shut(mis, qemu_file_get_error(mis->from_src_file) != 0);
Peter Xu34826552017-05-19 14:43:29 +0800179 qemu_fclose(mis->to_src_file);
180 mis->to_src_file = NULL;
181 }
182
Peter Xu660819b2017-05-19 14:43:30 +0800183 if (mis->from_src_file) {
184 qemu_fclose(mis->from_src_file);
185 mis->from_src_file = NULL;
186 }
Dr. David Alan Gilbert00fa4fc2018-03-12 17:21:04 +0000187 if (mis->postcopy_remote_fds) {
188 g_array_free(mis->postcopy_remote_fds, TRUE);
189 mis->postcopy_remote_fds = NULL;
190 }
Peter Xu660819b2017-05-19 14:43:30 +0800191
Dr. David Alan Gilbert5089e182017-08-25 15:19:39 +0100192 qemu_event_reset(&mis->main_thread_load_event);
Dr. David Alan Gilbertbca78562015-05-21 13:24:14 +0100193}
194
Juan Quintelab05dc722015-07-07 14:44:05 +0200195static void migrate_generate_event(int new_state)
196{
197 if (migrate_use_events()) {
198 qapi_event_send_migration(new_state, &error_abort);
Juan Quintelab05dc722015-07-07 14:44:05 +0200199 }
200}
201
Dr. David Alan Gilbertadde2202015-02-19 11:40:27 +0000202/*
203 * Called on -incoming with a defer: uri.
204 * The migration can be started later after any parameters have been
205 * changed.
206 */
207static void deferred_incoming_migration(Error **errp)
208{
209 if (deferred_incoming) {
210 error_setg(errp, "Incoming migration already deferred");
211 }
212 deferred_incoming = true;
213}
214
Juan Quintelada6f1792017-04-24 17:37:14 +0200215/*
216 * Send a message on the return channel back to the source
217 * of the migration.
218 */
Peter Xud6208e32018-02-08 18:31:12 +0800219static int migrate_send_rp_message(MigrationIncomingState *mis,
220 enum mig_rp_message_type message_type,
221 uint16_t len, void *data)
Juan Quintelada6f1792017-04-24 17:37:14 +0200222{
Peter Xud6208e32018-02-08 18:31:12 +0800223 int ret = 0;
224
Juan Quintelada6f1792017-04-24 17:37:14 +0200225 trace_migrate_send_rp_message((int)message_type, len);
226 qemu_mutex_lock(&mis->rp_mutex);
Peter Xud6208e32018-02-08 18:31:12 +0800227
228 /*
229 * It's possible that the file handle got lost due to network
230 * failures.
231 */
232 if (!mis->to_src_file) {
233 ret = -EIO;
234 goto error;
235 }
236
Juan Quintelada6f1792017-04-24 17:37:14 +0200237 qemu_put_be16(mis->to_src_file, (unsigned int)message_type);
238 qemu_put_be16(mis->to_src_file, len);
239 qemu_put_buffer(mis->to_src_file, data, len);
240 qemu_fflush(mis->to_src_file);
Peter Xud6208e32018-02-08 18:31:12 +0800241
242 /* It's possible that qemu file got error during sending */
243 ret = qemu_file_get_error(mis->to_src_file);
244
245error:
Juan Quintelada6f1792017-04-24 17:37:14 +0200246 qemu_mutex_unlock(&mis->rp_mutex);
Peter Xud6208e32018-02-08 18:31:12 +0800247 return ret;
Juan Quintelada6f1792017-04-24 17:37:14 +0200248}
249
Dr. David Alan Gilbert1e2d90e2015-11-05 18:11:07 +0000250/* Request a range of pages from the source VM at the given
251 * start address.
252 * rbname: Name of the RAMBlock to request the page in, if NULL it's the same
253 * as the last request (a name must have been given previously)
254 * Start: Address offset within the RB
255 * Len: Length in bytes required - must be a multiple of pagesize
256 */
Peter Xud6208e32018-02-08 18:31:12 +0800257int migrate_send_rp_req_pages(MigrationIncomingState *mis, const char *rbname,
258 ram_addr_t start, size_t len)
Dr. David Alan Gilbert1e2d90e2015-11-05 18:11:07 +0000259{
Stefan Weilcb8d4c82016-03-23 15:59:57 +0100260 uint8_t bufc[12 + 1 + 255]; /* start (8), len (4), rbname up to 256 */
Dr. David Alan Gilbert1e2d90e2015-11-05 18:11:07 +0000261 size_t msglen = 12; /* start + len */
Peter Xud6208e32018-02-08 18:31:12 +0800262 enum mig_rp_message_type msg_type;
Dr. David Alan Gilbert1e2d90e2015-11-05 18:11:07 +0000263
264 *(uint64_t *)bufc = cpu_to_be64((uint64_t)start);
265 *(uint32_t *)(bufc + 8) = cpu_to_be32((uint32_t)len);
266
267 if (rbname) {
268 int rbname_len = strlen(rbname);
269 assert(rbname_len < 256);
270
271 bufc[msglen++] = rbname_len;
272 memcpy(bufc + msglen, rbname, rbname_len);
273 msglen += rbname_len;
Peter Xud6208e32018-02-08 18:31:12 +0800274 msg_type = MIG_RP_MSG_REQ_PAGES_ID;
Dr. David Alan Gilbert1e2d90e2015-11-05 18:11:07 +0000275 } else {
Peter Xud6208e32018-02-08 18:31:12 +0800276 msg_type = MIG_RP_MSG_REQ_PAGES;
Dr. David Alan Gilbert1e2d90e2015-11-05 18:11:07 +0000277 }
Peter Xud6208e32018-02-08 18:31:12 +0800278
279 return migrate_send_rp_message(mis, msg_type, msglen, bufc);
Dr. David Alan Gilbert1e2d90e2015-11-05 18:11:07 +0000280}
281
Paolo Bonzini43eaae22012-10-02 18:21:18 +0200282void qemu_start_incoming_migration(const char *uri, Error **errp)
aliguori5bb79102008-10-13 03:12:02 +0000283{
aliguori34c9dd82008-10-13 03:14:31 +0000284 const char *p;
285
Juan Quintela7cf1fe62015-05-20 17:15:42 +0200286 qapi_event_send_migration(MIGRATION_STATUS_SETUP, &error_abort);
Dr. David Alan Gilbertadde2202015-02-19 11:40:27 +0000287 if (!strcmp(uri, "defer")) {
288 deferred_incoming_migration(errp);
289 } else if (strstart(uri, "tcp:", &p)) {
Paolo Bonzini43eaae22012-10-02 18:21:18 +0200290 tcp_start_incoming_migration(p, errp);
Michael R. Hines2da776d2013-07-22 10:01:54 -0400291#ifdef CONFIG_RDMA
Dr. David Alan Gilbertadde2202015-02-19 11:40:27 +0000292 } else if (strstart(uri, "rdma:", &p)) {
Michael R. Hines2da776d2013-07-22 10:01:54 -0400293 rdma_start_incoming_migration(p, errp);
294#endif
Dr. David Alan Gilbertadde2202015-02-19 11:40:27 +0000295 } else if (strstart(uri, "exec:", &p)) {
Paolo Bonzini43eaae22012-10-02 18:21:18 +0200296 exec_start_incoming_migration(p, errp);
Dr. David Alan Gilbertadde2202015-02-19 11:40:27 +0000297 } else if (strstart(uri, "unix:", &p)) {
Paolo Bonzini43eaae22012-10-02 18:21:18 +0200298 unix_start_incoming_migration(p, errp);
Dr. David Alan Gilbertadde2202015-02-19 11:40:27 +0000299 } else if (strstart(uri, "fd:", &p)) {
Paolo Bonzini43eaae22012-10-02 18:21:18 +0200300 fd_start_incoming_migration(p, errp);
Dr. David Alan Gilbertadde2202015-02-19 11:40:27 +0000301 } else {
Markus Armbruster312fd5f2013-02-08 21:22:16 +0100302 error_setg(errp, "unknown migration protocol: %s", uri);
Juan Quintela8ca5e802010-06-09 14:10:54 +0200303 }
aliguori5bb79102008-10-13 03:12:02 +0000304}
305
Denis V. Lunev0aa6aef2016-02-24 11:53:38 +0300306static void process_incoming_migration_bh(void *opaque)
307{
308 Error *local_err = NULL;
309 MigrationIncomingState *mis = opaque;
310
Dr. David Alan Gilberta18a73d2018-04-10 15:28:42 +0100311 /* Make sure all file formats flush their mutable metadata.
312 * If we get an error here, just don't restart the VM yet. */
313 bdrv_invalidate_cache_all(&local_err);
314 if (local_err) {
315 error_report_err(local_err);
316 local_err = NULL;
317 autostart = false;
Kevin Wolfd35ff5e2017-04-04 17:29:03 +0200318 }
319
Denis V. Lunev0aa6aef2016-02-24 11:53:38 +0300320 /*
321 * This must happen after all error conditions are dealt with and
322 * we're sure the VM is going to be running on this host.
323 */
324 qemu_announce_self();
325
Juan Quintelaf986c3d2016-01-14 16:52:55 +0100326 if (multifd_load_cleanup(&local_err) != 0) {
327 error_report_err(local_err);
328 autostart = false;
329 }
Denis V. Lunev0aa6aef2016-02-24 11:53:38 +0300330 /* If global state section was not received or we are in running
331 state, we need to obey autostart. Any other state is set with
332 runstate_set. */
333
Vladimir Sementsov-Ogievskiyb35ebdf2018-03-13 15:34:01 -0400334 dirty_bitmap_mig_before_vm_start();
335
Denis V. Lunev0aa6aef2016-02-24 11:53:38 +0300336 if (!global_state_received() ||
337 global_state_get_runstate() == RUN_STATE_RUNNING) {
338 if (autostart) {
339 vm_start();
340 } else {
341 runstate_set(RUN_STATE_PAUSED);
342 }
343 } else {
344 runstate_set(global_state_get_runstate());
345 }
Denis V. Lunev0aa6aef2016-02-24 11:53:38 +0300346 /*
347 * This must happen after any state changes since as soon as an external
348 * observer sees this event they might start to prod at the VM assuming
349 * it's ready to use.
350 */
351 migrate_set_state(&mis->state, MIGRATION_STATUS_ACTIVE,
352 MIGRATION_STATUS_COMPLETED);
353 qemu_bh_delete(mis->bh);
354 migration_incoming_state_destroy();
355}
356
Paolo Bonzini82a4da72012-08-07 10:57:43 +0200357static void process_incoming_migration_co(void *opaque)
Juan Quintela511c0232010-06-09 14:10:55 +0200358{
Juan Quintelab4b076d2017-01-23 22:32:06 +0100359 MigrationIncomingState *mis = migration_incoming_get_current();
Dr. David Alan Gilberte9bef232015-11-05 18:11:21 +0000360 PostcopyState ps;
Paolo Bonzini1c12e1f2012-08-07 10:51:51 +0200361 int ret;
362
Juan Quintela4f0fae72017-07-24 12:42:02 +0200363 assert(mis->from_src_file);
Dr. David Alan Gilbert67f11b52017-02-24 18:28:34 +0000364 mis->largest_page_size = qemu_ram_pagesize_largest();
Dr. David Alan Gilbert093e3c42015-11-05 18:10:52 +0000365 postcopy_state_set(POSTCOPY_INCOMING_NONE);
zhanghailiang93d7af62015-12-16 11:47:34 +0000366 migrate_set_state(&mis->state, MIGRATION_STATUS_NONE,
367 MIGRATION_STATUS_ACTIVE);
Juan Quintela4f0fae72017-07-24 12:42:02 +0200368 ret = qemu_loadvm_state(mis->from_src_file);
Dr. David Alan Gilbertbca78562015-05-21 13:24:14 +0100369
Dr. David Alan Gilberte9bef232015-11-05 18:11:21 +0000370 ps = postcopy_state_get();
371 trace_process_incoming_migration_co_end(ret, ps);
372 if (ps != POSTCOPY_INCOMING_NONE) {
373 if (ps == POSTCOPY_INCOMING_ADVISE) {
374 /*
375 * Where a migration had postcopy enabled (and thus went to advise)
376 * but managed to complete within the precopy period, we can use
377 * the normal exit.
378 */
379 postcopy_ram_incoming_cleanup(mis);
380 } else if (ret >= 0) {
381 /*
382 * Postcopy was started, cleanup should happen at the end of the
383 * postcopy thread.
384 */
385 trace_process_incoming_migration_co_postcopy_end_main();
386 return;
387 }
388 /* Else if something went wrong then just fall out of the normal exit */
389 }
390
zhanghailiang25d0c162016-10-27 14:42:55 +0800391 /* we get COLO info, and know if we are in COLO mode */
392 if (!ret && migration_incoming_enable_colo()) {
393 mis->migration_incoming_co = qemu_coroutine_self();
394 qemu_thread_create(&mis->colo_incoming_thread, "COLO incoming",
395 colo_process_incoming_thread, mis, QEMU_THREAD_JOINABLE);
396 mis->have_colo_incoming_thread = true;
397 qemu_coroutine_yield();
398
399 /* Wait checkpoint incoming thread exit before free resource */
400 qemu_thread_join(&mis->colo_incoming_thread);
401 }
402
Paolo Bonzini1c12e1f2012-08-07 10:51:51 +0200403 if (ret < 0) {
Juan Quintelaf986c3d2016-01-14 16:52:55 +0100404 Error *local_err = NULL;
405
zhanghailiang93d7af62015-12-16 11:47:34 +0000406 migrate_set_state(&mis->state, MIGRATION_STATUS_ACTIVE,
407 MIGRATION_STATUS_FAILED);
Peter Lievendb80fac2014-06-10 11:29:16 +0200408 error_report("load of migration failed: %s", strerror(-ret));
Dr. David Alan Gilbert3a0f2ce2017-07-17 12:09:32 +0100409 qemu_fclose(mis->from_src_file);
Juan Quintelaf986c3d2016-01-14 16:52:55 +0100410 if (multifd_load_cleanup(&local_err) != 0) {
411 error_report_err(local_err);
412 }
Eric Blake4aead692013-04-16 15:50:41 -0600413 exit(EXIT_FAILURE);
Juan Quintela511c0232010-06-09 14:10:55 +0200414 }
Denis V. Lunev0aa6aef2016-02-24 11:53:38 +0300415 mis->bh = qemu_bh_new(process_incoming_migration_bh, mis);
416 qemu_bh_schedule(mis->bh);
Juan Quintela511c0232010-06-09 14:10:55 +0200417}
418
Juan Quintelae595a012017-07-17 12:30:25 +0200419static void migration_incoming_setup(QEMUFile *f)
Paolo Bonzini82a4da72012-08-07 10:57:43 +0200420{
Juan Quintela4f0fae72017-07-24 12:42:02 +0200421 MigrationIncomingState *mis = migration_incoming_get_current();
Paolo Bonzini82a4da72012-08-07 10:57:43 +0200422
Juan Quintelaf986c3d2016-01-14 16:52:55 +0100423 if (multifd_load_setup() != 0) {
424 /* We haven't been able to create multifd threads
425 nothing better to do */
426 exit(EXIT_FAILURE);
427 }
428
Juan Quintela4f0fae72017-07-24 12:42:02 +0200429 if (!mis->from_src_file) {
430 mis->from_src_file = f;
431 }
Daniel P. Berrange06ad5132016-04-27 11:04:56 +0100432 qemu_file_set_blocking(f, false);
Juan Quintelae595a012017-07-17 12:30:25 +0200433}
434
Juan Quintela36c2f8b2018-03-07 08:40:52 +0100435void migration_incoming_process(void)
Juan Quintelae595a012017-07-17 12:30:25 +0200436{
437 Coroutine *co = qemu_coroutine_create(process_incoming_migration_co, NULL);
Paolo Bonzini0b8b8752016-07-04 19:10:01 +0200438 qemu_coroutine_enter(co);
Paolo Bonzini82a4da72012-08-07 10:57:43 +0200439}
440
Juan Quintelae595a012017-07-17 12:30:25 +0200441void migration_fd_process_incoming(QEMUFile *f)
442{
443 migration_incoming_setup(f);
444 migration_incoming_process();
445}
446
Juan Quintela4f0fae72017-07-24 12:42:02 +0200447void migration_ioc_process_incoming(QIOChannel *ioc)
448{
449 MigrationIncomingState *mis = migration_incoming_get_current();
450
451 if (!mis->from_src_file) {
452 QEMUFile *f = qemu_fopen_channel_input(ioc);
Juan Quintela36c2f8b2018-03-07 08:40:52 +0100453 migration_incoming_setup(f);
Juan Quintela71bb07d2018-02-19 19:01:03 +0100454 return;
Juan Quintela4f0fae72017-07-24 12:42:02 +0200455 }
Juan Quintela71bb07d2018-02-19 19:01:03 +0100456 multifd_recv_new_channel(ioc);
Juan Quintela4f0fae72017-07-24 12:42:02 +0200457}
458
Juan Quintela428d8902017-07-24 13:06:25 +0200459/**
460 * @migration_has_all_channels: We have received all channels that we need
461 *
462 * Returns true when we have got connections to all the channels that
463 * we need for migration.
464 */
465bool migration_has_all_channels(void)
466{
Juan Quintela62c1e0c2018-02-19 18:59:02 +0100467 bool all_channels;
468
469 all_channels = multifd_recv_all_channels_created();
470
471 return all_channels;
Juan Quintela428d8902017-07-24 13:06:25 +0200472}
473
Dr. David Alan Gilbert6decec92015-11-05 18:10:47 +0000474/*
Dr. David Alan Gilbert6decec92015-11-05 18:10:47 +0000475 * Send a 'SHUT' message on the return channel with the given value
476 * to indicate that we've finished with the RP. Non-0 value indicates
477 * error.
478 */
479void migrate_send_rp_shut(MigrationIncomingState *mis,
480 uint32_t value)
481{
482 uint32_t buf;
483
484 buf = cpu_to_be32(value);
485 migrate_send_rp_message(mis, MIG_RP_MSG_SHUT, sizeof(buf), &buf);
486}
487
488/*
489 * Send a 'PONG' message on the return channel with the given value
490 * (normally in response to a 'PING')
491 */
492void migrate_send_rp_pong(MigrationIncomingState *mis,
493 uint32_t value)
494{
495 uint32_t buf;
496
497 buf = cpu_to_be32(value);
498 migrate_send_rp_message(mis, MIG_RP_MSG_PONG, sizeof(buf), &buf);
499}
500
Orit Wassermanbbf6da32012-08-06 21:42:47 +0300501MigrationCapabilityStatusList *qmp_query_migrate_capabilities(Error **errp)
502{
503 MigrationCapabilityStatusList *head = NULL;
504 MigrationCapabilityStatusList *caps;
505 MigrationState *s = migrate_get_current();
506 int i;
507
Michael Tokarev387eede2013-10-05 13:18:28 +0400508 caps = NULL; /* silence compiler warning */
Eric Blake7fb1cf12015-11-18 01:52:57 -0700509 for (i = 0; i < MIGRATION_CAPABILITY__MAX; i++) {
Dr. David Alan Gilberted1701c2017-05-15 15:05:29 +0100510#ifndef CONFIG_LIVE_BLOCK_MIGRATION
511 if (i == MIGRATION_CAPABILITY_BLOCK) {
512 continue;
513 }
514#endif
Orit Wassermanbbf6da32012-08-06 21:42:47 +0300515 if (head == NULL) {
516 head = g_malloc0(sizeof(*caps));
517 caps = head;
518 } else {
519 caps->next = g_malloc0(sizeof(*caps));
520 caps = caps->next;
521 }
522 caps->value =
523 g_malloc(sizeof(*caps->value));
524 caps->value->capability = i;
525 caps->value->state = s->enabled_capabilities[i];
526 }
527
528 return head;
529}
530
Liang Li85de8322015-03-23 16:32:28 +0800531MigrationParameters *qmp_query_migrate_parameters(Error **errp)
532{
533 MigrationParameters *params;
534 MigrationState *s = migrate_get_current();
535
Markus Armbrustere87fae42017-07-18 12:57:38 +0200536 /* TODO use QAPI_CLONE() instead of duplicating it inline */
Liang Li85de8322015-03-23 16:32:28 +0800537 params = g_malloc0(sizeof(*params));
Eric Blakede63ab62016-09-08 22:14:15 -0500538 params->has_compress_level = true;
Daniel P. Berrange2594f562016-04-27 11:05:14 +0100539 params->compress_level = s->parameters.compress_level;
Eric Blakede63ab62016-09-08 22:14:15 -0500540 params->has_compress_threads = true;
Daniel P. Berrange2594f562016-04-27 11:05:14 +0100541 params->compress_threads = s->parameters.compress_threads;
Eric Blakede63ab62016-09-08 22:14:15 -0500542 params->has_decompress_threads = true;
Daniel P. Berrange2594f562016-04-27 11:05:14 +0100543 params->decompress_threads = s->parameters.decompress_threads;
Eric Blakede63ab62016-09-08 22:14:15 -0500544 params->has_cpu_throttle_initial = true;
Daniel P. Berrange2594f562016-04-27 11:05:14 +0100545 params->cpu_throttle_initial = s->parameters.cpu_throttle_initial;
Eric Blakede63ab62016-09-08 22:14:15 -0500546 params->has_cpu_throttle_increment = true;
Daniel P. Berrange2594f562016-04-27 11:05:14 +0100547 params->cpu_throttle_increment = s->parameters.cpu_throttle_increment;
Markus Armbruster8cc99dc2017-07-18 12:04:54 +0200548 params->has_tls_creds = true;
Daniel P. Berrange69ef1f32016-04-27 11:05:15 +0100549 params->tls_creds = g_strdup(s->parameters.tls_creds);
Markus Armbruster8cc99dc2017-07-18 12:04:54 +0200550 params->has_tls_hostname = true;
Daniel P. Berrange69ef1f32016-04-27 11:05:15 +0100551 params->tls_hostname = g_strdup(s->parameters.tls_hostname);
Ashijeet Acharya2ff30252016-09-15 21:50:28 +0530552 params->has_max_bandwidth = true;
553 params->max_bandwidth = s->parameters.max_bandwidth;
554 params->has_downtime_limit = true;
555 params->downtime_limit = s->parameters.downtime_limit;
zhanghailiangfe39a4d2016-11-02 15:42:09 +0800556 params->has_x_checkpoint_delay = true;
zhanghailiang68b53592016-10-27 14:43:01 +0800557 params->x_checkpoint_delay = s->parameters.x_checkpoint_delay;
Juan Quintela2833c592017-04-05 18:32:37 +0200558 params->has_block_incremental = true;
559 params->block_incremental = s->parameters.block_incremental;
Juan Quintela4075fb12016-01-15 08:56:17 +0100560 params->has_x_multifd_channels = true;
561 params->x_multifd_channels = s->parameters.x_multifd_channels;
Juan Quintela0fb86602017-04-27 10:48:25 +0200562 params->has_x_multifd_page_count = true;
563 params->x_multifd_page_count = s->parameters.x_multifd_page_count;
Juan Quintela73af8dd2017-10-05 21:30:10 +0200564 params->has_xbzrle_cache_size = true;
565 params->xbzrle_cache_size = s->parameters.xbzrle_cache_size;
Liang Li85de8322015-03-23 16:32:28 +0800566
567 return params;
568}
569
Dr. David Alan Gilbertf6844b92015-11-05 18:10:48 +0000570/*
571 * Return true if we're already in the middle of a migration
572 * (i.e. any of the active or setup states)
573 */
574static bool migration_is_setup_or_active(int state)
575{
576 switch (state) {
577 case MIGRATION_STATUS_ACTIVE:
Dr. David Alan Gilbert9ec055a2015-11-05 18:10:58 +0000578 case MIGRATION_STATUS_POSTCOPY_ACTIVE:
Peter Xua688d2c2018-05-02 18:47:18 +0800579 case MIGRATION_STATUS_POSTCOPY_PAUSED:
Peter Xu135b87b2018-05-02 18:47:25 +0800580 case MIGRATION_STATUS_POSTCOPY_RECOVER:
Dr. David Alan Gilbertf6844b92015-11-05 18:10:48 +0000581 case MIGRATION_STATUS_SETUP:
Dr. David Alan Gilbert31e06072017-10-20 10:05:51 +0100582 case MIGRATION_STATUS_PRE_SWITCHOVER:
583 case MIGRATION_STATUS_DEVICE:
Dr. David Alan Gilbertf6844b92015-11-05 18:10:48 +0000584 return true;
585
586 default:
587 return false;
588
589 }
590}
591
Dr. David Alan Gilberta22463a2016-06-13 12:16:41 +0100592static void populate_ram_info(MigrationInfo *info, MigrationState *s)
593{
594 info->has_ram = true;
595 info->ram = g_malloc0(sizeof(*info->ram));
Juan Quintela93604472017-06-06 19:49:03 +0200596 info->ram->transferred = ram_counters.transferred;
Dr. David Alan Gilberta22463a2016-06-13 12:16:41 +0100597 info->ram->total = ram_bytes_total();
Juan Quintela93604472017-06-06 19:49:03 +0200598 info->ram->duplicate = ram_counters.duplicate;
Juan Quintelabedf53c2017-03-13 20:35:54 +0100599 /* legacy value. It is not used anymore */
600 info->ram->skipped = 0;
Juan Quintela93604472017-06-06 19:49:03 +0200601 info->ram->normal = ram_counters.normal;
602 info->ram->normal_bytes = ram_counters.normal *
Juan Quintela20afaed2017-03-21 09:09:14 +0100603 qemu_target_page_size();
Dr. David Alan Gilberta22463a2016-06-13 12:16:41 +0100604 info->ram->mbps = s->mbps;
Juan Quintela93604472017-06-06 19:49:03 +0200605 info->ram->dirty_sync_count = ram_counters.dirty_sync_count;
606 info->ram->postcopy_requests = ram_counters.postcopy_requests;
Chao Fan030ce1f2017-03-21 10:22:43 +0800607 info->ram->page_size = qemu_target_page_size();
Dr. David Alan Gilberta22463a2016-06-13 12:16:41 +0100608
Juan Quintela114f5ae2017-05-04 10:09:21 +0200609 if (migrate_use_xbzrle()) {
610 info->has_xbzrle_cache = true;
611 info->xbzrle_cache = g_malloc0(sizeof(*info->xbzrle_cache));
612 info->xbzrle_cache->cache_size = migrate_xbzrle_cache_size();
Juan Quintela93604472017-06-06 19:49:03 +0200613 info->xbzrle_cache->bytes = xbzrle_counters.bytes;
614 info->xbzrle_cache->pages = xbzrle_counters.pages;
615 info->xbzrle_cache->cache_miss = xbzrle_counters.cache_miss;
616 info->xbzrle_cache->cache_miss_rate = xbzrle_counters.cache_miss_rate;
617 info->xbzrle_cache->overflow = xbzrle_counters.overflow;
Juan Quintela114f5ae2017-05-04 10:09:21 +0200618 }
619
Juan Quintela338182c2017-05-03 13:16:38 +0200620 if (cpu_throttle_active()) {
621 info->has_cpu_throttle_percentage = true;
622 info->cpu_throttle_percentage = cpu_throttle_get_percentage();
623 }
624
Dr. David Alan Gilberta22463a2016-06-13 12:16:41 +0100625 if (s->state != MIGRATION_STATUS_COMPLETED) {
626 info->ram->remaining = ram_bytes_remaining();
Juan Quintela93604472017-06-06 19:49:03 +0200627 info->ram->dirty_pages_rate = ram_counters.dirty_pages_rate;
Dr. David Alan Gilberta22463a2016-06-13 12:16:41 +0100628 }
629}
630
Juan Quintela930ac042017-05-04 10:21:46 +0200631static void populate_disk_info(MigrationInfo *info)
632{
633 if (blk_mig_active()) {
634 info->has_disk = true;
635 info->disk = g_malloc0(sizeof(*info->disk));
636 info->disk->transferred = blk_mig_bytes_transferred();
637 info->disk->remaining = blk_mig_bytes_remaining();
638 info->disk->total = blk_mig_bytes_total();
639 }
640}
641
Alexey Perevalov65ace062018-03-22 21:17:27 +0300642static void fill_source_migration_info(MigrationInfo *info)
aliguori5bb79102008-10-13 03:12:02 +0000643{
Juan Quintela17549e82011-10-05 13:50:43 +0200644 MigrationState *s = migrate_get_current();
aliguori376253e2009-03-05 23:01:23 +0000645
Juan Quintela17549e82011-10-05 13:50:43 +0200646 switch (s->state) {
zhanghailiang31194732015-03-13 16:08:38 +0800647 case MIGRATION_STATUS_NONE:
Juan Quintela17549e82011-10-05 13:50:43 +0200648 /* no migration has happened ever */
Alexey Perevalov65ace062018-03-22 21:17:27 +0300649 /* do not overwrite destination migration status */
650 return;
Juan Quintela17549e82011-10-05 13:50:43 +0200651 break;
zhanghailiang31194732015-03-13 16:08:38 +0800652 case MIGRATION_STATUS_SETUP:
Michael R. Hines29ae8a42013-07-22 10:01:57 -0400653 info->has_status = true;
Michael R. Hinesed4fbd12013-07-22 10:01:58 -0400654 info->has_total_time = false;
Michael R. Hines29ae8a42013-07-22 10:01:57 -0400655 break;
zhanghailiang31194732015-03-13 16:08:38 +0800656 case MIGRATION_STATUS_ACTIVE:
657 case MIGRATION_STATUS_CANCELLING:
Dr. David Alan Gilbert9ec055a2015-11-05 18:10:58 +0000658 case MIGRATION_STATUS_POSTCOPY_ACTIVE:
Dr. David Alan Gilbert31e06072017-10-20 10:05:51 +0100659 case MIGRATION_STATUS_PRE_SWITCHOVER:
660 case MIGRATION_STATUS_DEVICE:
Peter Xua688d2c2018-05-02 18:47:18 +0800661 case MIGRATION_STATUS_POSTCOPY_PAUSED:
Peter Xu135b87b2018-05-02 18:47:25 +0800662 case MIGRATION_STATUS_POSTCOPY_RECOVER:
Juan Quintelac8f9f4f2017-06-06 19:21:29 +0200663 /* TODO add some postcopy stats */
Dr. David Alan Gilbert9ec055a2015-11-05 18:10:58 +0000664 info->has_status = true;
665 info->has_total_time = true;
666 info->total_time = qemu_clock_get_ms(QEMU_CLOCK_REALTIME)
Peter Xu4af246a2018-01-03 20:20:08 +0800667 - s->start_time;
Dr. David Alan Gilbert9ec055a2015-11-05 18:10:58 +0000668 info->has_expected_downtime = true;
669 info->expected_downtime = s->expected_downtime;
670 info->has_setup_time = true;
671 info->setup_time = s->setup_time;
672
Dr. David Alan Gilberta22463a2016-06-13 12:16:41 +0100673 populate_ram_info(info, s);
Juan Quintela930ac042017-05-04 10:21:46 +0200674 populate_disk_info(info);
Dr. David Alan Gilbert9ec055a2015-11-05 18:10:58 +0000675 break;
zhanghailiang0b827d52016-10-27 14:42:54 +0800676 case MIGRATION_STATUS_COLO:
677 info->has_status = true;
678 /* TODO: display COLO specific information (checkpoint info etc.) */
679 break;
zhanghailiang31194732015-03-13 16:08:38 +0800680 case MIGRATION_STATUS_COMPLETED:
Luiz Capitulino791e7c82011-09-13 17:37:16 -0300681 info->has_status = true;
Pawit Pornkitprasan00c14992013-07-19 11:23:45 +0900682 info->has_total_time = true;
Juan Quintela7aa939a2012-08-18 13:17:10 +0200683 info->total_time = s->total_time;
Juan Quintela9c5a9fc2012-08-13 09:35:16 +0200684 info->has_downtime = true;
685 info->downtime = s->downtime;
Michael R. Hinesed4fbd12013-07-22 10:01:58 -0400686 info->has_setup_time = true;
687 info->setup_time = s->setup_time;
Juan Quintelad5f8a572012-05-21 22:01:07 +0200688
Dr. David Alan Gilberta22463a2016-06-13 12:16:41 +0100689 populate_ram_info(info, s);
Juan Quintela17549e82011-10-05 13:50:43 +0200690 break;
zhanghailiang31194732015-03-13 16:08:38 +0800691 case MIGRATION_STATUS_FAILED:
Luiz Capitulino791e7c82011-09-13 17:37:16 -0300692 info->has_status = true;
Daniel P. Berranged59ce6f2016-04-27 11:05:00 +0100693 if (s->error) {
694 info->has_error_desc = true;
695 info->error_desc = g_strdup(error_get_pretty(s->error));
696 }
Juan Quintela17549e82011-10-05 13:50:43 +0200697 break;
zhanghailiang31194732015-03-13 16:08:38 +0800698 case MIGRATION_STATUS_CANCELLED:
Luiz Capitulino791e7c82011-09-13 17:37:16 -0300699 info->has_status = true;
Juan Quintela17549e82011-10-05 13:50:43 +0200700 break;
aliguori5bb79102008-10-13 03:12:02 +0000701 }
zhanghailiangcde63fb2015-03-13 16:08:41 +0800702 info->status = s->state;
aliguori5bb79102008-10-13 03:12:02 +0000703}
704
Peter Xu4a842142017-07-18 11:39:08 +0800705/**
706 * @migration_caps_check - check capability validity
707 *
708 * @cap_list: old capability list, array of bool
709 * @params: new capabilities to be applied soon
710 * @errp: set *errp if the check failed, with reason
711 *
712 * Returns true if check passed, otherwise false.
713 */
714static bool migrate_caps_check(bool *cap_list,
715 MigrationCapabilityStatusList *params,
716 Error **errp)
Orit Wasserman00458432012-08-06 21:42:48 +0300717{
Orit Wasserman00458432012-08-06 21:42:48 +0300718 MigrationCapabilityStatusList *cap;
Peter Xu4a842142017-07-18 11:39:08 +0800719 bool old_postcopy_cap;
Alexey Perevalovd7651f12017-09-19 19:47:56 +0300720 MigrationIncomingState *mis = migration_incoming_get_current();
Orit Wasserman00458432012-08-06 21:42:48 +0300721
Peter Xu4a842142017-07-18 11:39:08 +0800722 old_postcopy_cap = cap_list[MIGRATION_CAPABILITY_POSTCOPY_RAM];
Orit Wasserman00458432012-08-06 21:42:48 +0300723
724 for (cap = params; cap; cap = cap->next) {
Peter Xu4a842142017-07-18 11:39:08 +0800725 cap_list[cap->value->capability] = cap->value->state;
Orit Wasserman00458432012-08-06 21:42:48 +0300726 }
Dr. David Alan Gilbert53dd3702015-11-05 18:10:51 +0000727
Peter Xu4a842142017-07-18 11:39:08 +0800728#ifndef CONFIG_LIVE_BLOCK_MIGRATION
729 if (cap_list[MIGRATION_CAPABILITY_BLOCK]) {
730 error_setg(errp, "QEMU compiled without old-style (blk/-b, inc/-i) "
731 "block migration");
732 error_append_hint(errp, "Use drive_mirror+NBD instead.\n");
733 return false;
734 }
735#endif
736
737 if (cap_list[MIGRATION_CAPABILITY_POSTCOPY_RAM]) {
738 if (cap_list[MIGRATION_CAPABILITY_COMPRESS]) {
Dr. David Alan Gilbert53dd3702015-11-05 18:10:51 +0000739 /* The decompression threads asynchronously write into RAM
740 * rather than use the atomic copies needed to avoid
741 * userfaulting. It should be possible to fix the decompression
742 * threads for compatibility in future.
743 */
Peter Xu4a842142017-07-18 11:39:08 +0800744 error_setg(errp, "Postcopy is not currently compatible "
745 "with compression");
746 return false;
Dr. David Alan Gilbert53dd3702015-11-05 18:10:51 +0000747 }
Peter Xu4a842142017-07-18 11:39:08 +0800748
Dr. David Alan Gilbert096631b2016-06-13 12:16:45 +0100749 /* This check is reasonably expensive, so only when it's being
750 * set the first time, also it's only the destination that needs
751 * special support.
752 */
753 if (!old_postcopy_cap && runstate_check(RUN_STATE_INMIGRATE) &&
Alexey Perevalovd7651f12017-09-19 19:47:56 +0300754 !postcopy_ram_supported_by_host(mis)) {
Dr. David Alan Gilbert096631b2016-06-13 12:16:45 +0100755 /* postcopy_ram_supported_by_host will have emitted a more
756 * detailed message
757 */
Peter Xu4a842142017-07-18 11:39:08 +0800758 error_setg(errp, "Postcopy is not supported");
759 return false;
Dr. David Alan Gilbert096631b2016-06-13 12:16:45 +0100760 }
Dr. David Alan Gilbert53dd3702015-11-05 18:10:51 +0000761 }
Peter Xu4a842142017-07-18 11:39:08 +0800762
763 return true;
764}
765
Alexey Perevalov65ace062018-03-22 21:17:27 +0300766static void fill_destination_migration_info(MigrationInfo *info)
767{
768 MigrationIncomingState *mis = migration_incoming_get_current();
769
770 switch (mis->state) {
771 case MIGRATION_STATUS_NONE:
772 return;
773 break;
774 case MIGRATION_STATUS_SETUP:
775 case MIGRATION_STATUS_CANCELLING:
776 case MIGRATION_STATUS_CANCELLED:
777 case MIGRATION_STATUS_ACTIVE:
778 case MIGRATION_STATUS_POSTCOPY_ACTIVE:
779 case MIGRATION_STATUS_FAILED:
780 case MIGRATION_STATUS_COLO:
781 info->has_status = true;
782 break;
783 case MIGRATION_STATUS_COMPLETED:
784 info->has_status = true;
785 fill_destination_postcopy_migration_info(info);
786 break;
787 }
788 info->status = mis->state;
789}
790
791MigrationInfo *qmp_query_migrate(Error **errp)
792{
793 MigrationInfo *info = g_malloc0(sizeof(*info));
794
795 fill_destination_migration_info(info);
796 fill_source_migration_info(info);
797
798 return info;
799}
800
Peter Xu4a842142017-07-18 11:39:08 +0800801void qmp_migrate_set_capabilities(MigrationCapabilityStatusList *params,
802 Error **errp)
803{
804 MigrationState *s = migrate_get_current();
805 MigrationCapabilityStatusList *cap;
Peter Xudd0ee302018-03-05 17:49:38 +0800806 bool cap_list[MIGRATION_CAPABILITY__MAX];
Peter Xu4a842142017-07-18 11:39:08 +0800807
808 if (migration_is_setup_or_active(s->state)) {
809 error_setg(errp, QERR_MIGRATION_ACTIVE);
810 return;
811 }
812
Peter Xudd0ee302018-03-05 17:49:38 +0800813 memcpy(cap_list, s->enabled_capabilities, sizeof(cap_list));
814 if (!migrate_caps_check(cap_list, params, errp)) {
Peter Xu4a842142017-07-18 11:39:08 +0800815 return;
816 }
817
818 for (cap = params; cap; cap = cap->next) {
819 s->enabled_capabilities[cap->value->capability] = cap->value->state;
820 }
Orit Wasserman00458432012-08-06 21:42:48 +0300821}
822
Peter Xu16d063b2017-07-18 11:39:04 +0800823/*
824 * Check whether the parameters are valid. Error will be put into errp
825 * (if provided). Return true if valid, otherwise false.
826 */
827static bool migrate_params_check(MigrationParameters *params, Error **errp)
Liang Li85de8322015-03-23 16:32:28 +0800828{
Eric Blake7f375e02016-09-08 22:14:16 -0500829 if (params->has_compress_level &&
Juan Quintela741d4082017-12-01 13:08:38 +0100830 (params->compress_level > 9)) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +0100831 error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "compress_level",
832 "is invalid, it should be in the range of 0 to 9");
Peter Xu16d063b2017-07-18 11:39:04 +0800833 return false;
Liang Li85de8322015-03-23 16:32:28 +0800834 }
Peter Xu16d063b2017-07-18 11:39:04 +0800835
Juan Quintela741d4082017-12-01 13:08:38 +0100836 if (params->has_compress_threads && (params->compress_threads < 1)) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +0100837 error_setg(errp, QERR_INVALID_PARAMETER_VALUE,
838 "compress_threads",
839 "is invalid, it should be in the range of 1 to 255");
Peter Xu16d063b2017-07-18 11:39:04 +0800840 return false;
Liang Li85de8322015-03-23 16:32:28 +0800841 }
Peter Xu16d063b2017-07-18 11:39:04 +0800842
Juan Quintela741d4082017-12-01 13:08:38 +0100843 if (params->has_decompress_threads && (params->decompress_threads < 1)) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +0100844 error_setg(errp, QERR_INVALID_PARAMETER_VALUE,
845 "decompress_threads",
846 "is invalid, it should be in the range of 1 to 255");
Peter Xu16d063b2017-07-18 11:39:04 +0800847 return false;
Liang Li85de8322015-03-23 16:32:28 +0800848 }
Peter Xu16d063b2017-07-18 11:39:04 +0800849
Eric Blake7f375e02016-09-08 22:14:16 -0500850 if (params->has_cpu_throttle_initial &&
851 (params->cpu_throttle_initial < 1 ||
852 params->cpu_throttle_initial > 99)) {
Jason J. Herne1626fee2015-09-08 13:12:34 -0400853 error_setg(errp, QERR_INVALID_PARAMETER_VALUE,
Jason J. Herned85a31d2016-04-21 14:07:18 -0400854 "cpu_throttle_initial",
Jason J. Herne1626fee2015-09-08 13:12:34 -0400855 "an integer in the range of 1 to 99");
Peter Xu16d063b2017-07-18 11:39:04 +0800856 return false;
Jason J. Herne1626fee2015-09-08 13:12:34 -0400857 }
Peter Xu16d063b2017-07-18 11:39:04 +0800858
Eric Blake7f375e02016-09-08 22:14:16 -0500859 if (params->has_cpu_throttle_increment &&
860 (params->cpu_throttle_increment < 1 ||
861 params->cpu_throttle_increment > 99)) {
Jason J. Herne1626fee2015-09-08 13:12:34 -0400862 error_setg(errp, QERR_INVALID_PARAMETER_VALUE,
Jason J. Herned85a31d2016-04-21 14:07:18 -0400863 "cpu_throttle_increment",
Jason J. Herne1626fee2015-09-08 13:12:34 -0400864 "an integer in the range of 1 to 99");
Peter Xu16d063b2017-07-18 11:39:04 +0800865 return false;
Jason J. Herne1626fee2015-09-08 13:12:34 -0400866 }
Peter Xu16d063b2017-07-18 11:39:04 +0800867
Juan Quintela741d4082017-12-01 13:08:38 +0100868 if (params->has_max_bandwidth && (params->max_bandwidth > SIZE_MAX)) {
Ashijeet Acharya2ff30252016-09-15 21:50:28 +0530869 error_setg(errp, "Parameter 'max_bandwidth' expects an integer in the"
870 " range of 0 to %zu bytes/second", SIZE_MAX);
Peter Xu16d063b2017-07-18 11:39:04 +0800871 return false;
Ashijeet Acharya2ff30252016-09-15 21:50:28 +0530872 }
Peter Xu16d063b2017-07-18 11:39:04 +0800873
Ashijeet Acharya2ff30252016-09-15 21:50:28 +0530874 if (params->has_downtime_limit &&
Juan Quintela741d4082017-12-01 13:08:38 +0100875 (params->downtime_limit > MAX_MIGRATE_DOWNTIME)) {
Daniel Henrique Barboza87c9cc12017-02-22 12:17:29 -0300876 error_setg(errp, "Parameter 'downtime_limit' expects an integer in "
877 "the range of 0 to %d milliseconds",
878 MAX_MIGRATE_DOWNTIME);
Peter Xu16d063b2017-07-18 11:39:04 +0800879 return false;
Ashijeet Acharya2ff30252016-09-15 21:50:28 +0530880 }
Peter Xu16d063b2017-07-18 11:39:04 +0800881
Juan Quintela741d4082017-12-01 13:08:38 +0100882 /* x_checkpoint_delay is now always positive */
883
884 if (params->has_x_multifd_channels && (params->x_multifd_channels < 1)) {
Juan Quintela4075fb12016-01-15 08:56:17 +0100885 error_setg(errp, QERR_INVALID_PARAMETER_VALUE,
886 "multifd_channels",
887 "is invalid, it should be in the range of 1 to 255");
888 return false;
889 }
Juan Quintela0fb86602017-04-27 10:48:25 +0200890 if (params->has_x_multifd_page_count &&
Juan Quintela741d4082017-12-01 13:08:38 +0100891 (params->x_multifd_page_count < 1 ||
892 params->x_multifd_page_count > 10000)) {
Juan Quintela0fb86602017-04-27 10:48:25 +0200893 error_setg(errp, QERR_INVALID_PARAMETER_VALUE,
894 "multifd_page_count",
895 "is invalid, it should be in the range of 1 to 10000");
896 return false;
897 }
Peter Xu16d063b2017-07-18 11:39:04 +0800898
Juan Quintela73af8dd2017-10-05 21:30:10 +0200899 if (params->has_xbzrle_cache_size &&
900 (params->xbzrle_cache_size < qemu_target_page_size() ||
901 !is_power_of_2(params->xbzrle_cache_size))) {
902 error_setg(errp, QERR_INVALID_PARAMETER_VALUE,
903 "xbzrle_cache_size",
904 "is invalid, it should be bigger than target page size"
905 " and a power of two");
906 return false;
907 }
908
Peter Xu16d063b2017-07-18 11:39:04 +0800909 return true;
910}
911
Markus Armbruster1bda8b32017-07-18 13:42:11 +0200912static void migrate_params_test_apply(MigrateSetParameters *params,
913 MigrationParameters *dest)
914{
915 *dest = migrate_get_current()->parameters;
916
917 /* TODO use QAPI_CLONE() instead of duplicating it inline */
918
919 if (params->has_compress_level) {
920 dest->compress_level = params->compress_level;
921 }
922
923 if (params->has_compress_threads) {
924 dest->compress_threads = params->compress_threads;
925 }
926
927 if (params->has_decompress_threads) {
928 dest->decompress_threads = params->decompress_threads;
929 }
930
931 if (params->has_cpu_throttle_initial) {
932 dest->cpu_throttle_initial = params->cpu_throttle_initial;
933 }
934
935 if (params->has_cpu_throttle_increment) {
936 dest->cpu_throttle_increment = params->cpu_throttle_increment;
937 }
938
939 if (params->has_tls_creds) {
Markus Armbruster01fa5592017-07-18 14:42:04 +0200940 assert(params->tls_creds->type == QTYPE_QSTRING);
941 dest->tls_creds = g_strdup(params->tls_creds->u.s);
Markus Armbruster1bda8b32017-07-18 13:42:11 +0200942 }
943
944 if (params->has_tls_hostname) {
Markus Armbruster01fa5592017-07-18 14:42:04 +0200945 assert(params->tls_hostname->type == QTYPE_QSTRING);
946 dest->tls_hostname = g_strdup(params->tls_hostname->u.s);
Markus Armbruster1bda8b32017-07-18 13:42:11 +0200947 }
948
949 if (params->has_max_bandwidth) {
950 dest->max_bandwidth = params->max_bandwidth;
951 }
952
953 if (params->has_downtime_limit) {
954 dest->downtime_limit = params->downtime_limit;
955 }
956
957 if (params->has_x_checkpoint_delay) {
958 dest->x_checkpoint_delay = params->x_checkpoint_delay;
959 }
960
961 if (params->has_block_incremental) {
962 dest->block_incremental = params->block_incremental;
963 }
Juan Quintela5e7577a2017-10-09 18:07:56 +0200964 if (params->has_x_multifd_channels) {
965 dest->x_multifd_channels = params->x_multifd_channels;
966 }
967 if (params->has_x_multifd_page_count) {
968 dest->x_multifd_page_count = params->x_multifd_page_count;
969 }
Juan Quintela73af8dd2017-10-05 21:30:10 +0200970 if (params->has_xbzrle_cache_size) {
971 dest->xbzrle_cache_size = params->xbzrle_cache_size;
972 }
Markus Armbruster1bda8b32017-07-18 13:42:11 +0200973}
974
Juan Quintela73af8dd2017-10-05 21:30:10 +0200975static void migrate_params_apply(MigrateSetParameters *params, Error **errp)
Peter Xu16d063b2017-07-18 11:39:04 +0800976{
977 MigrationState *s = migrate_get_current();
978
Markus Armbrustere87fae42017-07-18 12:57:38 +0200979 /* TODO use QAPI_CLONE() instead of duplicating it inline */
980
Eric Blake7f375e02016-09-08 22:14:16 -0500981 if (params->has_compress_level) {
982 s->parameters.compress_level = params->compress_level;
Liang Li85de8322015-03-23 16:32:28 +0800983 }
Peter Xu476c72a2017-07-18 11:39:05 +0800984
Eric Blake7f375e02016-09-08 22:14:16 -0500985 if (params->has_compress_threads) {
986 s->parameters.compress_threads = params->compress_threads;
Liang Li85de8322015-03-23 16:32:28 +0800987 }
Peter Xu476c72a2017-07-18 11:39:05 +0800988
Eric Blake7f375e02016-09-08 22:14:16 -0500989 if (params->has_decompress_threads) {
990 s->parameters.decompress_threads = params->decompress_threads;
Liang Li85de8322015-03-23 16:32:28 +0800991 }
Peter Xu476c72a2017-07-18 11:39:05 +0800992
Eric Blake7f375e02016-09-08 22:14:16 -0500993 if (params->has_cpu_throttle_initial) {
994 s->parameters.cpu_throttle_initial = params->cpu_throttle_initial;
Jason J. Herne1626fee2015-09-08 13:12:34 -0400995 }
Peter Xu476c72a2017-07-18 11:39:05 +0800996
Eric Blake7f375e02016-09-08 22:14:16 -0500997 if (params->has_cpu_throttle_increment) {
998 s->parameters.cpu_throttle_increment = params->cpu_throttle_increment;
Jason J. Herne1626fee2015-09-08 13:12:34 -0400999 }
Peter Xu476c72a2017-07-18 11:39:05 +08001000
Eric Blake7f375e02016-09-08 22:14:16 -05001001 if (params->has_tls_creds) {
Daniel P. Berrange69ef1f32016-04-27 11:05:15 +01001002 g_free(s->parameters.tls_creds);
Markus Armbruster01fa5592017-07-18 14:42:04 +02001003 assert(params->tls_creds->type == QTYPE_QSTRING);
1004 s->parameters.tls_creds = g_strdup(params->tls_creds->u.s);
Daniel P. Berrange69ef1f32016-04-27 11:05:15 +01001005 }
Peter Xu476c72a2017-07-18 11:39:05 +08001006
Eric Blake7f375e02016-09-08 22:14:16 -05001007 if (params->has_tls_hostname) {
Daniel P. Berrange69ef1f32016-04-27 11:05:15 +01001008 g_free(s->parameters.tls_hostname);
Markus Armbruster01fa5592017-07-18 14:42:04 +02001009 assert(params->tls_hostname->type == QTYPE_QSTRING);
1010 s->parameters.tls_hostname = g_strdup(params->tls_hostname->u.s);
Daniel P. Berrange69ef1f32016-04-27 11:05:15 +01001011 }
Peter Xu476c72a2017-07-18 11:39:05 +08001012
Ashijeet Acharya2ff30252016-09-15 21:50:28 +05301013 if (params->has_max_bandwidth) {
1014 s->parameters.max_bandwidth = params->max_bandwidth;
1015 if (s->to_dst_file) {
1016 qemu_file_set_rate_limit(s->to_dst_file,
1017 s->parameters.max_bandwidth / XFER_LIMIT_RATIO);
1018 }
1019 }
Peter Xu476c72a2017-07-18 11:39:05 +08001020
Ashijeet Acharya2ff30252016-09-15 21:50:28 +05301021 if (params->has_downtime_limit) {
1022 s->parameters.downtime_limit = params->downtime_limit;
1023 }
zhanghailiang68b53592016-10-27 14:43:01 +08001024
1025 if (params->has_x_checkpoint_delay) {
1026 s->parameters.x_checkpoint_delay = params->x_checkpoint_delay;
zhanghailiang479125d2017-01-17 20:57:42 +08001027 if (migration_in_colo_state()) {
1028 colo_checkpoint_notify(s);
1029 }
zhanghailiang68b53592016-10-27 14:43:01 +08001030 }
Peter Xu476c72a2017-07-18 11:39:05 +08001031
Juan Quintela2833c592017-04-05 18:32:37 +02001032 if (params->has_block_incremental) {
1033 s->parameters.block_incremental = params->block_incremental;
1034 }
Juan Quintela4075fb12016-01-15 08:56:17 +01001035 if (params->has_x_multifd_channels) {
1036 s->parameters.x_multifd_channels = params->x_multifd_channels;
1037 }
Juan Quintela0fb86602017-04-27 10:48:25 +02001038 if (params->has_x_multifd_page_count) {
1039 s->parameters.x_multifd_page_count = params->x_multifd_page_count;
1040 }
Juan Quintela73af8dd2017-10-05 21:30:10 +02001041 if (params->has_xbzrle_cache_size) {
1042 s->parameters.xbzrle_cache_size = params->xbzrle_cache_size;
1043 xbzrle_cache_resize(params->xbzrle_cache_size, errp);
1044 }
Liang Li85de8322015-03-23 16:32:28 +08001045}
1046
Markus Armbruster1bda8b32017-07-18 13:42:11 +02001047void qmp_migrate_set_parameters(MigrateSetParameters *params, Error **errp)
Peter Xu476c72a2017-07-18 11:39:05 +08001048{
Markus Armbruster1bda8b32017-07-18 13:42:11 +02001049 MigrationParameters tmp;
1050
Markus Armbruster01fa5592017-07-18 14:42:04 +02001051 /* TODO Rewrite "" to null instead */
1052 if (params->has_tls_creds
1053 && params->tls_creds->type == QTYPE_QNULL) {
Marc-André Lureaucb3e7f02018-04-19 17:01:43 +02001054 qobject_unref(params->tls_creds->u.n);
Markus Armbruster01fa5592017-07-18 14:42:04 +02001055 params->tls_creds->type = QTYPE_QSTRING;
1056 params->tls_creds->u.s = strdup("");
1057 }
1058 /* TODO Rewrite "" to null instead */
1059 if (params->has_tls_hostname
1060 && params->tls_hostname->type == QTYPE_QNULL) {
Marc-André Lureaucb3e7f02018-04-19 17:01:43 +02001061 qobject_unref(params->tls_hostname->u.n);
Markus Armbruster01fa5592017-07-18 14:42:04 +02001062 params->tls_hostname->type = QTYPE_QSTRING;
1063 params->tls_hostname->u.s = strdup("");
1064 }
1065
Markus Armbruster1bda8b32017-07-18 13:42:11 +02001066 migrate_params_test_apply(params, &tmp);
1067
1068 if (!migrate_params_check(&tmp, errp)) {
Peter Xu476c72a2017-07-18 11:39:05 +08001069 /* Invalid parameter */
1070 return;
1071 }
1072
Juan Quintela73af8dd2017-10-05 21:30:10 +02001073 migrate_params_apply(params, errp);
Peter Xu476c72a2017-07-18 11:39:05 +08001074}
1075
Daniel P. Berrange2594f562016-04-27 11:05:14 +01001076
Dr. David Alan Gilbert4886a1b2015-11-05 18:10:56 +00001077void qmp_migrate_start_postcopy(Error **errp)
1078{
1079 MigrationState *s = migrate_get_current();
1080
Vladimir Sementsov-Ogievskiy16b0fd32018-03-13 15:34:01 -04001081 if (!migrate_postcopy()) {
Dr. David Alan Gilberta54d3402015-11-12 11:34:44 +00001082 error_setg(errp, "Enable postcopy with migrate_set_capability before"
Dr. David Alan Gilbert4886a1b2015-11-05 18:10:56 +00001083 " the start of migration");
1084 return;
1085 }
1086
1087 if (s->state == MIGRATION_STATUS_NONE) {
1088 error_setg(errp, "Postcopy must be started after migration has been"
1089 " started");
1090 return;
1091 }
1092 /*
1093 * we don't error if migration has finished since that would be racy
1094 * with issuing this command.
1095 */
1096 atomic_set(&s->start_postcopy, true);
1097}
1098
aliguori065e2812008-11-11 16:46:33 +00001099/* shared migration helpers */
1100
zhanghailiang48781e52015-12-16 11:47:33 +00001101void migrate_set_state(int *state, int old_state, int new_state)
Zhanghaoyu (A)51cf4c12013-11-07 11:01:15 +00001102{
Peter Xua31fede2017-08-30 16:32:01 +08001103 assert(new_state < MIGRATION_STATUS__MAX);
zhanghailiang48781e52015-12-16 11:47:33 +00001104 if (atomic_cmpxchg(state, old_state, new_state) == old_state) {
Peter Xua31fede2017-08-30 16:32:01 +08001105 trace_migrate_set_state(MigrationStatus_str(new_state));
Juan Quintelab05dc722015-07-07 14:44:05 +02001106 migrate_generate_event(new_state);
Zhanghaoyu (A)51cf4c12013-11-07 11:01:15 +00001107 }
1108}
1109
Peter Xu4e4a3d32017-07-18 11:39:09 +08001110static MigrationCapabilityStatusList *migrate_cap_add(
1111 MigrationCapabilityStatusList *list,
1112 MigrationCapability index,
1113 bool state)
Juan Quintela2833c592017-04-05 18:32:37 +02001114{
1115 MigrationCapabilityStatusList *cap;
1116
1117 cap = g_new0(MigrationCapabilityStatusList, 1);
1118 cap->value = g_new0(MigrationCapabilityStatus, 1);
Peter Xu4e4a3d32017-07-18 11:39:09 +08001119 cap->value->capability = index;
1120 cap->value->state = state;
1121 cap->next = list;
1122
1123 return cap;
1124}
1125
1126void migrate_set_block_enabled(bool value, Error **errp)
1127{
1128 MigrationCapabilityStatusList *cap;
1129
1130 cap = migrate_cap_add(NULL, MIGRATION_CAPABILITY_BLOCK, value);
Juan Quintela2833c592017-04-05 18:32:37 +02001131 qmp_migrate_set_capabilities(cap, errp);
1132 qapi_free_MigrationCapabilityStatusList(cap);
1133}
1134
1135static void migrate_set_block_incremental(MigrationState *s, bool value)
1136{
1137 s->parameters.block_incremental = value;
1138}
1139
1140static void block_cleanup_parameters(MigrationState *s)
1141{
1142 if (s->must_remove_block_options) {
1143 /* setting to false can never fail */
1144 migrate_set_block_enabled(false, &error_abort);
1145 migrate_set_block_incremental(s, false);
1146 s->must_remove_block_options = false;
1147 }
1148}
1149
Paolo Bonzinibb1fadc2013-02-22 17:36:21 +01001150static void migrate_fd_cleanup(void *opaque)
aliguori065e2812008-11-11 16:46:33 +00001151{
Paolo Bonzinibb1fadc2013-02-22 17:36:21 +01001152 MigrationState *s = opaque;
1153
1154 qemu_bh_delete(s->cleanup_bh);
1155 s->cleanup_bh = NULL;
1156
Peter Xu0ceccd82018-01-03 20:20:06 +08001157 qemu_savevm_state_cleanup();
1158
zhanghailiang89a02a92016-01-15 11:37:42 +08001159 if (s->to_dst_file) {
Juan Quintelaf986c3d2016-01-14 16:52:55 +01001160 Error *local_err = NULL;
1161
Alexey Kardashevskiy9013dca2014-03-11 10:42:29 +11001162 trace_migrate_fd_cleanup();
Paolo Bonzini404a7c02013-02-22 17:36:46 +01001163 qemu_mutex_unlock_iothread();
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00001164 if (s->migration_thread_running) {
1165 qemu_thread_join(&s->thread);
1166 s->migration_thread_running = false;
1167 }
Paolo Bonzini404a7c02013-02-22 17:36:46 +01001168 qemu_mutex_lock_iothread();
1169
Juan Quintelaf986c3d2016-01-14 16:52:55 +01001170 if (multifd_save_cleanup(&local_err) != 0) {
1171 error_report_err(local_err);
1172 }
zhanghailiang89a02a92016-01-15 11:37:42 +08001173 qemu_fclose(s->to_dst_file);
1174 s->to_dst_file = NULL;
aliguori065e2812008-11-11 16:46:33 +00001175 }
1176
Dr. David Alan Gilbert9ec055a2015-11-05 18:10:58 +00001177 assert((s->state != MIGRATION_STATUS_ACTIVE) &&
1178 (s->state != MIGRATION_STATUS_POSTCOPY_ACTIVE));
Paolo Bonzini7a2c1722013-02-22 17:36:09 +01001179
Liang Li94f5a432015-11-02 15:37:00 +08001180 if (s->state == MIGRATION_STATUS_CANCELLING) {
zhanghailiang48781e52015-12-16 11:47:33 +00001181 migrate_set_state(&s->state, MIGRATION_STATUS_CANCELLING,
Liang Li94f5a432015-11-02 15:37:00 +08001182 MIGRATION_STATUS_CANCELLED);
Paolo Bonzini7a2c1722013-02-22 17:36:09 +01001183 }
Paolo Bonzinia3fa1d72013-02-22 17:36:18 +01001184
Juan Quintela87db1a72017-09-05 12:50:22 +02001185 if (s->error) {
1186 /* It is used on info migrate. We can't free it */
1187 error_report_err(error_copy(s->error));
1188 }
Paolo Bonzinia3fa1d72013-02-22 17:36:18 +01001189 notifier_list_notify(&migration_state_notifiers, s);
Juan Quintela2833c592017-04-05 18:32:37 +02001190 block_cleanup_parameters(s);
aliguori065e2812008-11-11 16:46:33 +00001191}
1192
Juan Quintela87db1a72017-09-05 12:50:22 +02001193void migrate_set_error(MigrationState *s, const Error *error)
1194{
1195 qemu_mutex_lock(&s->error_mutex);
1196 if (!s->error) {
1197 s->error = error_copy(error);
1198 }
1199 qemu_mutex_unlock(&s->error_mutex);
1200}
1201
Daniel P. Berranged59ce6f2016-04-27 11:05:00 +01001202void migrate_fd_error(MigrationState *s, const Error *error)
aliguori065e2812008-11-11 16:46:33 +00001203{
Peter Maydell25174052016-10-21 18:41:45 +01001204 trace_migrate_fd_error(error_get_pretty(error));
zhanghailiang89a02a92016-01-15 11:37:42 +08001205 assert(s->to_dst_file == NULL);
zhanghailiang48781e52015-12-16 11:47:33 +00001206 migrate_set_state(&s->state, MIGRATION_STATUS_SETUP,
1207 MIGRATION_STATUS_FAILED);
Juan Quintela87db1a72017-09-05 12:50:22 +02001208 migrate_set_error(s, error);
Juan Quintela458cf282011-02-22 23:32:54 +01001209}
1210
Juan Quintela0edda1c2010-05-11 16:28:39 +02001211static void migrate_fd_cancel(MigrationState *s)
aliguori065e2812008-11-11 16:46:33 +00001212{
Zhanghaoyu (A)6f2b8112013-11-07 08:21:23 +00001213 int old_state ;
zhanghailiang89a02a92016-01-15 11:37:42 +08001214 QEMUFile *f = migrate_get_current()->to_dst_file;
Alexey Kardashevskiy9013dca2014-03-11 10:42:29 +11001215 trace_migrate_fd_cancel();
aliguori065e2812008-11-11 16:46:33 +00001216
Dr. David Alan Gilbert70b20472015-11-05 18:10:49 +00001217 if (s->rp_state.from_dst_file) {
1218 /* shutdown the rp socket, so causing the rp thread to shutdown */
1219 qemu_file_shutdown(s->rp_state.from_dst_file);
1220 }
1221
Zhanghaoyu (A)6f2b8112013-11-07 08:21:23 +00001222 do {
1223 old_state = s->state;
Dr. David Alan Gilbertf6844b92015-11-05 18:10:48 +00001224 if (!migration_is_setup_or_active(old_state)) {
Zhanghaoyu (A)6f2b8112013-11-07 08:21:23 +00001225 break;
1226 }
Dr. David Alan Gilberta7b36b42017-10-20 10:05:55 +01001227 /* If the migration is paused, kick it out of the pause */
1228 if (old_state == MIGRATION_STATUS_PRE_SWITCHOVER) {
1229 qemu_sem_post(&s->pause_sem);
1230 }
zhanghailiang48781e52015-12-16 11:47:33 +00001231 migrate_set_state(&s->state, old_state, MIGRATION_STATUS_CANCELLING);
zhanghailiang31194732015-03-13 16:08:38 +08001232 } while (s->state != MIGRATION_STATUS_CANCELLING);
Dr. David Alan Gilberta26ba262015-01-08 11:11:32 +00001233
1234 /*
1235 * If we're unlucky the migration code might be stuck somewhere in a
1236 * send/write while the network has failed and is waiting to timeout;
1237 * if we've got shutdown(2) available then we can force it to quit.
1238 * The outgoing qemu file gets closed in migrate_fd_cleanup that is
1239 * called in a bh, so there is no race against this cancel.
1240 */
zhanghailiang31194732015-03-13 16:08:38 +08001241 if (s->state == MIGRATION_STATUS_CANCELLING && f) {
Dr. David Alan Gilberta26ba262015-01-08 11:11:32 +00001242 qemu_file_shutdown(f);
1243 }
zhanghailiang1d2acc32017-01-24 15:59:52 +08001244 if (s->state == MIGRATION_STATUS_CANCELLING && s->block_inactive) {
1245 Error *local_err = NULL;
1246
1247 bdrv_invalidate_cache_all(&local_err);
1248 if (local_err) {
1249 error_report_err(local_err);
1250 } else {
1251 s->block_inactive = false;
1252 }
1253 }
aliguori065e2812008-11-11 16:46:33 +00001254}
1255
Gerd Hoffmann99a0db92010-12-13 17:30:12 +01001256void add_migration_state_change_notifier(Notifier *notify)
1257{
1258 notifier_list_add(&migration_state_notifiers, notify);
1259}
1260
1261void remove_migration_state_change_notifier(Notifier *notify)
1262{
Paolo Bonzini31552522012-01-13 17:34:01 +01001263 notifier_remove(notify);
Gerd Hoffmann99a0db92010-12-13 17:30:12 +01001264}
1265
Stefan Hajnoczi02edd2e2013-07-29 15:01:58 +02001266bool migration_in_setup(MigrationState *s)
Gerd Hoffmannafe2df62011-10-25 13:50:11 +02001267{
zhanghailiang31194732015-03-13 16:08:38 +08001268 return s->state == MIGRATION_STATUS_SETUP;
Gerd Hoffmannafe2df62011-10-25 13:50:11 +02001269}
1270
Juan Quintela70736932011-02-23 00:43:59 +01001271bool migration_has_finished(MigrationState *s)
Gerd Hoffmann99a0db92010-12-13 17:30:12 +01001272{
zhanghailiang31194732015-03-13 16:08:38 +08001273 return s->state == MIGRATION_STATUS_COMPLETED;
Gerd Hoffmann99a0db92010-12-13 17:30:12 +01001274}
Juan Quintela0edda1c2010-05-11 16:28:39 +02001275
Gerd Hoffmannafe2df62011-10-25 13:50:11 +02001276bool migration_has_failed(MigrationState *s)
1277{
zhanghailiang31194732015-03-13 16:08:38 +08001278 return (s->state == MIGRATION_STATUS_CANCELLED ||
1279 s->state == MIGRATION_STATUS_FAILED);
Gerd Hoffmannafe2df62011-10-25 13:50:11 +02001280}
1281
Juan Quintela57273092017-03-20 22:25:28 +01001282bool migration_in_postcopy(void)
Dr. David Alan Gilbert9ec055a2015-11-05 18:10:58 +00001283{
Juan Quintela57273092017-03-20 22:25:28 +01001284 MigrationState *s = migrate_get_current();
1285
Dr. David Alan Gilbert9ec055a2015-11-05 18:10:58 +00001286 return (s->state == MIGRATION_STATUS_POSTCOPY_ACTIVE);
1287}
1288
Dr. David Alan Gilbertb82fc322016-02-22 17:17:32 +00001289bool migration_in_postcopy_after_devices(MigrationState *s)
1290{
Juan Quintela57273092017-03-20 22:25:28 +01001291 return migration_in_postcopy() && s->postcopy_after_devices;
Dr. David Alan Gilbertb82fc322016-02-22 17:17:32 +00001292}
1293
Juan Quintelafab35002017-03-22 17:36:57 +01001294bool migration_is_idle(void)
Ashijeet Acharyafe44dc92017-01-16 17:01:53 +05301295{
Juan Quintelafab35002017-03-22 17:36:57 +01001296 MigrationState *s = migrate_get_current();
Ashijeet Acharyafe44dc92017-01-16 17:01:53 +05301297
1298 switch (s->state) {
1299 case MIGRATION_STATUS_NONE:
1300 case MIGRATION_STATUS_CANCELLED:
1301 case MIGRATION_STATUS_COMPLETED:
1302 case MIGRATION_STATUS_FAILED:
1303 return true;
1304 case MIGRATION_STATUS_SETUP:
1305 case MIGRATION_STATUS_CANCELLING:
1306 case MIGRATION_STATUS_ACTIVE:
1307 case MIGRATION_STATUS_POSTCOPY_ACTIVE:
1308 case MIGRATION_STATUS_COLO:
Dr. David Alan Gilbert31e06072017-10-20 10:05:51 +01001309 case MIGRATION_STATUS_PRE_SWITCHOVER:
1310 case MIGRATION_STATUS_DEVICE:
Ashijeet Acharyafe44dc92017-01-16 17:01:53 +05301311 return false;
1312 case MIGRATION_STATUS__MAX:
1313 g_assert_not_reached();
1314 }
1315
1316 return false;
1317}
1318
Peter Xu3e0c8052018-02-08 18:31:15 +08001319void migrate_init(MigrationState *s)
Juan Quintela0edda1c2010-05-11 16:28:39 +02001320{
Dr. David Alan Gilbert389775d2015-11-12 15:38:27 +00001321 /*
1322 * Reinitialise all migration state, except
1323 * parameters/capabilities that the user set, and
1324 * locks.
1325 */
1326 s->bytes_xfer = 0;
1327 s->xfer_limit = 0;
1328 s->cleanup_bh = 0;
zhanghailiang89a02a92016-01-15 11:37:42 +08001329 s->to_dst_file = NULL;
Dr. David Alan Gilbert389775d2015-11-12 15:38:27 +00001330 s->state = MIGRATION_STATUS_NONE;
Dr. David Alan Gilbert389775d2015-11-12 15:38:27 +00001331 s->rp_state.from_dst_file = NULL;
1332 s->rp_state.error = false;
1333 s->mbps = 0.0;
1334 s->downtime = 0;
1335 s->expected_downtime = 0;
Dr. David Alan Gilbert389775d2015-11-12 15:38:27 +00001336 s->setup_time = 0;
Dr. David Alan Gilbert389775d2015-11-12 15:38:27 +00001337 s->start_postcopy = false;
Dr. David Alan Gilbertb82fc322016-02-22 17:17:32 +00001338 s->postcopy_after_devices = false;
Dr. David Alan Gilbert389775d2015-11-12 15:38:27 +00001339 s->migration_thread_running = false;
Daniel P. Berranged59ce6f2016-04-27 11:05:00 +01001340 error_free(s->error);
1341 s->error = NULL;
Juan Quintela1299c632011-11-09 21:29:01 +01001342
zhanghailiang48781e52015-12-16 11:47:33 +00001343 migrate_set_state(&s->state, MIGRATION_STATUS_NONE, MIGRATION_STATUS_SETUP);
Juan Quintela0edda1c2010-05-11 16:28:39 +02001344
Peter Xu4af246a2018-01-03 20:20:08 +08001345 s->start_time = qemu_clock_get_ms(QEMU_CLOCK_REALTIME);
1346 s->total_time = 0;
Peter Xu7287cbd2018-01-03 20:20:09 +08001347 s->vm_was_running = false;
Peter Xub15df1a2018-01-03 20:20:13 +08001348 s->iteration_initial_bytes = 0;
1349 s->threshold_size = 0;
Juan Quintela0edda1c2010-05-11 16:28:39 +02001350}
Juan Quintelacab30142011-02-22 23:54:21 +01001351
Anthony Liguorifa2756b2011-11-14 15:09:43 -06001352static GSList *migration_blockers;
1353
Ashijeet Acharyafe44dc92017-01-16 17:01:53 +05301354int migrate_add_blocker(Error *reason, Error **errp)
Anthony Liguorifa2756b2011-11-14 15:09:43 -06001355{
Peter Xu3df663e2017-06-27 12:10:15 +08001356 if (migrate_get_current()->only_migratable) {
Ashijeet Acharyab67b8c32017-01-16 17:01:54 +05301357 error_propagate(errp, error_copy(reason));
1358 error_prepend(errp, "disallowing migration blocker "
1359 "(--only_migratable) for: ");
1360 return -EACCES;
1361 }
1362
Juan Quintelafab35002017-03-22 17:36:57 +01001363 if (migration_is_idle()) {
Ashijeet Acharyafe44dc92017-01-16 17:01:53 +05301364 migration_blockers = g_slist_prepend(migration_blockers, reason);
1365 return 0;
1366 }
1367
1368 error_propagate(errp, error_copy(reason));
1369 error_prepend(errp, "disallowing migration blocker (migration in "
1370 "progress) for: ");
1371 return -EBUSY;
Anthony Liguorifa2756b2011-11-14 15:09:43 -06001372}
1373
1374void migrate_del_blocker(Error *reason)
1375{
1376 migration_blockers = g_slist_remove(migration_blockers, reason);
1377}
1378
Dr. David Alan Gilbertbf1ae1f2015-02-19 11:40:28 +00001379void qmp_migrate_incoming(const char *uri, Error **errp)
1380{
1381 Error *local_err = NULL;
Dr. David Alan Gilbert4debb5f2015-02-26 14:54:41 +00001382 static bool once = true;
Dr. David Alan Gilbertbf1ae1f2015-02-19 11:40:28 +00001383
1384 if (!deferred_incoming) {
Dr. David Alan Gilbert4debb5f2015-02-26 14:54:41 +00001385 error_setg(errp, "For use with '-incoming defer'");
Dr. David Alan Gilbertbf1ae1f2015-02-19 11:40:28 +00001386 return;
1387 }
Dr. David Alan Gilbert4debb5f2015-02-26 14:54:41 +00001388 if (!once) {
1389 error_setg(errp, "The incoming migration has already been started");
1390 }
Dr. David Alan Gilbertbf1ae1f2015-02-19 11:40:28 +00001391
1392 qemu_start_incoming_migration(uri, &local_err);
1393
1394 if (local_err) {
1395 error_propagate(errp, local_err);
1396 return;
1397 }
1398
Dr. David Alan Gilbert4debb5f2015-02-26 14:54:41 +00001399 once = false;
Dr. David Alan Gilbertbf1ae1f2015-02-19 11:40:28 +00001400}
1401
Greg Kurz24f39022016-05-04 21:44:19 +02001402bool migration_is_blocked(Error **errp)
1403{
1404 if (qemu_savevm_state_blocked(errp)) {
1405 return true;
1406 }
1407
1408 if (migration_blockers) {
Eduardo Habkost250561e2017-06-08 10:39:05 -03001409 error_propagate(errp, error_copy(migration_blockers->data));
Greg Kurz24f39022016-05-04 21:44:19 +02001410 return true;
1411 }
1412
1413 return false;
1414}
1415
Peter Xud3e35b82018-05-02 18:47:24 +08001416/* Returns true if continue to migrate, or false if error detected */
1417static bool migrate_prepare(MigrationState *s, bool blk, bool blk_inc,
1418 bool resume, Error **errp)
1419{
1420 Error *local_err = NULL;
1421
1422 if (resume) {
1423 if (s->state != MIGRATION_STATUS_POSTCOPY_PAUSED) {
1424 error_setg(errp, "Cannot resume if there is no "
1425 "paused migration");
1426 return false;
1427 }
1428 /* This is a resume, skip init status */
1429 return true;
1430 }
1431
1432 if (migration_is_setup_or_active(s->state) ||
1433 s->state == MIGRATION_STATUS_CANCELLING ||
1434 s->state == MIGRATION_STATUS_COLO) {
1435 error_setg(errp, QERR_MIGRATION_ACTIVE);
1436 return false;
1437 }
1438
1439 if (runstate_check(RUN_STATE_INMIGRATE)) {
1440 error_setg(errp, "Guest is waiting for an incoming migration");
1441 return false;
1442 }
1443
1444 if (migration_is_blocked(errp)) {
1445 return false;
1446 }
1447
1448 if (blk || blk_inc) {
1449 if (migrate_use_block() || migrate_use_block_incremental()) {
1450 error_setg(errp, "Command options are incompatible with "
1451 "current migration capabilities");
1452 return false;
1453 }
1454 migrate_set_block_enabled(true, &local_err);
1455 if (local_err) {
1456 error_propagate(errp, local_err);
1457 return false;
1458 }
1459 s->must_remove_block_options = true;
1460 }
1461
1462 if (blk_inc) {
1463 migrate_set_block_incremental(s, true);
1464 }
1465
1466 migrate_init(s);
1467
1468 return true;
1469}
1470
Luiz Capitulinoe1c37d02011-12-05 14:48:01 -02001471void qmp_migrate(const char *uri, bool has_blk, bool blk,
1472 bool has_inc, bool inc, bool has_detach, bool detach,
Peter Xu7a4da282018-05-02 18:47:23 +08001473 bool has_resume, bool resume, Error **errp)
Juan Quintelacab30142011-02-22 23:54:21 +01001474{
Paolo Bonzinibe7059c2012-10-03 14:34:33 +02001475 Error *local_err = NULL;
Juan Quintela17549e82011-10-05 13:50:43 +02001476 MigrationState *s = migrate_get_current();
Juan Quintelacab30142011-02-22 23:54:21 +01001477 const char *p;
Juan Quintelacab30142011-02-22 23:54:21 +01001478
Peter Xud3e35b82018-05-02 18:47:24 +08001479 if (!migrate_prepare(s, has_blk && blk, has_inc && inc,
1480 has_resume && resume, errp)) {
1481 /* Error detected, put into errp */
Luiz Capitulinoe1c37d02011-12-05 14:48:01 -02001482 return;
Juan Quintelacab30142011-02-22 23:54:21 +01001483 }
Juan Quintelacab30142011-02-22 23:54:21 +01001484
1485 if (strstart(uri, "tcp:", &p)) {
Paolo Bonzinif37afb52012-10-02 10:02:46 +02001486 tcp_start_outgoing_migration(s, p, &local_err);
Michael R. Hines2da776d2013-07-22 10:01:54 -04001487#ifdef CONFIG_RDMA
Michael R. Hines41310c62013-12-19 04:52:01 +08001488 } else if (strstart(uri, "rdma:", &p)) {
Michael R. Hines2da776d2013-07-22 10:01:54 -04001489 rdma_start_outgoing_migration(s, p, &local_err);
1490#endif
Juan Quintelacab30142011-02-22 23:54:21 +01001491 } else if (strstart(uri, "exec:", &p)) {
Paolo Bonzinif37afb52012-10-02 10:02:46 +02001492 exec_start_outgoing_migration(s, p, &local_err);
Juan Quintelacab30142011-02-22 23:54:21 +01001493 } else if (strstart(uri, "unix:", &p)) {
Paolo Bonzinif37afb52012-10-02 10:02:46 +02001494 unix_start_outgoing_migration(s, p, &local_err);
Juan Quintelacab30142011-02-22 23:54:21 +01001495 } else if (strstart(uri, "fd:", &p)) {
Paolo Bonzinif37afb52012-10-02 10:02:46 +02001496 fd_start_outgoing_migration(s, p, &local_err);
Juan Quintelacab30142011-02-22 23:54:21 +01001497 } else {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01001498 error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "uri",
1499 "a valid migration protocol");
zhanghailiang48781e52015-12-16 11:47:33 +00001500 migrate_set_state(&s->state, MIGRATION_STATUS_SETUP,
1501 MIGRATION_STATUS_FAILED);
Dr. David Alan Gilbert09576e72018-03-16 20:21:14 +00001502 block_cleanup_parameters(s);
Luiz Capitulinoe1c37d02011-12-05 14:48:01 -02001503 return;
Juan Quintelacab30142011-02-22 23:54:21 +01001504 }
1505
Paolo Bonzinif37afb52012-10-02 10:02:46 +02001506 if (local_err) {
Daniel P. Berranged59ce6f2016-04-27 11:05:00 +01001507 migrate_fd_error(s, local_err);
Paolo Bonzinif37afb52012-10-02 10:02:46 +02001508 error_propagate(errp, local_err);
Luiz Capitulinoe1c37d02011-12-05 14:48:01 -02001509 return;
Juan Quintela1299c632011-11-09 21:29:01 +01001510 }
Juan Quintelacab30142011-02-22 23:54:21 +01001511}
1512
Luiz Capitulino6cdedb02011-11-27 22:54:09 -02001513void qmp_migrate_cancel(Error **errp)
Juan Quintelacab30142011-02-22 23:54:21 +01001514{
Juan Quintela17549e82011-10-05 13:50:43 +02001515 migrate_fd_cancel(migrate_get_current());
Juan Quintelacab30142011-02-22 23:54:21 +01001516}
1517
Dr. David Alan Gilbert89cfc022017-10-20 10:05:53 +01001518void qmp_migrate_continue(MigrationStatus state, Error **errp)
1519{
1520 MigrationState *s = migrate_get_current();
1521 if (s->state != state) {
1522 error_setg(errp, "Migration not in expected state: %s",
1523 MigrationStatus_str(s->state));
1524 return;
1525 }
1526 qemu_sem_post(&s->pause_sem);
1527}
1528
Orit Wasserman9e1ba4c2012-08-06 21:42:54 +03001529void qmp_migrate_set_cache_size(int64_t value, Error **errp)
1530{
Juan Quintela73af8dd2017-10-05 21:30:10 +02001531 MigrateSetParameters p = {
1532 .has_xbzrle_cache_size = true,
1533 .xbzrle_cache_size = value,
1534 };
Orit Wasserman9e1ba4c2012-08-06 21:42:54 +03001535
Juan Quintela73af8dd2017-10-05 21:30:10 +02001536 qmp_migrate_set_parameters(&p, errp);
Orit Wasserman9e1ba4c2012-08-06 21:42:54 +03001537}
1538
1539int64_t qmp_query_migrate_cache_size(Error **errp)
1540{
1541 return migrate_xbzrle_cache_size();
1542}
1543
Luiz Capitulino3dc85382011-11-28 11:59:37 -02001544void qmp_migrate_set_speed(int64_t value, Error **errp)
Juan Quintelacab30142011-02-22 23:54:21 +01001545{
Markus Armbruster1bda8b32017-07-18 13:42:11 +02001546 MigrateSetParameters p = {
Ashijeet Acharya2ff30252016-09-15 21:50:28 +05301547 .has_max_bandwidth = true,
1548 .max_bandwidth = value,
1549 };
Juan Quintelacab30142011-02-22 23:54:21 +01001550
Ashijeet Acharya2ff30252016-09-15 21:50:28 +05301551 qmp_migrate_set_parameters(&p, errp);
Juan Quintelacab30142011-02-22 23:54:21 +01001552}
1553
Luiz Capitulino4f0a9932011-11-27 23:18:01 -02001554void qmp_migrate_set_downtime(double value, Error **errp)
Juan Quintelacab30142011-02-22 23:54:21 +01001555{
Daniel Henrique Barboza87c9cc12017-02-22 12:17:29 -03001556 if (value < 0 || value > MAX_MIGRATE_DOWNTIME_SECONDS) {
1557 error_setg(errp, "Parameter 'downtime_limit' expects an integer in "
1558 "the range of 0 to %d seconds",
1559 MAX_MIGRATE_DOWNTIME_SECONDS);
1560 return;
1561 }
1562
Ashijeet Acharya2ff30252016-09-15 21:50:28 +05301563 value *= 1000; /* Convert to milliseconds */
1564 value = MAX(0, MIN(INT64_MAX, value));
1565
Markus Armbruster1bda8b32017-07-18 13:42:11 +02001566 MigrateSetParameters p = {
Ashijeet Acharya2ff30252016-09-15 21:50:28 +05301567 .has_downtime_limit = true,
1568 .downtime_limit = value,
1569 };
1570
1571 qmp_migrate_set_parameters(&p, errp);
aliguori5bb79102008-10-13 03:12:02 +00001572}
Orit Wasserman17ad9b32012-08-06 21:42:53 +03001573
Pavel Butsykin53f09a12017-02-03 18:23:20 +03001574bool migrate_release_ram(void)
1575{
1576 MigrationState *s;
1577
1578 s = migrate_get_current();
1579
1580 return s->enabled_capabilities[MIGRATION_CAPABILITY_RELEASE_RAM];
1581}
1582
Dr. David Alan Gilbert53dd3702015-11-05 18:10:51 +00001583bool migrate_postcopy_ram(void)
1584{
1585 MigrationState *s;
1586
1587 s = migrate_get_current();
1588
Dr. David Alan Gilbert32c3db52016-03-11 09:53:36 +00001589 return s->enabled_capabilities[MIGRATION_CAPABILITY_POSTCOPY_RAM];
Dr. David Alan Gilbert53dd3702015-11-05 18:10:51 +00001590}
1591
Vladimir Sementsov-Ogievskiy58110f02017-07-10 19:30:16 +03001592bool migrate_postcopy(void)
1593{
Vladimir Sementsov-Ogievskiydd6bb912018-03-13 15:34:00 -04001594 return migrate_postcopy_ram() || migrate_dirty_bitmaps();
Vladimir Sementsov-Ogievskiy58110f02017-07-10 19:30:16 +03001595}
1596
Chegu Vinodbde1e2e2013-06-24 03:49:42 -06001597bool migrate_auto_converge(void)
1598{
1599 MigrationState *s;
1600
1601 s = migrate_get_current();
1602
1603 return s->enabled_capabilities[MIGRATION_CAPABILITY_AUTO_CONVERGE];
1604}
1605
Peter Lieven323004a2013-07-18 09:48:50 +02001606bool migrate_zero_blocks(void)
1607{
1608 MigrationState *s;
1609
1610 s = migrate_get_current();
1611
1612 return s->enabled_capabilities[MIGRATION_CAPABILITY_ZERO_BLOCKS];
1613}
1614
Alexey Perevalovf22f9282018-03-22 21:17:22 +03001615bool migrate_postcopy_blocktime(void)
1616{
1617 MigrationState *s;
1618
1619 s = migrate_get_current();
1620
1621 return s->enabled_capabilities[MIGRATION_CAPABILITY_POSTCOPY_BLOCKTIME];
1622}
1623
Liang Li8706d2d2015-03-23 16:32:17 +08001624bool migrate_use_compression(void)
1625{
Liang Lidde4e692015-03-23 16:32:26 +08001626 MigrationState *s;
1627
1628 s = migrate_get_current();
1629
1630 return s->enabled_capabilities[MIGRATION_CAPABILITY_COMPRESS];
Liang Li8706d2d2015-03-23 16:32:17 +08001631}
1632
1633int migrate_compress_level(void)
1634{
1635 MigrationState *s;
1636
1637 s = migrate_get_current();
1638
Daniel P. Berrange2594f562016-04-27 11:05:14 +01001639 return s->parameters.compress_level;
Liang Li8706d2d2015-03-23 16:32:17 +08001640}
1641
1642int migrate_compress_threads(void)
1643{
1644 MigrationState *s;
1645
1646 s = migrate_get_current();
1647
Daniel P. Berrange2594f562016-04-27 11:05:14 +01001648 return s->parameters.compress_threads;
Liang Li8706d2d2015-03-23 16:32:17 +08001649}
1650
Liang Li3fcb38c2015-03-23 16:32:18 +08001651int migrate_decompress_threads(void)
1652{
1653 MigrationState *s;
1654
1655 s = migrate_get_current();
1656
Daniel P. Berrange2594f562016-04-27 11:05:14 +01001657 return s->parameters.decompress_threads;
Liang Li3fcb38c2015-03-23 16:32:18 +08001658}
1659
Vladimir Sementsov-Ogievskiy55efc8c2018-03-13 15:34:00 -04001660bool migrate_dirty_bitmaps(void)
1661{
1662 MigrationState *s;
1663
1664 s = migrate_get_current();
1665
1666 return s->enabled_capabilities[MIGRATION_CAPABILITY_DIRTY_BITMAPS];
1667}
1668
Juan Quintelab05dc722015-07-07 14:44:05 +02001669bool migrate_use_events(void)
1670{
1671 MigrationState *s;
1672
1673 s = migrate_get_current();
1674
1675 return s->enabled_capabilities[MIGRATION_CAPABILITY_EVENTS];
1676}
1677
Juan Quintela30126bb2016-01-14 12:23:00 +01001678bool migrate_use_multifd(void)
1679{
1680 MigrationState *s;
1681
1682 s = migrate_get_current();
1683
1684 return s->enabled_capabilities[MIGRATION_CAPABILITY_X_MULTIFD];
1685}
1686
Dr. David Alan Gilbert93fbd032017-10-20 10:05:50 +01001687bool migrate_pause_before_switchover(void)
1688{
1689 MigrationState *s;
1690
1691 s = migrate_get_current();
1692
1693 return s->enabled_capabilities[
1694 MIGRATION_CAPABILITY_PAUSE_BEFORE_SWITCHOVER];
1695}
1696
Juan Quintela4075fb12016-01-15 08:56:17 +01001697int migrate_multifd_channels(void)
1698{
1699 MigrationState *s;
1700
1701 s = migrate_get_current();
1702
1703 return s->parameters.x_multifd_channels;
1704}
1705
Juan Quintela0fb86602017-04-27 10:48:25 +02001706int migrate_multifd_page_count(void)
1707{
1708 MigrationState *s;
1709
1710 s = migrate_get_current();
1711
1712 return s->parameters.x_multifd_page_count;
1713}
1714
Orit Wasserman17ad9b32012-08-06 21:42:53 +03001715int migrate_use_xbzrle(void)
1716{
1717 MigrationState *s;
1718
1719 s = migrate_get_current();
1720
1721 return s->enabled_capabilities[MIGRATION_CAPABILITY_XBZRLE];
1722}
1723
1724int64_t migrate_xbzrle_cache_size(void)
1725{
1726 MigrationState *s;
1727
1728 s = migrate_get_current();
1729
Juan Quintela73af8dd2017-10-05 21:30:10 +02001730 return s->parameters.xbzrle_cache_size;
Orit Wasserman17ad9b32012-08-06 21:42:53 +03001731}
Juan Quintela0d82d0e2012-10-03 14:18:33 +02001732
Juan Quintela2833c592017-04-05 18:32:37 +02001733bool migrate_use_block(void)
1734{
1735 MigrationState *s;
1736
1737 s = migrate_get_current();
1738
1739 return s->enabled_capabilities[MIGRATION_CAPABILITY_BLOCK];
1740}
1741
Peter Xuc788ada2017-06-26 18:28:55 +08001742bool migrate_use_return_path(void)
1743{
1744 MigrationState *s;
1745
1746 s = migrate_get_current();
1747
1748 return s->enabled_capabilities[MIGRATION_CAPABILITY_RETURN_PATH];
1749}
1750
Juan Quintela2833c592017-04-05 18:32:37 +02001751bool migrate_use_block_incremental(void)
1752{
1753 MigrationState *s;
1754
1755 s = migrate_get_current();
1756
1757 return s->parameters.block_incremental;
1758}
1759
Dr. David Alan Gilbert70b20472015-11-05 18:10:49 +00001760/* migration thread support */
1761/*
1762 * Something bad happened to the RP stream, mark an error
1763 * The caller shall print or trace something to indicate why
1764 */
1765static void mark_source_rp_bad(MigrationState *s)
1766{
1767 s->rp_state.error = true;
1768}
1769
1770static struct rp_cmd_args {
1771 ssize_t len; /* -1 = variable */
1772 const char *name;
1773} rp_cmd_args[] = {
1774 [MIG_RP_MSG_INVALID] = { .len = -1, .name = "INVALID" },
1775 [MIG_RP_MSG_SHUT] = { .len = 4, .name = "SHUT" },
1776 [MIG_RP_MSG_PONG] = { .len = 4, .name = "PONG" },
Dr. David Alan Gilbert1e2d90e2015-11-05 18:11:07 +00001777 [MIG_RP_MSG_REQ_PAGES] = { .len = 12, .name = "REQ_PAGES" },
1778 [MIG_RP_MSG_REQ_PAGES_ID] = { .len = -1, .name = "REQ_PAGES_ID" },
Dr. David Alan Gilbert70b20472015-11-05 18:10:49 +00001779 [MIG_RP_MSG_MAX] = { .len = -1, .name = "MAX" },
1780};
1781
1782/*
Dr. David Alan Gilbert1e2d90e2015-11-05 18:11:07 +00001783 * Process a request for pages received on the return path,
1784 * We're allowed to send more than requested (e.g. to round to our page size)
1785 * and we don't need to send pages that have already been sent.
1786 */
1787static void migrate_handle_rp_req_pages(MigrationState *ms, const char* rbname,
1788 ram_addr_t start, size_t len)
1789{
Dr. David Alan Gilbert6c595cd2015-11-05 18:11:08 +00001790 long our_host_ps = getpagesize();
1791
Dr. David Alan Gilbert1e2d90e2015-11-05 18:11:07 +00001792 trace_migrate_handle_rp_req_pages(rbname, start, len);
Dr. David Alan Gilbert6c595cd2015-11-05 18:11:08 +00001793
1794 /*
1795 * Since we currently insist on matching page sizes, just sanity check
1796 * we're being asked for whole host pages.
1797 */
1798 if (start & (our_host_ps-1) ||
1799 (len & (our_host_ps-1))) {
1800 error_report("%s: Misaligned page request, start: " RAM_ADDR_FMT
1801 " len: %zd", __func__, start, len);
1802 mark_source_rp_bad(ms);
1803 return;
1804 }
1805
Juan Quintela96506892017-03-14 18:41:03 +01001806 if (ram_save_queue_pages(rbname, start, len)) {
Dr. David Alan Gilbert6c595cd2015-11-05 18:11:08 +00001807 mark_source_rp_bad(ms);
1808 }
Dr. David Alan Gilbert1e2d90e2015-11-05 18:11:07 +00001809}
1810
Peter Xu14b17422018-05-02 18:47:21 +08001811/* Return true to retry, false to quit */
1812static bool postcopy_pause_return_path_thread(MigrationState *s)
1813{
1814 trace_postcopy_pause_return_path();
1815
1816 qemu_sem_wait(&s->postcopy_pause_rp_sem);
1817
1818 trace_postcopy_pause_return_path_continued();
1819
1820 return true;
1821}
1822
Dr. David Alan Gilbert1e2d90e2015-11-05 18:11:07 +00001823/*
Dr. David Alan Gilbert70b20472015-11-05 18:10:49 +00001824 * Handles messages sent on the return path towards the source VM
1825 *
1826 */
1827static void *source_return_path_thread(void *opaque)
1828{
1829 MigrationState *ms = opaque;
1830 QEMUFile *rp = ms->rp_state.from_dst_file;
1831 uint16_t header_len, header_type;
Peter Xu568b01c2016-03-09 14:12:12 +08001832 uint8_t buf[512];
Dr. David Alan Gilbert70b20472015-11-05 18:10:49 +00001833 uint32_t tmp32, sibling_error;
Dr. David Alan Gilbert1e2d90e2015-11-05 18:11:07 +00001834 ram_addr_t start = 0; /* =0 to silence warning */
1835 size_t len = 0, expected_len;
Dr. David Alan Gilbert70b20472015-11-05 18:10:49 +00001836 int res;
1837
1838 trace_source_return_path_thread_entry();
Peter Xu14b17422018-05-02 18:47:21 +08001839
1840retry:
Dr. David Alan Gilbert70b20472015-11-05 18:10:49 +00001841 while (!ms->rp_state.error && !qemu_file_get_error(rp) &&
1842 migration_is_setup_or_active(ms->state)) {
1843 trace_source_return_path_thread_loop_top();
1844 header_type = qemu_get_be16(rp);
1845 header_len = qemu_get_be16(rp);
1846
Peter Xu7a9ddfb2018-02-08 18:31:05 +08001847 if (qemu_file_get_error(rp)) {
1848 mark_source_rp_bad(ms);
1849 goto out;
1850 }
1851
Dr. David Alan Gilbert70b20472015-11-05 18:10:49 +00001852 if (header_type >= MIG_RP_MSG_MAX ||
1853 header_type == MIG_RP_MSG_INVALID) {
1854 error_report("RP: Received invalid message 0x%04x length 0x%04x",
1855 header_type, header_len);
1856 mark_source_rp_bad(ms);
1857 goto out;
1858 }
1859
1860 if ((rp_cmd_args[header_type].len != -1 &&
1861 header_len != rp_cmd_args[header_type].len) ||
Peter Xu568b01c2016-03-09 14:12:12 +08001862 header_len > sizeof(buf)) {
Dr. David Alan Gilbert70b20472015-11-05 18:10:49 +00001863 error_report("RP: Received '%s' message (0x%04x) with"
1864 "incorrect length %d expecting %zu",
1865 rp_cmd_args[header_type].name, header_type, header_len,
1866 (size_t)rp_cmd_args[header_type].len);
1867 mark_source_rp_bad(ms);
1868 goto out;
1869 }
1870
1871 /* We know we've got a valid header by this point */
1872 res = qemu_get_buffer(rp, buf, header_len);
1873 if (res != header_len) {
1874 error_report("RP: Failed reading data for message 0x%04x"
1875 " read %d expected %d",
1876 header_type, res, header_len);
1877 mark_source_rp_bad(ms);
1878 goto out;
1879 }
1880
1881 /* OK, we have the message and the data */
1882 switch (header_type) {
1883 case MIG_RP_MSG_SHUT:
Peter Maydell4d885132016-06-10 17:09:22 +01001884 sibling_error = ldl_be_p(buf);
Dr. David Alan Gilbert70b20472015-11-05 18:10:49 +00001885 trace_source_return_path_thread_shut(sibling_error);
1886 if (sibling_error) {
1887 error_report("RP: Sibling indicated error %d", sibling_error);
1888 mark_source_rp_bad(ms);
1889 }
1890 /*
1891 * We'll let the main thread deal with closing the RP
1892 * we could do a shutdown(2) on it, but we're the only user
1893 * anyway, so there's nothing gained.
1894 */
1895 goto out;
1896
1897 case MIG_RP_MSG_PONG:
Peter Maydell4d885132016-06-10 17:09:22 +01001898 tmp32 = ldl_be_p(buf);
Dr. David Alan Gilbert70b20472015-11-05 18:10:49 +00001899 trace_source_return_path_thread_pong(tmp32);
1900 break;
1901
Dr. David Alan Gilbert1e2d90e2015-11-05 18:11:07 +00001902 case MIG_RP_MSG_REQ_PAGES:
Peter Maydell4d885132016-06-10 17:09:22 +01001903 start = ldq_be_p(buf);
1904 len = ldl_be_p(buf + 8);
Dr. David Alan Gilbert1e2d90e2015-11-05 18:11:07 +00001905 migrate_handle_rp_req_pages(ms, NULL, start, len);
1906 break;
1907
1908 case MIG_RP_MSG_REQ_PAGES_ID:
1909 expected_len = 12 + 1; /* header + termination */
1910
1911 if (header_len >= expected_len) {
Peter Maydell4d885132016-06-10 17:09:22 +01001912 start = ldq_be_p(buf);
1913 len = ldl_be_p(buf + 8);
Dr. David Alan Gilbert1e2d90e2015-11-05 18:11:07 +00001914 /* Now we expect an idstr */
1915 tmp32 = buf[12]; /* Length of the following idstr */
1916 buf[13 + tmp32] = '\0';
1917 expected_len += tmp32;
1918 }
1919 if (header_len != expected_len) {
1920 error_report("RP: Req_Page_id with length %d expecting %zd",
1921 header_len, expected_len);
1922 mark_source_rp_bad(ms);
1923 goto out;
1924 }
1925 migrate_handle_rp_req_pages(ms, (char *)&buf[13], start, len);
1926 break;
1927
Dr. David Alan Gilbert70b20472015-11-05 18:10:49 +00001928 default:
1929 break;
1930 }
1931 }
Peter Xu14b17422018-05-02 18:47:21 +08001932
1933out:
1934 res = qemu_file_get_error(rp);
1935 if (res) {
1936 if (res == -EIO) {
1937 /*
1938 * Maybe there is something we can do: it looks like a
1939 * network down issue, and we pause for a recovery.
1940 */
1941 if (postcopy_pause_return_path_thread(ms)) {
1942 /* Reload rp, reset the rest */
1943 rp = ms->rp_state.from_dst_file;
1944 ms->rp_state.error = false;
1945 goto retry;
1946 }
1947 }
1948
Dr. David Alan Gilbert70b20472015-11-05 18:10:49 +00001949 trace_source_return_path_thread_bad_end();
1950 mark_source_rp_bad(ms);
1951 }
1952
1953 trace_source_return_path_thread_end();
Dr. David Alan Gilbert70b20472015-11-05 18:10:49 +00001954 ms->rp_state.from_dst_file = NULL;
1955 qemu_fclose(rp);
1956 return NULL;
1957}
1958
Peter Xud3e35b82018-05-02 18:47:24 +08001959static int open_return_path_on_source(MigrationState *ms,
1960 bool create_thread)
Dr. David Alan Gilbert70b20472015-11-05 18:10:49 +00001961{
1962
zhanghailiang89a02a92016-01-15 11:37:42 +08001963 ms->rp_state.from_dst_file = qemu_file_get_return_path(ms->to_dst_file);
Dr. David Alan Gilbert70b20472015-11-05 18:10:49 +00001964 if (!ms->rp_state.from_dst_file) {
1965 return -1;
1966 }
1967
1968 trace_open_return_path_on_source();
Peter Xud3e35b82018-05-02 18:47:24 +08001969
1970 if (!create_thread) {
1971 /* We're done */
1972 return 0;
1973 }
1974
Dr. David Alan Gilbert70b20472015-11-05 18:10:49 +00001975 qemu_thread_create(&ms->rp_state.rp_thread, "return path",
1976 source_return_path_thread, ms, QEMU_THREAD_JOINABLE);
1977
1978 trace_open_return_path_on_source_continue();
1979
1980 return 0;
1981}
1982
Dr. David Alan Gilbert70b20472015-11-05 18:10:49 +00001983/* Returns 0 if the RP was ok, otherwise there was an error on the RP */
1984static int await_return_path_close_on_source(MigrationState *ms)
1985{
1986 /*
1987 * If this is a normal exit then the destination will send a SHUT and the
1988 * rp_thread will exit, however if there's an error we need to cause
1989 * it to exit.
1990 */
zhanghailiang89a02a92016-01-15 11:37:42 +08001991 if (qemu_file_get_error(ms->to_dst_file) && ms->rp_state.from_dst_file) {
Dr. David Alan Gilbert70b20472015-11-05 18:10:49 +00001992 /*
1993 * shutdown(2), if we have it, will cause it to unblock if it's stuck
1994 * waiting for the destination.
1995 */
1996 qemu_file_shutdown(ms->rp_state.from_dst_file);
1997 mark_source_rp_bad(ms);
1998 }
1999 trace_await_return_path_close_on_source_joining();
2000 qemu_thread_join(&ms->rp_state.rp_thread);
2001 trace_await_return_path_close_on_source_close();
2002 return ms->rp_state.error;
2003}
2004
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002005/*
2006 * Switch from normal iteration to postcopy
2007 * Returns non-0 on error
2008 */
Peter Xu7287cbd2018-01-03 20:20:09 +08002009static int postcopy_start(MigrationState *ms)
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002010{
2011 int ret;
Daniel P. Berrange61b67d42016-04-27 11:05:01 +01002012 QIOChannelBuffer *bioc;
2013 QEMUFile *fb;
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002014 int64_t time_at_stop = qemu_clock_get_ms(QEMU_CLOCK_REALTIME);
Dr. David Alan Gilbertef8d6482017-02-02 15:59:09 +00002015 bool restart_block = false;
Dr. David Alan Gilbert0331c8c2017-10-20 10:05:56 +01002016 int cur_state = MIGRATION_STATUS_ACTIVE;
2017 if (!migrate_pause_before_switchover()) {
2018 migrate_set_state(&ms->state, MIGRATION_STATUS_ACTIVE,
2019 MIGRATION_STATUS_POSTCOPY_ACTIVE);
2020 }
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002021
2022 trace_postcopy_start();
2023 qemu_mutex_lock_iothread();
2024 trace_postcopy_start_set_run();
2025
2026 qemu_system_wakeup_request(QEMU_WAKEUP_REASON_OTHER);
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002027 global_state_store();
2028 ret = vm_stop_force_state(RUN_STATE_FINISH_MIGRATE);
Kevin Wolf76b1c7f2015-12-22 14:07:08 +01002029 if (ret < 0) {
2030 goto fail;
2031 }
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002032
Dr. David Alan Gilbert0331c8c2017-10-20 10:05:56 +01002033 ret = migration_maybe_pause(ms, &cur_state,
2034 MIGRATION_STATUS_POSTCOPY_ACTIVE);
2035 if (ret < 0) {
2036 goto fail;
2037 }
2038
Kevin Wolf76b1c7f2015-12-22 14:07:08 +01002039 ret = bdrv_inactivate_all();
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002040 if (ret < 0) {
2041 goto fail;
2042 }
Dr. David Alan Gilbertef8d6482017-02-02 15:59:09 +00002043 restart_block = true;
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002044
2045 /*
Dr. David Alan Gilbert1c0d2492015-11-11 14:02:27 +00002046 * Cause any non-postcopiable, but iterative devices to
2047 * send out their final data.
2048 */
Fam Zhenga1fbe752017-06-17 00:06:58 +08002049 qemu_savevm_state_complete_precopy(ms->to_dst_file, true, false);
Dr. David Alan Gilbert1c0d2492015-11-11 14:02:27 +00002050
2051 /*
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002052 * in Finish migrate and with the io-lock held everything should
2053 * be quiet, but we've potentially still got dirty pages and we
2054 * need to tell the destination to throw any pages it's already received
2055 * that are dirty
2056 */
Vladimir Sementsov-Ogievskiy58110f02017-07-10 19:30:16 +03002057 if (migrate_postcopy_ram()) {
2058 if (ram_postcopy_send_discard_bitmap(ms)) {
2059 error_report("postcopy send discard bitmap failed");
2060 goto fail;
2061 }
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002062 }
2063
2064 /*
2065 * send rest of state - note things that are doing postcopy
2066 * will notice we're in POSTCOPY_ACTIVE and not actually
2067 * wrap their state up here
2068 */
zhanghailiang89a02a92016-01-15 11:37:42 +08002069 qemu_file_set_rate_limit(ms->to_dst_file, INT64_MAX);
Vladimir Sementsov-Ogievskiy58110f02017-07-10 19:30:16 +03002070 if (migrate_postcopy_ram()) {
2071 /* Ping just for debugging, helps line traces up */
2072 qemu_savevm_send_ping(ms->to_dst_file, 2);
2073 }
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002074
2075 /*
2076 * While loading the device state we may trigger page transfer
2077 * requests and the fd must be free to process those, and thus
2078 * the destination must read the whole device state off the fd before
2079 * it starts processing it. Unfortunately the ad-hoc migration format
2080 * doesn't allow the destination to know the size to read without fully
2081 * parsing it through each devices load-state code (especially the open
2082 * coded devices that use get/put).
2083 * So we wrap the device state up in a package with a length at the start;
2084 * to do this we use a qemu_buf to hold the whole of the device state.
2085 */
Daniel P. Berrange61b67d42016-04-27 11:05:01 +01002086 bioc = qio_channel_buffer_new(4096);
Daniel P. Berrange6f01f132016-09-30 11:57:14 +01002087 qio_channel_set_name(QIO_CHANNEL(bioc), "migration-postcopy-buffer");
Daniel P. Berrange61b67d42016-04-27 11:05:01 +01002088 fb = qemu_fopen_channel_output(QIO_CHANNEL(bioc));
2089 object_unref(OBJECT(bioc));
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002090
Dr. David Alan Gilbertc76201a2015-11-05 18:11:18 +00002091 /*
2092 * Make sure the receiver can get incoming pages before we send the rest
2093 * of the state
2094 */
2095 qemu_savevm_send_postcopy_listen(fb);
2096
Fam Zhenga1fbe752017-06-17 00:06:58 +08002097 qemu_savevm_state_complete_precopy(fb, false, false);
Vladimir Sementsov-Ogievskiy58110f02017-07-10 19:30:16 +03002098 if (migrate_postcopy_ram()) {
2099 qemu_savevm_send_ping(fb, 3);
2100 }
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002101
2102 qemu_savevm_send_postcopy_run(fb);
2103
2104 /* <><> end of stuff going into the package */
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002105
Dr. David Alan Gilbertef8d6482017-02-02 15:59:09 +00002106 /* Last point of recovery; as soon as we send the package the destination
2107 * can open devices and potentially start running.
2108 * Lets just check again we've not got any errors.
2109 */
2110 ret = qemu_file_get_error(ms->to_dst_file);
2111 if (ret) {
2112 error_report("postcopy_start: Migration stream errored (pre package)");
2113 goto fail_closefb;
2114 }
2115
2116 restart_block = false;
2117
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002118 /* Now send that blob */
Daniel P. Berrange61b67d42016-04-27 11:05:01 +01002119 if (qemu_savevm_send_packaged(ms->to_dst_file, bioc->data, bioc->usage)) {
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002120 goto fail_closefb;
2121 }
2122 qemu_fclose(fb);
Dr. David Alan Gilbertb82fc322016-02-22 17:17:32 +00002123
2124 /* Send a notify to give a chance for anything that needs to happen
2125 * at the transition to postcopy and after the device state; in particular
2126 * spice needs to trigger a transition now
2127 */
2128 ms->postcopy_after_devices = true;
2129 notifier_list_notify(&migration_state_notifiers, ms);
2130
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002131 ms->downtime = qemu_clock_get_ms(QEMU_CLOCK_REALTIME) - time_at_stop;
2132
2133 qemu_mutex_unlock_iothread();
2134
Vladimir Sementsov-Ogievskiy58110f02017-07-10 19:30:16 +03002135 if (migrate_postcopy_ram()) {
2136 /*
2137 * Although this ping is just for debug, it could potentially be
2138 * used for getting a better measurement of downtime at the source.
2139 */
2140 qemu_savevm_send_ping(ms->to_dst_file, 4);
2141 }
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002142
Pavel Butsykinced1c612017-02-03 18:23:21 +03002143 if (migrate_release_ram()) {
2144 ram_postcopy_migrated_memory_release(ms);
2145 }
2146
zhanghailiang89a02a92016-01-15 11:37:42 +08002147 ret = qemu_file_get_error(ms->to_dst_file);
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002148 if (ret) {
2149 error_report("postcopy_start: Migration stream errored");
zhanghailiang48781e52015-12-16 11:47:33 +00002150 migrate_set_state(&ms->state, MIGRATION_STATUS_POSTCOPY_ACTIVE,
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002151 MIGRATION_STATUS_FAILED);
2152 }
2153
2154 return ret;
2155
2156fail_closefb:
2157 qemu_fclose(fb);
2158fail:
zhanghailiang48781e52015-12-16 11:47:33 +00002159 migrate_set_state(&ms->state, MIGRATION_STATUS_POSTCOPY_ACTIVE,
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002160 MIGRATION_STATUS_FAILED);
Dr. David Alan Gilbertef8d6482017-02-02 15:59:09 +00002161 if (restart_block) {
2162 /* A failure happened early enough that we know the destination hasn't
2163 * accessed block devices, so we're safe to recover.
2164 */
2165 Error *local_err = NULL;
2166
2167 bdrv_invalidate_cache_all(&local_err);
2168 if (local_err) {
2169 error_report_err(local_err);
2170 }
2171 }
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002172 qemu_mutex_unlock_iothread();
2173 return -1;
2174}
2175
Dr. David Alan Gilbert09f6c852015-08-13 11:51:31 +01002176/**
Dr. David Alan Gilberte91d8952017-10-20 10:05:52 +01002177 * migration_maybe_pause: Pause if required to by
2178 * migrate_pause_before_switchover called with the iothread locked
2179 * Returns: 0 on success
2180 */
Dr. David Alan Gilbert0331c8c2017-10-20 10:05:56 +01002181static int migration_maybe_pause(MigrationState *s,
2182 int *current_active_state,
2183 int new_state)
Dr. David Alan Gilberte91d8952017-10-20 10:05:52 +01002184{
2185 if (!migrate_pause_before_switchover()) {
2186 return 0;
2187 }
2188
2189 /* Since leaving this state is not atomic with posting the semaphore
2190 * it's possible that someone could have issued multiple migrate_continue
2191 * and the semaphore is incorrectly positive at this point;
2192 * the docs say it's undefined to reinit a semaphore that's already
2193 * init'd, so use timedwait to eat up any existing posts.
2194 */
2195 while (qemu_sem_timedwait(&s->pause_sem, 1) == 0) {
2196 /* This block intentionally left blank */
2197 }
2198
2199 qemu_mutex_unlock_iothread();
2200 migrate_set_state(&s->state, *current_active_state,
2201 MIGRATION_STATUS_PRE_SWITCHOVER);
2202 qemu_sem_wait(&s->pause_sem);
2203 migrate_set_state(&s->state, MIGRATION_STATUS_PRE_SWITCHOVER,
Dr. David Alan Gilbert0331c8c2017-10-20 10:05:56 +01002204 new_state);
2205 *current_active_state = new_state;
Dr. David Alan Gilberte91d8952017-10-20 10:05:52 +01002206 qemu_mutex_lock_iothread();
2207
Dr. David Alan Gilbert0331c8c2017-10-20 10:05:56 +01002208 return s->state == new_state ? 0 : -EINVAL;
Dr. David Alan Gilberte91d8952017-10-20 10:05:52 +01002209}
2210
2211/**
Dr. David Alan Gilbert09f6c852015-08-13 11:51:31 +01002212 * migration_completion: Used by migration_thread when there's not much left.
2213 * The caller 'breaks' the loop when this returns.
2214 *
2215 * @s: Current migration state
Dr. David Alan Gilbert09f6c852015-08-13 11:51:31 +01002216 */
Peter Xu2ad87302018-01-03 20:20:14 +08002217static void migration_completion(MigrationState *s)
Dr. David Alan Gilbert09f6c852015-08-13 11:51:31 +01002218{
2219 int ret;
Peter Xu2ad87302018-01-03 20:20:14 +08002220 int current_active_state = s->state;
Dr. David Alan Gilbert09f6c852015-08-13 11:51:31 +01002221
Dr. David Alan Gilbertb10ac0c2015-11-05 18:11:06 +00002222 if (s->state == MIGRATION_STATUS_ACTIVE) {
2223 qemu_mutex_lock_iothread();
Peter Xu64909f92018-01-03 20:20:10 +08002224 s->downtime_start = qemu_clock_get_ms(QEMU_CLOCK_REALTIME);
Dr. David Alan Gilbertb10ac0c2015-11-05 18:11:06 +00002225 qemu_system_wakeup_request(QEMU_WAKEUP_REASON_OTHER);
Peter Xu7287cbd2018-01-03 20:20:09 +08002226 s->vm_was_running = runstate_is_running();
Dr. David Alan Gilbertb10ac0c2015-11-05 18:11:06 +00002227 ret = global_state_store();
Dr. David Alan Gilbert09f6c852015-08-13 11:51:31 +01002228
Dr. David Alan Gilbertb10ac0c2015-11-05 18:11:06 +00002229 if (!ret) {
Fam Zhenga1fbe752017-06-17 00:06:58 +08002230 bool inactivate = !migrate_colo_enabled();
Dr. David Alan Gilbertb10ac0c2015-11-05 18:11:06 +00002231 ret = vm_stop_force_state(RUN_STATE_FINISH_MIGRATE);
Kevin Wolff07fa4c2017-05-22 17:10:38 +02002232 if (ret >= 0) {
Dr. David Alan Gilbert0331c8c2017-10-20 10:05:56 +01002233 ret = migration_maybe_pause(s, &current_active_state,
2234 MIGRATION_STATUS_DEVICE);
Dr. David Alan Gilberte91d8952017-10-20 10:05:52 +01002235 }
2236 if (ret >= 0) {
Kevin Wolff07fa4c2017-05-22 17:10:38 +02002237 qemu_file_set_rate_limit(s->to_dst_file, INT64_MAX);
Fam Zhenga1fbe752017-06-17 00:06:58 +08002238 ret = qemu_savevm_state_complete_precopy(s->to_dst_file, false,
2239 inactivate);
Kevin Wolff07fa4c2017-05-22 17:10:38 +02002240 }
Fam Zhenga1fbe752017-06-17 00:06:58 +08002241 if (inactivate && ret >= 0) {
2242 s->block_inactive = true;
Dr. David Alan Gilbertb10ac0c2015-11-05 18:11:06 +00002243 }
Dr. David Alan Gilbert09f6c852015-08-13 11:51:31 +01002244 }
Dr. David Alan Gilbertb10ac0c2015-11-05 18:11:06 +00002245 qemu_mutex_unlock_iothread();
Dr. David Alan Gilbert09f6c852015-08-13 11:51:31 +01002246
Dr. David Alan Gilbertb10ac0c2015-11-05 18:11:06 +00002247 if (ret < 0) {
2248 goto fail;
2249 }
2250 } else if (s->state == MIGRATION_STATUS_POSTCOPY_ACTIVE) {
2251 trace_migration_completion_postcopy_end();
2252
zhanghailiang89a02a92016-01-15 11:37:42 +08002253 qemu_savevm_state_complete_postcopy(s->to_dst_file);
Dr. David Alan Gilbertb10ac0c2015-11-05 18:11:06 +00002254 trace_migration_completion_postcopy_end_after_complete();
2255 }
2256
2257 /*
2258 * If rp was opened we must clean up the thread before
2259 * cleaning everything else up (since if there are no failures
2260 * it will wait for the destination to send it's status in
2261 * a SHUT command).
Dr. David Alan Gilbertb10ac0c2015-11-05 18:11:06 +00002262 */
Peter Xu0425dc92017-05-31 18:35:34 +08002263 if (s->rp_state.from_dst_file) {
Dr. David Alan Gilbertb10ac0c2015-11-05 18:11:06 +00002264 int rp_error;
Peter Xu0425dc92017-05-31 18:35:34 +08002265 trace_migration_return_path_end_before();
Dr. David Alan Gilbertb10ac0c2015-11-05 18:11:06 +00002266 rp_error = await_return_path_close_on_source(s);
Peter Xu0425dc92017-05-31 18:35:34 +08002267 trace_migration_return_path_end_after(rp_error);
Dr. David Alan Gilbertb10ac0c2015-11-05 18:11:06 +00002268 if (rp_error) {
Greg Kurzfe904ea2016-05-18 15:44:36 +02002269 goto fail_invalidate;
Dr. David Alan Gilbertb10ac0c2015-11-05 18:11:06 +00002270 }
Dr. David Alan Gilbert09f6c852015-08-13 11:51:31 +01002271 }
2272
zhanghailiang89a02a92016-01-15 11:37:42 +08002273 if (qemu_file_get_error(s->to_dst_file)) {
Dr. David Alan Gilbert09f6c852015-08-13 11:51:31 +01002274 trace_migration_completion_file_err();
Greg Kurzfe904ea2016-05-18 15:44:36 +02002275 goto fail_invalidate;
Dr. David Alan Gilbert09f6c852015-08-13 11:51:31 +01002276 }
2277
zhanghailiang0b827d52016-10-27 14:42:54 +08002278 if (!migrate_colo_enabled()) {
2279 migrate_set_state(&s->state, current_active_state,
2280 MIGRATION_STATUS_COMPLETED);
2281 }
2282
Dr. David Alan Gilbert09f6c852015-08-13 11:51:31 +01002283 return;
2284
Greg Kurzfe904ea2016-05-18 15:44:36 +02002285fail_invalidate:
2286 /* If not doing postcopy, vm_start() will be called: let's regain
2287 * control on images.
2288 */
Dr. David Alan Gilbert6039dd52018-02-05 09:13:37 +00002289 if (s->state == MIGRATION_STATUS_ACTIVE ||
2290 s->state == MIGRATION_STATUS_DEVICE) {
Greg Kurzfe904ea2016-05-18 15:44:36 +02002291 Error *local_err = NULL;
2292
zhanghailiang1d2acc32017-01-24 15:59:52 +08002293 qemu_mutex_lock_iothread();
Greg Kurzfe904ea2016-05-18 15:44:36 +02002294 bdrv_invalidate_cache_all(&local_err);
2295 if (local_err) {
2296 error_report_err(local_err);
zhanghailiang1d2acc32017-01-24 15:59:52 +08002297 } else {
2298 s->block_inactive = false;
Greg Kurzfe904ea2016-05-18 15:44:36 +02002299 }
zhanghailiang1d2acc32017-01-24 15:59:52 +08002300 qemu_mutex_unlock_iothread();
Greg Kurzfe904ea2016-05-18 15:44:36 +02002301 }
2302
Dr. David Alan Gilbert09f6c852015-08-13 11:51:31 +01002303fail:
zhanghailiang48781e52015-12-16 11:47:33 +00002304 migrate_set_state(&s->state, current_active_state,
2305 MIGRATION_STATUS_FAILED);
Dr. David Alan Gilbert09f6c852015-08-13 11:51:31 +01002306}
2307
zhanghailiang35a6ed42016-10-27 14:42:52 +08002308bool migrate_colo_enabled(void)
2309{
2310 MigrationState *s = migrate_get_current();
2311 return s->enabled_capabilities[MIGRATION_CAPABILITY_X_COLO];
2312}
2313
Peter Xub23c2ad2018-05-02 18:47:19 +08002314typedef enum MigThrError {
2315 /* No error detected */
2316 MIG_THR_ERR_NONE = 0,
2317 /* Detected error, but resumed successfully */
2318 MIG_THR_ERR_RECOVERED = 1,
2319 /* Detected fatal error, need to exit */
2320 MIG_THR_ERR_FATAL = 2,
2321} MigThrError;
2322
Peter Xu135b87b2018-05-02 18:47:25 +08002323/* Return zero if success, or <0 for error */
2324static int postcopy_do_resume(MigrationState *s)
2325{
2326 /* TODO: do the resume logic */
2327 return 0;
2328}
2329
Peter Xub23c2ad2018-05-02 18:47:19 +08002330/*
2331 * We don't return until we are in a safe state to continue current
2332 * postcopy migration. Returns MIG_THR_ERR_RECOVERED if recovered, or
2333 * MIG_THR_ERR_FATAL if unrecovery failure happened.
2334 */
2335static MigThrError postcopy_pause(MigrationState *s)
2336{
2337 assert(s->state == MIGRATION_STATUS_POSTCOPY_ACTIVE);
Peter Xub23c2ad2018-05-02 18:47:19 +08002338
Peter Xu135b87b2018-05-02 18:47:25 +08002339 while (true) {
2340 migrate_set_state(&s->state, s->state,
2341 MIGRATION_STATUS_POSTCOPY_PAUSED);
Peter Xub23c2ad2018-05-02 18:47:19 +08002342
Peter Xu135b87b2018-05-02 18:47:25 +08002343 /* Current channel is possibly broken. Release it. */
2344 assert(s->to_dst_file);
2345 qemu_file_shutdown(s->to_dst_file);
2346 qemu_fclose(s->to_dst_file);
2347 s->to_dst_file = NULL;
Peter Xub23c2ad2018-05-02 18:47:19 +08002348
Peter Xu135b87b2018-05-02 18:47:25 +08002349 error_report("Detected IO failure for postcopy. "
2350 "Migration paused.");
2351
2352 /*
2353 * We wait until things fixed up. Then someone will setup the
2354 * status back for us.
2355 */
2356 while (s->state == MIGRATION_STATUS_POSTCOPY_PAUSED) {
2357 qemu_sem_wait(&s->postcopy_pause_sem);
2358 }
2359
2360 if (s->state == MIGRATION_STATUS_POSTCOPY_RECOVER) {
2361 /* Woken up by a recover procedure. Give it a shot */
2362
2363 /*
2364 * Firstly, let's wake up the return path now, with a new
2365 * return path channel.
2366 */
2367 qemu_sem_post(&s->postcopy_pause_rp_sem);
2368
2369 /* Do the resume logic */
2370 if (postcopy_do_resume(s) == 0) {
2371 /* Let's continue! */
2372 trace_postcopy_pause_continued();
2373 return MIG_THR_ERR_RECOVERED;
2374 } else {
2375 /*
2376 * Something wrong happened during the recovery, let's
2377 * pause again. Pause is always better than throwing
2378 * data away.
2379 */
2380 continue;
2381 }
2382 } else {
2383 /* This is not right... Time to quit. */
2384 return MIG_THR_ERR_FATAL;
2385 }
Peter Xub23c2ad2018-05-02 18:47:19 +08002386 }
Peter Xub23c2ad2018-05-02 18:47:19 +08002387}
2388
2389static MigThrError migration_detect_error(MigrationState *s)
2390{
2391 int ret;
2392
2393 /* Try to detect any file errors */
2394 ret = qemu_file_get_error(s->to_dst_file);
2395
2396 if (!ret) {
2397 /* Everything is fine */
2398 return MIG_THR_ERR_NONE;
2399 }
2400
2401 if (s->state == MIGRATION_STATUS_POSTCOPY_ACTIVE && ret == -EIO) {
2402 /*
2403 * For postcopy, we allow the network to be down for a
2404 * while. After that, it can be continued by a
2405 * recovery phase.
2406 */
2407 return postcopy_pause(s);
2408 } else {
2409 /*
2410 * For precopy (or postcopy with error outside IO), we fail
2411 * with no time.
2412 */
2413 migrate_set_state(&s->state, s->state, MIGRATION_STATUS_FAILED);
2414 trace_migration_thread_file_err();
2415
2416 /* Time to stop the migration, now. */
2417 return MIG_THR_ERR_FATAL;
2418 }
2419}
2420
Peter Xucf011f02018-01-03 20:20:11 +08002421static void migration_calculate_complete(MigrationState *s)
2422{
2423 uint64_t bytes = qemu_ftell(s->to_dst_file);
2424 int64_t end_time = qemu_clock_get_ms(QEMU_CLOCK_REALTIME);
2425
2426 s->total_time = end_time - s->start_time;
2427 if (!s->downtime) {
2428 /*
2429 * It's still not set, so we are precopy migration. For
2430 * postcopy, downtime is calculated during postcopy_start().
2431 */
2432 s->downtime = end_time - s->downtime_start;
2433 }
2434
2435 if (s->total_time) {
2436 s->mbps = ((double) bytes * 8.0) / s->total_time / 1000;
2437 }
2438}
2439
Peter Xub15df1a2018-01-03 20:20:13 +08002440static void migration_update_counters(MigrationState *s,
2441 int64_t current_time)
2442{
2443 uint64_t transferred, time_spent;
Peter Xub15df1a2018-01-03 20:20:13 +08002444 double bandwidth;
2445
2446 if (current_time < s->iteration_start_time + BUFFER_DELAY) {
2447 return;
2448 }
2449
2450 transferred = qemu_ftell(s->to_dst_file) - s->iteration_initial_bytes;
2451 time_spent = current_time - s->iteration_start_time;
2452 bandwidth = (double)transferred / time_spent;
Wei Wang0781c1e2018-01-22 19:36:39 +08002453 s->threshold_size = bandwidth * s->parameters.downtime_limit;
Peter Xub15df1a2018-01-03 20:20:13 +08002454
2455 s->mbps = (((double) transferred * 8.0) /
2456 ((double) time_spent / 1000.0)) / 1000.0 / 1000.0;
2457
2458 /*
2459 * if we haven't sent anything, we don't want to
2460 * recalculate. 10000 is a small enough number for our purposes
2461 */
2462 if (ram_counters.dirty_pages_rate && transferred > 10000) {
2463 s->expected_downtime = ram_counters.dirty_pages_rate *
2464 qemu_target_page_size() / bandwidth;
2465 }
2466
2467 qemu_file_reset_rate_limit(s->to_dst_file);
2468
2469 s->iteration_start_time = current_time;
2470 s->iteration_initial_bytes = qemu_ftell(s->to_dst_file);
2471
2472 trace_migrate_transferred(transferred, time_spent,
Wei Wang0781c1e2018-01-22 19:36:39 +08002473 bandwidth, s->threshold_size);
Peter Xub15df1a2018-01-03 20:20:13 +08002474}
2475
Peter Xu2ad87302018-01-03 20:20:14 +08002476/* Migration thread iteration status */
2477typedef enum {
2478 MIG_ITERATE_RESUME, /* Resume current iteration */
2479 MIG_ITERATE_SKIP, /* Skip current iteration */
2480 MIG_ITERATE_BREAK, /* Break the loop */
2481} MigIterateState;
2482
2483/*
2484 * Return true if continue to the next iteration directly, false
2485 * otherwise.
2486 */
2487static MigIterateState migration_iteration_run(MigrationState *s)
2488{
Vladimir Sementsov-Ogievskiy47995022018-03-13 15:34:00 -04002489 uint64_t pending_size, pend_pre, pend_compat, pend_post;
Peter Xu2ad87302018-01-03 20:20:14 +08002490 bool in_postcopy = s->state == MIGRATION_STATUS_POSTCOPY_ACTIVE;
2491
Vladimir Sementsov-Ogievskiy47995022018-03-13 15:34:00 -04002492 qemu_savevm_state_pending(s->to_dst_file, s->threshold_size, &pend_pre,
2493 &pend_compat, &pend_post);
2494 pending_size = pend_pre + pend_compat + pend_post;
Peter Xu2ad87302018-01-03 20:20:14 +08002495
2496 trace_migrate_pending(pending_size, s->threshold_size,
Vladimir Sementsov-Ogievskiy47995022018-03-13 15:34:00 -04002497 pend_pre, pend_compat, pend_post);
Peter Xu2ad87302018-01-03 20:20:14 +08002498
2499 if (pending_size && pending_size >= s->threshold_size) {
2500 /* Still a significant amount to transfer */
2501 if (migrate_postcopy() && !in_postcopy &&
Vladimir Sementsov-Ogievskiy47995022018-03-13 15:34:00 -04002502 pend_pre <= s->threshold_size &&
Peter Xu2ad87302018-01-03 20:20:14 +08002503 atomic_read(&s->start_postcopy)) {
2504 if (postcopy_start(s)) {
2505 error_report("%s: postcopy failed to start", __func__);
2506 }
2507 return MIG_ITERATE_SKIP;
2508 }
2509 /* Just another iteration step */
2510 qemu_savevm_state_iterate(s->to_dst_file,
2511 s->state == MIGRATION_STATUS_POSTCOPY_ACTIVE);
2512 } else {
2513 trace_migration_thread_low_pending(pending_size);
2514 migration_completion(s);
2515 return MIG_ITERATE_BREAK;
2516 }
2517
2518 return MIG_ITERATE_RESUME;
2519}
2520
Peter Xu199aa6d2018-01-03 20:20:15 +08002521static void migration_iteration_finish(MigrationState *s)
2522{
2523 /* If we enabled cpu throttling for auto-converge, turn it off. */
2524 cpu_throttle_stop();
2525
2526 qemu_mutex_lock_iothread();
2527 switch (s->state) {
2528 case MIGRATION_STATUS_COMPLETED:
2529 migration_calculate_complete(s);
2530 runstate_set(RUN_STATE_POSTMIGRATE);
2531 break;
2532
2533 case MIGRATION_STATUS_ACTIVE:
2534 /*
2535 * We should really assert here, but since it's during
2536 * migration, let's try to reduce the usage of assertions.
2537 */
2538 if (!migrate_colo_enabled()) {
2539 error_report("%s: critical error: calling COLO code without "
2540 "COLO enabled", __func__);
2541 }
2542 migrate_start_colo_process(s);
2543 /*
2544 * Fixme: we will run VM in COLO no matter its old running state.
2545 * After exited COLO, we will keep running.
2546 */
2547 s->vm_was_running = true;
2548 /* Fallthrough */
2549 case MIGRATION_STATUS_FAILED:
2550 case MIGRATION_STATUS_CANCELLED:
2551 if (s->vm_was_running) {
2552 vm_start();
2553 } else {
2554 if (runstate_check(RUN_STATE_FINISH_MIGRATE)) {
2555 runstate_set(RUN_STATE_POSTMIGRATE);
2556 }
2557 }
2558 break;
2559
2560 default:
2561 /* Should not reach here, but if so, forgive the VM. */
2562 error_report("%s: Unknown ending state %d", __func__, s->state);
2563 break;
2564 }
2565 qemu_bh_schedule(s->cleanup_bh);
2566 qemu_mutex_unlock_iothread();
2567}
2568
Dr. David Alan Gilbert70b20472015-11-05 18:10:49 +00002569/*
2570 * Master migration thread on the source VM.
2571 * It drives the migration and pumps the data down the outgoing channel.
2572 */
Juan Quintela5f496a12013-02-22 17:36:30 +01002573static void *migration_thread(void *opaque)
Juan Quintela0d82d0e2012-10-03 14:18:33 +02002574{
Juan Quintela9848a402012-12-19 09:55:50 +01002575 MigrationState *s = opaque;
Alex Blighbc72ad62013-08-21 16:03:08 +01002576 int64_t setup_start = qemu_clock_get_ms(QEMU_CLOCK_HOST);
Peter Xub23c2ad2018-05-02 18:47:19 +08002577 MigThrError thr_error;
Juan Quintela76f59332012-10-03 20:16:24 +02002578
Paolo Bonziniab28bd22015-07-09 08:55:38 +02002579 rcu_register_thread();
2580
Peter Xub15df1a2018-01-03 20:20:13 +08002581 s->iteration_start_time = qemu_clock_get_ms(QEMU_CLOCK_REALTIME);
2582
zhanghailiang89a02a92016-01-15 11:37:42 +08002583 qemu_savevm_state_header(s->to_dst_file);
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002584
Peter Xu62a02652017-06-14 15:55:58 +08002585 /*
2586 * If we opened the return path, we need to make sure dst has it
2587 * opened as well.
2588 */
2589 if (s->rp_state.from_dst_file) {
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002590 /* Now tell the dest that it should open its end so it can reply */
zhanghailiang89a02a92016-01-15 11:37:42 +08002591 qemu_savevm_send_open_return_path(s->to_dst_file);
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002592
2593 /* And do a ping that will make stuff easier to debug */
zhanghailiang89a02a92016-01-15 11:37:42 +08002594 qemu_savevm_send_ping(s->to_dst_file, 1);
Peter Xu0425dc92017-05-31 18:35:34 +08002595 }
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002596
Vladimir Sementsov-Ogievskiy58110f02017-07-10 19:30:16 +03002597 if (migrate_postcopy()) {
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002598 /*
2599 * Tell the destination that we *might* want to do postcopy later;
2600 * if the other end can't do postcopy it should fail now, nice and
2601 * early.
2602 */
zhanghailiang89a02a92016-01-15 11:37:42 +08002603 qemu_savevm_send_postcopy_advise(s->to_dst_file);
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002604 }
2605
Juan Quintela9907e842017-06-28 11:52:24 +02002606 qemu_savevm_state_setup(s->to_dst_file);
Juan Quintela0d82d0e2012-10-03 14:18:33 +02002607
Alex Blighbc72ad62013-08-21 16:03:08 +01002608 s->setup_time = qemu_clock_get_ms(QEMU_CLOCK_HOST) - setup_start;
zhanghailiang48781e52015-12-16 11:47:33 +00002609 migrate_set_state(&s->state, MIGRATION_STATUS_SETUP,
2610 MIGRATION_STATUS_ACTIVE);
Michael R. Hines29ae8a42013-07-22 10:01:57 -04002611
Dr. David Alan Gilbert9ec055a2015-11-05 18:10:58 +00002612 trace_migration_thread_setup_complete();
2613
2614 while (s->state == MIGRATION_STATUS_ACTIVE ||
2615 s->state == MIGRATION_STATUS_POSTCOPY_ACTIVE) {
Juan Quintelaa3e879c2013-02-01 12:39:08 +01002616 int64_t current_time;
Juan Quintela0d82d0e2012-10-03 14:18:33 +02002617
zhanghailiang89a02a92016-01-15 11:37:42 +08002618 if (!qemu_file_rate_limit(s->to_dst_file)) {
Peter Xu2ad87302018-01-03 20:20:14 +08002619 MigIterateState iter_state = migration_iteration_run(s);
2620 if (iter_state == MIG_ITERATE_SKIP) {
2621 continue;
2622 } else if (iter_state == MIG_ITERATE_BREAK) {
Dr. David Alan Gilbert09f6c852015-08-13 11:51:31 +01002623 break;
Juan Quintelac369f402012-10-03 20:33:34 +02002624 }
2625 }
Paolo Bonzinif4410a52013-02-22 17:36:20 +01002626
Peter Xub23c2ad2018-05-02 18:47:19 +08002627 /*
2628 * Try to detect any kind of failures, and see whether we
2629 * should stop the migration now.
2630 */
2631 thr_error = migration_detect_error(s);
2632 if (thr_error == MIG_THR_ERR_FATAL) {
2633 /* Stop migration */
Paolo Bonzinifd45ee22013-02-22 17:36:33 +01002634 break;
Peter Xub23c2ad2018-05-02 18:47:19 +08002635 } else if (thr_error == MIG_THR_ERR_RECOVERED) {
2636 /*
2637 * Just recovered from a e.g. network failure, reset all
2638 * the local variables. This is important to avoid
2639 * breaking transferred_bytes and bandwidth calculation
2640 */
2641 s->iteration_start_time = qemu_clock_get_ms(QEMU_CLOCK_REALTIME);
2642 s->iteration_initial_bytes = 0;
Paolo Bonzinifd45ee22013-02-22 17:36:33 +01002643 }
Peter Xub15df1a2018-01-03 20:20:13 +08002644
Alex Blighbc72ad62013-08-21 16:03:08 +01002645 current_time = qemu_clock_get_ms(QEMU_CLOCK_REALTIME);
Juan Quintela0d82d0e2012-10-03 14:18:33 +02002646
Peter Xub15df1a2018-01-03 20:20:13 +08002647 migration_update_counters(s, current_time);
Michael R. Hines7e114f82013-06-25 21:35:30 -04002648
zhanghailiang89a02a92016-01-15 11:37:42 +08002649 if (qemu_file_rate_limit(s->to_dst_file)) {
Juan Quintela0d82d0e2012-10-03 14:18:33 +02002650 /* usleep expects microseconds */
Peter Xub15df1a2018-01-03 20:20:13 +08002651 g_usleep((s->iteration_start_time + BUFFER_DELAY -
2652 current_time) * 1000);
Juan Quintela0d82d0e2012-10-03 14:18:33 +02002653 }
Paolo Bonzinia3fa1d72013-02-22 17:36:18 +01002654 }
2655
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002656 trace_migration_thread_after_loop();
Peter Xu199aa6d2018-01-03 20:20:15 +08002657 migration_iteration_finish(s);
Paolo Bonziniab28bd22015-07-09 08:55:38 +02002658 rcu_unregister_thread();
Juan Quintela0d82d0e2012-10-03 14:18:33 +02002659 return NULL;
2660}
2661
Dr. David Alan Gilbertcce80402017-12-15 17:16:54 +00002662void migrate_fd_connect(MigrationState *s, Error *error_in)
Juan Quintela0d82d0e2012-10-03 14:18:33 +02002663{
Peter Xud3e35b82018-05-02 18:47:24 +08002664 int64_t rate_limit;
2665 bool resume = s->state == MIGRATION_STATUS_POSTCOPY_PAUSED;
2666
Ashijeet Acharya2ff30252016-09-15 21:50:28 +05302667 s->expected_downtime = s->parameters.downtime_limit;
Paolo Bonzinibb1fadc2013-02-22 17:36:21 +01002668 s->cleanup_bh = qemu_bh_new(migrate_fd_cleanup, s);
Dr. David Alan Gilbertcce80402017-12-15 17:16:54 +00002669 if (error_in) {
2670 migrate_fd_error(s, error_in);
2671 migrate_fd_cleanup(s);
2672 return;
2673 }
Juan Quintela0d82d0e2012-10-03 14:18:33 +02002674
Peter Xud3e35b82018-05-02 18:47:24 +08002675 if (resume) {
2676 /* This is a resumed migration */
2677 rate_limit = INT64_MAX;
2678 } else {
2679 /* This is a fresh new migration */
2680 rate_limit = s->parameters.max_bandwidth / XFER_LIMIT_RATIO;
2681 s->expected_downtime = s->parameters.downtime_limit;
2682 s->cleanup_bh = qemu_bh_new(migrate_fd_cleanup, s);
Paolo Bonzini442773c2013-02-22 17:36:44 +01002683
Peter Xud3e35b82018-05-02 18:47:24 +08002684 /* Notify before starting migration thread */
2685 notifier_list_notify(&migration_state_notifiers, s);
2686 }
2687
2688 qemu_file_set_rate_limit(s->to_dst_file, rate_limit);
2689 qemu_file_set_blocking(s->to_dst_file, true);
Stefan Hajnoczi9287ac22013-07-29 15:01:57 +02002690
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002691 /*
Peter Xuc788ada2017-06-26 18:28:55 +08002692 * Open the return path. For postcopy, it is used exclusively. For
2693 * precopy, only if user specified "return-path" capability would
2694 * QEMU uses the return path.
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002695 */
Peter Xuc788ada2017-06-26 18:28:55 +08002696 if (migrate_postcopy_ram() || migrate_use_return_path()) {
Peter Xud3e35b82018-05-02 18:47:24 +08002697 if (open_return_path_on_source(s, !resume)) {
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002698 error_report("Unable to open return-path for postcopy");
Peter Xud3e35b82018-05-02 18:47:24 +08002699 migrate_set_state(&s->state, s->state, MIGRATION_STATUS_FAILED);
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002700 migrate_fd_cleanup(s);
2701 return;
2702 }
2703 }
2704
Peter Xud3e35b82018-05-02 18:47:24 +08002705 if (resume) {
Peter Xu135b87b2018-05-02 18:47:25 +08002706 /* Wakeup the main migration thread to do the recovery */
2707 migrate_set_state(&s->state, MIGRATION_STATUS_POSTCOPY_PAUSED,
2708 MIGRATION_STATUS_POSTCOPY_RECOVER);
2709 qemu_sem_post(&s->postcopy_pause_sem);
Peter Xud3e35b82018-05-02 18:47:24 +08002710 return;
2711 }
2712
Juan Quintelaf986c3d2016-01-14 16:52:55 +01002713 if (multifd_save_setup() != 0) {
2714 migrate_set_state(&s->state, MIGRATION_STATUS_SETUP,
2715 MIGRATION_STATUS_FAILED);
2716 migrate_fd_cleanup(s);
2717 return;
2718 }
Pankaj Gupta009fad72017-01-23 19:12:56 +05302719 qemu_thread_create(&s->thread, "live_migration", migration_thread, s,
Paolo Bonzinibb1fadc2013-02-22 17:36:21 +01002720 QEMU_THREAD_JOINABLE);
Dr. David Alan Gilbert1d34e4b2015-11-05 18:11:05 +00002721 s->migration_thread_running = true;
Juan Quintela0d82d0e2012-10-03 14:18:33 +02002722}
Dr. David Alan Gilbert093e3c42015-11-05 18:10:52 +00002723
Peter Xu9d18af92017-06-27 12:10:19 +08002724void migration_global_dump(Monitor *mon)
2725{
2726 MigrationState *ms = migrate_get_current();
2727
Juan Quintela6f0f6422017-10-26 11:49:57 +02002728 monitor_printf(mon, "globals:\n");
2729 monitor_printf(mon, "store-global-state: %s\n",
2730 ms->store_global_state ? "on" : "off");
2731 monitor_printf(mon, "only-migratable: %s\n",
2732 ms->only_migratable ? "on" : "off");
2733 monitor_printf(mon, "send-configuration: %s\n",
2734 ms->send_configuration ? "on" : "off");
2735 monitor_printf(mon, "send-section-footer: %s\n",
2736 ms->send_section_footer ? "on" : "off");
Peter Xu9d18af92017-06-27 12:10:19 +08002737}
2738
Peter Xu20814752017-07-18 11:39:03 +08002739#define DEFINE_PROP_MIG_CAP(name, x) \
2740 DEFINE_PROP_BOOL(name, MigrationState, enabled_capabilities[x], false)
2741
Peter Xu52722982017-06-27 12:10:14 +08002742static Property migration_properties[] = {
2743 DEFINE_PROP_BOOL("store-global-state", MigrationState,
2744 store_global_state, true),
Peter Xu3df663e2017-06-27 12:10:15 +08002745 DEFINE_PROP_BOOL("only-migratable", MigrationState, only_migratable, false),
Peter Xu71dd4c12017-06-27 12:10:16 +08002746 DEFINE_PROP_BOOL("send-configuration", MigrationState,
2747 send_configuration, true),
Peter Xu15c38502017-06-27 12:10:17 +08002748 DEFINE_PROP_BOOL("send-section-footer", MigrationState,
2749 send_section_footer, true),
Peter Xu89632fa2017-07-18 11:39:02 +08002750
2751 /* Migration parameters */
Juan Quintela741d4082017-12-01 13:08:38 +01002752 DEFINE_PROP_UINT8("x-compress-level", MigrationState,
Peter Xu89632fa2017-07-18 11:39:02 +08002753 parameters.compress_level,
2754 DEFAULT_MIGRATE_COMPRESS_LEVEL),
Juan Quintela741d4082017-12-01 13:08:38 +01002755 DEFINE_PROP_UINT8("x-compress-threads", MigrationState,
Peter Xu89632fa2017-07-18 11:39:02 +08002756 parameters.compress_threads,
2757 DEFAULT_MIGRATE_COMPRESS_THREAD_COUNT),
Juan Quintela741d4082017-12-01 13:08:38 +01002758 DEFINE_PROP_UINT8("x-decompress-threads", MigrationState,
Peter Xu89632fa2017-07-18 11:39:02 +08002759 parameters.decompress_threads,
2760 DEFAULT_MIGRATE_DECOMPRESS_THREAD_COUNT),
Juan Quintela741d4082017-12-01 13:08:38 +01002761 DEFINE_PROP_UINT8("x-cpu-throttle-initial", MigrationState,
Peter Xu89632fa2017-07-18 11:39:02 +08002762 parameters.cpu_throttle_initial,
2763 DEFAULT_MIGRATE_CPU_THROTTLE_INITIAL),
Juan Quintela741d4082017-12-01 13:08:38 +01002764 DEFINE_PROP_UINT8("x-cpu-throttle-increment", MigrationState,
Peter Xu89632fa2017-07-18 11:39:02 +08002765 parameters.cpu_throttle_increment,
2766 DEFAULT_MIGRATE_CPU_THROTTLE_INCREMENT),
Juan Quintela741d4082017-12-01 13:08:38 +01002767 DEFINE_PROP_SIZE("x-max-bandwidth", MigrationState,
Peter Xu89632fa2017-07-18 11:39:02 +08002768 parameters.max_bandwidth, MAX_THROTTLE),
Juan Quintela741d4082017-12-01 13:08:38 +01002769 DEFINE_PROP_UINT64("x-downtime-limit", MigrationState,
Peter Xu89632fa2017-07-18 11:39:02 +08002770 parameters.downtime_limit,
2771 DEFAULT_MIGRATE_SET_DOWNTIME),
Juan Quintela741d4082017-12-01 13:08:38 +01002772 DEFINE_PROP_UINT32("x-checkpoint-delay", MigrationState,
Peter Xu89632fa2017-07-18 11:39:02 +08002773 parameters.x_checkpoint_delay,
2774 DEFAULT_MIGRATE_X_CHECKPOINT_DELAY),
Juan Quintela741d4082017-12-01 13:08:38 +01002775 DEFINE_PROP_UINT8("x-multifd-channels", MigrationState,
Juan Quintela4075fb12016-01-15 08:56:17 +01002776 parameters.x_multifd_channels,
2777 DEFAULT_MIGRATE_MULTIFD_CHANNELS),
Juan Quintela741d4082017-12-01 13:08:38 +01002778 DEFINE_PROP_UINT32("x-multifd-page-count", MigrationState,
Juan Quintela0fb86602017-04-27 10:48:25 +02002779 parameters.x_multifd_page_count,
2780 DEFAULT_MIGRATE_MULTIFD_PAGE_COUNT),
Juan Quintela73af8dd2017-10-05 21:30:10 +02002781 DEFINE_PROP_SIZE("xbzrle-cache-size", MigrationState,
2782 parameters.xbzrle_cache_size,
2783 DEFAULT_MIGRATE_XBZRLE_CACHE_SIZE),
Peter Xu20814752017-07-18 11:39:03 +08002784
2785 /* Migration capabilities */
2786 DEFINE_PROP_MIG_CAP("x-xbzrle", MIGRATION_CAPABILITY_XBZRLE),
2787 DEFINE_PROP_MIG_CAP("x-rdma-pin-all", MIGRATION_CAPABILITY_RDMA_PIN_ALL),
2788 DEFINE_PROP_MIG_CAP("x-auto-converge", MIGRATION_CAPABILITY_AUTO_CONVERGE),
2789 DEFINE_PROP_MIG_CAP("x-zero-blocks", MIGRATION_CAPABILITY_ZERO_BLOCKS),
2790 DEFINE_PROP_MIG_CAP("x-compress", MIGRATION_CAPABILITY_COMPRESS),
2791 DEFINE_PROP_MIG_CAP("x-events", MIGRATION_CAPABILITY_EVENTS),
2792 DEFINE_PROP_MIG_CAP("x-postcopy-ram", MIGRATION_CAPABILITY_POSTCOPY_RAM),
2793 DEFINE_PROP_MIG_CAP("x-colo", MIGRATION_CAPABILITY_X_COLO),
2794 DEFINE_PROP_MIG_CAP("x-release-ram", MIGRATION_CAPABILITY_RELEASE_RAM),
2795 DEFINE_PROP_MIG_CAP("x-block", MIGRATION_CAPABILITY_BLOCK),
2796 DEFINE_PROP_MIG_CAP("x-return-path", MIGRATION_CAPABILITY_RETURN_PATH),
Juan Quintela30126bb2016-01-14 12:23:00 +01002797 DEFINE_PROP_MIG_CAP("x-multifd", MIGRATION_CAPABILITY_X_MULTIFD),
Peter Xu20814752017-07-18 11:39:03 +08002798
Peter Xu52722982017-06-27 12:10:14 +08002799 DEFINE_PROP_END_OF_LIST(),
2800};
2801
Peter Xue5cb7e72017-06-27 12:10:13 +08002802static void migration_class_init(ObjectClass *klass, void *data)
2803{
2804 DeviceClass *dc = DEVICE_CLASS(klass);
2805
2806 dc->user_creatable = false;
Peter Xu52722982017-06-27 12:10:14 +08002807 dc->props = migration_properties;
Peter Xue5cb7e72017-06-27 12:10:13 +08002808}
2809
Marc-André Lureaub91bf5e2017-08-01 17:04:18 +01002810static void migration_instance_finalize(Object *obj)
2811{
2812 MigrationState *ms = MIGRATION_OBJ(obj);
2813 MigrationParameters *params = &ms->parameters;
2814
Juan Quintela87db1a72017-09-05 12:50:22 +02002815 qemu_mutex_destroy(&ms->error_mutex);
Marc-André Lureaub91bf5e2017-08-01 17:04:18 +01002816 g_free(params->tls_hostname);
2817 g_free(params->tls_creds);
Dr. David Alan Gilberte91d8952017-10-20 10:05:52 +01002818 qemu_sem_destroy(&ms->pause_sem);
Peter Xub23c2ad2018-05-02 18:47:19 +08002819 qemu_sem_destroy(&ms->postcopy_pause_sem);
Peter Xu14b17422018-05-02 18:47:21 +08002820 qemu_sem_destroy(&ms->postcopy_pause_rp_sem);
Marc-André Lureauab105cc2018-03-06 18:09:59 +01002821 error_free(ms->error);
Marc-André Lureaub91bf5e2017-08-01 17:04:18 +01002822}
2823
Peter Xue5cb7e72017-06-27 12:10:13 +08002824static void migration_instance_init(Object *obj)
2825{
2826 MigrationState *ms = MIGRATION_OBJ(obj);
Peter Xu8b0b29d2017-07-18 11:39:06 +08002827 MigrationParameters *params = &ms->parameters;
Peter Xue5cb7e72017-06-27 12:10:13 +08002828
2829 ms->state = MIGRATION_STATUS_NONE;
Peter Xue5cb7e72017-06-27 12:10:13 +08002830 ms->mbps = -1;
Dr. David Alan Gilberte91d8952017-10-20 10:05:52 +01002831 qemu_sem_init(&ms->pause_sem, 0);
Juan Quintela87db1a72017-09-05 12:50:22 +02002832 qemu_mutex_init(&ms->error_mutex);
Peter Xu8b0b29d2017-07-18 11:39:06 +08002833
2834 params->tls_hostname = g_strdup("");
2835 params->tls_creds = g_strdup("");
2836
2837 /* Set has_* up only for parameter checks */
2838 params->has_compress_level = true;
2839 params->has_compress_threads = true;
2840 params->has_decompress_threads = true;
2841 params->has_cpu_throttle_initial = true;
2842 params->has_cpu_throttle_increment = true;
2843 params->has_max_bandwidth = true;
2844 params->has_downtime_limit = true;
2845 params->has_x_checkpoint_delay = true;
2846 params->has_block_incremental = true;
Juan Quintela4075fb12016-01-15 08:56:17 +01002847 params->has_x_multifd_channels = true;
Juan Quintela0fb86602017-04-27 10:48:25 +02002848 params->has_x_multifd_page_count = true;
Juan Quintela73af8dd2017-10-05 21:30:10 +02002849 params->has_xbzrle_cache_size = true;
Peter Xub23c2ad2018-05-02 18:47:19 +08002850
2851 qemu_sem_init(&ms->postcopy_pause_sem, 0);
Peter Xu14b17422018-05-02 18:47:21 +08002852 qemu_sem_init(&ms->postcopy_pause_rp_sem, 0);
Peter Xu8b0b29d2017-07-18 11:39:06 +08002853}
2854
2855/*
2856 * Return true if check pass, false otherwise. Error will be put
2857 * inside errp if provided.
2858 */
2859static bool migration_object_check(MigrationState *ms, Error **errp)
2860{
Peter Xu6b19a7d2017-07-18 11:39:10 +08002861 MigrationCapabilityStatusList *head = NULL;
2862 /* Assuming all off */
2863 bool cap_list[MIGRATION_CAPABILITY__MAX] = { 0 }, ret;
2864 int i;
2865
Peter Xu8b0b29d2017-07-18 11:39:06 +08002866 if (!migrate_params_check(&ms->parameters, errp)) {
2867 return false;
2868 }
2869
Peter Xu6b19a7d2017-07-18 11:39:10 +08002870 for (i = 0; i < MIGRATION_CAPABILITY__MAX; i++) {
2871 if (ms->enabled_capabilities[i]) {
2872 head = migrate_cap_add(head, i, true);
2873 }
2874 }
2875
2876 ret = migrate_caps_check(cap_list, head, errp);
2877
2878 /* It works with head == NULL */
2879 qapi_free_MigrationCapabilityStatusList(head);
2880
2881 return ret;
Peter Xue5cb7e72017-06-27 12:10:13 +08002882}
2883
2884static const TypeInfo migration_type = {
2885 .name = TYPE_MIGRATION,
Peter Xu01f6e142017-06-28 15:15:44 +08002886 /*
Peter Xuc8d3ff32017-07-05 16:21:23 +08002887 * NOTE: TYPE_MIGRATION is not really a device, as the object is
2888 * not created using qdev_create(), it is not attached to the qdev
2889 * device tree, and it is never realized.
2890 *
2891 * TODO: Make this TYPE_OBJECT once QOM provides something like
2892 * TYPE_DEVICE's "-global" properties.
Peter Xu01f6e142017-06-28 15:15:44 +08002893 */
Peter Xue5cb7e72017-06-27 12:10:13 +08002894 .parent = TYPE_DEVICE,
2895 .class_init = migration_class_init,
2896 .class_size = sizeof(MigrationClass),
2897 .instance_size = sizeof(MigrationState),
2898 .instance_init = migration_instance_init,
Marc-André Lureaub91bf5e2017-08-01 17:04:18 +01002899 .instance_finalize = migration_instance_finalize,
Peter Xue5cb7e72017-06-27 12:10:13 +08002900};
2901
2902static void register_migration_types(void)
2903{
2904 type_register_static(&migration_type);
2905}
2906
2907type_init(register_migration_types);