aliguori | 5bb7910 | 2008-10-13 03:12:02 +0000 | [diff] [blame] | 1 | /* |
| 2 | * QEMU live migration |
| 3 | * |
| 4 | * Copyright IBM, Corp. 2008 |
| 5 | * |
| 6 | * Authors: |
| 7 | * Anthony Liguori <aliguori@us.ibm.com> |
| 8 | * |
| 9 | * This work is licensed under the terms of the GNU GPL, version 2. See |
| 10 | * the COPYING file in the top-level directory. |
| 11 | * |
Paolo Bonzini | 6b620ca | 2012-01-13 17:44:23 +0100 | [diff] [blame] | 12 | * Contributions after 2012-01-13 are licensed under the terms of the |
| 13 | * GNU GPL, version 2 or (at your option) any later version. |
aliguori | 5bb7910 | 2008-10-13 03:12:02 +0000 | [diff] [blame] | 14 | */ |
| 15 | |
Peter Maydell | 1393a48 | 2016-01-26 18:16:54 +0000 | [diff] [blame] | 16 | #include "qemu/osdep.h" |
Veronia Bahaa | f348b6d | 2016-03-20 19:16:19 +0200 | [diff] [blame] | 17 | #include "qemu/cutils.h" |
Markus Armbruster | d49b683 | 2015-03-17 18:29:20 +0100 | [diff] [blame] | 18 | #include "qemu/error-report.h" |
Juan Quintela | 795c40b | 2017-04-06 12:00:28 +0200 | [diff] [blame] | 19 | #include "migration/blocker.h" |
Juan Quintela | f4dbe1b | 2017-04-05 15:54:10 +0200 | [diff] [blame] | 20 | #include "exec.h" |
Juan Quintela | 7fcac4a | 2017-04-05 15:58:29 +0200 | [diff] [blame] | 21 | #include "fd.h" |
Juan Quintela | 61e8b14 | 2017-04-05 17:40:11 +0200 | [diff] [blame] | 22 | #include "socket.h" |
Juan Quintela | e1a3ece | 2017-04-17 20:32:36 +0200 | [diff] [blame] | 23 | #include "rdma.h" |
Juan Quintela | 7b1e1a2 | 2017-04-17 20:26:27 +0200 | [diff] [blame] | 24 | #include "ram.h" |
Juan Quintela | 84a899d | 2017-04-24 18:53:30 +0200 | [diff] [blame] | 25 | #include "migration/global_state.h" |
Juan Quintela | c4b63b7 | 2017-04-24 19:02:44 +0200 | [diff] [blame] | 26 | #include "migration/misc.h" |
Juan Quintela | 6666c96 | 2017-04-24 20:07:27 +0200 | [diff] [blame] | 27 | #include "migration.h" |
Juan Quintela | 20a519a | 2017-04-20 14:48:46 +0200 | [diff] [blame] | 28 | #include "savevm.h" |
Juan Quintela | 40014d8 | 2017-04-17 19:34:36 +0200 | [diff] [blame] | 29 | #include "qemu-file-channel.h" |
Juan Quintela | 08a0aee | 2017-04-20 18:52:18 +0200 | [diff] [blame] | 30 | #include "qemu-file.h" |
Juan Quintela | 987772d | 2017-04-17 19:02:59 +0200 | [diff] [blame] | 31 | #include "migration/vmstate.h" |
Paolo Bonzini | 737e150 | 2012-12-17 18:19:44 +0100 | [diff] [blame] | 32 | #include "block/block.h" |
Markus Armbruster | e688df6 | 2018-02-01 12:18:31 +0100 | [diff] [blame] | 33 | #include "qapi/error.h" |
Markus Armbruster | 9af2398 | 2018-02-11 10:36:01 +0100 | [diff] [blame] | 34 | #include "qapi/qapi-commands-migration.h" |
| 35 | #include "qapi/qapi-events-migration.h" |
Markus Armbruster | cc7a8ea | 2015-03-17 17:22:46 +0100 | [diff] [blame] | 36 | #include "qapi/qmp/qerror.h" |
Markus Armbruster | 15280c3 | 2018-02-01 12:18:36 +0100 | [diff] [blame] | 37 | #include "qapi/qmp/qnull.h" |
Paolo Bonzini | ab28bd2 | 2015-07-09 08:55:38 +0200 | [diff] [blame] | 38 | #include "qemu/rcu.h" |
Juan Quintela | 2c9e6fe | 2017-04-21 14:31:22 +0200 | [diff] [blame] | 39 | #include "block.h" |
Juan Quintela | be07b0a | 2017-04-20 13:12:24 +0200 | [diff] [blame] | 40 | #include "postcopy-ram.h" |
Juan Quintela | 766bd17 | 2012-07-23 05:45:29 +0200 | [diff] [blame] | 41 | #include "qemu/thread.h" |
Kazuya Saito | c09e5bb | 2013-02-22 17:36:19 +0100 | [diff] [blame] | 42 | #include "trace.h" |
Juan Quintela | 5118042 | 2017-04-24 20:50:19 +0200 | [diff] [blame] | 43 | #include "exec/target_page.h" |
Daniel P. Berrange | 61b67d4 | 2016-04-27 11:05:01 +0100 | [diff] [blame] | 44 | #include "io/channel-buffer.h" |
zhanghailiang | 35a6ed4 | 2016-10-27 14:42:52 +0800 | [diff] [blame] | 45 | #include "migration/colo.h" |
Peter Xu | 4ffdb33 | 2017-06-27 12:10:18 +0800 | [diff] [blame] | 46 | #include "hw/boards.h" |
Peter Xu | 9d18af9 | 2017-06-27 12:10:19 +0800 | [diff] [blame] | 47 | #include "monitor/monitor.h" |
aliguori | 065e281 | 2008-11-11 16:46:33 +0000 | [diff] [blame] | 48 | |
Jason J. Herne | dc32562 | 2015-09-08 13:12:37 -0400 | [diff] [blame] | 49 | #define MAX_THROTTLE (32 << 20) /* Migration transfer speed throttling */ |
aliguori | 5bb7910 | 2008-10-13 03:12:02 +0000 | [diff] [blame] | 50 | |
Juan Quintela | 5b4e1eb | 2012-12-19 10:40:48 +0100 | [diff] [blame] | 51 | /* Amount of time to allocate to each "chunk" of bandwidth-throttled |
| 52 | * data. */ |
| 53 | #define BUFFER_DELAY 100 |
| 54 | #define XFER_LIMIT_RATIO (1000 / BUFFER_DELAY) |
| 55 | |
Ashijeet Acharya | 2ff3025 | 2016-09-15 21:50:28 +0530 | [diff] [blame] | 56 | /* Time in milliseconds we are allowed to stop the source, |
| 57 | * for sending the last part */ |
| 58 | #define DEFAULT_MIGRATE_SET_DOWNTIME 300 |
| 59 | |
Daniel Henrique Barboza | 87c9cc1 | 2017-02-22 12:17:29 -0300 | [diff] [blame] | 60 | /* Maximum migrate downtime set to 2000 seconds */ |
| 61 | #define MAX_MIGRATE_DOWNTIME_SECONDS 2000 |
| 62 | #define MAX_MIGRATE_DOWNTIME (MAX_MIGRATE_DOWNTIME_SECONDS * 1000) |
| 63 | |
Liang Li | 8706d2d | 2015-03-23 16:32:17 +0800 | [diff] [blame] | 64 | /* Default compression thread count */ |
| 65 | #define DEFAULT_MIGRATE_COMPRESS_THREAD_COUNT 8 |
Liang Li | 3fcb38c | 2015-03-23 16:32:18 +0800 | [diff] [blame] | 66 | /* Default decompression thread count, usually decompression is at |
| 67 | * least 4 times as fast as compression.*/ |
| 68 | #define DEFAULT_MIGRATE_DECOMPRESS_THREAD_COUNT 2 |
Liang Li | 8706d2d | 2015-03-23 16:32:17 +0800 | [diff] [blame] | 69 | /*0: means nocompress, 1: best speed, ... 9: best compress ratio */ |
| 70 | #define DEFAULT_MIGRATE_COMPRESS_LEVEL 1 |
Jason J. Herne | 1626fee | 2015-09-08 13:12:34 -0400 | [diff] [blame] | 71 | /* Define default autoconverge cpu throttle migration parameters */ |
Jason J. Herne | d85a31d | 2016-04-21 14:07:18 -0400 | [diff] [blame] | 72 | #define DEFAULT_MIGRATE_CPU_THROTTLE_INITIAL 20 |
| 73 | #define DEFAULT_MIGRATE_CPU_THROTTLE_INCREMENT 10 |
Li Qiang | 4cbc9c7 | 2018-08-01 06:00:20 -0700 | [diff] [blame] | 74 | #define DEFAULT_MIGRATE_MAX_CPU_THROTTLE 99 |
Liang Li | 8706d2d | 2015-03-23 16:32:17 +0800 | [diff] [blame] | 75 | |
Orit Wasserman | 17ad9b3 | 2012-08-06 21:42:53 +0300 | [diff] [blame] | 76 | /* Migration XBZRLE default cache size */ |
Juan Quintela | 73af8dd | 2017-10-05 21:30:10 +0200 | [diff] [blame] | 77 | #define DEFAULT_MIGRATE_XBZRLE_CACHE_SIZE (64 * 1024 * 1024) |
Orit Wasserman | 17ad9b3 | 2012-08-06 21:42:53 +0300 | [diff] [blame] | 78 | |
zhanghailiang | 68b5359 | 2016-10-27 14:43:01 +0800 | [diff] [blame] | 79 | /* The delay time (in ms) between two COLO checkpoints |
| 80 | * Note: Please change this default value to 10000 when we support hybrid mode. |
| 81 | */ |
| 82 | #define DEFAULT_MIGRATE_X_CHECKPOINT_DELAY 200 |
Juan Quintela | 4075fb1 | 2016-01-15 08:56:17 +0100 | [diff] [blame] | 83 | #define DEFAULT_MIGRATE_MULTIFD_CHANNELS 2 |
Juan Quintela | 0fb8660 | 2017-04-27 10:48:25 +0200 | [diff] [blame] | 84 | #define DEFAULT_MIGRATE_MULTIFD_PAGE_COUNT 16 |
zhanghailiang | 68b5359 | 2016-10-27 14:43:01 +0800 | [diff] [blame] | 85 | |
Dr. David Alan Gilbert | 7e555c6 | 2018-06-13 11:26:40 +0100 | [diff] [blame] | 86 | /* Background transfer rate for postcopy, 0 means unlimited, note |
| 87 | * that page requests can still exceed this limit. |
| 88 | */ |
| 89 | #define DEFAULT_MIGRATE_MAX_POSTCOPY_BANDWIDTH 0 |
| 90 | |
Gerd Hoffmann | 99a0db9 | 2010-12-13 17:30:12 +0100 | [diff] [blame] | 91 | static NotifierList migration_state_notifiers = |
| 92 | NOTIFIER_LIST_INITIALIZER(migration_state_notifiers); |
| 93 | |
Dr. David Alan Gilbert | adde220 | 2015-02-19 11:40:27 +0000 | [diff] [blame] | 94 | static bool deferred_incoming; |
| 95 | |
Juan Quintela | da6f179 | 2017-04-24 17:37:14 +0200 | [diff] [blame] | 96 | /* Messages sent on the return path from destination to source */ |
| 97 | enum mig_rp_message_type { |
| 98 | MIG_RP_MSG_INVALID = 0, /* Must be 0 */ |
| 99 | MIG_RP_MSG_SHUT, /* sibling will not send any more RP messages */ |
| 100 | MIG_RP_MSG_PONG, /* Response to a PING; data (seq: be32 ) */ |
| 101 | |
| 102 | MIG_RP_MSG_REQ_PAGES_ID, /* data (start: be64, len: be32, id: string) */ |
| 103 | MIG_RP_MSG_REQ_PAGES, /* data (start: be64, len: be32) */ |
Peter Xu | a335deb | 2018-05-02 18:47:28 +0800 | [diff] [blame] | 104 | MIG_RP_MSG_RECV_BITMAP, /* send recved_bitmap back to source */ |
Peter Xu | 13955b8 | 2018-05-02 18:47:30 +0800 | [diff] [blame] | 105 | MIG_RP_MSG_RESUME_ACK, /* tell source that we are ready to resume */ |
Juan Quintela | da6f179 | 2017-04-24 17:37:14 +0200 | [diff] [blame] | 106 | |
| 107 | MIG_RP_MSG_MAX |
| 108 | }; |
| 109 | |
Juan Quintela | 17549e8 | 2011-10-05 13:50:43 +0200 | [diff] [blame] | 110 | /* When we add fault tolerance, we could have several |
| 111 | migrations at once. For now we don't need to add |
| 112 | dynamic creation of migration */ |
| 113 | |
Peter Xu | e5cb7e7 | 2017-06-27 12:10:13 +0800 | [diff] [blame] | 114 | static MigrationState *current_migration; |
Peter Xu | e1b1b1b | 2018-05-02 18:47:35 +0800 | [diff] [blame] | 115 | static MigrationIncomingState *current_incoming; |
Peter Xu | e5cb7e7 | 2017-06-27 12:10:13 +0800 | [diff] [blame] | 116 | |
Peter Xu | 8b0b29d | 2017-07-18 11:39:06 +0800 | [diff] [blame] | 117 | static bool migration_object_check(MigrationState *ms, Error **errp); |
Dr. David Alan Gilbert | 0331c8c | 2017-10-20 10:05:56 +0100 | [diff] [blame] | 118 | static int migration_maybe_pause(MigrationState *s, |
| 119 | int *current_active_state, |
| 120 | int new_state); |
Peter Xu | 8b0b29d | 2017-07-18 11:39:06 +0800 | [diff] [blame] | 121 | |
Peter Xu | e5cb7e7 | 2017-06-27 12:10:13 +0800 | [diff] [blame] | 122 | void migration_object_init(void) |
| 123 | { |
Peter Xu | 4ffdb33 | 2017-06-27 12:10:18 +0800 | [diff] [blame] | 124 | MachineState *ms = MACHINE(qdev_get_machine()); |
Peter Xu | 8b0b29d | 2017-07-18 11:39:06 +0800 | [diff] [blame] | 125 | Error *err = NULL; |
Peter Xu | 4ffdb33 | 2017-06-27 12:10:18 +0800 | [diff] [blame] | 126 | |
Peter Xu | e5cb7e7 | 2017-06-27 12:10:13 +0800 | [diff] [blame] | 127 | /* This can only be called once. */ |
| 128 | assert(!current_migration); |
| 129 | current_migration = MIGRATION_OBJ(object_new(TYPE_MIGRATION)); |
Peter Xu | 4ffdb33 | 2017-06-27 12:10:18 +0800 | [diff] [blame] | 130 | |
Peter Xu | e1b1b1b | 2018-05-02 18:47:35 +0800 | [diff] [blame] | 131 | /* |
| 132 | * Init the migrate incoming object as well no matter whether |
| 133 | * we'll use it or not. |
| 134 | */ |
| 135 | assert(!current_incoming); |
| 136 | current_incoming = g_new0(MigrationIncomingState, 1); |
| 137 | current_incoming->state = MIGRATION_STATUS_NONE; |
| 138 | current_incoming->postcopy_remote_fds = |
| 139 | g_array_new(FALSE, TRUE, sizeof(struct PostCopyFD)); |
| 140 | qemu_mutex_init(¤t_incoming->rp_mutex); |
| 141 | qemu_event_init(¤t_incoming->main_thread_load_event, false); |
| 142 | qemu_sem_init(¤t_incoming->postcopy_pause_sem_dst, 0); |
| 143 | qemu_sem_init(¤t_incoming->postcopy_pause_sem_fault, 0); |
| 144 | |
| 145 | init_dirty_bitmap_incoming_migration(); |
| 146 | |
Peter Xu | 8b0b29d | 2017-07-18 11:39:06 +0800 | [diff] [blame] | 147 | if (!migration_object_check(current_migration, &err)) { |
| 148 | error_report_err(err); |
| 149 | exit(1); |
| 150 | } |
| 151 | |
Peter Xu | 4ffdb33 | 2017-06-27 12:10:18 +0800 | [diff] [blame] | 152 | /* |
| 153 | * We cannot really do this in migration_instance_init() since at |
| 154 | * that time global properties are not yet applied, then this |
| 155 | * value will be definitely replaced by something else. |
| 156 | */ |
| 157 | if (ms->enforce_config_section) { |
| 158 | current_migration->send_configuration = true; |
| 159 | } |
Peter Xu | e5cb7e7 | 2017-06-27 12:10:13 +0800 | [diff] [blame] | 160 | } |
| 161 | |
Vladimir Sementsov-Ogievskiy | 1f89560 | 2017-12-28 12:16:16 +0300 | [diff] [blame] | 162 | void migration_object_finalize(void) |
| 163 | { |
| 164 | object_unref(OBJECT(current_migration)); |
| 165 | } |
| 166 | |
Dr. David Alan Gilbert | bca7856 | 2015-05-21 13:24:14 +0100 | [diff] [blame] | 167 | /* For outgoing */ |
Juan Quintela | 859bc75 | 2012-08-13 09:42:49 +0200 | [diff] [blame] | 168 | MigrationState *migrate_get_current(void) |
Juan Quintela | 17549e8 | 2011-10-05 13:50:43 +0200 | [diff] [blame] | 169 | { |
Peter Xu | e5cb7e7 | 2017-06-27 12:10:13 +0800 | [diff] [blame] | 170 | /* This can only be called after the object created. */ |
| 171 | assert(current_migration); |
| 172 | return current_migration; |
Juan Quintela | 17549e8 | 2011-10-05 13:50:43 +0200 | [diff] [blame] | 173 | } |
| 174 | |
Dr. David Alan Gilbert | bca7856 | 2015-05-21 13:24:14 +0100 | [diff] [blame] | 175 | MigrationIncomingState *migration_incoming_get_current(void) |
| 176 | { |
Peter Xu | e1b1b1b | 2018-05-02 18:47:35 +0800 | [diff] [blame] | 177 | assert(current_incoming); |
| 178 | return current_incoming; |
Dr. David Alan Gilbert | bca7856 | 2015-05-21 13:24:14 +0100 | [diff] [blame] | 179 | } |
| 180 | |
| 181 | void migration_incoming_state_destroy(void) |
| 182 | { |
Juan Quintela | b4b076d | 2017-01-23 22:32:06 +0100 | [diff] [blame] | 183 | struct MigrationIncomingState *mis = migration_incoming_get_current(); |
| 184 | |
Peter Xu | 3482655 | 2017-05-19 14:43:29 +0800 | [diff] [blame] | 185 | if (mis->to_src_file) { |
Peter Xu | 660819b | 2017-05-19 14:43:30 +0800 | [diff] [blame] | 186 | /* Tell source that we are done */ |
| 187 | migrate_send_rp_shut(mis, qemu_file_get_error(mis->from_src_file) != 0); |
Peter Xu | 3482655 | 2017-05-19 14:43:29 +0800 | [diff] [blame] | 188 | qemu_fclose(mis->to_src_file); |
| 189 | mis->to_src_file = NULL; |
| 190 | } |
| 191 | |
Peter Xu | 660819b | 2017-05-19 14:43:30 +0800 | [diff] [blame] | 192 | if (mis->from_src_file) { |
| 193 | qemu_fclose(mis->from_src_file); |
| 194 | mis->from_src_file = NULL; |
| 195 | } |
Dr. David Alan Gilbert | 00fa4fc | 2018-03-12 17:21:04 +0000 | [diff] [blame] | 196 | if (mis->postcopy_remote_fds) { |
| 197 | g_array_free(mis->postcopy_remote_fds, TRUE); |
| 198 | mis->postcopy_remote_fds = NULL; |
| 199 | } |
Peter Xu | 660819b | 2017-05-19 14:43:30 +0800 | [diff] [blame] | 200 | |
Dr. David Alan Gilbert | 5089e18 | 2017-08-25 15:19:39 +0100 | [diff] [blame] | 201 | qemu_event_reset(&mis->main_thread_load_event); |
Dr. David Alan Gilbert | bca7856 | 2015-05-21 13:24:14 +0100 | [diff] [blame] | 202 | } |
| 203 | |
Juan Quintela | b05dc72 | 2015-07-07 14:44:05 +0200 | [diff] [blame] | 204 | static void migrate_generate_event(int new_state) |
| 205 | { |
| 206 | if (migrate_use_events()) { |
| 207 | qapi_event_send_migration(new_state, &error_abort); |
Juan Quintela | b05dc72 | 2015-07-07 14:44:05 +0200 | [diff] [blame] | 208 | } |
| 209 | } |
| 210 | |
Dr. David Alan Gilbert | 0f073f4 | 2018-04-16 18:09:30 +0100 | [diff] [blame] | 211 | static bool migrate_late_block_activate(void) |
| 212 | { |
| 213 | MigrationState *s; |
| 214 | |
| 215 | s = migrate_get_current(); |
| 216 | |
| 217 | return s->enabled_capabilities[ |
| 218 | MIGRATION_CAPABILITY_LATE_BLOCK_ACTIVATE]; |
| 219 | } |
| 220 | |
Dr. David Alan Gilbert | adde220 | 2015-02-19 11:40:27 +0000 | [diff] [blame] | 221 | /* |
| 222 | * Called on -incoming with a defer: uri. |
| 223 | * The migration can be started later after any parameters have been |
| 224 | * changed. |
| 225 | */ |
| 226 | static void deferred_incoming_migration(Error **errp) |
| 227 | { |
| 228 | if (deferred_incoming) { |
| 229 | error_setg(errp, "Incoming migration already deferred"); |
| 230 | } |
| 231 | deferred_incoming = true; |
| 232 | } |
| 233 | |
Juan Quintela | da6f179 | 2017-04-24 17:37:14 +0200 | [diff] [blame] | 234 | /* |
| 235 | * Send a message on the return channel back to the source |
| 236 | * of the migration. |
| 237 | */ |
Peter Xu | d6208e3 | 2018-02-08 18:31:12 +0800 | [diff] [blame] | 238 | static int migrate_send_rp_message(MigrationIncomingState *mis, |
| 239 | enum mig_rp_message_type message_type, |
| 240 | uint16_t len, void *data) |
Juan Quintela | da6f179 | 2017-04-24 17:37:14 +0200 | [diff] [blame] | 241 | { |
Peter Xu | d6208e3 | 2018-02-08 18:31:12 +0800 | [diff] [blame] | 242 | int ret = 0; |
| 243 | |
Juan Quintela | da6f179 | 2017-04-24 17:37:14 +0200 | [diff] [blame] | 244 | trace_migrate_send_rp_message((int)message_type, len); |
| 245 | qemu_mutex_lock(&mis->rp_mutex); |
Peter Xu | d6208e3 | 2018-02-08 18:31:12 +0800 | [diff] [blame] | 246 | |
| 247 | /* |
| 248 | * It's possible that the file handle got lost due to network |
| 249 | * failures. |
| 250 | */ |
| 251 | if (!mis->to_src_file) { |
| 252 | ret = -EIO; |
| 253 | goto error; |
| 254 | } |
| 255 | |
Juan Quintela | da6f179 | 2017-04-24 17:37:14 +0200 | [diff] [blame] | 256 | qemu_put_be16(mis->to_src_file, (unsigned int)message_type); |
| 257 | qemu_put_be16(mis->to_src_file, len); |
| 258 | qemu_put_buffer(mis->to_src_file, data, len); |
| 259 | qemu_fflush(mis->to_src_file); |
Peter Xu | d6208e3 | 2018-02-08 18:31:12 +0800 | [diff] [blame] | 260 | |
| 261 | /* It's possible that qemu file got error during sending */ |
| 262 | ret = qemu_file_get_error(mis->to_src_file); |
| 263 | |
| 264 | error: |
Juan Quintela | da6f179 | 2017-04-24 17:37:14 +0200 | [diff] [blame] | 265 | qemu_mutex_unlock(&mis->rp_mutex); |
Peter Xu | d6208e3 | 2018-02-08 18:31:12 +0800 | [diff] [blame] | 266 | return ret; |
Juan Quintela | da6f179 | 2017-04-24 17:37:14 +0200 | [diff] [blame] | 267 | } |
| 268 | |
Dr. David Alan Gilbert | 1e2d90e | 2015-11-05 18:11:07 +0000 | [diff] [blame] | 269 | /* Request a range of pages from the source VM at the given |
| 270 | * start address. |
| 271 | * rbname: Name of the RAMBlock to request the page in, if NULL it's the same |
| 272 | * as the last request (a name must have been given previously) |
| 273 | * Start: Address offset within the RB |
| 274 | * Len: Length in bytes required - must be a multiple of pagesize |
| 275 | */ |
Peter Xu | d6208e3 | 2018-02-08 18:31:12 +0800 | [diff] [blame] | 276 | int migrate_send_rp_req_pages(MigrationIncomingState *mis, const char *rbname, |
| 277 | ram_addr_t start, size_t len) |
Dr. David Alan Gilbert | 1e2d90e | 2015-11-05 18:11:07 +0000 | [diff] [blame] | 278 | { |
Stefan Weil | cb8d4c8 | 2016-03-23 15:59:57 +0100 | [diff] [blame] | 279 | uint8_t bufc[12 + 1 + 255]; /* start (8), len (4), rbname up to 256 */ |
Dr. David Alan Gilbert | 1e2d90e | 2015-11-05 18:11:07 +0000 | [diff] [blame] | 280 | size_t msglen = 12; /* start + len */ |
Peter Xu | d6208e3 | 2018-02-08 18:31:12 +0800 | [diff] [blame] | 281 | enum mig_rp_message_type msg_type; |
Dr. David Alan Gilbert | 1e2d90e | 2015-11-05 18:11:07 +0000 | [diff] [blame] | 282 | |
| 283 | *(uint64_t *)bufc = cpu_to_be64((uint64_t)start); |
| 284 | *(uint32_t *)(bufc + 8) = cpu_to_be32((uint32_t)len); |
| 285 | |
| 286 | if (rbname) { |
| 287 | int rbname_len = strlen(rbname); |
| 288 | assert(rbname_len < 256); |
| 289 | |
| 290 | bufc[msglen++] = rbname_len; |
| 291 | memcpy(bufc + msglen, rbname, rbname_len); |
| 292 | msglen += rbname_len; |
Peter Xu | d6208e3 | 2018-02-08 18:31:12 +0800 | [diff] [blame] | 293 | msg_type = MIG_RP_MSG_REQ_PAGES_ID; |
Dr. David Alan Gilbert | 1e2d90e | 2015-11-05 18:11:07 +0000 | [diff] [blame] | 294 | } else { |
Peter Xu | d6208e3 | 2018-02-08 18:31:12 +0800 | [diff] [blame] | 295 | msg_type = MIG_RP_MSG_REQ_PAGES; |
Dr. David Alan Gilbert | 1e2d90e | 2015-11-05 18:11:07 +0000 | [diff] [blame] | 296 | } |
Peter Xu | d6208e3 | 2018-02-08 18:31:12 +0800 | [diff] [blame] | 297 | |
| 298 | return migrate_send_rp_message(mis, msg_type, msglen, bufc); |
Dr. David Alan Gilbert | 1e2d90e | 2015-11-05 18:11:07 +0000 | [diff] [blame] | 299 | } |
| 300 | |
Paolo Bonzini | 43eaae2 | 2012-10-02 18:21:18 +0200 | [diff] [blame] | 301 | void qemu_start_incoming_migration(const char *uri, Error **errp) |
aliguori | 5bb7910 | 2008-10-13 03:12:02 +0000 | [diff] [blame] | 302 | { |
aliguori | 34c9dd8 | 2008-10-13 03:14:31 +0000 | [diff] [blame] | 303 | const char *p; |
| 304 | |
Juan Quintela | 7cf1fe6 | 2015-05-20 17:15:42 +0200 | [diff] [blame] | 305 | qapi_event_send_migration(MIGRATION_STATUS_SETUP, &error_abort); |
Dr. David Alan Gilbert | adde220 | 2015-02-19 11:40:27 +0000 | [diff] [blame] | 306 | if (!strcmp(uri, "defer")) { |
| 307 | deferred_incoming_migration(errp); |
| 308 | } else if (strstart(uri, "tcp:", &p)) { |
Paolo Bonzini | 43eaae2 | 2012-10-02 18:21:18 +0200 | [diff] [blame] | 309 | tcp_start_incoming_migration(p, errp); |
Michael R. Hines | 2da776d | 2013-07-22 10:01:54 -0400 | [diff] [blame] | 310 | #ifdef CONFIG_RDMA |
Dr. David Alan Gilbert | adde220 | 2015-02-19 11:40:27 +0000 | [diff] [blame] | 311 | } else if (strstart(uri, "rdma:", &p)) { |
Michael R. Hines | 2da776d | 2013-07-22 10:01:54 -0400 | [diff] [blame] | 312 | rdma_start_incoming_migration(p, errp); |
| 313 | #endif |
Dr. David Alan Gilbert | adde220 | 2015-02-19 11:40:27 +0000 | [diff] [blame] | 314 | } else if (strstart(uri, "exec:", &p)) { |
Paolo Bonzini | 43eaae2 | 2012-10-02 18:21:18 +0200 | [diff] [blame] | 315 | exec_start_incoming_migration(p, errp); |
Dr. David Alan Gilbert | adde220 | 2015-02-19 11:40:27 +0000 | [diff] [blame] | 316 | } else if (strstart(uri, "unix:", &p)) { |
Paolo Bonzini | 43eaae2 | 2012-10-02 18:21:18 +0200 | [diff] [blame] | 317 | unix_start_incoming_migration(p, errp); |
Dr. David Alan Gilbert | adde220 | 2015-02-19 11:40:27 +0000 | [diff] [blame] | 318 | } else if (strstart(uri, "fd:", &p)) { |
Paolo Bonzini | 43eaae2 | 2012-10-02 18:21:18 +0200 | [diff] [blame] | 319 | fd_start_incoming_migration(p, errp); |
Dr. David Alan Gilbert | adde220 | 2015-02-19 11:40:27 +0000 | [diff] [blame] | 320 | } else { |
Markus Armbruster | 312fd5f | 2013-02-08 21:22:16 +0100 | [diff] [blame] | 321 | error_setg(errp, "unknown migration protocol: %s", uri); |
Juan Quintela | 8ca5e80 | 2010-06-09 14:10:54 +0200 | [diff] [blame] | 322 | } |
aliguori | 5bb7910 | 2008-10-13 03:12:02 +0000 | [diff] [blame] | 323 | } |
| 324 | |
Denis V. Lunev | 0aa6aef | 2016-02-24 11:53:38 +0300 | [diff] [blame] | 325 | static void process_incoming_migration_bh(void *opaque) |
| 326 | { |
| 327 | Error *local_err = NULL; |
| 328 | MigrationIncomingState *mis = opaque; |
| 329 | |
Dr. David Alan Gilbert | 0f073f4 | 2018-04-16 18:09:30 +0100 | [diff] [blame] | 330 | /* If capability late_block_activate is set: |
| 331 | * Only fire up the block code now if we're going to restart the |
| 332 | * VM, else 'cont' will do it. |
| 333 | * This causes file locking to happen; so we don't want it to happen |
| 334 | * unless we really are starting the VM. |
| 335 | */ |
| 336 | if (!migrate_late_block_activate() || |
| 337 | (autostart && (!global_state_received() || |
| 338 | global_state_get_runstate() == RUN_STATE_RUNNING))) { |
| 339 | /* Make sure all file formats flush their mutable metadata. |
| 340 | * If we get an error here, just don't restart the VM yet. */ |
| 341 | bdrv_invalidate_cache_all(&local_err); |
| 342 | if (local_err) { |
| 343 | error_report_err(local_err); |
| 344 | local_err = NULL; |
| 345 | autostart = false; |
| 346 | } |
Kevin Wolf | d35ff5e | 2017-04-04 17:29:03 +0200 | [diff] [blame] | 347 | } |
| 348 | |
Denis V. Lunev | 0aa6aef | 2016-02-24 11:53:38 +0300 | [diff] [blame] | 349 | /* |
| 350 | * This must happen after all error conditions are dealt with and |
| 351 | * we're sure the VM is going to be running on this host. |
| 352 | */ |
| 353 | qemu_announce_self(); |
| 354 | |
Juan Quintela | f986c3d | 2016-01-14 16:52:55 +0100 | [diff] [blame] | 355 | if (multifd_load_cleanup(&local_err) != 0) { |
| 356 | error_report_err(local_err); |
| 357 | autostart = false; |
| 358 | } |
Denis V. Lunev | 0aa6aef | 2016-02-24 11:53:38 +0300 | [diff] [blame] | 359 | /* If global state section was not received or we are in running |
| 360 | state, we need to obey autostart. Any other state is set with |
| 361 | runstate_set. */ |
| 362 | |
Vladimir Sementsov-Ogievskiy | b35ebdf | 2018-03-13 15:34:01 -0400 | [diff] [blame] | 363 | dirty_bitmap_mig_before_vm_start(); |
| 364 | |
Denis V. Lunev | 0aa6aef | 2016-02-24 11:53:38 +0300 | [diff] [blame] | 365 | if (!global_state_received() || |
| 366 | global_state_get_runstate() == RUN_STATE_RUNNING) { |
| 367 | if (autostart) { |
| 368 | vm_start(); |
| 369 | } else { |
| 370 | runstate_set(RUN_STATE_PAUSED); |
| 371 | } |
| 372 | } else { |
| 373 | runstate_set(global_state_get_runstate()); |
| 374 | } |
Denis V. Lunev | 0aa6aef | 2016-02-24 11:53:38 +0300 | [diff] [blame] | 375 | /* |
| 376 | * This must happen after any state changes since as soon as an external |
| 377 | * observer sees this event they might start to prod at the VM assuming |
| 378 | * it's ready to use. |
| 379 | */ |
| 380 | migrate_set_state(&mis->state, MIGRATION_STATUS_ACTIVE, |
| 381 | MIGRATION_STATUS_COMPLETED); |
| 382 | qemu_bh_delete(mis->bh); |
| 383 | migration_incoming_state_destroy(); |
| 384 | } |
| 385 | |
Paolo Bonzini | 82a4da7 | 2012-08-07 10:57:43 +0200 | [diff] [blame] | 386 | static void process_incoming_migration_co(void *opaque) |
Juan Quintela | 511c023 | 2010-06-09 14:10:55 +0200 | [diff] [blame] | 387 | { |
Juan Quintela | b4b076d | 2017-01-23 22:32:06 +0100 | [diff] [blame] | 388 | MigrationIncomingState *mis = migration_incoming_get_current(); |
Dr. David Alan Gilbert | e9bef23 | 2015-11-05 18:11:21 +0000 | [diff] [blame] | 389 | PostcopyState ps; |
Paolo Bonzini | 1c12e1f | 2012-08-07 10:51:51 +0200 | [diff] [blame] | 390 | int ret; |
| 391 | |
Juan Quintela | 4f0fae7 | 2017-07-24 12:42:02 +0200 | [diff] [blame] | 392 | assert(mis->from_src_file); |
Dr. David Alan Gilbert | 67f11b5 | 2017-02-24 18:28:34 +0000 | [diff] [blame] | 393 | mis->largest_page_size = qemu_ram_pagesize_largest(); |
Dr. David Alan Gilbert | 093e3c4 | 2015-11-05 18:10:52 +0000 | [diff] [blame] | 394 | postcopy_state_set(POSTCOPY_INCOMING_NONE); |
zhanghailiang | 93d7af6 | 2015-12-16 11:47:34 +0000 | [diff] [blame] | 395 | migrate_set_state(&mis->state, MIGRATION_STATUS_NONE, |
| 396 | MIGRATION_STATUS_ACTIVE); |
Juan Quintela | 4f0fae7 | 2017-07-24 12:42:02 +0200 | [diff] [blame] | 397 | ret = qemu_loadvm_state(mis->from_src_file); |
Dr. David Alan Gilbert | bca7856 | 2015-05-21 13:24:14 +0100 | [diff] [blame] | 398 | |
Dr. David Alan Gilbert | e9bef23 | 2015-11-05 18:11:21 +0000 | [diff] [blame] | 399 | ps = postcopy_state_get(); |
| 400 | trace_process_incoming_migration_co_end(ret, ps); |
| 401 | if (ps != POSTCOPY_INCOMING_NONE) { |
| 402 | if (ps == POSTCOPY_INCOMING_ADVISE) { |
| 403 | /* |
| 404 | * Where a migration had postcopy enabled (and thus went to advise) |
| 405 | * but managed to complete within the precopy period, we can use |
| 406 | * the normal exit. |
| 407 | */ |
| 408 | postcopy_ram_incoming_cleanup(mis); |
| 409 | } else if (ret >= 0) { |
| 410 | /* |
| 411 | * Postcopy was started, cleanup should happen at the end of the |
| 412 | * postcopy thread. |
| 413 | */ |
| 414 | trace_process_incoming_migration_co_postcopy_end_main(); |
| 415 | return; |
| 416 | } |
| 417 | /* Else if something went wrong then just fall out of the normal exit */ |
| 418 | } |
| 419 | |
zhanghailiang | 25d0c16 | 2016-10-27 14:42:55 +0800 | [diff] [blame] | 420 | /* we get COLO info, and know if we are in COLO mode */ |
| 421 | if (!ret && migration_incoming_enable_colo()) { |
| 422 | mis->migration_incoming_co = qemu_coroutine_self(); |
| 423 | qemu_thread_create(&mis->colo_incoming_thread, "COLO incoming", |
| 424 | colo_process_incoming_thread, mis, QEMU_THREAD_JOINABLE); |
| 425 | mis->have_colo_incoming_thread = true; |
| 426 | qemu_coroutine_yield(); |
| 427 | |
| 428 | /* Wait checkpoint incoming thread exit before free resource */ |
| 429 | qemu_thread_join(&mis->colo_incoming_thread); |
| 430 | } |
| 431 | |
Paolo Bonzini | 1c12e1f | 2012-08-07 10:51:51 +0200 | [diff] [blame] | 432 | if (ret < 0) { |
Juan Quintela | f986c3d | 2016-01-14 16:52:55 +0100 | [diff] [blame] | 433 | Error *local_err = NULL; |
| 434 | |
zhanghailiang | 93d7af6 | 2015-12-16 11:47:34 +0000 | [diff] [blame] | 435 | migrate_set_state(&mis->state, MIGRATION_STATUS_ACTIVE, |
| 436 | MIGRATION_STATUS_FAILED); |
Peter Lieven | db80fac | 2014-06-10 11:29:16 +0200 | [diff] [blame] | 437 | error_report("load of migration failed: %s", strerror(-ret)); |
Dr. David Alan Gilbert | 3a0f2ce | 2017-07-17 12:09:32 +0100 | [diff] [blame] | 438 | qemu_fclose(mis->from_src_file); |
Juan Quintela | f986c3d | 2016-01-14 16:52:55 +0100 | [diff] [blame] | 439 | if (multifd_load_cleanup(&local_err) != 0) { |
| 440 | error_report_err(local_err); |
| 441 | } |
Eric Blake | 4aead69 | 2013-04-16 15:50:41 -0600 | [diff] [blame] | 442 | exit(EXIT_FAILURE); |
Juan Quintela | 511c023 | 2010-06-09 14:10:55 +0200 | [diff] [blame] | 443 | } |
Denis V. Lunev | 0aa6aef | 2016-02-24 11:53:38 +0300 | [diff] [blame] | 444 | mis->bh = qemu_bh_new(process_incoming_migration_bh, mis); |
| 445 | qemu_bh_schedule(mis->bh); |
Juan Quintela | 511c023 | 2010-06-09 14:10:55 +0200 | [diff] [blame] | 446 | } |
| 447 | |
Juan Quintela | e595a01 | 2017-07-17 12:30:25 +0200 | [diff] [blame] | 448 | static void migration_incoming_setup(QEMUFile *f) |
Paolo Bonzini | 82a4da7 | 2012-08-07 10:57:43 +0200 | [diff] [blame] | 449 | { |
Juan Quintela | 4f0fae7 | 2017-07-24 12:42:02 +0200 | [diff] [blame] | 450 | MigrationIncomingState *mis = migration_incoming_get_current(); |
Paolo Bonzini | 82a4da7 | 2012-08-07 10:57:43 +0200 | [diff] [blame] | 451 | |
Juan Quintela | f986c3d | 2016-01-14 16:52:55 +0100 | [diff] [blame] | 452 | if (multifd_load_setup() != 0) { |
| 453 | /* We haven't been able to create multifd threads |
| 454 | nothing better to do */ |
| 455 | exit(EXIT_FAILURE); |
| 456 | } |
| 457 | |
Juan Quintela | 4f0fae7 | 2017-07-24 12:42:02 +0200 | [diff] [blame] | 458 | if (!mis->from_src_file) { |
| 459 | mis->from_src_file = f; |
| 460 | } |
Daniel P. Berrange | 06ad513 | 2016-04-27 11:04:56 +0100 | [diff] [blame] | 461 | qemu_file_set_blocking(f, false); |
Juan Quintela | e595a01 | 2017-07-17 12:30:25 +0200 | [diff] [blame] | 462 | } |
| 463 | |
Juan Quintela | 36c2f8b | 2018-03-07 08:40:52 +0100 | [diff] [blame] | 464 | void migration_incoming_process(void) |
Juan Quintela | e595a01 | 2017-07-17 12:30:25 +0200 | [diff] [blame] | 465 | { |
| 466 | Coroutine *co = qemu_coroutine_create(process_incoming_migration_co, NULL); |
Paolo Bonzini | 0b8b875 | 2016-07-04 19:10:01 +0200 | [diff] [blame] | 467 | qemu_coroutine_enter(co); |
Paolo Bonzini | 82a4da7 | 2012-08-07 10:57:43 +0200 | [diff] [blame] | 468 | } |
| 469 | |
Peter Xu | 884835f | 2018-06-27 21:22:45 +0800 | [diff] [blame] | 470 | /* Returns true if recovered from a paused migration, otherwise false */ |
| 471 | static bool postcopy_try_recover(QEMUFile *f) |
Juan Quintela | e595a01 | 2017-07-17 12:30:25 +0200 | [diff] [blame] | 472 | { |
Peter Xu | d96c9e8 | 2018-05-02 18:47:26 +0800 | [diff] [blame] | 473 | MigrationIncomingState *mis = migration_incoming_get_current(); |
| 474 | |
| 475 | if (mis->state == MIGRATION_STATUS_POSTCOPY_PAUSED) { |
| 476 | /* Resumed from a paused postcopy migration */ |
| 477 | |
| 478 | mis->from_src_file = f; |
| 479 | /* Postcopy has standalone thread to do vm load */ |
| 480 | qemu_file_set_blocking(f, true); |
| 481 | |
| 482 | /* Re-configure the return path */ |
| 483 | mis->to_src_file = qemu_file_get_return_path(f); |
| 484 | |
| 485 | migrate_set_state(&mis->state, MIGRATION_STATUS_POSTCOPY_PAUSED, |
| 486 | MIGRATION_STATUS_POSTCOPY_RECOVER); |
| 487 | |
| 488 | /* |
| 489 | * Here, we only wake up the main loading thread (while the |
| 490 | * fault thread will still be waiting), so that we can receive |
| 491 | * commands from source now, and answer it if needed. The |
| 492 | * fault thread will be woken up afterwards until we are sure |
| 493 | * that source is ready to reply to page requests. |
| 494 | */ |
| 495 | qemu_sem_post(&mis->postcopy_pause_sem_dst); |
Peter Xu | 884835f | 2018-06-27 21:22:45 +0800 | [diff] [blame] | 496 | return true; |
Peter Xu | d96c9e8 | 2018-05-02 18:47:26 +0800 | [diff] [blame] | 497 | } |
Peter Xu | 884835f | 2018-06-27 21:22:45 +0800 | [diff] [blame] | 498 | |
| 499 | return false; |
| 500 | } |
| 501 | |
| 502 | void migration_fd_process_incoming(QEMUFile *f) |
| 503 | { |
| 504 | if (postcopy_try_recover(f)) { |
| 505 | return; |
| 506 | } |
| 507 | |
| 508 | migration_incoming_setup(f); |
| 509 | migration_incoming_process(); |
Juan Quintela | e595a01 | 2017-07-17 12:30:25 +0200 | [diff] [blame] | 510 | } |
| 511 | |
Juan Quintela | 4f0fae7 | 2017-07-24 12:42:02 +0200 | [diff] [blame] | 512 | void migration_ioc_process_incoming(QIOChannel *ioc) |
| 513 | { |
| 514 | MigrationIncomingState *mis = migration_incoming_get_current(); |
Peter Xu | a429e7f | 2018-06-27 21:22:46 +0800 | [diff] [blame] | 515 | bool start_migration; |
Juan Quintela | 4f0fae7 | 2017-07-24 12:42:02 +0200 | [diff] [blame] | 516 | |
| 517 | if (!mis->from_src_file) { |
Peter Xu | a429e7f | 2018-06-27 21:22:46 +0800 | [diff] [blame] | 518 | /* The first connection (multifd may have multiple) */ |
Juan Quintela | 4f0fae7 | 2017-07-24 12:42:02 +0200 | [diff] [blame] | 519 | QEMUFile *f = qemu_fopen_channel_input(ioc); |
Peter Xu | a429e7f | 2018-06-27 21:22:46 +0800 | [diff] [blame] | 520 | |
| 521 | /* If it's a recovery, we're done */ |
Peter Xu | 884835f | 2018-06-27 21:22:45 +0800 | [diff] [blame] | 522 | if (postcopy_try_recover(f)) { |
| 523 | return; |
| 524 | } |
Peter Xu | a429e7f | 2018-06-27 21:22:46 +0800 | [diff] [blame] | 525 | |
Juan Quintela | 36c2f8b | 2018-03-07 08:40:52 +0100 | [diff] [blame] | 526 | migration_incoming_setup(f); |
Peter Xu | a429e7f | 2018-06-27 21:22:46 +0800 | [diff] [blame] | 527 | |
| 528 | /* |
| 529 | * Common migration only needs one channel, so we can start |
| 530 | * right now. Multifd needs more than one channel, we wait. |
| 531 | */ |
| 532 | start_migration = !migrate_use_multifd(); |
| 533 | } else { |
| 534 | /* Multiple connections */ |
| 535 | assert(migrate_use_multifd()); |
| 536 | start_migration = multifd_recv_new_channel(ioc); |
Juan Quintela | 4f0fae7 | 2017-07-24 12:42:02 +0200 | [diff] [blame] | 537 | } |
Peter Xu | 81e6205 | 2018-06-27 21:22:44 +0800 | [diff] [blame] | 538 | |
Peter Xu | a429e7f | 2018-06-27 21:22:46 +0800 | [diff] [blame] | 539 | if (start_migration) { |
Peter Xu | 81e6205 | 2018-06-27 21:22:44 +0800 | [diff] [blame] | 540 | migration_incoming_process(); |
| 541 | } |
Juan Quintela | 4f0fae7 | 2017-07-24 12:42:02 +0200 | [diff] [blame] | 542 | } |
| 543 | |
Juan Quintela | 428d890 | 2017-07-24 13:06:25 +0200 | [diff] [blame] | 544 | /** |
| 545 | * @migration_has_all_channels: We have received all channels that we need |
| 546 | * |
| 547 | * Returns true when we have got connections to all the channels that |
| 548 | * we need for migration. |
| 549 | */ |
| 550 | bool migration_has_all_channels(void) |
| 551 | { |
Daniel P. Berrangé | ca273df | 2018-06-19 17:35:52 +0100 | [diff] [blame] | 552 | MigrationIncomingState *mis = migration_incoming_get_current(); |
Juan Quintela | 62c1e0c | 2018-02-19 18:59:02 +0100 | [diff] [blame] | 553 | bool all_channels; |
| 554 | |
| 555 | all_channels = multifd_recv_all_channels_created(); |
| 556 | |
Daniel P. Berrangé | ca273df | 2018-06-19 17:35:52 +0100 | [diff] [blame] | 557 | return all_channels && mis->from_src_file != NULL; |
Juan Quintela | 428d890 | 2017-07-24 13:06:25 +0200 | [diff] [blame] | 558 | } |
| 559 | |
Dr. David Alan Gilbert | 6decec9 | 2015-11-05 18:10:47 +0000 | [diff] [blame] | 560 | /* |
Dr. David Alan Gilbert | 6decec9 | 2015-11-05 18:10:47 +0000 | [diff] [blame] | 561 | * Send a 'SHUT' message on the return channel with the given value |
| 562 | * to indicate that we've finished with the RP. Non-0 value indicates |
| 563 | * error. |
| 564 | */ |
| 565 | void migrate_send_rp_shut(MigrationIncomingState *mis, |
| 566 | uint32_t value) |
| 567 | { |
| 568 | uint32_t buf; |
| 569 | |
| 570 | buf = cpu_to_be32(value); |
| 571 | migrate_send_rp_message(mis, MIG_RP_MSG_SHUT, sizeof(buf), &buf); |
| 572 | } |
| 573 | |
| 574 | /* |
| 575 | * Send a 'PONG' message on the return channel with the given value |
| 576 | * (normally in response to a 'PING') |
| 577 | */ |
| 578 | void migrate_send_rp_pong(MigrationIncomingState *mis, |
| 579 | uint32_t value) |
| 580 | { |
| 581 | uint32_t buf; |
| 582 | |
| 583 | buf = cpu_to_be32(value); |
| 584 | migrate_send_rp_message(mis, MIG_RP_MSG_PONG, sizeof(buf), &buf); |
| 585 | } |
| 586 | |
Peter Xu | a335deb | 2018-05-02 18:47:28 +0800 | [diff] [blame] | 587 | void migrate_send_rp_recv_bitmap(MigrationIncomingState *mis, |
| 588 | char *block_name) |
| 589 | { |
| 590 | char buf[512]; |
| 591 | int len; |
| 592 | int64_t res; |
| 593 | |
| 594 | /* |
| 595 | * First, we send the header part. It contains only the len of |
| 596 | * idstr, and the idstr itself. |
| 597 | */ |
| 598 | len = strlen(block_name); |
| 599 | buf[0] = len; |
| 600 | memcpy(buf + 1, block_name, len); |
| 601 | |
| 602 | if (mis->state != MIGRATION_STATUS_POSTCOPY_RECOVER) { |
| 603 | error_report("%s: MSG_RP_RECV_BITMAP only used for recovery", |
| 604 | __func__); |
| 605 | return; |
| 606 | } |
| 607 | |
| 608 | migrate_send_rp_message(mis, MIG_RP_MSG_RECV_BITMAP, len + 1, buf); |
| 609 | |
| 610 | /* |
| 611 | * Next, we dump the received bitmap to the stream. |
| 612 | * |
| 613 | * TODO: currently we are safe since we are the only one that is |
| 614 | * using the to_src_file handle (fault thread is still paused), |
| 615 | * and it's ok even not taking the mutex. However the best way is |
| 616 | * to take the lock before sending the message header, and release |
| 617 | * the lock after sending the bitmap. |
| 618 | */ |
| 619 | qemu_mutex_lock(&mis->rp_mutex); |
| 620 | res = ramblock_recv_bitmap_send(mis->to_src_file, block_name); |
| 621 | qemu_mutex_unlock(&mis->rp_mutex); |
| 622 | |
| 623 | trace_migrate_send_rp_recv_bitmap(block_name, res); |
| 624 | } |
| 625 | |
Peter Xu | 13955b8 | 2018-05-02 18:47:30 +0800 | [diff] [blame] | 626 | void migrate_send_rp_resume_ack(MigrationIncomingState *mis, uint32_t value) |
| 627 | { |
| 628 | uint32_t buf; |
| 629 | |
| 630 | buf = cpu_to_be32(value); |
| 631 | migrate_send_rp_message(mis, MIG_RP_MSG_RESUME_ACK, sizeof(buf), &buf); |
| 632 | } |
| 633 | |
Orit Wasserman | bbf6da3 | 2012-08-06 21:42:47 +0300 | [diff] [blame] | 634 | MigrationCapabilityStatusList *qmp_query_migrate_capabilities(Error **errp) |
| 635 | { |
| 636 | MigrationCapabilityStatusList *head = NULL; |
| 637 | MigrationCapabilityStatusList *caps; |
| 638 | MigrationState *s = migrate_get_current(); |
| 639 | int i; |
| 640 | |
Michael Tokarev | 387eede | 2013-10-05 13:18:28 +0400 | [diff] [blame] | 641 | caps = NULL; /* silence compiler warning */ |
Eric Blake | 7fb1cf1 | 2015-11-18 01:52:57 -0700 | [diff] [blame] | 642 | for (i = 0; i < MIGRATION_CAPABILITY__MAX; i++) { |
Dr. David Alan Gilbert | ed1701c | 2017-05-15 15:05:29 +0100 | [diff] [blame] | 643 | #ifndef CONFIG_LIVE_BLOCK_MIGRATION |
| 644 | if (i == MIGRATION_CAPABILITY_BLOCK) { |
| 645 | continue; |
| 646 | } |
| 647 | #endif |
Orit Wasserman | bbf6da3 | 2012-08-06 21:42:47 +0300 | [diff] [blame] | 648 | if (head == NULL) { |
| 649 | head = g_malloc0(sizeof(*caps)); |
| 650 | caps = head; |
| 651 | } else { |
| 652 | caps->next = g_malloc0(sizeof(*caps)); |
| 653 | caps = caps->next; |
| 654 | } |
| 655 | caps->value = |
| 656 | g_malloc(sizeof(*caps->value)); |
| 657 | caps->value->capability = i; |
| 658 | caps->value->state = s->enabled_capabilities[i]; |
| 659 | } |
| 660 | |
| 661 | return head; |
| 662 | } |
| 663 | |
Liang Li | 85de832 | 2015-03-23 16:32:28 +0800 | [diff] [blame] | 664 | MigrationParameters *qmp_query_migrate_parameters(Error **errp) |
| 665 | { |
| 666 | MigrationParameters *params; |
| 667 | MigrationState *s = migrate_get_current(); |
| 668 | |
Markus Armbruster | e87fae4 | 2017-07-18 12:57:38 +0200 | [diff] [blame] | 669 | /* TODO use QAPI_CLONE() instead of duplicating it inline */ |
Liang Li | 85de832 | 2015-03-23 16:32:28 +0800 | [diff] [blame] | 670 | params = g_malloc0(sizeof(*params)); |
Eric Blake | de63ab6 | 2016-09-08 22:14:15 -0500 | [diff] [blame] | 671 | params->has_compress_level = true; |
Daniel P. Berrange | 2594f56 | 2016-04-27 11:05:14 +0100 | [diff] [blame] | 672 | params->compress_level = s->parameters.compress_level; |
Eric Blake | de63ab6 | 2016-09-08 22:14:15 -0500 | [diff] [blame] | 673 | params->has_compress_threads = true; |
Daniel P. Berrange | 2594f56 | 2016-04-27 11:05:14 +0100 | [diff] [blame] | 674 | params->compress_threads = s->parameters.compress_threads; |
Eric Blake | de63ab6 | 2016-09-08 22:14:15 -0500 | [diff] [blame] | 675 | params->has_decompress_threads = true; |
Daniel P. Berrange | 2594f56 | 2016-04-27 11:05:14 +0100 | [diff] [blame] | 676 | params->decompress_threads = s->parameters.decompress_threads; |
Eric Blake | de63ab6 | 2016-09-08 22:14:15 -0500 | [diff] [blame] | 677 | params->has_cpu_throttle_initial = true; |
Daniel P. Berrange | 2594f56 | 2016-04-27 11:05:14 +0100 | [diff] [blame] | 678 | params->cpu_throttle_initial = s->parameters.cpu_throttle_initial; |
Eric Blake | de63ab6 | 2016-09-08 22:14:15 -0500 | [diff] [blame] | 679 | params->has_cpu_throttle_increment = true; |
Daniel P. Berrange | 2594f56 | 2016-04-27 11:05:14 +0100 | [diff] [blame] | 680 | params->cpu_throttle_increment = s->parameters.cpu_throttle_increment; |
Markus Armbruster | 8cc99dc | 2017-07-18 12:04:54 +0200 | [diff] [blame] | 681 | params->has_tls_creds = true; |
Daniel P. Berrange | 69ef1f3 | 2016-04-27 11:05:15 +0100 | [diff] [blame] | 682 | params->tls_creds = g_strdup(s->parameters.tls_creds); |
Markus Armbruster | 8cc99dc | 2017-07-18 12:04:54 +0200 | [diff] [blame] | 683 | params->has_tls_hostname = true; |
Daniel P. Berrange | 69ef1f3 | 2016-04-27 11:05:15 +0100 | [diff] [blame] | 684 | params->tls_hostname = g_strdup(s->parameters.tls_hostname); |
Ashijeet Acharya | 2ff3025 | 2016-09-15 21:50:28 +0530 | [diff] [blame] | 685 | params->has_max_bandwidth = true; |
| 686 | params->max_bandwidth = s->parameters.max_bandwidth; |
| 687 | params->has_downtime_limit = true; |
| 688 | params->downtime_limit = s->parameters.downtime_limit; |
zhanghailiang | fe39a4d | 2016-11-02 15:42:09 +0800 | [diff] [blame] | 689 | params->has_x_checkpoint_delay = true; |
zhanghailiang | 68b5359 | 2016-10-27 14:43:01 +0800 | [diff] [blame] | 690 | params->x_checkpoint_delay = s->parameters.x_checkpoint_delay; |
Juan Quintela | 2833c59 | 2017-04-05 18:32:37 +0200 | [diff] [blame] | 691 | params->has_block_incremental = true; |
| 692 | params->block_incremental = s->parameters.block_incremental; |
Juan Quintela | 4075fb1 | 2016-01-15 08:56:17 +0100 | [diff] [blame] | 693 | params->has_x_multifd_channels = true; |
| 694 | params->x_multifd_channels = s->parameters.x_multifd_channels; |
Juan Quintela | 0fb8660 | 2017-04-27 10:48:25 +0200 | [diff] [blame] | 695 | params->has_x_multifd_page_count = true; |
| 696 | params->x_multifd_page_count = s->parameters.x_multifd_page_count; |
Juan Quintela | 73af8dd | 2017-10-05 21:30:10 +0200 | [diff] [blame] | 697 | params->has_xbzrle_cache_size = true; |
| 698 | params->xbzrle_cache_size = s->parameters.xbzrle_cache_size; |
Dr. David Alan Gilbert | 7e555c6 | 2018-06-13 11:26:40 +0100 | [diff] [blame] | 699 | params->has_max_postcopy_bandwidth = true; |
| 700 | params->max_postcopy_bandwidth = s->parameters.max_postcopy_bandwidth; |
Li Qiang | 4cbc9c7 | 2018-08-01 06:00:20 -0700 | [diff] [blame] | 701 | params->has_max_cpu_throttle = true; |
| 702 | params->max_cpu_throttle = s->parameters.max_cpu_throttle; |
Liang Li | 85de832 | 2015-03-23 16:32:28 +0800 | [diff] [blame] | 703 | |
| 704 | return params; |
| 705 | } |
| 706 | |
Dr. David Alan Gilbert | f6844b9 | 2015-11-05 18:10:48 +0000 | [diff] [blame] | 707 | /* |
| 708 | * Return true if we're already in the middle of a migration |
| 709 | * (i.e. any of the active or setup states) |
| 710 | */ |
| 711 | static bool migration_is_setup_or_active(int state) |
| 712 | { |
| 713 | switch (state) { |
| 714 | case MIGRATION_STATUS_ACTIVE: |
Dr. David Alan Gilbert | 9ec055a | 2015-11-05 18:10:58 +0000 | [diff] [blame] | 715 | case MIGRATION_STATUS_POSTCOPY_ACTIVE: |
Peter Xu | a688d2c | 2018-05-02 18:47:18 +0800 | [diff] [blame] | 716 | case MIGRATION_STATUS_POSTCOPY_PAUSED: |
Peter Xu | 135b87b | 2018-05-02 18:47:25 +0800 | [diff] [blame] | 717 | case MIGRATION_STATUS_POSTCOPY_RECOVER: |
Dr. David Alan Gilbert | f6844b9 | 2015-11-05 18:10:48 +0000 | [diff] [blame] | 718 | case MIGRATION_STATUS_SETUP: |
Dr. David Alan Gilbert | 31e0607 | 2017-10-20 10:05:51 +0100 | [diff] [blame] | 719 | case MIGRATION_STATUS_PRE_SWITCHOVER: |
| 720 | case MIGRATION_STATUS_DEVICE: |
Dr. David Alan Gilbert | f6844b9 | 2015-11-05 18:10:48 +0000 | [diff] [blame] | 721 | return true; |
| 722 | |
| 723 | default: |
| 724 | return false; |
| 725 | |
| 726 | } |
| 727 | } |
| 728 | |
Dr. David Alan Gilbert | a22463a | 2016-06-13 12:16:41 +0100 | [diff] [blame] | 729 | static void populate_ram_info(MigrationInfo *info, MigrationState *s) |
| 730 | { |
| 731 | info->has_ram = true; |
| 732 | info->ram = g_malloc0(sizeof(*info->ram)); |
Juan Quintela | 9360447 | 2017-06-06 19:49:03 +0200 | [diff] [blame] | 733 | info->ram->transferred = ram_counters.transferred; |
Dr. David Alan Gilbert | a22463a | 2016-06-13 12:16:41 +0100 | [diff] [blame] | 734 | info->ram->total = ram_bytes_total(); |
Juan Quintela | 9360447 | 2017-06-06 19:49:03 +0200 | [diff] [blame] | 735 | info->ram->duplicate = ram_counters.duplicate; |
Juan Quintela | bedf53c | 2017-03-13 20:35:54 +0100 | [diff] [blame] | 736 | /* legacy value. It is not used anymore */ |
| 737 | info->ram->skipped = 0; |
Juan Quintela | 9360447 | 2017-06-06 19:49:03 +0200 | [diff] [blame] | 738 | info->ram->normal = ram_counters.normal; |
| 739 | info->ram->normal_bytes = ram_counters.normal * |
Juan Quintela | 20afaed | 2017-03-21 09:09:14 +0100 | [diff] [blame] | 740 | qemu_target_page_size(); |
Dr. David Alan Gilbert | a22463a | 2016-06-13 12:16:41 +0100 | [diff] [blame] | 741 | info->ram->mbps = s->mbps; |
Juan Quintela | 9360447 | 2017-06-06 19:49:03 +0200 | [diff] [blame] | 742 | info->ram->dirty_sync_count = ram_counters.dirty_sync_count; |
| 743 | info->ram->postcopy_requests = ram_counters.postcopy_requests; |
Chao Fan | 030ce1f | 2017-03-21 10:22:43 +0800 | [diff] [blame] | 744 | info->ram->page_size = qemu_target_page_size(); |
Juan Quintela | a61c45b | 2018-06-26 15:20:11 +0200 | [diff] [blame] | 745 | info->ram->multifd_bytes = ram_counters.multifd_bytes; |
Dr. David Alan Gilbert | a22463a | 2016-06-13 12:16:41 +0100 | [diff] [blame] | 746 | |
Juan Quintela | 114f5ae | 2017-05-04 10:09:21 +0200 | [diff] [blame] | 747 | if (migrate_use_xbzrle()) { |
| 748 | info->has_xbzrle_cache = true; |
| 749 | info->xbzrle_cache = g_malloc0(sizeof(*info->xbzrle_cache)); |
| 750 | info->xbzrle_cache->cache_size = migrate_xbzrle_cache_size(); |
Juan Quintela | 9360447 | 2017-06-06 19:49:03 +0200 | [diff] [blame] | 751 | info->xbzrle_cache->bytes = xbzrle_counters.bytes; |
| 752 | info->xbzrle_cache->pages = xbzrle_counters.pages; |
| 753 | info->xbzrle_cache->cache_miss = xbzrle_counters.cache_miss; |
| 754 | info->xbzrle_cache->cache_miss_rate = xbzrle_counters.cache_miss_rate; |
| 755 | info->xbzrle_cache->overflow = xbzrle_counters.overflow; |
Juan Quintela | 114f5ae | 2017-05-04 10:09:21 +0200 | [diff] [blame] | 756 | } |
| 757 | |
Juan Quintela | 338182c | 2017-05-03 13:16:38 +0200 | [diff] [blame] | 758 | if (cpu_throttle_active()) { |
| 759 | info->has_cpu_throttle_percentage = true; |
| 760 | info->cpu_throttle_percentage = cpu_throttle_get_percentage(); |
| 761 | } |
| 762 | |
Dr. David Alan Gilbert | a22463a | 2016-06-13 12:16:41 +0100 | [diff] [blame] | 763 | if (s->state != MIGRATION_STATUS_COMPLETED) { |
| 764 | info->ram->remaining = ram_bytes_remaining(); |
Juan Quintela | 9360447 | 2017-06-06 19:49:03 +0200 | [diff] [blame] | 765 | info->ram->dirty_pages_rate = ram_counters.dirty_pages_rate; |
Dr. David Alan Gilbert | a22463a | 2016-06-13 12:16:41 +0100 | [diff] [blame] | 766 | } |
| 767 | } |
| 768 | |
Juan Quintela | 930ac04 | 2017-05-04 10:21:46 +0200 | [diff] [blame] | 769 | static void populate_disk_info(MigrationInfo *info) |
| 770 | { |
| 771 | if (blk_mig_active()) { |
| 772 | info->has_disk = true; |
| 773 | info->disk = g_malloc0(sizeof(*info->disk)); |
| 774 | info->disk->transferred = blk_mig_bytes_transferred(); |
| 775 | info->disk->remaining = blk_mig_bytes_remaining(); |
| 776 | info->disk->total = blk_mig_bytes_total(); |
| 777 | } |
| 778 | } |
| 779 | |
Alexey Perevalov | 65ace06 | 2018-03-22 21:17:27 +0300 | [diff] [blame] | 780 | static void fill_source_migration_info(MigrationInfo *info) |
aliguori | 5bb7910 | 2008-10-13 03:12:02 +0000 | [diff] [blame] | 781 | { |
Juan Quintela | 17549e8 | 2011-10-05 13:50:43 +0200 | [diff] [blame] | 782 | MigrationState *s = migrate_get_current(); |
aliguori | 376253e | 2009-03-05 23:01:23 +0000 | [diff] [blame] | 783 | |
Juan Quintela | 17549e8 | 2011-10-05 13:50:43 +0200 | [diff] [blame] | 784 | switch (s->state) { |
zhanghailiang | 3119473 | 2015-03-13 16:08:38 +0800 | [diff] [blame] | 785 | case MIGRATION_STATUS_NONE: |
Juan Quintela | 17549e8 | 2011-10-05 13:50:43 +0200 | [diff] [blame] | 786 | /* no migration has happened ever */ |
Alexey Perevalov | 65ace06 | 2018-03-22 21:17:27 +0300 | [diff] [blame] | 787 | /* do not overwrite destination migration status */ |
| 788 | return; |
Juan Quintela | 17549e8 | 2011-10-05 13:50:43 +0200 | [diff] [blame] | 789 | break; |
zhanghailiang | 3119473 | 2015-03-13 16:08:38 +0800 | [diff] [blame] | 790 | case MIGRATION_STATUS_SETUP: |
Michael R. Hines | 29ae8a4 | 2013-07-22 10:01:57 -0400 | [diff] [blame] | 791 | info->has_status = true; |
Michael R. Hines | ed4fbd1 | 2013-07-22 10:01:58 -0400 | [diff] [blame] | 792 | info->has_total_time = false; |
Michael R. Hines | 29ae8a4 | 2013-07-22 10:01:57 -0400 | [diff] [blame] | 793 | break; |
zhanghailiang | 3119473 | 2015-03-13 16:08:38 +0800 | [diff] [blame] | 794 | case MIGRATION_STATUS_ACTIVE: |
| 795 | case MIGRATION_STATUS_CANCELLING: |
Dr. David Alan Gilbert | 9ec055a | 2015-11-05 18:10:58 +0000 | [diff] [blame] | 796 | case MIGRATION_STATUS_POSTCOPY_ACTIVE: |
Dr. David Alan Gilbert | 31e0607 | 2017-10-20 10:05:51 +0100 | [diff] [blame] | 797 | case MIGRATION_STATUS_PRE_SWITCHOVER: |
| 798 | case MIGRATION_STATUS_DEVICE: |
Peter Xu | a688d2c | 2018-05-02 18:47:18 +0800 | [diff] [blame] | 799 | case MIGRATION_STATUS_POSTCOPY_PAUSED: |
Peter Xu | 135b87b | 2018-05-02 18:47:25 +0800 | [diff] [blame] | 800 | case MIGRATION_STATUS_POSTCOPY_RECOVER: |
Juan Quintela | c8f9f4f | 2017-06-06 19:21:29 +0200 | [diff] [blame] | 801 | /* TODO add some postcopy stats */ |
Dr. David Alan Gilbert | 9ec055a | 2015-11-05 18:10:58 +0000 | [diff] [blame] | 802 | info->has_status = true; |
| 803 | info->has_total_time = true; |
| 804 | info->total_time = qemu_clock_get_ms(QEMU_CLOCK_REALTIME) |
Peter Xu | 4af246a | 2018-01-03 20:20:08 +0800 | [diff] [blame] | 805 | - s->start_time; |
Dr. David Alan Gilbert | 9ec055a | 2015-11-05 18:10:58 +0000 | [diff] [blame] | 806 | info->has_expected_downtime = true; |
| 807 | info->expected_downtime = s->expected_downtime; |
| 808 | info->has_setup_time = true; |
| 809 | info->setup_time = s->setup_time; |
| 810 | |
Dr. David Alan Gilbert | a22463a | 2016-06-13 12:16:41 +0100 | [diff] [blame] | 811 | populate_ram_info(info, s); |
Juan Quintela | 930ac04 | 2017-05-04 10:21:46 +0200 | [diff] [blame] | 812 | populate_disk_info(info); |
Dr. David Alan Gilbert | 9ec055a | 2015-11-05 18:10:58 +0000 | [diff] [blame] | 813 | break; |
zhanghailiang | 0b827d5 | 2016-10-27 14:42:54 +0800 | [diff] [blame] | 814 | case MIGRATION_STATUS_COLO: |
| 815 | info->has_status = true; |
| 816 | /* TODO: display COLO specific information (checkpoint info etc.) */ |
| 817 | break; |
zhanghailiang | 3119473 | 2015-03-13 16:08:38 +0800 | [diff] [blame] | 818 | case MIGRATION_STATUS_COMPLETED: |
Luiz Capitulino | 791e7c8 | 2011-09-13 17:37:16 -0300 | [diff] [blame] | 819 | info->has_status = true; |
Pawit Pornkitprasan | 00c1499 | 2013-07-19 11:23:45 +0900 | [diff] [blame] | 820 | info->has_total_time = true; |
Juan Quintela | 7aa939a | 2012-08-18 13:17:10 +0200 | [diff] [blame] | 821 | info->total_time = s->total_time; |
Juan Quintela | 9c5a9fc | 2012-08-13 09:35:16 +0200 | [diff] [blame] | 822 | info->has_downtime = true; |
| 823 | info->downtime = s->downtime; |
Michael R. Hines | ed4fbd1 | 2013-07-22 10:01:58 -0400 | [diff] [blame] | 824 | info->has_setup_time = true; |
| 825 | info->setup_time = s->setup_time; |
Juan Quintela | d5f8a57 | 2012-05-21 22:01:07 +0200 | [diff] [blame] | 826 | |
Dr. David Alan Gilbert | a22463a | 2016-06-13 12:16:41 +0100 | [diff] [blame] | 827 | populate_ram_info(info, s); |
Juan Quintela | 17549e8 | 2011-10-05 13:50:43 +0200 | [diff] [blame] | 828 | break; |
zhanghailiang | 3119473 | 2015-03-13 16:08:38 +0800 | [diff] [blame] | 829 | case MIGRATION_STATUS_FAILED: |
Luiz Capitulino | 791e7c8 | 2011-09-13 17:37:16 -0300 | [diff] [blame] | 830 | info->has_status = true; |
Daniel P. Berrange | d59ce6f | 2016-04-27 11:05:00 +0100 | [diff] [blame] | 831 | if (s->error) { |
| 832 | info->has_error_desc = true; |
| 833 | info->error_desc = g_strdup(error_get_pretty(s->error)); |
| 834 | } |
Juan Quintela | 17549e8 | 2011-10-05 13:50:43 +0200 | [diff] [blame] | 835 | break; |
zhanghailiang | 3119473 | 2015-03-13 16:08:38 +0800 | [diff] [blame] | 836 | case MIGRATION_STATUS_CANCELLED: |
Luiz Capitulino | 791e7c8 | 2011-09-13 17:37:16 -0300 | [diff] [blame] | 837 | info->has_status = true; |
Juan Quintela | 17549e8 | 2011-10-05 13:50:43 +0200 | [diff] [blame] | 838 | break; |
aliguori | 5bb7910 | 2008-10-13 03:12:02 +0000 | [diff] [blame] | 839 | } |
zhanghailiang | cde63fb | 2015-03-13 16:08:41 +0800 | [diff] [blame] | 840 | info->status = s->state; |
aliguori | 5bb7910 | 2008-10-13 03:12:02 +0000 | [diff] [blame] | 841 | } |
| 842 | |
Peter Xu | 4a84214 | 2017-07-18 11:39:08 +0800 | [diff] [blame] | 843 | /** |
| 844 | * @migration_caps_check - check capability validity |
| 845 | * |
| 846 | * @cap_list: old capability list, array of bool |
| 847 | * @params: new capabilities to be applied soon |
| 848 | * @errp: set *errp if the check failed, with reason |
| 849 | * |
| 850 | * Returns true if check passed, otherwise false. |
| 851 | */ |
| 852 | static bool migrate_caps_check(bool *cap_list, |
| 853 | MigrationCapabilityStatusList *params, |
| 854 | Error **errp) |
Orit Wasserman | 0045843 | 2012-08-06 21:42:48 +0300 | [diff] [blame] | 855 | { |
Orit Wasserman | 0045843 | 2012-08-06 21:42:48 +0300 | [diff] [blame] | 856 | MigrationCapabilityStatusList *cap; |
Peter Xu | 4a84214 | 2017-07-18 11:39:08 +0800 | [diff] [blame] | 857 | bool old_postcopy_cap; |
Alexey Perevalov | d7651f1 | 2017-09-19 19:47:56 +0300 | [diff] [blame] | 858 | MigrationIncomingState *mis = migration_incoming_get_current(); |
Orit Wasserman | 0045843 | 2012-08-06 21:42:48 +0300 | [diff] [blame] | 859 | |
Peter Xu | 4a84214 | 2017-07-18 11:39:08 +0800 | [diff] [blame] | 860 | old_postcopy_cap = cap_list[MIGRATION_CAPABILITY_POSTCOPY_RAM]; |
Orit Wasserman | 0045843 | 2012-08-06 21:42:48 +0300 | [diff] [blame] | 861 | |
| 862 | for (cap = params; cap; cap = cap->next) { |
Peter Xu | 4a84214 | 2017-07-18 11:39:08 +0800 | [diff] [blame] | 863 | cap_list[cap->value->capability] = cap->value->state; |
Orit Wasserman | 0045843 | 2012-08-06 21:42:48 +0300 | [diff] [blame] | 864 | } |
Dr. David Alan Gilbert | 53dd370 | 2015-11-05 18:10:51 +0000 | [diff] [blame] | 865 | |
Peter Xu | 4a84214 | 2017-07-18 11:39:08 +0800 | [diff] [blame] | 866 | #ifndef CONFIG_LIVE_BLOCK_MIGRATION |
| 867 | if (cap_list[MIGRATION_CAPABILITY_BLOCK]) { |
| 868 | error_setg(errp, "QEMU compiled without old-style (blk/-b, inc/-i) " |
| 869 | "block migration"); |
| 870 | error_append_hint(errp, "Use drive_mirror+NBD instead.\n"); |
| 871 | return false; |
| 872 | } |
| 873 | #endif |
| 874 | |
| 875 | if (cap_list[MIGRATION_CAPABILITY_POSTCOPY_RAM]) { |
| 876 | if (cap_list[MIGRATION_CAPABILITY_COMPRESS]) { |
Dr. David Alan Gilbert | 53dd370 | 2015-11-05 18:10:51 +0000 | [diff] [blame] | 877 | /* The decompression threads asynchronously write into RAM |
| 878 | * rather than use the atomic copies needed to avoid |
| 879 | * userfaulting. It should be possible to fix the decompression |
| 880 | * threads for compatibility in future. |
| 881 | */ |
Peter Xu | 4a84214 | 2017-07-18 11:39:08 +0800 | [diff] [blame] | 882 | error_setg(errp, "Postcopy is not currently compatible " |
| 883 | "with compression"); |
| 884 | return false; |
Dr. David Alan Gilbert | 53dd370 | 2015-11-05 18:10:51 +0000 | [diff] [blame] | 885 | } |
Peter Xu | 4a84214 | 2017-07-18 11:39:08 +0800 | [diff] [blame] | 886 | |
Dr. David Alan Gilbert | 096631b | 2016-06-13 12:16:45 +0100 | [diff] [blame] | 887 | /* This check is reasonably expensive, so only when it's being |
| 888 | * set the first time, also it's only the destination that needs |
| 889 | * special support. |
| 890 | */ |
| 891 | if (!old_postcopy_cap && runstate_check(RUN_STATE_INMIGRATE) && |
Alexey Perevalov | d7651f1 | 2017-09-19 19:47:56 +0300 | [diff] [blame] | 892 | !postcopy_ram_supported_by_host(mis)) { |
Dr. David Alan Gilbert | 096631b | 2016-06-13 12:16:45 +0100 | [diff] [blame] | 893 | /* postcopy_ram_supported_by_host will have emitted a more |
| 894 | * detailed message |
| 895 | */ |
Peter Xu | 4a84214 | 2017-07-18 11:39:08 +0800 | [diff] [blame] | 896 | error_setg(errp, "Postcopy is not supported"); |
| 897 | return false; |
Dr. David Alan Gilbert | 096631b | 2016-06-13 12:16:45 +0100 | [diff] [blame] | 898 | } |
Dr. David Alan Gilbert | 53dd370 | 2015-11-05 18:10:51 +0000 | [diff] [blame] | 899 | } |
Peter Xu | 4a84214 | 2017-07-18 11:39:08 +0800 | [diff] [blame] | 900 | |
| 901 | return true; |
| 902 | } |
| 903 | |
Alexey Perevalov | 65ace06 | 2018-03-22 21:17:27 +0300 | [diff] [blame] | 904 | static void fill_destination_migration_info(MigrationInfo *info) |
| 905 | { |
| 906 | MigrationIncomingState *mis = migration_incoming_get_current(); |
| 907 | |
| 908 | switch (mis->state) { |
| 909 | case MIGRATION_STATUS_NONE: |
| 910 | return; |
| 911 | break; |
| 912 | case MIGRATION_STATUS_SETUP: |
| 913 | case MIGRATION_STATUS_CANCELLING: |
| 914 | case MIGRATION_STATUS_CANCELLED: |
| 915 | case MIGRATION_STATUS_ACTIVE: |
| 916 | case MIGRATION_STATUS_POSTCOPY_ACTIVE: |
Peter Xu | 3c9928d | 2018-07-10 17:18:56 +0800 | [diff] [blame] | 917 | case MIGRATION_STATUS_POSTCOPY_PAUSED: |
| 918 | case MIGRATION_STATUS_POSTCOPY_RECOVER: |
Alexey Perevalov | 65ace06 | 2018-03-22 21:17:27 +0300 | [diff] [blame] | 919 | case MIGRATION_STATUS_FAILED: |
| 920 | case MIGRATION_STATUS_COLO: |
| 921 | info->has_status = true; |
| 922 | break; |
| 923 | case MIGRATION_STATUS_COMPLETED: |
| 924 | info->has_status = true; |
| 925 | fill_destination_postcopy_migration_info(info); |
| 926 | break; |
| 927 | } |
| 928 | info->status = mis->state; |
| 929 | } |
| 930 | |
| 931 | MigrationInfo *qmp_query_migrate(Error **errp) |
| 932 | { |
| 933 | MigrationInfo *info = g_malloc0(sizeof(*info)); |
| 934 | |
| 935 | fill_destination_migration_info(info); |
| 936 | fill_source_migration_info(info); |
| 937 | |
| 938 | return info; |
| 939 | } |
| 940 | |
Peter Xu | 4a84214 | 2017-07-18 11:39:08 +0800 | [diff] [blame] | 941 | void qmp_migrate_set_capabilities(MigrationCapabilityStatusList *params, |
| 942 | Error **errp) |
| 943 | { |
| 944 | MigrationState *s = migrate_get_current(); |
| 945 | MigrationCapabilityStatusList *cap; |
Peter Xu | dd0ee30 | 2018-03-05 17:49:38 +0800 | [diff] [blame] | 946 | bool cap_list[MIGRATION_CAPABILITY__MAX]; |
Peter Xu | 4a84214 | 2017-07-18 11:39:08 +0800 | [diff] [blame] | 947 | |
| 948 | if (migration_is_setup_or_active(s->state)) { |
| 949 | error_setg(errp, QERR_MIGRATION_ACTIVE); |
| 950 | return; |
| 951 | } |
| 952 | |
Peter Xu | dd0ee30 | 2018-03-05 17:49:38 +0800 | [diff] [blame] | 953 | memcpy(cap_list, s->enabled_capabilities, sizeof(cap_list)); |
| 954 | if (!migrate_caps_check(cap_list, params, errp)) { |
Peter Xu | 4a84214 | 2017-07-18 11:39:08 +0800 | [diff] [blame] | 955 | return; |
| 956 | } |
| 957 | |
| 958 | for (cap = params; cap; cap = cap->next) { |
| 959 | s->enabled_capabilities[cap->value->capability] = cap->value->state; |
| 960 | } |
Orit Wasserman | 0045843 | 2012-08-06 21:42:48 +0300 | [diff] [blame] | 961 | } |
| 962 | |
Peter Xu | 16d063b | 2017-07-18 11:39:04 +0800 | [diff] [blame] | 963 | /* |
| 964 | * Check whether the parameters are valid. Error will be put into errp |
| 965 | * (if provided). Return true if valid, otherwise false. |
| 966 | */ |
| 967 | static bool migrate_params_check(MigrationParameters *params, Error **errp) |
Liang Li | 85de832 | 2015-03-23 16:32:28 +0800 | [diff] [blame] | 968 | { |
Eric Blake | 7f375e0 | 2016-09-08 22:14:16 -0500 | [diff] [blame] | 969 | if (params->has_compress_level && |
Juan Quintela | 741d408 | 2017-12-01 13:08:38 +0100 | [diff] [blame] | 970 | (params->compress_level > 9)) { |
Markus Armbruster | c6bd8c7 | 2015-03-17 11:54:50 +0100 | [diff] [blame] | 971 | error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "compress_level", |
| 972 | "is invalid, it should be in the range of 0 to 9"); |
Peter Xu | 16d063b | 2017-07-18 11:39:04 +0800 | [diff] [blame] | 973 | return false; |
Liang Li | 85de832 | 2015-03-23 16:32:28 +0800 | [diff] [blame] | 974 | } |
Peter Xu | 16d063b | 2017-07-18 11:39:04 +0800 | [diff] [blame] | 975 | |
Juan Quintela | 741d408 | 2017-12-01 13:08:38 +0100 | [diff] [blame] | 976 | if (params->has_compress_threads && (params->compress_threads < 1)) { |
Markus Armbruster | c6bd8c7 | 2015-03-17 11:54:50 +0100 | [diff] [blame] | 977 | error_setg(errp, QERR_INVALID_PARAMETER_VALUE, |
| 978 | "compress_threads", |
| 979 | "is invalid, it should be in the range of 1 to 255"); |
Peter Xu | 16d063b | 2017-07-18 11:39:04 +0800 | [diff] [blame] | 980 | return false; |
Liang Li | 85de832 | 2015-03-23 16:32:28 +0800 | [diff] [blame] | 981 | } |
Peter Xu | 16d063b | 2017-07-18 11:39:04 +0800 | [diff] [blame] | 982 | |
Juan Quintela | 741d408 | 2017-12-01 13:08:38 +0100 | [diff] [blame] | 983 | if (params->has_decompress_threads && (params->decompress_threads < 1)) { |
Markus Armbruster | c6bd8c7 | 2015-03-17 11:54:50 +0100 | [diff] [blame] | 984 | error_setg(errp, QERR_INVALID_PARAMETER_VALUE, |
| 985 | "decompress_threads", |
| 986 | "is invalid, it should be in the range of 1 to 255"); |
Peter Xu | 16d063b | 2017-07-18 11:39:04 +0800 | [diff] [blame] | 987 | return false; |
Liang Li | 85de832 | 2015-03-23 16:32:28 +0800 | [diff] [blame] | 988 | } |
Peter Xu | 16d063b | 2017-07-18 11:39:04 +0800 | [diff] [blame] | 989 | |
Eric Blake | 7f375e0 | 2016-09-08 22:14:16 -0500 | [diff] [blame] | 990 | if (params->has_cpu_throttle_initial && |
| 991 | (params->cpu_throttle_initial < 1 || |
| 992 | params->cpu_throttle_initial > 99)) { |
Jason J. Herne | 1626fee | 2015-09-08 13:12:34 -0400 | [diff] [blame] | 993 | error_setg(errp, QERR_INVALID_PARAMETER_VALUE, |
Jason J. Herne | d85a31d | 2016-04-21 14:07:18 -0400 | [diff] [blame] | 994 | "cpu_throttle_initial", |
Jason J. Herne | 1626fee | 2015-09-08 13:12:34 -0400 | [diff] [blame] | 995 | "an integer in the range of 1 to 99"); |
Peter Xu | 16d063b | 2017-07-18 11:39:04 +0800 | [diff] [blame] | 996 | return false; |
Jason J. Herne | 1626fee | 2015-09-08 13:12:34 -0400 | [diff] [blame] | 997 | } |
Peter Xu | 16d063b | 2017-07-18 11:39:04 +0800 | [diff] [blame] | 998 | |
Eric Blake | 7f375e0 | 2016-09-08 22:14:16 -0500 | [diff] [blame] | 999 | if (params->has_cpu_throttle_increment && |
| 1000 | (params->cpu_throttle_increment < 1 || |
| 1001 | params->cpu_throttle_increment > 99)) { |
Jason J. Herne | 1626fee | 2015-09-08 13:12:34 -0400 | [diff] [blame] | 1002 | error_setg(errp, QERR_INVALID_PARAMETER_VALUE, |
Jason J. Herne | d85a31d | 2016-04-21 14:07:18 -0400 | [diff] [blame] | 1003 | "cpu_throttle_increment", |
Jason J. Herne | 1626fee | 2015-09-08 13:12:34 -0400 | [diff] [blame] | 1004 | "an integer in the range of 1 to 99"); |
Peter Xu | 16d063b | 2017-07-18 11:39:04 +0800 | [diff] [blame] | 1005 | return false; |
Jason J. Herne | 1626fee | 2015-09-08 13:12:34 -0400 | [diff] [blame] | 1006 | } |
Peter Xu | 16d063b | 2017-07-18 11:39:04 +0800 | [diff] [blame] | 1007 | |
Juan Quintela | 741d408 | 2017-12-01 13:08:38 +0100 | [diff] [blame] | 1008 | if (params->has_max_bandwidth && (params->max_bandwidth > SIZE_MAX)) { |
Ashijeet Acharya | 2ff3025 | 2016-09-15 21:50:28 +0530 | [diff] [blame] | 1009 | error_setg(errp, "Parameter 'max_bandwidth' expects an integer in the" |
| 1010 | " range of 0 to %zu bytes/second", SIZE_MAX); |
Peter Xu | 16d063b | 2017-07-18 11:39:04 +0800 | [diff] [blame] | 1011 | return false; |
Ashijeet Acharya | 2ff3025 | 2016-09-15 21:50:28 +0530 | [diff] [blame] | 1012 | } |
Peter Xu | 16d063b | 2017-07-18 11:39:04 +0800 | [diff] [blame] | 1013 | |
Ashijeet Acharya | 2ff3025 | 2016-09-15 21:50:28 +0530 | [diff] [blame] | 1014 | if (params->has_downtime_limit && |
Juan Quintela | 741d408 | 2017-12-01 13:08:38 +0100 | [diff] [blame] | 1015 | (params->downtime_limit > MAX_MIGRATE_DOWNTIME)) { |
Daniel Henrique Barboza | 87c9cc1 | 2017-02-22 12:17:29 -0300 | [diff] [blame] | 1016 | error_setg(errp, "Parameter 'downtime_limit' expects an integer in " |
| 1017 | "the range of 0 to %d milliseconds", |
| 1018 | MAX_MIGRATE_DOWNTIME); |
Peter Xu | 16d063b | 2017-07-18 11:39:04 +0800 | [diff] [blame] | 1019 | return false; |
Ashijeet Acharya | 2ff3025 | 2016-09-15 21:50:28 +0530 | [diff] [blame] | 1020 | } |
Peter Xu | 16d063b | 2017-07-18 11:39:04 +0800 | [diff] [blame] | 1021 | |
Juan Quintela | 741d408 | 2017-12-01 13:08:38 +0100 | [diff] [blame] | 1022 | /* x_checkpoint_delay is now always positive */ |
| 1023 | |
| 1024 | if (params->has_x_multifd_channels && (params->x_multifd_channels < 1)) { |
Juan Quintela | 4075fb1 | 2016-01-15 08:56:17 +0100 | [diff] [blame] | 1025 | error_setg(errp, QERR_INVALID_PARAMETER_VALUE, |
| 1026 | "multifd_channels", |
| 1027 | "is invalid, it should be in the range of 1 to 255"); |
| 1028 | return false; |
| 1029 | } |
Juan Quintela | 0fb8660 | 2017-04-27 10:48:25 +0200 | [diff] [blame] | 1030 | if (params->has_x_multifd_page_count && |
Juan Quintela | 741d408 | 2017-12-01 13:08:38 +0100 | [diff] [blame] | 1031 | (params->x_multifd_page_count < 1 || |
| 1032 | params->x_multifd_page_count > 10000)) { |
Juan Quintela | 0fb8660 | 2017-04-27 10:48:25 +0200 | [diff] [blame] | 1033 | error_setg(errp, QERR_INVALID_PARAMETER_VALUE, |
| 1034 | "multifd_page_count", |
| 1035 | "is invalid, it should be in the range of 1 to 10000"); |
| 1036 | return false; |
| 1037 | } |
Peter Xu | 16d063b | 2017-07-18 11:39:04 +0800 | [diff] [blame] | 1038 | |
Juan Quintela | 73af8dd | 2017-10-05 21:30:10 +0200 | [diff] [blame] | 1039 | if (params->has_xbzrle_cache_size && |
| 1040 | (params->xbzrle_cache_size < qemu_target_page_size() || |
| 1041 | !is_power_of_2(params->xbzrle_cache_size))) { |
| 1042 | error_setg(errp, QERR_INVALID_PARAMETER_VALUE, |
| 1043 | "xbzrle_cache_size", |
| 1044 | "is invalid, it should be bigger than target page size" |
| 1045 | " and a power of two"); |
| 1046 | return false; |
| 1047 | } |
| 1048 | |
Li Qiang | 4cbc9c7 | 2018-08-01 06:00:20 -0700 | [diff] [blame] | 1049 | if (params->has_max_cpu_throttle && |
| 1050 | (params->max_cpu_throttle < params->cpu_throttle_initial || |
| 1051 | params->max_cpu_throttle > 99)) { |
| 1052 | error_setg(errp, QERR_INVALID_PARAMETER_VALUE, |
| 1053 | "max_cpu_throttle", |
| 1054 | "an integer in the range of cpu_throttle_initial to 99"); |
| 1055 | return false; |
| 1056 | } |
| 1057 | |
Peter Xu | 16d063b | 2017-07-18 11:39:04 +0800 | [diff] [blame] | 1058 | return true; |
| 1059 | } |
| 1060 | |
Markus Armbruster | 1bda8b3 | 2017-07-18 13:42:11 +0200 | [diff] [blame] | 1061 | static void migrate_params_test_apply(MigrateSetParameters *params, |
| 1062 | MigrationParameters *dest) |
| 1063 | { |
| 1064 | *dest = migrate_get_current()->parameters; |
| 1065 | |
| 1066 | /* TODO use QAPI_CLONE() instead of duplicating it inline */ |
| 1067 | |
| 1068 | if (params->has_compress_level) { |
| 1069 | dest->compress_level = params->compress_level; |
| 1070 | } |
| 1071 | |
| 1072 | if (params->has_compress_threads) { |
| 1073 | dest->compress_threads = params->compress_threads; |
| 1074 | } |
| 1075 | |
| 1076 | if (params->has_decompress_threads) { |
| 1077 | dest->decompress_threads = params->decompress_threads; |
| 1078 | } |
| 1079 | |
| 1080 | if (params->has_cpu_throttle_initial) { |
| 1081 | dest->cpu_throttle_initial = params->cpu_throttle_initial; |
| 1082 | } |
| 1083 | |
| 1084 | if (params->has_cpu_throttle_increment) { |
| 1085 | dest->cpu_throttle_increment = params->cpu_throttle_increment; |
| 1086 | } |
| 1087 | |
| 1088 | if (params->has_tls_creds) { |
Markus Armbruster | 01fa559 | 2017-07-18 14:42:04 +0200 | [diff] [blame] | 1089 | assert(params->tls_creds->type == QTYPE_QSTRING); |
| 1090 | dest->tls_creds = g_strdup(params->tls_creds->u.s); |
Markus Armbruster | 1bda8b3 | 2017-07-18 13:42:11 +0200 | [diff] [blame] | 1091 | } |
| 1092 | |
| 1093 | if (params->has_tls_hostname) { |
Markus Armbruster | 01fa559 | 2017-07-18 14:42:04 +0200 | [diff] [blame] | 1094 | assert(params->tls_hostname->type == QTYPE_QSTRING); |
| 1095 | dest->tls_hostname = g_strdup(params->tls_hostname->u.s); |
Markus Armbruster | 1bda8b3 | 2017-07-18 13:42:11 +0200 | [diff] [blame] | 1096 | } |
| 1097 | |
| 1098 | if (params->has_max_bandwidth) { |
| 1099 | dest->max_bandwidth = params->max_bandwidth; |
| 1100 | } |
| 1101 | |
| 1102 | if (params->has_downtime_limit) { |
| 1103 | dest->downtime_limit = params->downtime_limit; |
| 1104 | } |
| 1105 | |
| 1106 | if (params->has_x_checkpoint_delay) { |
| 1107 | dest->x_checkpoint_delay = params->x_checkpoint_delay; |
| 1108 | } |
| 1109 | |
| 1110 | if (params->has_block_incremental) { |
| 1111 | dest->block_incremental = params->block_incremental; |
| 1112 | } |
Juan Quintela | 5e7577a | 2017-10-09 18:07:56 +0200 | [diff] [blame] | 1113 | if (params->has_x_multifd_channels) { |
| 1114 | dest->x_multifd_channels = params->x_multifd_channels; |
| 1115 | } |
| 1116 | if (params->has_x_multifd_page_count) { |
| 1117 | dest->x_multifd_page_count = params->x_multifd_page_count; |
| 1118 | } |
Juan Quintela | 73af8dd | 2017-10-05 21:30:10 +0200 | [diff] [blame] | 1119 | if (params->has_xbzrle_cache_size) { |
| 1120 | dest->xbzrle_cache_size = params->xbzrle_cache_size; |
| 1121 | } |
Dr. David Alan Gilbert | 7e555c6 | 2018-06-13 11:26:40 +0100 | [diff] [blame] | 1122 | if (params->has_max_postcopy_bandwidth) { |
| 1123 | dest->max_postcopy_bandwidth = params->max_postcopy_bandwidth; |
| 1124 | } |
Li Qiang | 4cbc9c7 | 2018-08-01 06:00:20 -0700 | [diff] [blame] | 1125 | if (params->has_max_cpu_throttle) { |
| 1126 | dest->max_cpu_throttle = params->max_cpu_throttle; |
| 1127 | } |
Markus Armbruster | 1bda8b3 | 2017-07-18 13:42:11 +0200 | [diff] [blame] | 1128 | } |
| 1129 | |
Juan Quintela | 73af8dd | 2017-10-05 21:30:10 +0200 | [diff] [blame] | 1130 | static void migrate_params_apply(MigrateSetParameters *params, Error **errp) |
Peter Xu | 16d063b | 2017-07-18 11:39:04 +0800 | [diff] [blame] | 1131 | { |
| 1132 | MigrationState *s = migrate_get_current(); |
| 1133 | |
Markus Armbruster | e87fae4 | 2017-07-18 12:57:38 +0200 | [diff] [blame] | 1134 | /* TODO use QAPI_CLONE() instead of duplicating it inline */ |
| 1135 | |
Eric Blake | 7f375e0 | 2016-09-08 22:14:16 -0500 | [diff] [blame] | 1136 | if (params->has_compress_level) { |
| 1137 | s->parameters.compress_level = params->compress_level; |
Liang Li | 85de832 | 2015-03-23 16:32:28 +0800 | [diff] [blame] | 1138 | } |
Peter Xu | 476c72a | 2017-07-18 11:39:05 +0800 | [diff] [blame] | 1139 | |
Eric Blake | 7f375e0 | 2016-09-08 22:14:16 -0500 | [diff] [blame] | 1140 | if (params->has_compress_threads) { |
| 1141 | s->parameters.compress_threads = params->compress_threads; |
Liang Li | 85de832 | 2015-03-23 16:32:28 +0800 | [diff] [blame] | 1142 | } |
Peter Xu | 476c72a | 2017-07-18 11:39:05 +0800 | [diff] [blame] | 1143 | |
Eric Blake | 7f375e0 | 2016-09-08 22:14:16 -0500 | [diff] [blame] | 1144 | if (params->has_decompress_threads) { |
| 1145 | s->parameters.decompress_threads = params->decompress_threads; |
Liang Li | 85de832 | 2015-03-23 16:32:28 +0800 | [diff] [blame] | 1146 | } |
Peter Xu | 476c72a | 2017-07-18 11:39:05 +0800 | [diff] [blame] | 1147 | |
Eric Blake | 7f375e0 | 2016-09-08 22:14:16 -0500 | [diff] [blame] | 1148 | if (params->has_cpu_throttle_initial) { |
| 1149 | s->parameters.cpu_throttle_initial = params->cpu_throttle_initial; |
Jason J. Herne | 1626fee | 2015-09-08 13:12:34 -0400 | [diff] [blame] | 1150 | } |
Peter Xu | 476c72a | 2017-07-18 11:39:05 +0800 | [diff] [blame] | 1151 | |
Eric Blake | 7f375e0 | 2016-09-08 22:14:16 -0500 | [diff] [blame] | 1152 | if (params->has_cpu_throttle_increment) { |
| 1153 | s->parameters.cpu_throttle_increment = params->cpu_throttle_increment; |
Jason J. Herne | 1626fee | 2015-09-08 13:12:34 -0400 | [diff] [blame] | 1154 | } |
Peter Xu | 476c72a | 2017-07-18 11:39:05 +0800 | [diff] [blame] | 1155 | |
Eric Blake | 7f375e0 | 2016-09-08 22:14:16 -0500 | [diff] [blame] | 1156 | if (params->has_tls_creds) { |
Daniel P. Berrange | 69ef1f3 | 2016-04-27 11:05:15 +0100 | [diff] [blame] | 1157 | g_free(s->parameters.tls_creds); |
Markus Armbruster | 01fa559 | 2017-07-18 14:42:04 +0200 | [diff] [blame] | 1158 | assert(params->tls_creds->type == QTYPE_QSTRING); |
| 1159 | s->parameters.tls_creds = g_strdup(params->tls_creds->u.s); |
Daniel P. Berrange | 69ef1f3 | 2016-04-27 11:05:15 +0100 | [diff] [blame] | 1160 | } |
Peter Xu | 476c72a | 2017-07-18 11:39:05 +0800 | [diff] [blame] | 1161 | |
Eric Blake | 7f375e0 | 2016-09-08 22:14:16 -0500 | [diff] [blame] | 1162 | if (params->has_tls_hostname) { |
Daniel P. Berrange | 69ef1f3 | 2016-04-27 11:05:15 +0100 | [diff] [blame] | 1163 | g_free(s->parameters.tls_hostname); |
Markus Armbruster | 01fa559 | 2017-07-18 14:42:04 +0200 | [diff] [blame] | 1164 | assert(params->tls_hostname->type == QTYPE_QSTRING); |
| 1165 | s->parameters.tls_hostname = g_strdup(params->tls_hostname->u.s); |
Daniel P. Berrange | 69ef1f3 | 2016-04-27 11:05:15 +0100 | [diff] [blame] | 1166 | } |
Peter Xu | 476c72a | 2017-07-18 11:39:05 +0800 | [diff] [blame] | 1167 | |
Ashijeet Acharya | 2ff3025 | 2016-09-15 21:50:28 +0530 | [diff] [blame] | 1168 | if (params->has_max_bandwidth) { |
| 1169 | s->parameters.max_bandwidth = params->max_bandwidth; |
| 1170 | if (s->to_dst_file) { |
| 1171 | qemu_file_set_rate_limit(s->to_dst_file, |
| 1172 | s->parameters.max_bandwidth / XFER_LIMIT_RATIO); |
| 1173 | } |
| 1174 | } |
Peter Xu | 476c72a | 2017-07-18 11:39:05 +0800 | [diff] [blame] | 1175 | |
Ashijeet Acharya | 2ff3025 | 2016-09-15 21:50:28 +0530 | [diff] [blame] | 1176 | if (params->has_downtime_limit) { |
| 1177 | s->parameters.downtime_limit = params->downtime_limit; |
| 1178 | } |
zhanghailiang | 68b5359 | 2016-10-27 14:43:01 +0800 | [diff] [blame] | 1179 | |
| 1180 | if (params->has_x_checkpoint_delay) { |
| 1181 | s->parameters.x_checkpoint_delay = params->x_checkpoint_delay; |
zhanghailiang | 479125d | 2017-01-17 20:57:42 +0800 | [diff] [blame] | 1182 | if (migration_in_colo_state()) { |
| 1183 | colo_checkpoint_notify(s); |
| 1184 | } |
zhanghailiang | 68b5359 | 2016-10-27 14:43:01 +0800 | [diff] [blame] | 1185 | } |
Peter Xu | 476c72a | 2017-07-18 11:39:05 +0800 | [diff] [blame] | 1186 | |
Juan Quintela | 2833c59 | 2017-04-05 18:32:37 +0200 | [diff] [blame] | 1187 | if (params->has_block_incremental) { |
| 1188 | s->parameters.block_incremental = params->block_incremental; |
| 1189 | } |
Juan Quintela | 4075fb1 | 2016-01-15 08:56:17 +0100 | [diff] [blame] | 1190 | if (params->has_x_multifd_channels) { |
| 1191 | s->parameters.x_multifd_channels = params->x_multifd_channels; |
| 1192 | } |
Juan Quintela | 0fb8660 | 2017-04-27 10:48:25 +0200 | [diff] [blame] | 1193 | if (params->has_x_multifd_page_count) { |
| 1194 | s->parameters.x_multifd_page_count = params->x_multifd_page_count; |
| 1195 | } |
Juan Quintela | 73af8dd | 2017-10-05 21:30:10 +0200 | [diff] [blame] | 1196 | if (params->has_xbzrle_cache_size) { |
| 1197 | s->parameters.xbzrle_cache_size = params->xbzrle_cache_size; |
| 1198 | xbzrle_cache_resize(params->xbzrle_cache_size, errp); |
| 1199 | } |
Dr. David Alan Gilbert | 7e555c6 | 2018-06-13 11:26:40 +0100 | [diff] [blame] | 1200 | if (params->has_max_postcopy_bandwidth) { |
| 1201 | s->parameters.max_postcopy_bandwidth = params->max_postcopy_bandwidth; |
| 1202 | } |
Li Qiang | 4cbc9c7 | 2018-08-01 06:00:20 -0700 | [diff] [blame] | 1203 | if (params->has_max_cpu_throttle) { |
| 1204 | s->parameters.max_cpu_throttle = params->max_cpu_throttle; |
| 1205 | } |
Liang Li | 85de832 | 2015-03-23 16:32:28 +0800 | [diff] [blame] | 1206 | } |
| 1207 | |
Markus Armbruster | 1bda8b3 | 2017-07-18 13:42:11 +0200 | [diff] [blame] | 1208 | void qmp_migrate_set_parameters(MigrateSetParameters *params, Error **errp) |
Peter Xu | 476c72a | 2017-07-18 11:39:05 +0800 | [diff] [blame] | 1209 | { |
Markus Armbruster | 1bda8b3 | 2017-07-18 13:42:11 +0200 | [diff] [blame] | 1210 | MigrationParameters tmp; |
| 1211 | |
Markus Armbruster | 01fa559 | 2017-07-18 14:42:04 +0200 | [diff] [blame] | 1212 | /* TODO Rewrite "" to null instead */ |
| 1213 | if (params->has_tls_creds |
| 1214 | && params->tls_creds->type == QTYPE_QNULL) { |
Marc-André Lureau | cb3e7f0 | 2018-04-19 17:01:43 +0200 | [diff] [blame] | 1215 | qobject_unref(params->tls_creds->u.n); |
Markus Armbruster | 01fa559 | 2017-07-18 14:42:04 +0200 | [diff] [blame] | 1216 | params->tls_creds->type = QTYPE_QSTRING; |
| 1217 | params->tls_creds->u.s = strdup(""); |
| 1218 | } |
| 1219 | /* TODO Rewrite "" to null instead */ |
| 1220 | if (params->has_tls_hostname |
| 1221 | && params->tls_hostname->type == QTYPE_QNULL) { |
Marc-André Lureau | cb3e7f0 | 2018-04-19 17:01:43 +0200 | [diff] [blame] | 1222 | qobject_unref(params->tls_hostname->u.n); |
Markus Armbruster | 01fa559 | 2017-07-18 14:42:04 +0200 | [diff] [blame] | 1223 | params->tls_hostname->type = QTYPE_QSTRING; |
| 1224 | params->tls_hostname->u.s = strdup(""); |
| 1225 | } |
| 1226 | |
Markus Armbruster | 1bda8b3 | 2017-07-18 13:42:11 +0200 | [diff] [blame] | 1227 | migrate_params_test_apply(params, &tmp); |
| 1228 | |
| 1229 | if (!migrate_params_check(&tmp, errp)) { |
Peter Xu | 476c72a | 2017-07-18 11:39:05 +0800 | [diff] [blame] | 1230 | /* Invalid parameter */ |
| 1231 | return; |
| 1232 | } |
| 1233 | |
Juan Quintela | 73af8dd | 2017-10-05 21:30:10 +0200 | [diff] [blame] | 1234 | migrate_params_apply(params, errp); |
Peter Xu | 476c72a | 2017-07-18 11:39:05 +0800 | [diff] [blame] | 1235 | } |
| 1236 | |
Daniel P. Berrange | 2594f56 | 2016-04-27 11:05:14 +0100 | [diff] [blame] | 1237 | |
Dr. David Alan Gilbert | 4886a1b | 2015-11-05 18:10:56 +0000 | [diff] [blame] | 1238 | void qmp_migrate_start_postcopy(Error **errp) |
| 1239 | { |
| 1240 | MigrationState *s = migrate_get_current(); |
| 1241 | |
Vladimir Sementsov-Ogievskiy | 16b0fd3 | 2018-03-13 15:34:01 -0400 | [diff] [blame] | 1242 | if (!migrate_postcopy()) { |
Dr. David Alan Gilbert | a54d340 | 2015-11-12 11:34:44 +0000 | [diff] [blame] | 1243 | error_setg(errp, "Enable postcopy with migrate_set_capability before" |
Dr. David Alan Gilbert | 4886a1b | 2015-11-05 18:10:56 +0000 | [diff] [blame] | 1244 | " the start of migration"); |
| 1245 | return; |
| 1246 | } |
| 1247 | |
| 1248 | if (s->state == MIGRATION_STATUS_NONE) { |
| 1249 | error_setg(errp, "Postcopy must be started after migration has been" |
| 1250 | " started"); |
| 1251 | return; |
| 1252 | } |
| 1253 | /* |
| 1254 | * we don't error if migration has finished since that would be racy |
| 1255 | * with issuing this command. |
| 1256 | */ |
| 1257 | atomic_set(&s->start_postcopy, true); |
| 1258 | } |
| 1259 | |
aliguori | 065e281 | 2008-11-11 16:46:33 +0000 | [diff] [blame] | 1260 | /* shared migration helpers */ |
| 1261 | |
zhanghailiang | 48781e5 | 2015-12-16 11:47:33 +0000 | [diff] [blame] | 1262 | void migrate_set_state(int *state, int old_state, int new_state) |
Zhanghaoyu (A) | 51cf4c1 | 2013-11-07 11:01:15 +0000 | [diff] [blame] | 1263 | { |
Peter Xu | a31fede | 2017-08-30 16:32:01 +0800 | [diff] [blame] | 1264 | assert(new_state < MIGRATION_STATUS__MAX); |
zhanghailiang | 48781e5 | 2015-12-16 11:47:33 +0000 | [diff] [blame] | 1265 | if (atomic_cmpxchg(state, old_state, new_state) == old_state) { |
Peter Xu | a31fede | 2017-08-30 16:32:01 +0800 | [diff] [blame] | 1266 | trace_migrate_set_state(MigrationStatus_str(new_state)); |
Juan Quintela | b05dc72 | 2015-07-07 14:44:05 +0200 | [diff] [blame] | 1267 | migrate_generate_event(new_state); |
Zhanghaoyu (A) | 51cf4c1 | 2013-11-07 11:01:15 +0000 | [diff] [blame] | 1268 | } |
| 1269 | } |
| 1270 | |
Peter Xu | 4e4a3d3 | 2017-07-18 11:39:09 +0800 | [diff] [blame] | 1271 | static MigrationCapabilityStatusList *migrate_cap_add( |
| 1272 | MigrationCapabilityStatusList *list, |
| 1273 | MigrationCapability index, |
| 1274 | bool state) |
Juan Quintela | 2833c59 | 2017-04-05 18:32:37 +0200 | [diff] [blame] | 1275 | { |
| 1276 | MigrationCapabilityStatusList *cap; |
| 1277 | |
| 1278 | cap = g_new0(MigrationCapabilityStatusList, 1); |
| 1279 | cap->value = g_new0(MigrationCapabilityStatus, 1); |
Peter Xu | 4e4a3d3 | 2017-07-18 11:39:09 +0800 | [diff] [blame] | 1280 | cap->value->capability = index; |
| 1281 | cap->value->state = state; |
| 1282 | cap->next = list; |
| 1283 | |
| 1284 | return cap; |
| 1285 | } |
| 1286 | |
| 1287 | void migrate_set_block_enabled(bool value, Error **errp) |
| 1288 | { |
| 1289 | MigrationCapabilityStatusList *cap; |
| 1290 | |
| 1291 | cap = migrate_cap_add(NULL, MIGRATION_CAPABILITY_BLOCK, value); |
Juan Quintela | 2833c59 | 2017-04-05 18:32:37 +0200 | [diff] [blame] | 1292 | qmp_migrate_set_capabilities(cap, errp); |
| 1293 | qapi_free_MigrationCapabilityStatusList(cap); |
| 1294 | } |
| 1295 | |
| 1296 | static void migrate_set_block_incremental(MigrationState *s, bool value) |
| 1297 | { |
| 1298 | s->parameters.block_incremental = value; |
| 1299 | } |
| 1300 | |
| 1301 | static void block_cleanup_parameters(MigrationState *s) |
| 1302 | { |
| 1303 | if (s->must_remove_block_options) { |
| 1304 | /* setting to false can never fail */ |
| 1305 | migrate_set_block_enabled(false, &error_abort); |
| 1306 | migrate_set_block_incremental(s, false); |
| 1307 | s->must_remove_block_options = false; |
| 1308 | } |
| 1309 | } |
| 1310 | |
Paolo Bonzini | bb1fadc | 2013-02-22 17:36:21 +0100 | [diff] [blame] | 1311 | static void migrate_fd_cleanup(void *opaque) |
aliguori | 065e281 | 2008-11-11 16:46:33 +0000 | [diff] [blame] | 1312 | { |
Paolo Bonzini | bb1fadc | 2013-02-22 17:36:21 +0100 | [diff] [blame] | 1313 | MigrationState *s = opaque; |
| 1314 | |
| 1315 | qemu_bh_delete(s->cleanup_bh); |
| 1316 | s->cleanup_bh = NULL; |
| 1317 | |
Peter Xu | 0ceccd8 | 2018-01-03 20:20:06 +0800 | [diff] [blame] | 1318 | qemu_savevm_state_cleanup(); |
| 1319 | |
zhanghailiang | 89a02a9 | 2016-01-15 11:37:42 +0800 | [diff] [blame] | 1320 | if (s->to_dst_file) { |
Juan Quintela | f986c3d | 2016-01-14 16:52:55 +0100 | [diff] [blame] | 1321 | Error *local_err = NULL; |
Peter Xu | 62df066 | 2018-05-02 18:47:38 +0800 | [diff] [blame] | 1322 | QEMUFile *tmp; |
Juan Quintela | f986c3d | 2016-01-14 16:52:55 +0100 | [diff] [blame] | 1323 | |
Alexey Kardashevskiy | 9013dca | 2014-03-11 10:42:29 +1100 | [diff] [blame] | 1324 | trace_migrate_fd_cleanup(); |
Paolo Bonzini | 404a7c0 | 2013-02-22 17:36:46 +0100 | [diff] [blame] | 1325 | qemu_mutex_unlock_iothread(); |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 1326 | if (s->migration_thread_running) { |
| 1327 | qemu_thread_join(&s->thread); |
| 1328 | s->migration_thread_running = false; |
| 1329 | } |
Paolo Bonzini | 404a7c0 | 2013-02-22 17:36:46 +0100 | [diff] [blame] | 1330 | qemu_mutex_lock_iothread(); |
| 1331 | |
Juan Quintela | f986c3d | 2016-01-14 16:52:55 +0100 | [diff] [blame] | 1332 | if (multifd_save_cleanup(&local_err) != 0) { |
| 1333 | error_report_err(local_err); |
| 1334 | } |
Peter Xu | 62df066 | 2018-05-02 18:47:38 +0800 | [diff] [blame] | 1335 | qemu_mutex_lock(&s->qemu_file_lock); |
| 1336 | tmp = s->to_dst_file; |
zhanghailiang | 89a02a9 | 2016-01-15 11:37:42 +0800 | [diff] [blame] | 1337 | s->to_dst_file = NULL; |
Peter Xu | 62df066 | 2018-05-02 18:47:38 +0800 | [diff] [blame] | 1338 | qemu_mutex_unlock(&s->qemu_file_lock); |
| 1339 | /* |
| 1340 | * Close the file handle without the lock to make sure the |
| 1341 | * critical section won't block for long. |
| 1342 | */ |
| 1343 | qemu_fclose(tmp); |
aliguori | 065e281 | 2008-11-11 16:46:33 +0000 | [diff] [blame] | 1344 | } |
| 1345 | |
Dr. David Alan Gilbert | 9ec055a | 2015-11-05 18:10:58 +0000 | [diff] [blame] | 1346 | assert((s->state != MIGRATION_STATUS_ACTIVE) && |
| 1347 | (s->state != MIGRATION_STATUS_POSTCOPY_ACTIVE)); |
Paolo Bonzini | 7a2c172 | 2013-02-22 17:36:09 +0100 | [diff] [blame] | 1348 | |
Liang Li | 94f5a43 | 2015-11-02 15:37:00 +0800 | [diff] [blame] | 1349 | if (s->state == MIGRATION_STATUS_CANCELLING) { |
zhanghailiang | 48781e5 | 2015-12-16 11:47:33 +0000 | [diff] [blame] | 1350 | migrate_set_state(&s->state, MIGRATION_STATUS_CANCELLING, |
Liang Li | 94f5a43 | 2015-11-02 15:37:00 +0800 | [diff] [blame] | 1351 | MIGRATION_STATUS_CANCELLED); |
Paolo Bonzini | 7a2c172 | 2013-02-22 17:36:09 +0100 | [diff] [blame] | 1352 | } |
Paolo Bonzini | a3fa1d7 | 2013-02-22 17:36:18 +0100 | [diff] [blame] | 1353 | |
Juan Quintela | 87db1a7 | 2017-09-05 12:50:22 +0200 | [diff] [blame] | 1354 | if (s->error) { |
| 1355 | /* It is used on info migrate. We can't free it */ |
| 1356 | error_report_err(error_copy(s->error)); |
| 1357 | } |
Paolo Bonzini | a3fa1d7 | 2013-02-22 17:36:18 +0100 | [diff] [blame] | 1358 | notifier_list_notify(&migration_state_notifiers, s); |
Juan Quintela | 2833c59 | 2017-04-05 18:32:37 +0200 | [diff] [blame] | 1359 | block_cleanup_parameters(s); |
aliguori | 065e281 | 2008-11-11 16:46:33 +0000 | [diff] [blame] | 1360 | } |
| 1361 | |
Juan Quintela | 87db1a7 | 2017-09-05 12:50:22 +0200 | [diff] [blame] | 1362 | void migrate_set_error(MigrationState *s, const Error *error) |
| 1363 | { |
| 1364 | qemu_mutex_lock(&s->error_mutex); |
| 1365 | if (!s->error) { |
| 1366 | s->error = error_copy(error); |
| 1367 | } |
| 1368 | qemu_mutex_unlock(&s->error_mutex); |
| 1369 | } |
| 1370 | |
Daniel P. Berrange | d59ce6f | 2016-04-27 11:05:00 +0100 | [diff] [blame] | 1371 | void migrate_fd_error(MigrationState *s, const Error *error) |
aliguori | 065e281 | 2008-11-11 16:46:33 +0000 | [diff] [blame] | 1372 | { |
Peter Maydell | 2517405 | 2016-10-21 18:41:45 +0100 | [diff] [blame] | 1373 | trace_migrate_fd_error(error_get_pretty(error)); |
zhanghailiang | 89a02a9 | 2016-01-15 11:37:42 +0800 | [diff] [blame] | 1374 | assert(s->to_dst_file == NULL); |
zhanghailiang | 48781e5 | 2015-12-16 11:47:33 +0000 | [diff] [blame] | 1375 | migrate_set_state(&s->state, MIGRATION_STATUS_SETUP, |
| 1376 | MIGRATION_STATUS_FAILED); |
Juan Quintela | 87db1a7 | 2017-09-05 12:50:22 +0200 | [diff] [blame] | 1377 | migrate_set_error(s, error); |
Juan Quintela | 458cf28 | 2011-02-22 23:32:54 +0100 | [diff] [blame] | 1378 | } |
| 1379 | |
Juan Quintela | 0edda1c | 2010-05-11 16:28:39 +0200 | [diff] [blame] | 1380 | static void migrate_fd_cancel(MigrationState *s) |
aliguori | 065e281 | 2008-11-11 16:46:33 +0000 | [diff] [blame] | 1381 | { |
Zhanghaoyu (A) | 6f2b811 | 2013-11-07 08:21:23 +0000 | [diff] [blame] | 1382 | int old_state ; |
zhanghailiang | 89a02a9 | 2016-01-15 11:37:42 +0800 | [diff] [blame] | 1383 | QEMUFile *f = migrate_get_current()->to_dst_file; |
Alexey Kardashevskiy | 9013dca | 2014-03-11 10:42:29 +1100 | [diff] [blame] | 1384 | trace_migrate_fd_cancel(); |
aliguori | 065e281 | 2008-11-11 16:46:33 +0000 | [diff] [blame] | 1385 | |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 1386 | if (s->rp_state.from_dst_file) { |
| 1387 | /* shutdown the rp socket, so causing the rp thread to shutdown */ |
| 1388 | qemu_file_shutdown(s->rp_state.from_dst_file); |
| 1389 | } |
| 1390 | |
Zhanghaoyu (A) | 6f2b811 | 2013-11-07 08:21:23 +0000 | [diff] [blame] | 1391 | do { |
| 1392 | old_state = s->state; |
Dr. David Alan Gilbert | f6844b9 | 2015-11-05 18:10:48 +0000 | [diff] [blame] | 1393 | if (!migration_is_setup_or_active(old_state)) { |
Zhanghaoyu (A) | 6f2b811 | 2013-11-07 08:21:23 +0000 | [diff] [blame] | 1394 | break; |
| 1395 | } |
Dr. David Alan Gilbert | a7b36b4 | 2017-10-20 10:05:55 +0100 | [diff] [blame] | 1396 | /* If the migration is paused, kick it out of the pause */ |
| 1397 | if (old_state == MIGRATION_STATUS_PRE_SWITCHOVER) { |
| 1398 | qemu_sem_post(&s->pause_sem); |
| 1399 | } |
zhanghailiang | 48781e5 | 2015-12-16 11:47:33 +0000 | [diff] [blame] | 1400 | migrate_set_state(&s->state, old_state, MIGRATION_STATUS_CANCELLING); |
zhanghailiang | 3119473 | 2015-03-13 16:08:38 +0800 | [diff] [blame] | 1401 | } while (s->state != MIGRATION_STATUS_CANCELLING); |
Dr. David Alan Gilbert | a26ba26 | 2015-01-08 11:11:32 +0000 | [diff] [blame] | 1402 | |
| 1403 | /* |
| 1404 | * If we're unlucky the migration code might be stuck somewhere in a |
| 1405 | * send/write while the network has failed and is waiting to timeout; |
| 1406 | * if we've got shutdown(2) available then we can force it to quit. |
| 1407 | * The outgoing qemu file gets closed in migrate_fd_cleanup that is |
| 1408 | * called in a bh, so there is no race against this cancel. |
| 1409 | */ |
zhanghailiang | 3119473 | 2015-03-13 16:08:38 +0800 | [diff] [blame] | 1410 | if (s->state == MIGRATION_STATUS_CANCELLING && f) { |
Dr. David Alan Gilbert | a26ba26 | 2015-01-08 11:11:32 +0000 | [diff] [blame] | 1411 | qemu_file_shutdown(f); |
| 1412 | } |
zhanghailiang | 1d2acc3 | 2017-01-24 15:59:52 +0800 | [diff] [blame] | 1413 | if (s->state == MIGRATION_STATUS_CANCELLING && s->block_inactive) { |
| 1414 | Error *local_err = NULL; |
| 1415 | |
| 1416 | bdrv_invalidate_cache_all(&local_err); |
| 1417 | if (local_err) { |
| 1418 | error_report_err(local_err); |
| 1419 | } else { |
| 1420 | s->block_inactive = false; |
| 1421 | } |
| 1422 | } |
aliguori | 065e281 | 2008-11-11 16:46:33 +0000 | [diff] [blame] | 1423 | } |
| 1424 | |
Gerd Hoffmann | 99a0db9 | 2010-12-13 17:30:12 +0100 | [diff] [blame] | 1425 | void add_migration_state_change_notifier(Notifier *notify) |
| 1426 | { |
| 1427 | notifier_list_add(&migration_state_notifiers, notify); |
| 1428 | } |
| 1429 | |
| 1430 | void remove_migration_state_change_notifier(Notifier *notify) |
| 1431 | { |
Paolo Bonzini | 3155252 | 2012-01-13 17:34:01 +0100 | [diff] [blame] | 1432 | notifier_remove(notify); |
Gerd Hoffmann | 99a0db9 | 2010-12-13 17:30:12 +0100 | [diff] [blame] | 1433 | } |
| 1434 | |
Stefan Hajnoczi | 02edd2e | 2013-07-29 15:01:58 +0200 | [diff] [blame] | 1435 | bool migration_in_setup(MigrationState *s) |
Gerd Hoffmann | afe2df6 | 2011-10-25 13:50:11 +0200 | [diff] [blame] | 1436 | { |
zhanghailiang | 3119473 | 2015-03-13 16:08:38 +0800 | [diff] [blame] | 1437 | return s->state == MIGRATION_STATUS_SETUP; |
Gerd Hoffmann | afe2df6 | 2011-10-25 13:50:11 +0200 | [diff] [blame] | 1438 | } |
| 1439 | |
Juan Quintela | 7073693 | 2011-02-23 00:43:59 +0100 | [diff] [blame] | 1440 | bool migration_has_finished(MigrationState *s) |
Gerd Hoffmann | 99a0db9 | 2010-12-13 17:30:12 +0100 | [diff] [blame] | 1441 | { |
zhanghailiang | 3119473 | 2015-03-13 16:08:38 +0800 | [diff] [blame] | 1442 | return s->state == MIGRATION_STATUS_COMPLETED; |
Gerd Hoffmann | 99a0db9 | 2010-12-13 17:30:12 +0100 | [diff] [blame] | 1443 | } |
Juan Quintela | 0edda1c | 2010-05-11 16:28:39 +0200 | [diff] [blame] | 1444 | |
Gerd Hoffmann | afe2df6 | 2011-10-25 13:50:11 +0200 | [diff] [blame] | 1445 | bool migration_has_failed(MigrationState *s) |
| 1446 | { |
zhanghailiang | 3119473 | 2015-03-13 16:08:38 +0800 | [diff] [blame] | 1447 | return (s->state == MIGRATION_STATUS_CANCELLED || |
| 1448 | s->state == MIGRATION_STATUS_FAILED); |
Gerd Hoffmann | afe2df6 | 2011-10-25 13:50:11 +0200 | [diff] [blame] | 1449 | } |
| 1450 | |
Juan Quintela | 5727309 | 2017-03-20 22:25:28 +0100 | [diff] [blame] | 1451 | bool migration_in_postcopy(void) |
Dr. David Alan Gilbert | 9ec055a | 2015-11-05 18:10:58 +0000 | [diff] [blame] | 1452 | { |
Juan Quintela | 5727309 | 2017-03-20 22:25:28 +0100 | [diff] [blame] | 1453 | MigrationState *s = migrate_get_current(); |
| 1454 | |
Dr. David Alan Gilbert | 9ec055a | 2015-11-05 18:10:58 +0000 | [diff] [blame] | 1455 | return (s->state == MIGRATION_STATUS_POSTCOPY_ACTIVE); |
| 1456 | } |
| 1457 | |
Dr. David Alan Gilbert | b82fc32 | 2016-02-22 17:17:32 +0000 | [diff] [blame] | 1458 | bool migration_in_postcopy_after_devices(MigrationState *s) |
| 1459 | { |
Juan Quintela | 5727309 | 2017-03-20 22:25:28 +0100 | [diff] [blame] | 1460 | return migration_in_postcopy() && s->postcopy_after_devices; |
Dr. David Alan Gilbert | b82fc32 | 2016-02-22 17:17:32 +0000 | [diff] [blame] | 1461 | } |
| 1462 | |
Juan Quintela | fab3500 | 2017-03-22 17:36:57 +0100 | [diff] [blame] | 1463 | bool migration_is_idle(void) |
Ashijeet Acharya | fe44dc9 | 2017-01-16 17:01:53 +0530 | [diff] [blame] | 1464 | { |
Juan Quintela | fab3500 | 2017-03-22 17:36:57 +0100 | [diff] [blame] | 1465 | MigrationState *s = migrate_get_current(); |
Ashijeet Acharya | fe44dc9 | 2017-01-16 17:01:53 +0530 | [diff] [blame] | 1466 | |
| 1467 | switch (s->state) { |
| 1468 | case MIGRATION_STATUS_NONE: |
| 1469 | case MIGRATION_STATUS_CANCELLED: |
| 1470 | case MIGRATION_STATUS_COMPLETED: |
| 1471 | case MIGRATION_STATUS_FAILED: |
| 1472 | return true; |
| 1473 | case MIGRATION_STATUS_SETUP: |
| 1474 | case MIGRATION_STATUS_CANCELLING: |
| 1475 | case MIGRATION_STATUS_ACTIVE: |
| 1476 | case MIGRATION_STATUS_POSTCOPY_ACTIVE: |
| 1477 | case MIGRATION_STATUS_COLO: |
Dr. David Alan Gilbert | 31e0607 | 2017-10-20 10:05:51 +0100 | [diff] [blame] | 1478 | case MIGRATION_STATUS_PRE_SWITCHOVER: |
| 1479 | case MIGRATION_STATUS_DEVICE: |
Ashijeet Acharya | fe44dc9 | 2017-01-16 17:01:53 +0530 | [diff] [blame] | 1480 | return false; |
| 1481 | case MIGRATION_STATUS__MAX: |
| 1482 | g_assert_not_reached(); |
| 1483 | } |
| 1484 | |
| 1485 | return false; |
| 1486 | } |
| 1487 | |
Peter Xu | 3e0c805 | 2018-02-08 18:31:15 +0800 | [diff] [blame] | 1488 | void migrate_init(MigrationState *s) |
Juan Quintela | 0edda1c | 2010-05-11 16:28:39 +0200 | [diff] [blame] | 1489 | { |
Dr. David Alan Gilbert | 389775d | 2015-11-12 15:38:27 +0000 | [diff] [blame] | 1490 | /* |
| 1491 | * Reinitialise all migration state, except |
| 1492 | * parameters/capabilities that the user set, and |
| 1493 | * locks. |
| 1494 | */ |
| 1495 | s->bytes_xfer = 0; |
| 1496 | s->xfer_limit = 0; |
| 1497 | s->cleanup_bh = 0; |
zhanghailiang | 89a02a9 | 2016-01-15 11:37:42 +0800 | [diff] [blame] | 1498 | s->to_dst_file = NULL; |
Dr. David Alan Gilbert | 389775d | 2015-11-12 15:38:27 +0000 | [diff] [blame] | 1499 | s->state = MIGRATION_STATUS_NONE; |
Dr. David Alan Gilbert | 389775d | 2015-11-12 15:38:27 +0000 | [diff] [blame] | 1500 | s->rp_state.from_dst_file = NULL; |
| 1501 | s->rp_state.error = false; |
| 1502 | s->mbps = 0.0; |
| 1503 | s->downtime = 0; |
| 1504 | s->expected_downtime = 0; |
Dr. David Alan Gilbert | 389775d | 2015-11-12 15:38:27 +0000 | [diff] [blame] | 1505 | s->setup_time = 0; |
Dr. David Alan Gilbert | 389775d | 2015-11-12 15:38:27 +0000 | [diff] [blame] | 1506 | s->start_postcopy = false; |
Dr. David Alan Gilbert | b82fc32 | 2016-02-22 17:17:32 +0000 | [diff] [blame] | 1507 | s->postcopy_after_devices = false; |
Dr. David Alan Gilbert | 389775d | 2015-11-12 15:38:27 +0000 | [diff] [blame] | 1508 | s->migration_thread_running = false; |
Daniel P. Berrange | d59ce6f | 2016-04-27 11:05:00 +0100 | [diff] [blame] | 1509 | error_free(s->error); |
| 1510 | s->error = NULL; |
Juan Quintela | 1299c63 | 2011-11-09 21:29:01 +0100 | [diff] [blame] | 1511 | |
zhanghailiang | 48781e5 | 2015-12-16 11:47:33 +0000 | [diff] [blame] | 1512 | migrate_set_state(&s->state, MIGRATION_STATUS_NONE, MIGRATION_STATUS_SETUP); |
Juan Quintela | 0edda1c | 2010-05-11 16:28:39 +0200 | [diff] [blame] | 1513 | |
Peter Xu | 4af246a | 2018-01-03 20:20:08 +0800 | [diff] [blame] | 1514 | s->start_time = qemu_clock_get_ms(QEMU_CLOCK_REALTIME); |
| 1515 | s->total_time = 0; |
Peter Xu | 7287cbd | 2018-01-03 20:20:09 +0800 | [diff] [blame] | 1516 | s->vm_was_running = false; |
Peter Xu | b15df1a | 2018-01-03 20:20:13 +0800 | [diff] [blame] | 1517 | s->iteration_initial_bytes = 0; |
| 1518 | s->threshold_size = 0; |
Juan Quintela | 0edda1c | 2010-05-11 16:28:39 +0200 | [diff] [blame] | 1519 | } |
Juan Quintela | cab3014 | 2011-02-22 23:54:21 +0100 | [diff] [blame] | 1520 | |
Anthony Liguori | fa2756b | 2011-11-14 15:09:43 -0600 | [diff] [blame] | 1521 | static GSList *migration_blockers; |
| 1522 | |
Ashijeet Acharya | fe44dc9 | 2017-01-16 17:01:53 +0530 | [diff] [blame] | 1523 | int migrate_add_blocker(Error *reason, Error **errp) |
Anthony Liguori | fa2756b | 2011-11-14 15:09:43 -0600 | [diff] [blame] | 1524 | { |
Peter Xu | 3df663e | 2017-06-27 12:10:15 +0800 | [diff] [blame] | 1525 | if (migrate_get_current()->only_migratable) { |
Ashijeet Acharya | b67b8c3 | 2017-01-16 17:01:54 +0530 | [diff] [blame] | 1526 | error_propagate(errp, error_copy(reason)); |
| 1527 | error_prepend(errp, "disallowing migration blocker " |
| 1528 | "(--only_migratable) for: "); |
| 1529 | return -EACCES; |
| 1530 | } |
| 1531 | |
Juan Quintela | fab3500 | 2017-03-22 17:36:57 +0100 | [diff] [blame] | 1532 | if (migration_is_idle()) { |
Ashijeet Acharya | fe44dc9 | 2017-01-16 17:01:53 +0530 | [diff] [blame] | 1533 | migration_blockers = g_slist_prepend(migration_blockers, reason); |
| 1534 | return 0; |
| 1535 | } |
| 1536 | |
| 1537 | error_propagate(errp, error_copy(reason)); |
| 1538 | error_prepend(errp, "disallowing migration blocker (migration in " |
| 1539 | "progress) for: "); |
| 1540 | return -EBUSY; |
Anthony Liguori | fa2756b | 2011-11-14 15:09:43 -0600 | [diff] [blame] | 1541 | } |
| 1542 | |
| 1543 | void migrate_del_blocker(Error *reason) |
| 1544 | { |
| 1545 | migration_blockers = g_slist_remove(migration_blockers, reason); |
| 1546 | } |
| 1547 | |
Dr. David Alan Gilbert | bf1ae1f | 2015-02-19 11:40:28 +0000 | [diff] [blame] | 1548 | void qmp_migrate_incoming(const char *uri, Error **errp) |
| 1549 | { |
| 1550 | Error *local_err = NULL; |
Dr. David Alan Gilbert | 4debb5f | 2015-02-26 14:54:41 +0000 | [diff] [blame] | 1551 | static bool once = true; |
Dr. David Alan Gilbert | bf1ae1f | 2015-02-19 11:40:28 +0000 | [diff] [blame] | 1552 | |
| 1553 | if (!deferred_incoming) { |
Dr. David Alan Gilbert | 4debb5f | 2015-02-26 14:54:41 +0000 | [diff] [blame] | 1554 | error_setg(errp, "For use with '-incoming defer'"); |
Dr. David Alan Gilbert | bf1ae1f | 2015-02-19 11:40:28 +0000 | [diff] [blame] | 1555 | return; |
| 1556 | } |
Dr. David Alan Gilbert | 4debb5f | 2015-02-26 14:54:41 +0000 | [diff] [blame] | 1557 | if (!once) { |
| 1558 | error_setg(errp, "The incoming migration has already been started"); |
| 1559 | } |
Dr. David Alan Gilbert | bf1ae1f | 2015-02-19 11:40:28 +0000 | [diff] [blame] | 1560 | |
| 1561 | qemu_start_incoming_migration(uri, &local_err); |
| 1562 | |
| 1563 | if (local_err) { |
| 1564 | error_propagate(errp, local_err); |
| 1565 | return; |
| 1566 | } |
| 1567 | |
Dr. David Alan Gilbert | 4debb5f | 2015-02-26 14:54:41 +0000 | [diff] [blame] | 1568 | once = false; |
Dr. David Alan Gilbert | bf1ae1f | 2015-02-19 11:40:28 +0000 | [diff] [blame] | 1569 | } |
| 1570 | |
Peter Xu | 02affd4 | 2018-05-02 18:47:36 +0800 | [diff] [blame] | 1571 | void qmp_migrate_recover(const char *uri, Error **errp) |
| 1572 | { |
| 1573 | MigrationIncomingState *mis = migration_incoming_get_current(); |
| 1574 | |
| 1575 | if (mis->state != MIGRATION_STATUS_POSTCOPY_PAUSED) { |
| 1576 | error_setg(errp, "Migrate recover can only be run " |
| 1577 | "when postcopy is paused."); |
| 1578 | return; |
| 1579 | } |
| 1580 | |
| 1581 | if (atomic_cmpxchg(&mis->postcopy_recover_triggered, |
| 1582 | false, true) == true) { |
| 1583 | error_setg(errp, "Migrate recovery is triggered already"); |
| 1584 | return; |
| 1585 | } |
| 1586 | |
| 1587 | /* |
| 1588 | * Note that this call will never start a real migration; it will |
| 1589 | * only re-setup the migration stream and poke existing migration |
| 1590 | * to continue using that newly established channel. |
| 1591 | */ |
| 1592 | qemu_start_incoming_migration(uri, errp); |
| 1593 | } |
| 1594 | |
Peter Xu | bfbf89c | 2018-05-02 18:47:39 +0800 | [diff] [blame] | 1595 | void qmp_migrate_pause(Error **errp) |
| 1596 | { |
| 1597 | MigrationState *ms = migrate_get_current(); |
| 1598 | MigrationIncomingState *mis = migration_incoming_get_current(); |
| 1599 | int ret; |
| 1600 | |
| 1601 | if (ms->state == MIGRATION_STATUS_POSTCOPY_ACTIVE) { |
| 1602 | /* Source side, during postcopy */ |
| 1603 | qemu_mutex_lock(&ms->qemu_file_lock); |
| 1604 | ret = qemu_file_shutdown(ms->to_dst_file); |
| 1605 | qemu_mutex_unlock(&ms->qemu_file_lock); |
| 1606 | if (ret) { |
| 1607 | error_setg(errp, "Failed to pause source migration"); |
| 1608 | } |
| 1609 | return; |
| 1610 | } |
| 1611 | |
| 1612 | if (mis->state == MIGRATION_STATUS_POSTCOPY_ACTIVE) { |
| 1613 | ret = qemu_file_shutdown(mis->from_src_file); |
| 1614 | if (ret) { |
| 1615 | error_setg(errp, "Failed to pause destination migration"); |
| 1616 | } |
| 1617 | return; |
| 1618 | } |
| 1619 | |
| 1620 | error_setg(errp, "migrate-pause is currently only supported " |
| 1621 | "during postcopy-active state"); |
| 1622 | } |
| 1623 | |
Greg Kurz | 24f3902 | 2016-05-04 21:44:19 +0200 | [diff] [blame] | 1624 | bool migration_is_blocked(Error **errp) |
| 1625 | { |
| 1626 | if (qemu_savevm_state_blocked(errp)) { |
| 1627 | return true; |
| 1628 | } |
| 1629 | |
| 1630 | if (migration_blockers) { |
Eduardo Habkost | 250561e | 2017-06-08 10:39:05 -0300 | [diff] [blame] | 1631 | error_propagate(errp, error_copy(migration_blockers->data)); |
Greg Kurz | 24f3902 | 2016-05-04 21:44:19 +0200 | [diff] [blame] | 1632 | return true; |
| 1633 | } |
| 1634 | |
| 1635 | return false; |
| 1636 | } |
| 1637 | |
Peter Xu | d3e35b8 | 2018-05-02 18:47:24 +0800 | [diff] [blame] | 1638 | /* Returns true if continue to migrate, or false if error detected */ |
| 1639 | static bool migrate_prepare(MigrationState *s, bool blk, bool blk_inc, |
| 1640 | bool resume, Error **errp) |
| 1641 | { |
| 1642 | Error *local_err = NULL; |
| 1643 | |
| 1644 | if (resume) { |
| 1645 | if (s->state != MIGRATION_STATUS_POSTCOPY_PAUSED) { |
| 1646 | error_setg(errp, "Cannot resume if there is no " |
| 1647 | "paused migration"); |
| 1648 | return false; |
| 1649 | } |
Peter Xu | 97ca211 | 2018-07-23 20:33:03 +0800 | [diff] [blame] | 1650 | |
| 1651 | /* |
| 1652 | * Postcopy recovery won't work well with release-ram |
| 1653 | * capability since release-ram will drop the page buffer as |
| 1654 | * long as the page is put into the send buffer. So if there |
| 1655 | * is a network failure happened, any page buffers that have |
| 1656 | * not yet reached the destination VM but have already been |
| 1657 | * sent from the source VM will be lost forever. Let's refuse |
| 1658 | * the client from resuming such a postcopy migration. |
| 1659 | * Luckily release-ram was designed to only be used when src |
| 1660 | * and destination VMs are on the same host, so it should be |
| 1661 | * fine. |
| 1662 | */ |
| 1663 | if (migrate_release_ram()) { |
| 1664 | error_setg(errp, "Postcopy recovery cannot work " |
| 1665 | "when release-ram capability is set"); |
| 1666 | return false; |
| 1667 | } |
| 1668 | |
Peter Xu | d3e35b8 | 2018-05-02 18:47:24 +0800 | [diff] [blame] | 1669 | /* This is a resume, skip init status */ |
| 1670 | return true; |
| 1671 | } |
| 1672 | |
| 1673 | if (migration_is_setup_or_active(s->state) || |
| 1674 | s->state == MIGRATION_STATUS_CANCELLING || |
| 1675 | s->state == MIGRATION_STATUS_COLO) { |
| 1676 | error_setg(errp, QERR_MIGRATION_ACTIVE); |
| 1677 | return false; |
| 1678 | } |
| 1679 | |
| 1680 | if (runstate_check(RUN_STATE_INMIGRATE)) { |
| 1681 | error_setg(errp, "Guest is waiting for an incoming migration"); |
| 1682 | return false; |
| 1683 | } |
| 1684 | |
| 1685 | if (migration_is_blocked(errp)) { |
| 1686 | return false; |
| 1687 | } |
| 1688 | |
| 1689 | if (blk || blk_inc) { |
| 1690 | if (migrate_use_block() || migrate_use_block_incremental()) { |
| 1691 | error_setg(errp, "Command options are incompatible with " |
| 1692 | "current migration capabilities"); |
| 1693 | return false; |
| 1694 | } |
| 1695 | migrate_set_block_enabled(true, &local_err); |
| 1696 | if (local_err) { |
| 1697 | error_propagate(errp, local_err); |
| 1698 | return false; |
| 1699 | } |
| 1700 | s->must_remove_block_options = true; |
| 1701 | } |
| 1702 | |
| 1703 | if (blk_inc) { |
| 1704 | migrate_set_block_incremental(s, true); |
| 1705 | } |
| 1706 | |
| 1707 | migrate_init(s); |
| 1708 | |
| 1709 | return true; |
| 1710 | } |
| 1711 | |
Luiz Capitulino | e1c37d0 | 2011-12-05 14:48:01 -0200 | [diff] [blame] | 1712 | void qmp_migrate(const char *uri, bool has_blk, bool blk, |
| 1713 | bool has_inc, bool inc, bool has_detach, bool detach, |
Peter Xu | 7a4da28 | 2018-05-02 18:47:23 +0800 | [diff] [blame] | 1714 | bool has_resume, bool resume, Error **errp) |
Juan Quintela | cab3014 | 2011-02-22 23:54:21 +0100 | [diff] [blame] | 1715 | { |
Paolo Bonzini | be7059c | 2012-10-03 14:34:33 +0200 | [diff] [blame] | 1716 | Error *local_err = NULL; |
Juan Quintela | 17549e8 | 2011-10-05 13:50:43 +0200 | [diff] [blame] | 1717 | MigrationState *s = migrate_get_current(); |
Juan Quintela | cab3014 | 2011-02-22 23:54:21 +0100 | [diff] [blame] | 1718 | const char *p; |
Juan Quintela | cab3014 | 2011-02-22 23:54:21 +0100 | [diff] [blame] | 1719 | |
Peter Xu | d3e35b8 | 2018-05-02 18:47:24 +0800 | [diff] [blame] | 1720 | if (!migrate_prepare(s, has_blk && blk, has_inc && inc, |
| 1721 | has_resume && resume, errp)) { |
| 1722 | /* Error detected, put into errp */ |
Luiz Capitulino | e1c37d0 | 2011-12-05 14:48:01 -0200 | [diff] [blame] | 1723 | return; |
Juan Quintela | cab3014 | 2011-02-22 23:54:21 +0100 | [diff] [blame] | 1724 | } |
Juan Quintela | cab3014 | 2011-02-22 23:54:21 +0100 | [diff] [blame] | 1725 | |
| 1726 | if (strstart(uri, "tcp:", &p)) { |
Paolo Bonzini | f37afb5 | 2012-10-02 10:02:46 +0200 | [diff] [blame] | 1727 | tcp_start_outgoing_migration(s, p, &local_err); |
Michael R. Hines | 2da776d | 2013-07-22 10:01:54 -0400 | [diff] [blame] | 1728 | #ifdef CONFIG_RDMA |
Michael R. Hines | 41310c6 | 2013-12-19 04:52:01 +0800 | [diff] [blame] | 1729 | } else if (strstart(uri, "rdma:", &p)) { |
Michael R. Hines | 2da776d | 2013-07-22 10:01:54 -0400 | [diff] [blame] | 1730 | rdma_start_outgoing_migration(s, p, &local_err); |
| 1731 | #endif |
Juan Quintela | cab3014 | 2011-02-22 23:54:21 +0100 | [diff] [blame] | 1732 | } else if (strstart(uri, "exec:", &p)) { |
Paolo Bonzini | f37afb5 | 2012-10-02 10:02:46 +0200 | [diff] [blame] | 1733 | exec_start_outgoing_migration(s, p, &local_err); |
Juan Quintela | cab3014 | 2011-02-22 23:54:21 +0100 | [diff] [blame] | 1734 | } else if (strstart(uri, "unix:", &p)) { |
Paolo Bonzini | f37afb5 | 2012-10-02 10:02:46 +0200 | [diff] [blame] | 1735 | unix_start_outgoing_migration(s, p, &local_err); |
Juan Quintela | cab3014 | 2011-02-22 23:54:21 +0100 | [diff] [blame] | 1736 | } else if (strstart(uri, "fd:", &p)) { |
Paolo Bonzini | f37afb5 | 2012-10-02 10:02:46 +0200 | [diff] [blame] | 1737 | fd_start_outgoing_migration(s, p, &local_err); |
Juan Quintela | cab3014 | 2011-02-22 23:54:21 +0100 | [diff] [blame] | 1738 | } else { |
Markus Armbruster | c6bd8c7 | 2015-03-17 11:54:50 +0100 | [diff] [blame] | 1739 | error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "uri", |
| 1740 | "a valid migration protocol"); |
zhanghailiang | 48781e5 | 2015-12-16 11:47:33 +0000 | [diff] [blame] | 1741 | migrate_set_state(&s->state, MIGRATION_STATUS_SETUP, |
| 1742 | MIGRATION_STATUS_FAILED); |
Dr. David Alan Gilbert | 09576e7 | 2018-03-16 20:21:14 +0000 | [diff] [blame] | 1743 | block_cleanup_parameters(s); |
Luiz Capitulino | e1c37d0 | 2011-12-05 14:48:01 -0200 | [diff] [blame] | 1744 | return; |
Juan Quintela | cab3014 | 2011-02-22 23:54:21 +0100 | [diff] [blame] | 1745 | } |
| 1746 | |
Paolo Bonzini | f37afb5 | 2012-10-02 10:02:46 +0200 | [diff] [blame] | 1747 | if (local_err) { |
Daniel P. Berrange | d59ce6f | 2016-04-27 11:05:00 +0100 | [diff] [blame] | 1748 | migrate_fd_error(s, local_err); |
Paolo Bonzini | f37afb5 | 2012-10-02 10:02:46 +0200 | [diff] [blame] | 1749 | error_propagate(errp, local_err); |
Luiz Capitulino | e1c37d0 | 2011-12-05 14:48:01 -0200 | [diff] [blame] | 1750 | return; |
Juan Quintela | 1299c63 | 2011-11-09 21:29:01 +0100 | [diff] [blame] | 1751 | } |
Juan Quintela | cab3014 | 2011-02-22 23:54:21 +0100 | [diff] [blame] | 1752 | } |
| 1753 | |
Luiz Capitulino | 6cdedb0 | 2011-11-27 22:54:09 -0200 | [diff] [blame] | 1754 | void qmp_migrate_cancel(Error **errp) |
Juan Quintela | cab3014 | 2011-02-22 23:54:21 +0100 | [diff] [blame] | 1755 | { |
Juan Quintela | 17549e8 | 2011-10-05 13:50:43 +0200 | [diff] [blame] | 1756 | migrate_fd_cancel(migrate_get_current()); |
Juan Quintela | cab3014 | 2011-02-22 23:54:21 +0100 | [diff] [blame] | 1757 | } |
| 1758 | |
Dr. David Alan Gilbert | 89cfc02 | 2017-10-20 10:05:53 +0100 | [diff] [blame] | 1759 | void qmp_migrate_continue(MigrationStatus state, Error **errp) |
| 1760 | { |
| 1761 | MigrationState *s = migrate_get_current(); |
| 1762 | if (s->state != state) { |
| 1763 | error_setg(errp, "Migration not in expected state: %s", |
| 1764 | MigrationStatus_str(s->state)); |
| 1765 | return; |
| 1766 | } |
| 1767 | qemu_sem_post(&s->pause_sem); |
| 1768 | } |
| 1769 | |
Orit Wasserman | 9e1ba4c | 2012-08-06 21:42:54 +0300 | [diff] [blame] | 1770 | void qmp_migrate_set_cache_size(int64_t value, Error **errp) |
| 1771 | { |
Juan Quintela | 73af8dd | 2017-10-05 21:30:10 +0200 | [diff] [blame] | 1772 | MigrateSetParameters p = { |
| 1773 | .has_xbzrle_cache_size = true, |
| 1774 | .xbzrle_cache_size = value, |
| 1775 | }; |
Orit Wasserman | 9e1ba4c | 2012-08-06 21:42:54 +0300 | [diff] [blame] | 1776 | |
Juan Quintela | 73af8dd | 2017-10-05 21:30:10 +0200 | [diff] [blame] | 1777 | qmp_migrate_set_parameters(&p, errp); |
Orit Wasserman | 9e1ba4c | 2012-08-06 21:42:54 +0300 | [diff] [blame] | 1778 | } |
| 1779 | |
| 1780 | int64_t qmp_query_migrate_cache_size(Error **errp) |
| 1781 | { |
| 1782 | return migrate_xbzrle_cache_size(); |
| 1783 | } |
| 1784 | |
Luiz Capitulino | 3dc8538 | 2011-11-28 11:59:37 -0200 | [diff] [blame] | 1785 | void qmp_migrate_set_speed(int64_t value, Error **errp) |
Juan Quintela | cab3014 | 2011-02-22 23:54:21 +0100 | [diff] [blame] | 1786 | { |
Markus Armbruster | 1bda8b3 | 2017-07-18 13:42:11 +0200 | [diff] [blame] | 1787 | MigrateSetParameters p = { |
Ashijeet Acharya | 2ff3025 | 2016-09-15 21:50:28 +0530 | [diff] [blame] | 1788 | .has_max_bandwidth = true, |
| 1789 | .max_bandwidth = value, |
| 1790 | }; |
Juan Quintela | cab3014 | 2011-02-22 23:54:21 +0100 | [diff] [blame] | 1791 | |
Ashijeet Acharya | 2ff3025 | 2016-09-15 21:50:28 +0530 | [diff] [blame] | 1792 | qmp_migrate_set_parameters(&p, errp); |
Juan Quintela | cab3014 | 2011-02-22 23:54:21 +0100 | [diff] [blame] | 1793 | } |
| 1794 | |
Luiz Capitulino | 4f0a993 | 2011-11-27 23:18:01 -0200 | [diff] [blame] | 1795 | void qmp_migrate_set_downtime(double value, Error **errp) |
Juan Quintela | cab3014 | 2011-02-22 23:54:21 +0100 | [diff] [blame] | 1796 | { |
Daniel Henrique Barboza | 87c9cc1 | 2017-02-22 12:17:29 -0300 | [diff] [blame] | 1797 | if (value < 0 || value > MAX_MIGRATE_DOWNTIME_SECONDS) { |
| 1798 | error_setg(errp, "Parameter 'downtime_limit' expects an integer in " |
| 1799 | "the range of 0 to %d seconds", |
| 1800 | MAX_MIGRATE_DOWNTIME_SECONDS); |
| 1801 | return; |
| 1802 | } |
| 1803 | |
Ashijeet Acharya | 2ff3025 | 2016-09-15 21:50:28 +0530 | [diff] [blame] | 1804 | value *= 1000; /* Convert to milliseconds */ |
| 1805 | value = MAX(0, MIN(INT64_MAX, value)); |
| 1806 | |
Markus Armbruster | 1bda8b3 | 2017-07-18 13:42:11 +0200 | [diff] [blame] | 1807 | MigrateSetParameters p = { |
Ashijeet Acharya | 2ff3025 | 2016-09-15 21:50:28 +0530 | [diff] [blame] | 1808 | .has_downtime_limit = true, |
| 1809 | .downtime_limit = value, |
| 1810 | }; |
| 1811 | |
| 1812 | qmp_migrate_set_parameters(&p, errp); |
aliguori | 5bb7910 | 2008-10-13 03:12:02 +0000 | [diff] [blame] | 1813 | } |
Orit Wasserman | 17ad9b3 | 2012-08-06 21:42:53 +0300 | [diff] [blame] | 1814 | |
Pavel Butsykin | 53f09a1 | 2017-02-03 18:23:20 +0300 | [diff] [blame] | 1815 | bool migrate_release_ram(void) |
| 1816 | { |
| 1817 | MigrationState *s; |
| 1818 | |
| 1819 | s = migrate_get_current(); |
| 1820 | |
| 1821 | return s->enabled_capabilities[MIGRATION_CAPABILITY_RELEASE_RAM]; |
| 1822 | } |
| 1823 | |
Dr. David Alan Gilbert | 53dd370 | 2015-11-05 18:10:51 +0000 | [diff] [blame] | 1824 | bool migrate_postcopy_ram(void) |
| 1825 | { |
| 1826 | MigrationState *s; |
| 1827 | |
| 1828 | s = migrate_get_current(); |
| 1829 | |
Dr. David Alan Gilbert | 32c3db5 | 2016-03-11 09:53:36 +0000 | [diff] [blame] | 1830 | return s->enabled_capabilities[MIGRATION_CAPABILITY_POSTCOPY_RAM]; |
Dr. David Alan Gilbert | 53dd370 | 2015-11-05 18:10:51 +0000 | [diff] [blame] | 1831 | } |
| 1832 | |
Vladimir Sementsov-Ogievskiy | 58110f0 | 2017-07-10 19:30:16 +0300 | [diff] [blame] | 1833 | bool migrate_postcopy(void) |
| 1834 | { |
Vladimir Sementsov-Ogievskiy | dd6bb91 | 2018-03-13 15:34:00 -0400 | [diff] [blame] | 1835 | return migrate_postcopy_ram() || migrate_dirty_bitmaps(); |
Vladimir Sementsov-Ogievskiy | 58110f0 | 2017-07-10 19:30:16 +0300 | [diff] [blame] | 1836 | } |
| 1837 | |
Chegu Vinod | bde1e2e | 2013-06-24 03:49:42 -0600 | [diff] [blame] | 1838 | bool migrate_auto_converge(void) |
| 1839 | { |
| 1840 | MigrationState *s; |
| 1841 | |
| 1842 | s = migrate_get_current(); |
| 1843 | |
| 1844 | return s->enabled_capabilities[MIGRATION_CAPABILITY_AUTO_CONVERGE]; |
| 1845 | } |
| 1846 | |
Peter Lieven | 323004a | 2013-07-18 09:48:50 +0200 | [diff] [blame] | 1847 | bool migrate_zero_blocks(void) |
| 1848 | { |
| 1849 | MigrationState *s; |
| 1850 | |
| 1851 | s = migrate_get_current(); |
| 1852 | |
| 1853 | return s->enabled_capabilities[MIGRATION_CAPABILITY_ZERO_BLOCKS]; |
| 1854 | } |
| 1855 | |
Alexey Perevalov | f22f928 | 2018-03-22 21:17:22 +0300 | [diff] [blame] | 1856 | bool migrate_postcopy_blocktime(void) |
| 1857 | { |
| 1858 | MigrationState *s; |
| 1859 | |
| 1860 | s = migrate_get_current(); |
| 1861 | |
| 1862 | return s->enabled_capabilities[MIGRATION_CAPABILITY_POSTCOPY_BLOCKTIME]; |
| 1863 | } |
| 1864 | |
Liang Li | 8706d2d | 2015-03-23 16:32:17 +0800 | [diff] [blame] | 1865 | bool migrate_use_compression(void) |
| 1866 | { |
Liang Li | dde4e69 | 2015-03-23 16:32:26 +0800 | [diff] [blame] | 1867 | MigrationState *s; |
| 1868 | |
| 1869 | s = migrate_get_current(); |
| 1870 | |
| 1871 | return s->enabled_capabilities[MIGRATION_CAPABILITY_COMPRESS]; |
Liang Li | 8706d2d | 2015-03-23 16:32:17 +0800 | [diff] [blame] | 1872 | } |
| 1873 | |
| 1874 | int migrate_compress_level(void) |
| 1875 | { |
| 1876 | MigrationState *s; |
| 1877 | |
| 1878 | s = migrate_get_current(); |
| 1879 | |
Daniel P. Berrange | 2594f56 | 2016-04-27 11:05:14 +0100 | [diff] [blame] | 1880 | return s->parameters.compress_level; |
Liang Li | 8706d2d | 2015-03-23 16:32:17 +0800 | [diff] [blame] | 1881 | } |
| 1882 | |
| 1883 | int migrate_compress_threads(void) |
| 1884 | { |
| 1885 | MigrationState *s; |
| 1886 | |
| 1887 | s = migrate_get_current(); |
| 1888 | |
Daniel P. Berrange | 2594f56 | 2016-04-27 11:05:14 +0100 | [diff] [blame] | 1889 | return s->parameters.compress_threads; |
Liang Li | 8706d2d | 2015-03-23 16:32:17 +0800 | [diff] [blame] | 1890 | } |
| 1891 | |
Liang Li | 3fcb38c | 2015-03-23 16:32:18 +0800 | [diff] [blame] | 1892 | int migrate_decompress_threads(void) |
| 1893 | { |
| 1894 | MigrationState *s; |
| 1895 | |
| 1896 | s = migrate_get_current(); |
| 1897 | |
Daniel P. Berrange | 2594f56 | 2016-04-27 11:05:14 +0100 | [diff] [blame] | 1898 | return s->parameters.decompress_threads; |
Liang Li | 3fcb38c | 2015-03-23 16:32:18 +0800 | [diff] [blame] | 1899 | } |
| 1900 | |
Vladimir Sementsov-Ogievskiy | 55efc8c | 2018-03-13 15:34:00 -0400 | [diff] [blame] | 1901 | bool migrate_dirty_bitmaps(void) |
| 1902 | { |
| 1903 | MigrationState *s; |
| 1904 | |
| 1905 | s = migrate_get_current(); |
| 1906 | |
| 1907 | return s->enabled_capabilities[MIGRATION_CAPABILITY_DIRTY_BITMAPS]; |
| 1908 | } |
| 1909 | |
Juan Quintela | b05dc72 | 2015-07-07 14:44:05 +0200 | [diff] [blame] | 1910 | bool migrate_use_events(void) |
| 1911 | { |
| 1912 | MigrationState *s; |
| 1913 | |
| 1914 | s = migrate_get_current(); |
| 1915 | |
| 1916 | return s->enabled_capabilities[MIGRATION_CAPABILITY_EVENTS]; |
| 1917 | } |
| 1918 | |
Juan Quintela | 30126bb | 2016-01-14 12:23:00 +0100 | [diff] [blame] | 1919 | bool migrate_use_multifd(void) |
| 1920 | { |
| 1921 | MigrationState *s; |
| 1922 | |
| 1923 | s = migrate_get_current(); |
| 1924 | |
| 1925 | return s->enabled_capabilities[MIGRATION_CAPABILITY_X_MULTIFD]; |
| 1926 | } |
| 1927 | |
Dr. David Alan Gilbert | 93fbd03 | 2017-10-20 10:05:50 +0100 | [diff] [blame] | 1928 | bool migrate_pause_before_switchover(void) |
| 1929 | { |
| 1930 | MigrationState *s; |
| 1931 | |
| 1932 | s = migrate_get_current(); |
| 1933 | |
| 1934 | return s->enabled_capabilities[ |
| 1935 | MIGRATION_CAPABILITY_PAUSE_BEFORE_SWITCHOVER]; |
| 1936 | } |
| 1937 | |
Juan Quintela | 4075fb1 | 2016-01-15 08:56:17 +0100 | [diff] [blame] | 1938 | int migrate_multifd_channels(void) |
| 1939 | { |
| 1940 | MigrationState *s; |
| 1941 | |
| 1942 | s = migrate_get_current(); |
| 1943 | |
| 1944 | return s->parameters.x_multifd_channels; |
| 1945 | } |
| 1946 | |
Juan Quintela | 0fb8660 | 2017-04-27 10:48:25 +0200 | [diff] [blame] | 1947 | int migrate_multifd_page_count(void) |
| 1948 | { |
| 1949 | MigrationState *s; |
| 1950 | |
| 1951 | s = migrate_get_current(); |
| 1952 | |
| 1953 | return s->parameters.x_multifd_page_count; |
| 1954 | } |
| 1955 | |
Orit Wasserman | 17ad9b3 | 2012-08-06 21:42:53 +0300 | [diff] [blame] | 1956 | int migrate_use_xbzrle(void) |
| 1957 | { |
| 1958 | MigrationState *s; |
| 1959 | |
| 1960 | s = migrate_get_current(); |
| 1961 | |
| 1962 | return s->enabled_capabilities[MIGRATION_CAPABILITY_XBZRLE]; |
| 1963 | } |
| 1964 | |
| 1965 | int64_t migrate_xbzrle_cache_size(void) |
| 1966 | { |
| 1967 | MigrationState *s; |
| 1968 | |
| 1969 | s = migrate_get_current(); |
| 1970 | |
Juan Quintela | 73af8dd | 2017-10-05 21:30:10 +0200 | [diff] [blame] | 1971 | return s->parameters.xbzrle_cache_size; |
Orit Wasserman | 17ad9b3 | 2012-08-06 21:42:53 +0300 | [diff] [blame] | 1972 | } |
Juan Quintela | 0d82d0e | 2012-10-03 14:18:33 +0200 | [diff] [blame] | 1973 | |
Dr. David Alan Gilbert | 7e555c6 | 2018-06-13 11:26:40 +0100 | [diff] [blame] | 1974 | static int64_t migrate_max_postcopy_bandwidth(void) |
| 1975 | { |
| 1976 | MigrationState *s; |
| 1977 | |
| 1978 | s = migrate_get_current(); |
| 1979 | |
| 1980 | return s->parameters.max_postcopy_bandwidth; |
| 1981 | } |
| 1982 | |
Juan Quintela | 2833c59 | 2017-04-05 18:32:37 +0200 | [diff] [blame] | 1983 | bool migrate_use_block(void) |
| 1984 | { |
| 1985 | MigrationState *s; |
| 1986 | |
| 1987 | s = migrate_get_current(); |
| 1988 | |
| 1989 | return s->enabled_capabilities[MIGRATION_CAPABILITY_BLOCK]; |
| 1990 | } |
| 1991 | |
Peter Xu | c788ada | 2017-06-26 18:28:55 +0800 | [diff] [blame] | 1992 | bool migrate_use_return_path(void) |
| 1993 | { |
| 1994 | MigrationState *s; |
| 1995 | |
| 1996 | s = migrate_get_current(); |
| 1997 | |
| 1998 | return s->enabled_capabilities[MIGRATION_CAPABILITY_RETURN_PATH]; |
| 1999 | } |
| 2000 | |
Juan Quintela | 2833c59 | 2017-04-05 18:32:37 +0200 | [diff] [blame] | 2001 | bool migrate_use_block_incremental(void) |
| 2002 | { |
| 2003 | MigrationState *s; |
| 2004 | |
| 2005 | s = migrate_get_current(); |
| 2006 | |
| 2007 | return s->parameters.block_incremental; |
| 2008 | } |
| 2009 | |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 2010 | /* migration thread support */ |
| 2011 | /* |
| 2012 | * Something bad happened to the RP stream, mark an error |
| 2013 | * The caller shall print or trace something to indicate why |
| 2014 | */ |
| 2015 | static void mark_source_rp_bad(MigrationState *s) |
| 2016 | { |
| 2017 | s->rp_state.error = true; |
| 2018 | } |
| 2019 | |
| 2020 | static struct rp_cmd_args { |
| 2021 | ssize_t len; /* -1 = variable */ |
| 2022 | const char *name; |
| 2023 | } rp_cmd_args[] = { |
| 2024 | [MIG_RP_MSG_INVALID] = { .len = -1, .name = "INVALID" }, |
| 2025 | [MIG_RP_MSG_SHUT] = { .len = 4, .name = "SHUT" }, |
| 2026 | [MIG_RP_MSG_PONG] = { .len = 4, .name = "PONG" }, |
Dr. David Alan Gilbert | 1e2d90e | 2015-11-05 18:11:07 +0000 | [diff] [blame] | 2027 | [MIG_RP_MSG_REQ_PAGES] = { .len = 12, .name = "REQ_PAGES" }, |
| 2028 | [MIG_RP_MSG_REQ_PAGES_ID] = { .len = -1, .name = "REQ_PAGES_ID" }, |
Peter Xu | a335deb | 2018-05-02 18:47:28 +0800 | [diff] [blame] | 2029 | [MIG_RP_MSG_RECV_BITMAP] = { .len = -1, .name = "RECV_BITMAP" }, |
Peter Xu | 13955b8 | 2018-05-02 18:47:30 +0800 | [diff] [blame] | 2030 | [MIG_RP_MSG_RESUME_ACK] = { .len = 4, .name = "RESUME_ACK" }, |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 2031 | [MIG_RP_MSG_MAX] = { .len = -1, .name = "MAX" }, |
| 2032 | }; |
| 2033 | |
| 2034 | /* |
Dr. David Alan Gilbert | 1e2d90e | 2015-11-05 18:11:07 +0000 | [diff] [blame] | 2035 | * Process a request for pages received on the return path, |
| 2036 | * We're allowed to send more than requested (e.g. to round to our page size) |
| 2037 | * and we don't need to send pages that have already been sent. |
| 2038 | */ |
| 2039 | static void migrate_handle_rp_req_pages(MigrationState *ms, const char* rbname, |
| 2040 | ram_addr_t start, size_t len) |
| 2041 | { |
Dr. David Alan Gilbert | 6c595cd | 2015-11-05 18:11:08 +0000 | [diff] [blame] | 2042 | long our_host_ps = getpagesize(); |
| 2043 | |
Dr. David Alan Gilbert | 1e2d90e | 2015-11-05 18:11:07 +0000 | [diff] [blame] | 2044 | trace_migrate_handle_rp_req_pages(rbname, start, len); |
Dr. David Alan Gilbert | 6c595cd | 2015-11-05 18:11:08 +0000 | [diff] [blame] | 2045 | |
| 2046 | /* |
| 2047 | * Since we currently insist on matching page sizes, just sanity check |
| 2048 | * we're being asked for whole host pages. |
| 2049 | */ |
| 2050 | if (start & (our_host_ps-1) || |
| 2051 | (len & (our_host_ps-1))) { |
| 2052 | error_report("%s: Misaligned page request, start: " RAM_ADDR_FMT |
| 2053 | " len: %zd", __func__, start, len); |
| 2054 | mark_source_rp_bad(ms); |
| 2055 | return; |
| 2056 | } |
| 2057 | |
Juan Quintela | 9650689 | 2017-03-14 18:41:03 +0100 | [diff] [blame] | 2058 | if (ram_save_queue_pages(rbname, start, len)) { |
Dr. David Alan Gilbert | 6c595cd | 2015-11-05 18:11:08 +0000 | [diff] [blame] | 2059 | mark_source_rp_bad(ms); |
| 2060 | } |
Dr. David Alan Gilbert | 1e2d90e | 2015-11-05 18:11:07 +0000 | [diff] [blame] | 2061 | } |
| 2062 | |
Peter Xu | 14b1742 | 2018-05-02 18:47:21 +0800 | [diff] [blame] | 2063 | /* Return true to retry, false to quit */ |
| 2064 | static bool postcopy_pause_return_path_thread(MigrationState *s) |
| 2065 | { |
| 2066 | trace_postcopy_pause_return_path(); |
| 2067 | |
| 2068 | qemu_sem_wait(&s->postcopy_pause_rp_sem); |
| 2069 | |
| 2070 | trace_postcopy_pause_return_path_continued(); |
| 2071 | |
| 2072 | return true; |
| 2073 | } |
| 2074 | |
Peter Xu | a335deb | 2018-05-02 18:47:28 +0800 | [diff] [blame] | 2075 | static int migrate_handle_rp_recv_bitmap(MigrationState *s, char *block_name) |
| 2076 | { |
| 2077 | RAMBlock *block = qemu_ram_block_by_name(block_name); |
| 2078 | |
| 2079 | if (!block) { |
| 2080 | error_report("%s: invalid block name '%s'", __func__, block_name); |
| 2081 | return -EINVAL; |
| 2082 | } |
| 2083 | |
| 2084 | /* Fetch the received bitmap and refresh the dirty bitmap */ |
| 2085 | return ram_dirty_bitmap_reload(s, block); |
| 2086 | } |
| 2087 | |
Peter Xu | 13955b8 | 2018-05-02 18:47:30 +0800 | [diff] [blame] | 2088 | static int migrate_handle_rp_resume_ack(MigrationState *s, uint32_t value) |
| 2089 | { |
| 2090 | trace_source_return_path_thread_resume_ack(value); |
| 2091 | |
| 2092 | if (value != MIGRATION_RESUME_ACK_VALUE) { |
| 2093 | error_report("%s: illegal resume_ack value %"PRIu32, |
| 2094 | __func__, value); |
| 2095 | return -1; |
| 2096 | } |
| 2097 | |
| 2098 | /* Now both sides are active. */ |
| 2099 | migrate_set_state(&s->state, MIGRATION_STATUS_POSTCOPY_RECOVER, |
| 2100 | MIGRATION_STATUS_POSTCOPY_ACTIVE); |
| 2101 | |
Peter Xu | 9419069 | 2018-05-02 18:47:34 +0800 | [diff] [blame] | 2102 | /* Notify send thread that time to continue send pages */ |
| 2103 | qemu_sem_post(&s->rp_state.rp_sem); |
Peter Xu | 13955b8 | 2018-05-02 18:47:30 +0800 | [diff] [blame] | 2104 | |
| 2105 | return 0; |
| 2106 | } |
| 2107 | |
Dr. David Alan Gilbert | 1e2d90e | 2015-11-05 18:11:07 +0000 | [diff] [blame] | 2108 | /* |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 2109 | * Handles messages sent on the return path towards the source VM |
| 2110 | * |
| 2111 | */ |
| 2112 | static void *source_return_path_thread(void *opaque) |
| 2113 | { |
| 2114 | MigrationState *ms = opaque; |
| 2115 | QEMUFile *rp = ms->rp_state.from_dst_file; |
| 2116 | uint16_t header_len, header_type; |
Peter Xu | 568b01c | 2016-03-09 14:12:12 +0800 | [diff] [blame] | 2117 | uint8_t buf[512]; |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 2118 | uint32_t tmp32, sibling_error; |
Dr. David Alan Gilbert | 1e2d90e | 2015-11-05 18:11:07 +0000 | [diff] [blame] | 2119 | ram_addr_t start = 0; /* =0 to silence warning */ |
| 2120 | size_t len = 0, expected_len; |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 2121 | int res; |
| 2122 | |
| 2123 | trace_source_return_path_thread_entry(); |
Lidong Chen | 74637e6 | 2018-08-06 21:29:29 +0800 | [diff] [blame^] | 2124 | rcu_register_thread(); |
Peter Xu | 14b1742 | 2018-05-02 18:47:21 +0800 | [diff] [blame] | 2125 | |
| 2126 | retry: |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 2127 | while (!ms->rp_state.error && !qemu_file_get_error(rp) && |
| 2128 | migration_is_setup_or_active(ms->state)) { |
| 2129 | trace_source_return_path_thread_loop_top(); |
| 2130 | header_type = qemu_get_be16(rp); |
| 2131 | header_len = qemu_get_be16(rp); |
| 2132 | |
Peter Xu | 7a9ddfb | 2018-02-08 18:31:05 +0800 | [diff] [blame] | 2133 | if (qemu_file_get_error(rp)) { |
| 2134 | mark_source_rp_bad(ms); |
| 2135 | goto out; |
| 2136 | } |
| 2137 | |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 2138 | if (header_type >= MIG_RP_MSG_MAX || |
| 2139 | header_type == MIG_RP_MSG_INVALID) { |
| 2140 | error_report("RP: Received invalid message 0x%04x length 0x%04x", |
| 2141 | header_type, header_len); |
| 2142 | mark_source_rp_bad(ms); |
| 2143 | goto out; |
| 2144 | } |
| 2145 | |
| 2146 | if ((rp_cmd_args[header_type].len != -1 && |
| 2147 | header_len != rp_cmd_args[header_type].len) || |
Peter Xu | 568b01c | 2016-03-09 14:12:12 +0800 | [diff] [blame] | 2148 | header_len > sizeof(buf)) { |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 2149 | error_report("RP: Received '%s' message (0x%04x) with" |
| 2150 | "incorrect length %d expecting %zu", |
| 2151 | rp_cmd_args[header_type].name, header_type, header_len, |
| 2152 | (size_t)rp_cmd_args[header_type].len); |
| 2153 | mark_source_rp_bad(ms); |
| 2154 | goto out; |
| 2155 | } |
| 2156 | |
| 2157 | /* We know we've got a valid header by this point */ |
| 2158 | res = qemu_get_buffer(rp, buf, header_len); |
| 2159 | if (res != header_len) { |
| 2160 | error_report("RP: Failed reading data for message 0x%04x" |
| 2161 | " read %d expected %d", |
| 2162 | header_type, res, header_len); |
| 2163 | mark_source_rp_bad(ms); |
| 2164 | goto out; |
| 2165 | } |
| 2166 | |
| 2167 | /* OK, we have the message and the data */ |
| 2168 | switch (header_type) { |
| 2169 | case MIG_RP_MSG_SHUT: |
Peter Maydell | 4d88513 | 2016-06-10 17:09:22 +0100 | [diff] [blame] | 2170 | sibling_error = ldl_be_p(buf); |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 2171 | trace_source_return_path_thread_shut(sibling_error); |
| 2172 | if (sibling_error) { |
| 2173 | error_report("RP: Sibling indicated error %d", sibling_error); |
| 2174 | mark_source_rp_bad(ms); |
| 2175 | } |
| 2176 | /* |
| 2177 | * We'll let the main thread deal with closing the RP |
| 2178 | * we could do a shutdown(2) on it, but we're the only user |
| 2179 | * anyway, so there's nothing gained. |
| 2180 | */ |
| 2181 | goto out; |
| 2182 | |
| 2183 | case MIG_RP_MSG_PONG: |
Peter Maydell | 4d88513 | 2016-06-10 17:09:22 +0100 | [diff] [blame] | 2184 | tmp32 = ldl_be_p(buf); |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 2185 | trace_source_return_path_thread_pong(tmp32); |
| 2186 | break; |
| 2187 | |
Dr. David Alan Gilbert | 1e2d90e | 2015-11-05 18:11:07 +0000 | [diff] [blame] | 2188 | case MIG_RP_MSG_REQ_PAGES: |
Peter Maydell | 4d88513 | 2016-06-10 17:09:22 +0100 | [diff] [blame] | 2189 | start = ldq_be_p(buf); |
| 2190 | len = ldl_be_p(buf + 8); |
Dr. David Alan Gilbert | 1e2d90e | 2015-11-05 18:11:07 +0000 | [diff] [blame] | 2191 | migrate_handle_rp_req_pages(ms, NULL, start, len); |
| 2192 | break; |
| 2193 | |
| 2194 | case MIG_RP_MSG_REQ_PAGES_ID: |
| 2195 | expected_len = 12 + 1; /* header + termination */ |
| 2196 | |
| 2197 | if (header_len >= expected_len) { |
Peter Maydell | 4d88513 | 2016-06-10 17:09:22 +0100 | [diff] [blame] | 2198 | start = ldq_be_p(buf); |
| 2199 | len = ldl_be_p(buf + 8); |
Dr. David Alan Gilbert | 1e2d90e | 2015-11-05 18:11:07 +0000 | [diff] [blame] | 2200 | /* Now we expect an idstr */ |
| 2201 | tmp32 = buf[12]; /* Length of the following idstr */ |
| 2202 | buf[13 + tmp32] = '\0'; |
| 2203 | expected_len += tmp32; |
| 2204 | } |
| 2205 | if (header_len != expected_len) { |
| 2206 | error_report("RP: Req_Page_id with length %d expecting %zd", |
| 2207 | header_len, expected_len); |
| 2208 | mark_source_rp_bad(ms); |
| 2209 | goto out; |
| 2210 | } |
| 2211 | migrate_handle_rp_req_pages(ms, (char *)&buf[13], start, len); |
| 2212 | break; |
| 2213 | |
Peter Xu | a335deb | 2018-05-02 18:47:28 +0800 | [diff] [blame] | 2214 | case MIG_RP_MSG_RECV_BITMAP: |
| 2215 | if (header_len < 1) { |
| 2216 | error_report("%s: missing block name", __func__); |
| 2217 | mark_source_rp_bad(ms); |
| 2218 | goto out; |
| 2219 | } |
| 2220 | /* Format: len (1B) + idstr (<255B). This ends the idstr. */ |
| 2221 | buf[buf[0] + 1] = '\0'; |
| 2222 | if (migrate_handle_rp_recv_bitmap(ms, (char *)(buf + 1))) { |
| 2223 | mark_source_rp_bad(ms); |
| 2224 | goto out; |
| 2225 | } |
| 2226 | break; |
| 2227 | |
Peter Xu | 13955b8 | 2018-05-02 18:47:30 +0800 | [diff] [blame] | 2228 | case MIG_RP_MSG_RESUME_ACK: |
| 2229 | tmp32 = ldl_be_p(buf); |
| 2230 | if (migrate_handle_rp_resume_ack(ms, tmp32)) { |
| 2231 | mark_source_rp_bad(ms); |
| 2232 | goto out; |
| 2233 | } |
| 2234 | break; |
| 2235 | |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 2236 | default: |
| 2237 | break; |
| 2238 | } |
| 2239 | } |
Peter Xu | 14b1742 | 2018-05-02 18:47:21 +0800 | [diff] [blame] | 2240 | |
| 2241 | out: |
| 2242 | res = qemu_file_get_error(rp); |
| 2243 | if (res) { |
| 2244 | if (res == -EIO) { |
| 2245 | /* |
| 2246 | * Maybe there is something we can do: it looks like a |
| 2247 | * network down issue, and we pause for a recovery. |
| 2248 | */ |
| 2249 | if (postcopy_pause_return_path_thread(ms)) { |
| 2250 | /* Reload rp, reset the rest */ |
| 2251 | rp = ms->rp_state.from_dst_file; |
| 2252 | ms->rp_state.error = false; |
| 2253 | goto retry; |
| 2254 | } |
| 2255 | } |
| 2256 | |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 2257 | trace_source_return_path_thread_bad_end(); |
| 2258 | mark_source_rp_bad(ms); |
| 2259 | } |
| 2260 | |
| 2261 | trace_source_return_path_thread_end(); |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 2262 | ms->rp_state.from_dst_file = NULL; |
| 2263 | qemu_fclose(rp); |
Lidong Chen | 74637e6 | 2018-08-06 21:29:29 +0800 | [diff] [blame^] | 2264 | rcu_unregister_thread(); |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 2265 | return NULL; |
| 2266 | } |
| 2267 | |
Peter Xu | d3e35b8 | 2018-05-02 18:47:24 +0800 | [diff] [blame] | 2268 | static int open_return_path_on_source(MigrationState *ms, |
| 2269 | bool create_thread) |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 2270 | { |
| 2271 | |
zhanghailiang | 89a02a9 | 2016-01-15 11:37:42 +0800 | [diff] [blame] | 2272 | ms->rp_state.from_dst_file = qemu_file_get_return_path(ms->to_dst_file); |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 2273 | if (!ms->rp_state.from_dst_file) { |
| 2274 | return -1; |
| 2275 | } |
| 2276 | |
| 2277 | trace_open_return_path_on_source(); |
Peter Xu | d3e35b8 | 2018-05-02 18:47:24 +0800 | [diff] [blame] | 2278 | |
| 2279 | if (!create_thread) { |
| 2280 | /* We're done */ |
| 2281 | return 0; |
| 2282 | } |
| 2283 | |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 2284 | qemu_thread_create(&ms->rp_state.rp_thread, "return path", |
| 2285 | source_return_path_thread, ms, QEMU_THREAD_JOINABLE); |
| 2286 | |
| 2287 | trace_open_return_path_on_source_continue(); |
| 2288 | |
| 2289 | return 0; |
| 2290 | } |
| 2291 | |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 2292 | /* Returns 0 if the RP was ok, otherwise there was an error on the RP */ |
| 2293 | static int await_return_path_close_on_source(MigrationState *ms) |
| 2294 | { |
| 2295 | /* |
| 2296 | * If this is a normal exit then the destination will send a SHUT and the |
| 2297 | * rp_thread will exit, however if there's an error we need to cause |
| 2298 | * it to exit. |
| 2299 | */ |
zhanghailiang | 89a02a9 | 2016-01-15 11:37:42 +0800 | [diff] [blame] | 2300 | if (qemu_file_get_error(ms->to_dst_file) && ms->rp_state.from_dst_file) { |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 2301 | /* |
| 2302 | * shutdown(2), if we have it, will cause it to unblock if it's stuck |
| 2303 | * waiting for the destination. |
| 2304 | */ |
| 2305 | qemu_file_shutdown(ms->rp_state.from_dst_file); |
| 2306 | mark_source_rp_bad(ms); |
| 2307 | } |
| 2308 | trace_await_return_path_close_on_source_joining(); |
| 2309 | qemu_thread_join(&ms->rp_state.rp_thread); |
| 2310 | trace_await_return_path_close_on_source_close(); |
| 2311 | return ms->rp_state.error; |
| 2312 | } |
| 2313 | |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2314 | /* |
| 2315 | * Switch from normal iteration to postcopy |
| 2316 | * Returns non-0 on error |
| 2317 | */ |
Peter Xu | 7287cbd | 2018-01-03 20:20:09 +0800 | [diff] [blame] | 2318 | static int postcopy_start(MigrationState *ms) |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2319 | { |
| 2320 | int ret; |
Daniel P. Berrange | 61b67d4 | 2016-04-27 11:05:01 +0100 | [diff] [blame] | 2321 | QIOChannelBuffer *bioc; |
| 2322 | QEMUFile *fb; |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2323 | int64_t time_at_stop = qemu_clock_get_ms(QEMU_CLOCK_REALTIME); |
Dr. David Alan Gilbert | 7e555c6 | 2018-06-13 11:26:40 +0100 | [diff] [blame] | 2324 | int64_t bandwidth = migrate_max_postcopy_bandwidth(); |
Dr. David Alan Gilbert | ef8d648 | 2017-02-02 15:59:09 +0000 | [diff] [blame] | 2325 | bool restart_block = false; |
Dr. David Alan Gilbert | 0331c8c | 2017-10-20 10:05:56 +0100 | [diff] [blame] | 2326 | int cur_state = MIGRATION_STATUS_ACTIVE; |
| 2327 | if (!migrate_pause_before_switchover()) { |
| 2328 | migrate_set_state(&ms->state, MIGRATION_STATUS_ACTIVE, |
| 2329 | MIGRATION_STATUS_POSTCOPY_ACTIVE); |
| 2330 | } |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2331 | |
| 2332 | trace_postcopy_start(); |
| 2333 | qemu_mutex_lock_iothread(); |
| 2334 | trace_postcopy_start_set_run(); |
| 2335 | |
| 2336 | qemu_system_wakeup_request(QEMU_WAKEUP_REASON_OTHER); |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2337 | global_state_store(); |
| 2338 | ret = vm_stop_force_state(RUN_STATE_FINISH_MIGRATE); |
Kevin Wolf | 76b1c7f | 2015-12-22 14:07:08 +0100 | [diff] [blame] | 2339 | if (ret < 0) { |
| 2340 | goto fail; |
| 2341 | } |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2342 | |
Dr. David Alan Gilbert | 0331c8c | 2017-10-20 10:05:56 +0100 | [diff] [blame] | 2343 | ret = migration_maybe_pause(ms, &cur_state, |
| 2344 | MIGRATION_STATUS_POSTCOPY_ACTIVE); |
| 2345 | if (ret < 0) { |
| 2346 | goto fail; |
| 2347 | } |
| 2348 | |
Kevin Wolf | 76b1c7f | 2015-12-22 14:07:08 +0100 | [diff] [blame] | 2349 | ret = bdrv_inactivate_all(); |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2350 | if (ret < 0) { |
| 2351 | goto fail; |
| 2352 | } |
Dr. David Alan Gilbert | ef8d648 | 2017-02-02 15:59:09 +0000 | [diff] [blame] | 2353 | restart_block = true; |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2354 | |
| 2355 | /* |
Dr. David Alan Gilbert | 1c0d249 | 2015-11-11 14:02:27 +0000 | [diff] [blame] | 2356 | * Cause any non-postcopiable, but iterative devices to |
| 2357 | * send out their final data. |
| 2358 | */ |
Fam Zheng | a1fbe75 | 2017-06-17 00:06:58 +0800 | [diff] [blame] | 2359 | qemu_savevm_state_complete_precopy(ms->to_dst_file, true, false); |
Dr. David Alan Gilbert | 1c0d249 | 2015-11-11 14:02:27 +0000 | [diff] [blame] | 2360 | |
| 2361 | /* |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2362 | * in Finish migrate and with the io-lock held everything should |
| 2363 | * be quiet, but we've potentially still got dirty pages and we |
| 2364 | * need to tell the destination to throw any pages it's already received |
| 2365 | * that are dirty |
| 2366 | */ |
Vladimir Sementsov-Ogievskiy | 58110f0 | 2017-07-10 19:30:16 +0300 | [diff] [blame] | 2367 | if (migrate_postcopy_ram()) { |
| 2368 | if (ram_postcopy_send_discard_bitmap(ms)) { |
| 2369 | error_report("postcopy send discard bitmap failed"); |
| 2370 | goto fail; |
| 2371 | } |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2372 | } |
| 2373 | |
| 2374 | /* |
| 2375 | * send rest of state - note things that are doing postcopy |
| 2376 | * will notice we're in POSTCOPY_ACTIVE and not actually |
| 2377 | * wrap their state up here |
| 2378 | */ |
Dr. David Alan Gilbert | 7e555c6 | 2018-06-13 11:26:40 +0100 | [diff] [blame] | 2379 | /* 0 max-postcopy-bandwidth means unlimited */ |
| 2380 | if (!bandwidth) { |
| 2381 | qemu_file_set_rate_limit(ms->to_dst_file, INT64_MAX); |
| 2382 | } else { |
| 2383 | qemu_file_set_rate_limit(ms->to_dst_file, bandwidth / XFER_LIMIT_RATIO); |
| 2384 | } |
Vladimir Sementsov-Ogievskiy | 58110f0 | 2017-07-10 19:30:16 +0300 | [diff] [blame] | 2385 | if (migrate_postcopy_ram()) { |
| 2386 | /* Ping just for debugging, helps line traces up */ |
| 2387 | qemu_savevm_send_ping(ms->to_dst_file, 2); |
| 2388 | } |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2389 | |
| 2390 | /* |
| 2391 | * While loading the device state we may trigger page transfer |
| 2392 | * requests and the fd must be free to process those, and thus |
| 2393 | * the destination must read the whole device state off the fd before |
| 2394 | * it starts processing it. Unfortunately the ad-hoc migration format |
| 2395 | * doesn't allow the destination to know the size to read without fully |
| 2396 | * parsing it through each devices load-state code (especially the open |
| 2397 | * coded devices that use get/put). |
| 2398 | * So we wrap the device state up in a package with a length at the start; |
| 2399 | * to do this we use a qemu_buf to hold the whole of the device state. |
| 2400 | */ |
Daniel P. Berrange | 61b67d4 | 2016-04-27 11:05:01 +0100 | [diff] [blame] | 2401 | bioc = qio_channel_buffer_new(4096); |
Daniel P. Berrange | 6f01f13 | 2016-09-30 11:57:14 +0100 | [diff] [blame] | 2402 | qio_channel_set_name(QIO_CHANNEL(bioc), "migration-postcopy-buffer"); |
Daniel P. Berrange | 61b67d4 | 2016-04-27 11:05:01 +0100 | [diff] [blame] | 2403 | fb = qemu_fopen_channel_output(QIO_CHANNEL(bioc)); |
| 2404 | object_unref(OBJECT(bioc)); |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2405 | |
Dr. David Alan Gilbert | c76201a | 2015-11-05 18:11:18 +0000 | [diff] [blame] | 2406 | /* |
| 2407 | * Make sure the receiver can get incoming pages before we send the rest |
| 2408 | * of the state |
| 2409 | */ |
| 2410 | qemu_savevm_send_postcopy_listen(fb); |
| 2411 | |
Fam Zheng | a1fbe75 | 2017-06-17 00:06:58 +0800 | [diff] [blame] | 2412 | qemu_savevm_state_complete_precopy(fb, false, false); |
Vladimir Sementsov-Ogievskiy | 58110f0 | 2017-07-10 19:30:16 +0300 | [diff] [blame] | 2413 | if (migrate_postcopy_ram()) { |
| 2414 | qemu_savevm_send_ping(fb, 3); |
| 2415 | } |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2416 | |
| 2417 | qemu_savevm_send_postcopy_run(fb); |
| 2418 | |
| 2419 | /* <><> end of stuff going into the package */ |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2420 | |
Dr. David Alan Gilbert | ef8d648 | 2017-02-02 15:59:09 +0000 | [diff] [blame] | 2421 | /* Last point of recovery; as soon as we send the package the destination |
| 2422 | * can open devices and potentially start running. |
| 2423 | * Lets just check again we've not got any errors. |
| 2424 | */ |
| 2425 | ret = qemu_file_get_error(ms->to_dst_file); |
| 2426 | if (ret) { |
| 2427 | error_report("postcopy_start: Migration stream errored (pre package)"); |
| 2428 | goto fail_closefb; |
| 2429 | } |
| 2430 | |
| 2431 | restart_block = false; |
| 2432 | |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2433 | /* Now send that blob */ |
Daniel P. Berrange | 61b67d4 | 2016-04-27 11:05:01 +0100 | [diff] [blame] | 2434 | if (qemu_savevm_send_packaged(ms->to_dst_file, bioc->data, bioc->usage)) { |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2435 | goto fail_closefb; |
| 2436 | } |
| 2437 | qemu_fclose(fb); |
Dr. David Alan Gilbert | b82fc32 | 2016-02-22 17:17:32 +0000 | [diff] [blame] | 2438 | |
| 2439 | /* Send a notify to give a chance for anything that needs to happen |
| 2440 | * at the transition to postcopy and after the device state; in particular |
| 2441 | * spice needs to trigger a transition now |
| 2442 | */ |
| 2443 | ms->postcopy_after_devices = true; |
| 2444 | notifier_list_notify(&migration_state_notifiers, ms); |
| 2445 | |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2446 | ms->downtime = qemu_clock_get_ms(QEMU_CLOCK_REALTIME) - time_at_stop; |
| 2447 | |
| 2448 | qemu_mutex_unlock_iothread(); |
| 2449 | |
Vladimir Sementsov-Ogievskiy | 58110f0 | 2017-07-10 19:30:16 +0300 | [diff] [blame] | 2450 | if (migrate_postcopy_ram()) { |
| 2451 | /* |
| 2452 | * Although this ping is just for debug, it could potentially be |
| 2453 | * used for getting a better measurement of downtime at the source. |
| 2454 | */ |
| 2455 | qemu_savevm_send_ping(ms->to_dst_file, 4); |
| 2456 | } |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2457 | |
Pavel Butsykin | ced1c61 | 2017-02-03 18:23:21 +0300 | [diff] [blame] | 2458 | if (migrate_release_ram()) { |
| 2459 | ram_postcopy_migrated_memory_release(ms); |
| 2460 | } |
| 2461 | |
zhanghailiang | 89a02a9 | 2016-01-15 11:37:42 +0800 | [diff] [blame] | 2462 | ret = qemu_file_get_error(ms->to_dst_file); |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2463 | if (ret) { |
| 2464 | error_report("postcopy_start: Migration stream errored"); |
zhanghailiang | 48781e5 | 2015-12-16 11:47:33 +0000 | [diff] [blame] | 2465 | migrate_set_state(&ms->state, MIGRATION_STATUS_POSTCOPY_ACTIVE, |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2466 | MIGRATION_STATUS_FAILED); |
| 2467 | } |
| 2468 | |
| 2469 | return ret; |
| 2470 | |
| 2471 | fail_closefb: |
| 2472 | qemu_fclose(fb); |
| 2473 | fail: |
zhanghailiang | 48781e5 | 2015-12-16 11:47:33 +0000 | [diff] [blame] | 2474 | migrate_set_state(&ms->state, MIGRATION_STATUS_POSTCOPY_ACTIVE, |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2475 | MIGRATION_STATUS_FAILED); |
Dr. David Alan Gilbert | ef8d648 | 2017-02-02 15:59:09 +0000 | [diff] [blame] | 2476 | if (restart_block) { |
| 2477 | /* A failure happened early enough that we know the destination hasn't |
| 2478 | * accessed block devices, so we're safe to recover. |
| 2479 | */ |
| 2480 | Error *local_err = NULL; |
| 2481 | |
| 2482 | bdrv_invalidate_cache_all(&local_err); |
| 2483 | if (local_err) { |
| 2484 | error_report_err(local_err); |
| 2485 | } |
| 2486 | } |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2487 | qemu_mutex_unlock_iothread(); |
| 2488 | return -1; |
| 2489 | } |
| 2490 | |
Dr. David Alan Gilbert | 09f6c85 | 2015-08-13 11:51:31 +0100 | [diff] [blame] | 2491 | /** |
Dr. David Alan Gilbert | e91d895 | 2017-10-20 10:05:52 +0100 | [diff] [blame] | 2492 | * migration_maybe_pause: Pause if required to by |
| 2493 | * migrate_pause_before_switchover called with the iothread locked |
| 2494 | * Returns: 0 on success |
| 2495 | */ |
Dr. David Alan Gilbert | 0331c8c | 2017-10-20 10:05:56 +0100 | [diff] [blame] | 2496 | static int migration_maybe_pause(MigrationState *s, |
| 2497 | int *current_active_state, |
| 2498 | int new_state) |
Dr. David Alan Gilbert | e91d895 | 2017-10-20 10:05:52 +0100 | [diff] [blame] | 2499 | { |
| 2500 | if (!migrate_pause_before_switchover()) { |
| 2501 | return 0; |
| 2502 | } |
| 2503 | |
| 2504 | /* Since leaving this state is not atomic with posting the semaphore |
| 2505 | * it's possible that someone could have issued multiple migrate_continue |
| 2506 | * and the semaphore is incorrectly positive at this point; |
| 2507 | * the docs say it's undefined to reinit a semaphore that's already |
| 2508 | * init'd, so use timedwait to eat up any existing posts. |
| 2509 | */ |
| 2510 | while (qemu_sem_timedwait(&s->pause_sem, 1) == 0) { |
| 2511 | /* This block intentionally left blank */ |
| 2512 | } |
| 2513 | |
| 2514 | qemu_mutex_unlock_iothread(); |
| 2515 | migrate_set_state(&s->state, *current_active_state, |
| 2516 | MIGRATION_STATUS_PRE_SWITCHOVER); |
| 2517 | qemu_sem_wait(&s->pause_sem); |
| 2518 | migrate_set_state(&s->state, MIGRATION_STATUS_PRE_SWITCHOVER, |
Dr. David Alan Gilbert | 0331c8c | 2017-10-20 10:05:56 +0100 | [diff] [blame] | 2519 | new_state); |
| 2520 | *current_active_state = new_state; |
Dr. David Alan Gilbert | e91d895 | 2017-10-20 10:05:52 +0100 | [diff] [blame] | 2521 | qemu_mutex_lock_iothread(); |
| 2522 | |
Dr. David Alan Gilbert | 0331c8c | 2017-10-20 10:05:56 +0100 | [diff] [blame] | 2523 | return s->state == new_state ? 0 : -EINVAL; |
Dr. David Alan Gilbert | e91d895 | 2017-10-20 10:05:52 +0100 | [diff] [blame] | 2524 | } |
| 2525 | |
| 2526 | /** |
Dr. David Alan Gilbert | 09f6c85 | 2015-08-13 11:51:31 +0100 | [diff] [blame] | 2527 | * migration_completion: Used by migration_thread when there's not much left. |
| 2528 | * The caller 'breaks' the loop when this returns. |
| 2529 | * |
| 2530 | * @s: Current migration state |
Dr. David Alan Gilbert | 09f6c85 | 2015-08-13 11:51:31 +0100 | [diff] [blame] | 2531 | */ |
Peter Xu | 2ad8730 | 2018-01-03 20:20:14 +0800 | [diff] [blame] | 2532 | static void migration_completion(MigrationState *s) |
Dr. David Alan Gilbert | 09f6c85 | 2015-08-13 11:51:31 +0100 | [diff] [blame] | 2533 | { |
| 2534 | int ret; |
Peter Xu | 2ad8730 | 2018-01-03 20:20:14 +0800 | [diff] [blame] | 2535 | int current_active_state = s->state; |
Dr. David Alan Gilbert | 09f6c85 | 2015-08-13 11:51:31 +0100 | [diff] [blame] | 2536 | |
Dr. David Alan Gilbert | b10ac0c | 2015-11-05 18:11:06 +0000 | [diff] [blame] | 2537 | if (s->state == MIGRATION_STATUS_ACTIVE) { |
| 2538 | qemu_mutex_lock_iothread(); |
Peter Xu | 64909f9 | 2018-01-03 20:20:10 +0800 | [diff] [blame] | 2539 | s->downtime_start = qemu_clock_get_ms(QEMU_CLOCK_REALTIME); |
Dr. David Alan Gilbert | b10ac0c | 2015-11-05 18:11:06 +0000 | [diff] [blame] | 2540 | qemu_system_wakeup_request(QEMU_WAKEUP_REASON_OTHER); |
Peter Xu | 7287cbd | 2018-01-03 20:20:09 +0800 | [diff] [blame] | 2541 | s->vm_was_running = runstate_is_running(); |
Dr. David Alan Gilbert | b10ac0c | 2015-11-05 18:11:06 +0000 | [diff] [blame] | 2542 | ret = global_state_store(); |
Dr. David Alan Gilbert | 09f6c85 | 2015-08-13 11:51:31 +0100 | [diff] [blame] | 2543 | |
Dr. David Alan Gilbert | b10ac0c | 2015-11-05 18:11:06 +0000 | [diff] [blame] | 2544 | if (!ret) { |
Fam Zheng | a1fbe75 | 2017-06-17 00:06:58 +0800 | [diff] [blame] | 2545 | bool inactivate = !migrate_colo_enabled(); |
Dr. David Alan Gilbert | b10ac0c | 2015-11-05 18:11:06 +0000 | [diff] [blame] | 2546 | ret = vm_stop_force_state(RUN_STATE_FINISH_MIGRATE); |
Kevin Wolf | f07fa4c | 2017-05-22 17:10:38 +0200 | [diff] [blame] | 2547 | if (ret >= 0) { |
Dr. David Alan Gilbert | 0331c8c | 2017-10-20 10:05:56 +0100 | [diff] [blame] | 2548 | ret = migration_maybe_pause(s, ¤t_active_state, |
| 2549 | MIGRATION_STATUS_DEVICE); |
Dr. David Alan Gilbert | e91d895 | 2017-10-20 10:05:52 +0100 | [diff] [blame] | 2550 | } |
| 2551 | if (ret >= 0) { |
Kevin Wolf | f07fa4c | 2017-05-22 17:10:38 +0200 | [diff] [blame] | 2552 | qemu_file_set_rate_limit(s->to_dst_file, INT64_MAX); |
Fam Zheng | a1fbe75 | 2017-06-17 00:06:58 +0800 | [diff] [blame] | 2553 | ret = qemu_savevm_state_complete_precopy(s->to_dst_file, false, |
| 2554 | inactivate); |
Kevin Wolf | f07fa4c | 2017-05-22 17:10:38 +0200 | [diff] [blame] | 2555 | } |
Fam Zheng | a1fbe75 | 2017-06-17 00:06:58 +0800 | [diff] [blame] | 2556 | if (inactivate && ret >= 0) { |
| 2557 | s->block_inactive = true; |
Dr. David Alan Gilbert | b10ac0c | 2015-11-05 18:11:06 +0000 | [diff] [blame] | 2558 | } |
Dr. David Alan Gilbert | 09f6c85 | 2015-08-13 11:51:31 +0100 | [diff] [blame] | 2559 | } |
Dr. David Alan Gilbert | b10ac0c | 2015-11-05 18:11:06 +0000 | [diff] [blame] | 2560 | qemu_mutex_unlock_iothread(); |
Dr. David Alan Gilbert | 09f6c85 | 2015-08-13 11:51:31 +0100 | [diff] [blame] | 2561 | |
Dr. David Alan Gilbert | b10ac0c | 2015-11-05 18:11:06 +0000 | [diff] [blame] | 2562 | if (ret < 0) { |
| 2563 | goto fail; |
| 2564 | } |
| 2565 | } else if (s->state == MIGRATION_STATUS_POSTCOPY_ACTIVE) { |
| 2566 | trace_migration_completion_postcopy_end(); |
| 2567 | |
zhanghailiang | 89a02a9 | 2016-01-15 11:37:42 +0800 | [diff] [blame] | 2568 | qemu_savevm_state_complete_postcopy(s->to_dst_file); |
Dr. David Alan Gilbert | b10ac0c | 2015-11-05 18:11:06 +0000 | [diff] [blame] | 2569 | trace_migration_completion_postcopy_end_after_complete(); |
| 2570 | } |
| 2571 | |
| 2572 | /* |
| 2573 | * If rp was opened we must clean up the thread before |
| 2574 | * cleaning everything else up (since if there are no failures |
| 2575 | * it will wait for the destination to send it's status in |
| 2576 | * a SHUT command). |
Dr. David Alan Gilbert | b10ac0c | 2015-11-05 18:11:06 +0000 | [diff] [blame] | 2577 | */ |
Peter Xu | 0425dc9 | 2017-05-31 18:35:34 +0800 | [diff] [blame] | 2578 | if (s->rp_state.from_dst_file) { |
Dr. David Alan Gilbert | b10ac0c | 2015-11-05 18:11:06 +0000 | [diff] [blame] | 2579 | int rp_error; |
Peter Xu | 0425dc9 | 2017-05-31 18:35:34 +0800 | [diff] [blame] | 2580 | trace_migration_return_path_end_before(); |
Dr. David Alan Gilbert | b10ac0c | 2015-11-05 18:11:06 +0000 | [diff] [blame] | 2581 | rp_error = await_return_path_close_on_source(s); |
Peter Xu | 0425dc9 | 2017-05-31 18:35:34 +0800 | [diff] [blame] | 2582 | trace_migration_return_path_end_after(rp_error); |
Dr. David Alan Gilbert | b10ac0c | 2015-11-05 18:11:06 +0000 | [diff] [blame] | 2583 | if (rp_error) { |
Greg Kurz | fe904ea | 2016-05-18 15:44:36 +0200 | [diff] [blame] | 2584 | goto fail_invalidate; |
Dr. David Alan Gilbert | b10ac0c | 2015-11-05 18:11:06 +0000 | [diff] [blame] | 2585 | } |
Dr. David Alan Gilbert | 09f6c85 | 2015-08-13 11:51:31 +0100 | [diff] [blame] | 2586 | } |
| 2587 | |
zhanghailiang | 89a02a9 | 2016-01-15 11:37:42 +0800 | [diff] [blame] | 2588 | if (qemu_file_get_error(s->to_dst_file)) { |
Dr. David Alan Gilbert | 09f6c85 | 2015-08-13 11:51:31 +0100 | [diff] [blame] | 2589 | trace_migration_completion_file_err(); |
Greg Kurz | fe904ea | 2016-05-18 15:44:36 +0200 | [diff] [blame] | 2590 | goto fail_invalidate; |
Dr. David Alan Gilbert | 09f6c85 | 2015-08-13 11:51:31 +0100 | [diff] [blame] | 2591 | } |
| 2592 | |
zhanghailiang | 0b827d5 | 2016-10-27 14:42:54 +0800 | [diff] [blame] | 2593 | if (!migrate_colo_enabled()) { |
| 2594 | migrate_set_state(&s->state, current_active_state, |
| 2595 | MIGRATION_STATUS_COMPLETED); |
| 2596 | } |
| 2597 | |
Dr. David Alan Gilbert | 09f6c85 | 2015-08-13 11:51:31 +0100 | [diff] [blame] | 2598 | return; |
| 2599 | |
Greg Kurz | fe904ea | 2016-05-18 15:44:36 +0200 | [diff] [blame] | 2600 | fail_invalidate: |
| 2601 | /* If not doing postcopy, vm_start() will be called: let's regain |
| 2602 | * control on images. |
| 2603 | */ |
Dr. David Alan Gilbert | 6039dd5 | 2018-02-05 09:13:37 +0000 | [diff] [blame] | 2604 | if (s->state == MIGRATION_STATUS_ACTIVE || |
| 2605 | s->state == MIGRATION_STATUS_DEVICE) { |
Greg Kurz | fe904ea | 2016-05-18 15:44:36 +0200 | [diff] [blame] | 2606 | Error *local_err = NULL; |
| 2607 | |
zhanghailiang | 1d2acc3 | 2017-01-24 15:59:52 +0800 | [diff] [blame] | 2608 | qemu_mutex_lock_iothread(); |
Greg Kurz | fe904ea | 2016-05-18 15:44:36 +0200 | [diff] [blame] | 2609 | bdrv_invalidate_cache_all(&local_err); |
| 2610 | if (local_err) { |
| 2611 | error_report_err(local_err); |
zhanghailiang | 1d2acc3 | 2017-01-24 15:59:52 +0800 | [diff] [blame] | 2612 | } else { |
| 2613 | s->block_inactive = false; |
Greg Kurz | fe904ea | 2016-05-18 15:44:36 +0200 | [diff] [blame] | 2614 | } |
zhanghailiang | 1d2acc3 | 2017-01-24 15:59:52 +0800 | [diff] [blame] | 2615 | qemu_mutex_unlock_iothread(); |
Greg Kurz | fe904ea | 2016-05-18 15:44:36 +0200 | [diff] [blame] | 2616 | } |
| 2617 | |
Dr. David Alan Gilbert | 09f6c85 | 2015-08-13 11:51:31 +0100 | [diff] [blame] | 2618 | fail: |
zhanghailiang | 48781e5 | 2015-12-16 11:47:33 +0000 | [diff] [blame] | 2619 | migrate_set_state(&s->state, current_active_state, |
| 2620 | MIGRATION_STATUS_FAILED); |
Dr. David Alan Gilbert | 09f6c85 | 2015-08-13 11:51:31 +0100 | [diff] [blame] | 2621 | } |
| 2622 | |
zhanghailiang | 35a6ed4 | 2016-10-27 14:42:52 +0800 | [diff] [blame] | 2623 | bool migrate_colo_enabled(void) |
| 2624 | { |
| 2625 | MigrationState *s = migrate_get_current(); |
| 2626 | return s->enabled_capabilities[MIGRATION_CAPABILITY_X_COLO]; |
| 2627 | } |
| 2628 | |
Peter Xu | b23c2ad | 2018-05-02 18:47:19 +0800 | [diff] [blame] | 2629 | typedef enum MigThrError { |
| 2630 | /* No error detected */ |
| 2631 | MIG_THR_ERR_NONE = 0, |
| 2632 | /* Detected error, but resumed successfully */ |
| 2633 | MIG_THR_ERR_RECOVERED = 1, |
| 2634 | /* Detected fatal error, need to exit */ |
| 2635 | MIG_THR_ERR_FATAL = 2, |
| 2636 | } MigThrError; |
| 2637 | |
Peter Xu | 9419069 | 2018-05-02 18:47:34 +0800 | [diff] [blame] | 2638 | static int postcopy_resume_handshake(MigrationState *s) |
| 2639 | { |
| 2640 | qemu_savevm_send_postcopy_resume(s->to_dst_file); |
| 2641 | |
| 2642 | while (s->state == MIGRATION_STATUS_POSTCOPY_RECOVER) { |
| 2643 | qemu_sem_wait(&s->rp_state.rp_sem); |
| 2644 | } |
| 2645 | |
| 2646 | if (s->state == MIGRATION_STATUS_POSTCOPY_ACTIVE) { |
| 2647 | return 0; |
| 2648 | } |
| 2649 | |
| 2650 | return -1; |
| 2651 | } |
| 2652 | |
Peter Xu | 135b87b | 2018-05-02 18:47:25 +0800 | [diff] [blame] | 2653 | /* Return zero if success, or <0 for error */ |
| 2654 | static int postcopy_do_resume(MigrationState *s) |
| 2655 | { |
Peter Xu | d1b8ead | 2018-05-02 18:47:31 +0800 | [diff] [blame] | 2656 | int ret; |
| 2657 | |
| 2658 | /* |
| 2659 | * Call all the resume_prepare() hooks, so that modules can be |
| 2660 | * ready for the migration resume. |
| 2661 | */ |
| 2662 | ret = qemu_savevm_state_resume_prepare(s); |
| 2663 | if (ret) { |
| 2664 | error_report("%s: resume_prepare() failure detected: %d", |
| 2665 | __func__, ret); |
| 2666 | return ret; |
| 2667 | } |
| 2668 | |
| 2669 | /* |
Peter Xu | 9419069 | 2018-05-02 18:47:34 +0800 | [diff] [blame] | 2670 | * Last handshake with destination on the resume (destination will |
| 2671 | * switch to postcopy-active afterwards) |
Peter Xu | d1b8ead | 2018-05-02 18:47:31 +0800 | [diff] [blame] | 2672 | */ |
Peter Xu | 9419069 | 2018-05-02 18:47:34 +0800 | [diff] [blame] | 2673 | ret = postcopy_resume_handshake(s); |
| 2674 | if (ret) { |
| 2675 | error_report("%s: handshake failed: %d", __func__, ret); |
| 2676 | return ret; |
| 2677 | } |
Peter Xu | d1b8ead | 2018-05-02 18:47:31 +0800 | [diff] [blame] | 2678 | |
Peter Xu | 135b87b | 2018-05-02 18:47:25 +0800 | [diff] [blame] | 2679 | return 0; |
| 2680 | } |
| 2681 | |
Peter Xu | b23c2ad | 2018-05-02 18:47:19 +0800 | [diff] [blame] | 2682 | /* |
| 2683 | * We don't return until we are in a safe state to continue current |
| 2684 | * postcopy migration. Returns MIG_THR_ERR_RECOVERED if recovered, or |
| 2685 | * MIG_THR_ERR_FATAL if unrecovery failure happened. |
| 2686 | */ |
| 2687 | static MigThrError postcopy_pause(MigrationState *s) |
| 2688 | { |
| 2689 | assert(s->state == MIGRATION_STATUS_POSTCOPY_ACTIVE); |
Peter Xu | b23c2ad | 2018-05-02 18:47:19 +0800 | [diff] [blame] | 2690 | |
Peter Xu | 135b87b | 2018-05-02 18:47:25 +0800 | [diff] [blame] | 2691 | while (true) { |
Peter Xu | 62df066 | 2018-05-02 18:47:38 +0800 | [diff] [blame] | 2692 | QEMUFile *file; |
| 2693 | |
Peter Xu | 135b87b | 2018-05-02 18:47:25 +0800 | [diff] [blame] | 2694 | migrate_set_state(&s->state, s->state, |
| 2695 | MIGRATION_STATUS_POSTCOPY_PAUSED); |
Peter Xu | b23c2ad | 2018-05-02 18:47:19 +0800 | [diff] [blame] | 2696 | |
Peter Xu | 135b87b | 2018-05-02 18:47:25 +0800 | [diff] [blame] | 2697 | /* Current channel is possibly broken. Release it. */ |
| 2698 | assert(s->to_dst_file); |
Peter Xu | 62df066 | 2018-05-02 18:47:38 +0800 | [diff] [blame] | 2699 | qemu_mutex_lock(&s->qemu_file_lock); |
| 2700 | file = s->to_dst_file; |
Peter Xu | 135b87b | 2018-05-02 18:47:25 +0800 | [diff] [blame] | 2701 | s->to_dst_file = NULL; |
Peter Xu | 62df066 | 2018-05-02 18:47:38 +0800 | [diff] [blame] | 2702 | qemu_mutex_unlock(&s->qemu_file_lock); |
| 2703 | |
| 2704 | qemu_file_shutdown(file); |
| 2705 | qemu_fclose(file); |
Peter Xu | b23c2ad | 2018-05-02 18:47:19 +0800 | [diff] [blame] | 2706 | |
Peter Xu | 135b87b | 2018-05-02 18:47:25 +0800 | [diff] [blame] | 2707 | error_report("Detected IO failure for postcopy. " |
| 2708 | "Migration paused."); |
| 2709 | |
| 2710 | /* |
| 2711 | * We wait until things fixed up. Then someone will setup the |
| 2712 | * status back for us. |
| 2713 | */ |
| 2714 | while (s->state == MIGRATION_STATUS_POSTCOPY_PAUSED) { |
| 2715 | qemu_sem_wait(&s->postcopy_pause_sem); |
| 2716 | } |
| 2717 | |
| 2718 | if (s->state == MIGRATION_STATUS_POSTCOPY_RECOVER) { |
| 2719 | /* Woken up by a recover procedure. Give it a shot */ |
| 2720 | |
| 2721 | /* |
| 2722 | * Firstly, let's wake up the return path now, with a new |
| 2723 | * return path channel. |
| 2724 | */ |
| 2725 | qemu_sem_post(&s->postcopy_pause_rp_sem); |
| 2726 | |
| 2727 | /* Do the resume logic */ |
| 2728 | if (postcopy_do_resume(s) == 0) { |
| 2729 | /* Let's continue! */ |
| 2730 | trace_postcopy_pause_continued(); |
| 2731 | return MIG_THR_ERR_RECOVERED; |
| 2732 | } else { |
| 2733 | /* |
| 2734 | * Something wrong happened during the recovery, let's |
| 2735 | * pause again. Pause is always better than throwing |
| 2736 | * data away. |
| 2737 | */ |
| 2738 | continue; |
| 2739 | } |
| 2740 | } else { |
| 2741 | /* This is not right... Time to quit. */ |
| 2742 | return MIG_THR_ERR_FATAL; |
| 2743 | } |
Peter Xu | b23c2ad | 2018-05-02 18:47:19 +0800 | [diff] [blame] | 2744 | } |
Peter Xu | b23c2ad | 2018-05-02 18:47:19 +0800 | [diff] [blame] | 2745 | } |
| 2746 | |
| 2747 | static MigThrError migration_detect_error(MigrationState *s) |
| 2748 | { |
| 2749 | int ret; |
| 2750 | |
| 2751 | /* Try to detect any file errors */ |
| 2752 | ret = qemu_file_get_error(s->to_dst_file); |
| 2753 | |
| 2754 | if (!ret) { |
| 2755 | /* Everything is fine */ |
| 2756 | return MIG_THR_ERR_NONE; |
| 2757 | } |
| 2758 | |
| 2759 | if (s->state == MIGRATION_STATUS_POSTCOPY_ACTIVE && ret == -EIO) { |
| 2760 | /* |
| 2761 | * For postcopy, we allow the network to be down for a |
| 2762 | * while. After that, it can be continued by a |
| 2763 | * recovery phase. |
| 2764 | */ |
| 2765 | return postcopy_pause(s); |
| 2766 | } else { |
| 2767 | /* |
| 2768 | * For precopy (or postcopy with error outside IO), we fail |
| 2769 | * with no time. |
| 2770 | */ |
| 2771 | migrate_set_state(&s->state, s->state, MIGRATION_STATUS_FAILED); |
| 2772 | trace_migration_thread_file_err(); |
| 2773 | |
| 2774 | /* Time to stop the migration, now. */ |
| 2775 | return MIG_THR_ERR_FATAL; |
| 2776 | } |
| 2777 | } |
| 2778 | |
Juan Quintela | 0c8f0ef | 2018-06-26 15:38:00 +0200 | [diff] [blame] | 2779 | /* How many bytes have we transferred since the beggining of the migration */ |
| 2780 | static uint64_t migration_total_bytes(MigrationState *s) |
| 2781 | { |
Juan Quintela | b9ee2f7 | 2016-01-15 11:40:13 +0100 | [diff] [blame] | 2782 | return qemu_ftell(s->to_dst_file) + ram_counters.multifd_bytes; |
Juan Quintela | 0c8f0ef | 2018-06-26 15:38:00 +0200 | [diff] [blame] | 2783 | } |
| 2784 | |
Peter Xu | cf011f0 | 2018-01-03 20:20:11 +0800 | [diff] [blame] | 2785 | static void migration_calculate_complete(MigrationState *s) |
| 2786 | { |
Juan Quintela | 0c8f0ef | 2018-06-26 15:38:00 +0200 | [diff] [blame] | 2787 | uint64_t bytes = migration_total_bytes(s); |
Peter Xu | cf011f0 | 2018-01-03 20:20:11 +0800 | [diff] [blame] | 2788 | int64_t end_time = qemu_clock_get_ms(QEMU_CLOCK_REALTIME); |
Juan Quintela | 6cde6fb | 2018-06-26 15:26:35 +0200 | [diff] [blame] | 2789 | int64_t transfer_time; |
Peter Xu | cf011f0 | 2018-01-03 20:20:11 +0800 | [diff] [blame] | 2790 | |
| 2791 | s->total_time = end_time - s->start_time; |
| 2792 | if (!s->downtime) { |
| 2793 | /* |
| 2794 | * It's still not set, so we are precopy migration. For |
| 2795 | * postcopy, downtime is calculated during postcopy_start(). |
| 2796 | */ |
| 2797 | s->downtime = end_time - s->downtime_start; |
| 2798 | } |
| 2799 | |
Juan Quintela | 6cde6fb | 2018-06-26 15:26:35 +0200 | [diff] [blame] | 2800 | transfer_time = s->total_time - s->setup_time; |
| 2801 | if (transfer_time) { |
| 2802 | s->mbps = ((double) bytes * 8.0) / transfer_time / 1000; |
Peter Xu | cf011f0 | 2018-01-03 20:20:11 +0800 | [diff] [blame] | 2803 | } |
| 2804 | } |
| 2805 | |
Peter Xu | b15df1a | 2018-01-03 20:20:13 +0800 | [diff] [blame] | 2806 | static void migration_update_counters(MigrationState *s, |
| 2807 | int64_t current_time) |
| 2808 | { |
| 2809 | uint64_t transferred, time_spent; |
Juan Quintela | 0c8f0ef | 2018-06-26 15:38:00 +0200 | [diff] [blame] | 2810 | uint64_t current_bytes; /* bytes transferred since the beginning */ |
Peter Xu | b15df1a | 2018-01-03 20:20:13 +0800 | [diff] [blame] | 2811 | double bandwidth; |
| 2812 | |
| 2813 | if (current_time < s->iteration_start_time + BUFFER_DELAY) { |
| 2814 | return; |
| 2815 | } |
| 2816 | |
Juan Quintela | 0c8f0ef | 2018-06-26 15:38:00 +0200 | [diff] [blame] | 2817 | current_bytes = migration_total_bytes(s); |
| 2818 | transferred = current_bytes - s->iteration_initial_bytes; |
Peter Xu | b15df1a | 2018-01-03 20:20:13 +0800 | [diff] [blame] | 2819 | time_spent = current_time - s->iteration_start_time; |
| 2820 | bandwidth = (double)transferred / time_spent; |
Wei Wang | 0781c1e | 2018-01-22 19:36:39 +0800 | [diff] [blame] | 2821 | s->threshold_size = bandwidth * s->parameters.downtime_limit; |
Peter Xu | b15df1a | 2018-01-03 20:20:13 +0800 | [diff] [blame] | 2822 | |
| 2823 | s->mbps = (((double) transferred * 8.0) / |
| 2824 | ((double) time_spent / 1000.0)) / 1000.0 / 1000.0; |
| 2825 | |
| 2826 | /* |
| 2827 | * if we haven't sent anything, we don't want to |
| 2828 | * recalculate. 10000 is a small enough number for our purposes |
| 2829 | */ |
| 2830 | if (ram_counters.dirty_pages_rate && transferred > 10000) { |
Balamuruhan S | 650af89 | 2018-06-12 14:20:09 +0530 | [diff] [blame] | 2831 | s->expected_downtime = ram_counters.remaining / bandwidth; |
Peter Xu | b15df1a | 2018-01-03 20:20:13 +0800 | [diff] [blame] | 2832 | } |
| 2833 | |
| 2834 | qemu_file_reset_rate_limit(s->to_dst_file); |
| 2835 | |
| 2836 | s->iteration_start_time = current_time; |
Juan Quintela | 0c8f0ef | 2018-06-26 15:38:00 +0200 | [diff] [blame] | 2837 | s->iteration_initial_bytes = current_bytes; |
Peter Xu | b15df1a | 2018-01-03 20:20:13 +0800 | [diff] [blame] | 2838 | |
| 2839 | trace_migrate_transferred(transferred, time_spent, |
Wei Wang | 0781c1e | 2018-01-22 19:36:39 +0800 | [diff] [blame] | 2840 | bandwidth, s->threshold_size); |
Peter Xu | b15df1a | 2018-01-03 20:20:13 +0800 | [diff] [blame] | 2841 | } |
| 2842 | |
Peter Xu | 2ad8730 | 2018-01-03 20:20:14 +0800 | [diff] [blame] | 2843 | /* Migration thread iteration status */ |
| 2844 | typedef enum { |
| 2845 | MIG_ITERATE_RESUME, /* Resume current iteration */ |
| 2846 | MIG_ITERATE_SKIP, /* Skip current iteration */ |
| 2847 | MIG_ITERATE_BREAK, /* Break the loop */ |
| 2848 | } MigIterateState; |
| 2849 | |
| 2850 | /* |
| 2851 | * Return true if continue to the next iteration directly, false |
| 2852 | * otherwise. |
| 2853 | */ |
| 2854 | static MigIterateState migration_iteration_run(MigrationState *s) |
| 2855 | { |
Vladimir Sementsov-Ogievskiy | 4799502 | 2018-03-13 15:34:00 -0400 | [diff] [blame] | 2856 | uint64_t pending_size, pend_pre, pend_compat, pend_post; |
Peter Xu | 2ad8730 | 2018-01-03 20:20:14 +0800 | [diff] [blame] | 2857 | bool in_postcopy = s->state == MIGRATION_STATUS_POSTCOPY_ACTIVE; |
| 2858 | |
Vladimir Sementsov-Ogievskiy | 4799502 | 2018-03-13 15:34:00 -0400 | [diff] [blame] | 2859 | qemu_savevm_state_pending(s->to_dst_file, s->threshold_size, &pend_pre, |
| 2860 | &pend_compat, &pend_post); |
| 2861 | pending_size = pend_pre + pend_compat + pend_post; |
Peter Xu | 2ad8730 | 2018-01-03 20:20:14 +0800 | [diff] [blame] | 2862 | |
| 2863 | trace_migrate_pending(pending_size, s->threshold_size, |
Vladimir Sementsov-Ogievskiy | 4799502 | 2018-03-13 15:34:00 -0400 | [diff] [blame] | 2864 | pend_pre, pend_compat, pend_post); |
Peter Xu | 2ad8730 | 2018-01-03 20:20:14 +0800 | [diff] [blame] | 2865 | |
| 2866 | if (pending_size && pending_size >= s->threshold_size) { |
| 2867 | /* Still a significant amount to transfer */ |
| 2868 | if (migrate_postcopy() && !in_postcopy && |
Vladimir Sementsov-Ogievskiy | 4799502 | 2018-03-13 15:34:00 -0400 | [diff] [blame] | 2869 | pend_pre <= s->threshold_size && |
Peter Xu | 2ad8730 | 2018-01-03 20:20:14 +0800 | [diff] [blame] | 2870 | atomic_read(&s->start_postcopy)) { |
| 2871 | if (postcopy_start(s)) { |
| 2872 | error_report("%s: postcopy failed to start", __func__); |
| 2873 | } |
| 2874 | return MIG_ITERATE_SKIP; |
| 2875 | } |
| 2876 | /* Just another iteration step */ |
| 2877 | qemu_savevm_state_iterate(s->to_dst_file, |
| 2878 | s->state == MIGRATION_STATUS_POSTCOPY_ACTIVE); |
| 2879 | } else { |
| 2880 | trace_migration_thread_low_pending(pending_size); |
| 2881 | migration_completion(s); |
| 2882 | return MIG_ITERATE_BREAK; |
| 2883 | } |
| 2884 | |
| 2885 | return MIG_ITERATE_RESUME; |
| 2886 | } |
| 2887 | |
Peter Xu | 199aa6d | 2018-01-03 20:20:15 +0800 | [diff] [blame] | 2888 | static void migration_iteration_finish(MigrationState *s) |
| 2889 | { |
| 2890 | /* If we enabled cpu throttling for auto-converge, turn it off. */ |
| 2891 | cpu_throttle_stop(); |
| 2892 | |
| 2893 | qemu_mutex_lock_iothread(); |
| 2894 | switch (s->state) { |
| 2895 | case MIGRATION_STATUS_COMPLETED: |
| 2896 | migration_calculate_complete(s); |
| 2897 | runstate_set(RUN_STATE_POSTMIGRATE); |
| 2898 | break; |
| 2899 | |
| 2900 | case MIGRATION_STATUS_ACTIVE: |
| 2901 | /* |
| 2902 | * We should really assert here, but since it's during |
| 2903 | * migration, let's try to reduce the usage of assertions. |
| 2904 | */ |
| 2905 | if (!migrate_colo_enabled()) { |
| 2906 | error_report("%s: critical error: calling COLO code without " |
| 2907 | "COLO enabled", __func__); |
| 2908 | } |
| 2909 | migrate_start_colo_process(s); |
| 2910 | /* |
| 2911 | * Fixme: we will run VM in COLO no matter its old running state. |
| 2912 | * After exited COLO, we will keep running. |
| 2913 | */ |
| 2914 | s->vm_was_running = true; |
| 2915 | /* Fallthrough */ |
| 2916 | case MIGRATION_STATUS_FAILED: |
| 2917 | case MIGRATION_STATUS_CANCELLED: |
Dr. David Alan Gilbert | 57225e5 | 2018-07-19 10:22:57 +0100 | [diff] [blame] | 2918 | case MIGRATION_STATUS_CANCELLING: |
Peter Xu | 199aa6d | 2018-01-03 20:20:15 +0800 | [diff] [blame] | 2919 | if (s->vm_was_running) { |
| 2920 | vm_start(); |
| 2921 | } else { |
| 2922 | if (runstate_check(RUN_STATE_FINISH_MIGRATE)) { |
| 2923 | runstate_set(RUN_STATE_POSTMIGRATE); |
| 2924 | } |
| 2925 | } |
| 2926 | break; |
| 2927 | |
| 2928 | default: |
| 2929 | /* Should not reach here, but if so, forgive the VM. */ |
| 2930 | error_report("%s: Unknown ending state %d", __func__, s->state); |
| 2931 | break; |
| 2932 | } |
| 2933 | qemu_bh_schedule(s->cleanup_bh); |
| 2934 | qemu_mutex_unlock_iothread(); |
| 2935 | } |
| 2936 | |
Dr. David Alan Gilbert | ad767be | 2018-06-13 11:26:41 +0100 | [diff] [blame] | 2937 | void migration_make_urgent_request(void) |
| 2938 | { |
| 2939 | qemu_sem_post(&migrate_get_current()->rate_limit_sem); |
| 2940 | } |
| 2941 | |
| 2942 | void migration_consume_urgent_request(void) |
| 2943 | { |
| 2944 | qemu_sem_wait(&migrate_get_current()->rate_limit_sem); |
| 2945 | } |
| 2946 | |
Dr. David Alan Gilbert | 70b2047 | 2015-11-05 18:10:49 +0000 | [diff] [blame] | 2947 | /* |
| 2948 | * Master migration thread on the source VM. |
| 2949 | * It drives the migration and pumps the data down the outgoing channel. |
| 2950 | */ |
Juan Quintela | 5f496a1 | 2013-02-22 17:36:30 +0100 | [diff] [blame] | 2951 | static void *migration_thread(void *opaque) |
Juan Quintela | 0d82d0e | 2012-10-03 14:18:33 +0200 | [diff] [blame] | 2952 | { |
Juan Quintela | 9848a40 | 2012-12-19 09:55:50 +0100 | [diff] [blame] | 2953 | MigrationState *s = opaque; |
Alex Bligh | bc72ad6 | 2013-08-21 16:03:08 +0100 | [diff] [blame] | 2954 | int64_t setup_start = qemu_clock_get_ms(QEMU_CLOCK_HOST); |
Peter Xu | b23c2ad | 2018-05-02 18:47:19 +0800 | [diff] [blame] | 2955 | MigThrError thr_error; |
Dr. David Alan Gilbert | ad767be | 2018-06-13 11:26:41 +0100 | [diff] [blame] | 2956 | bool urgent = false; |
Juan Quintela | 76f5933 | 2012-10-03 20:16:24 +0200 | [diff] [blame] | 2957 | |
Paolo Bonzini | ab28bd2 | 2015-07-09 08:55:38 +0200 | [diff] [blame] | 2958 | rcu_register_thread(); |
| 2959 | |
Peter Xu | b15df1a | 2018-01-03 20:20:13 +0800 | [diff] [blame] | 2960 | s->iteration_start_time = qemu_clock_get_ms(QEMU_CLOCK_REALTIME); |
| 2961 | |
zhanghailiang | 89a02a9 | 2016-01-15 11:37:42 +0800 | [diff] [blame] | 2962 | qemu_savevm_state_header(s->to_dst_file); |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2963 | |
Peter Xu | 62a0265 | 2017-06-14 15:55:58 +0800 | [diff] [blame] | 2964 | /* |
| 2965 | * If we opened the return path, we need to make sure dst has it |
| 2966 | * opened as well. |
| 2967 | */ |
| 2968 | if (s->rp_state.from_dst_file) { |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2969 | /* Now tell the dest that it should open its end so it can reply */ |
zhanghailiang | 89a02a9 | 2016-01-15 11:37:42 +0800 | [diff] [blame] | 2970 | qemu_savevm_send_open_return_path(s->to_dst_file); |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2971 | |
| 2972 | /* And do a ping that will make stuff easier to debug */ |
zhanghailiang | 89a02a9 | 2016-01-15 11:37:42 +0800 | [diff] [blame] | 2973 | qemu_savevm_send_ping(s->to_dst_file, 1); |
Peter Xu | 0425dc9 | 2017-05-31 18:35:34 +0800 | [diff] [blame] | 2974 | } |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2975 | |
Vladimir Sementsov-Ogievskiy | 58110f0 | 2017-07-10 19:30:16 +0300 | [diff] [blame] | 2976 | if (migrate_postcopy()) { |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2977 | /* |
| 2978 | * Tell the destination that we *might* want to do postcopy later; |
| 2979 | * if the other end can't do postcopy it should fail now, nice and |
| 2980 | * early. |
| 2981 | */ |
zhanghailiang | 89a02a9 | 2016-01-15 11:37:42 +0800 | [diff] [blame] | 2982 | qemu_savevm_send_postcopy_advise(s->to_dst_file); |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 2983 | } |
| 2984 | |
Juan Quintela | 9907e84 | 2017-06-28 11:52:24 +0200 | [diff] [blame] | 2985 | qemu_savevm_state_setup(s->to_dst_file); |
Juan Quintela | 0d82d0e | 2012-10-03 14:18:33 +0200 | [diff] [blame] | 2986 | |
Alex Bligh | bc72ad6 | 2013-08-21 16:03:08 +0100 | [diff] [blame] | 2987 | s->setup_time = qemu_clock_get_ms(QEMU_CLOCK_HOST) - setup_start; |
zhanghailiang | 48781e5 | 2015-12-16 11:47:33 +0000 | [diff] [blame] | 2988 | migrate_set_state(&s->state, MIGRATION_STATUS_SETUP, |
| 2989 | MIGRATION_STATUS_ACTIVE); |
Michael R. Hines | 29ae8a4 | 2013-07-22 10:01:57 -0400 | [diff] [blame] | 2990 | |
Dr. David Alan Gilbert | 9ec055a | 2015-11-05 18:10:58 +0000 | [diff] [blame] | 2991 | trace_migration_thread_setup_complete(); |
| 2992 | |
| 2993 | while (s->state == MIGRATION_STATUS_ACTIVE || |
| 2994 | s->state == MIGRATION_STATUS_POSTCOPY_ACTIVE) { |
Juan Quintela | a3e879c | 2013-02-01 12:39:08 +0100 | [diff] [blame] | 2995 | int64_t current_time; |
Juan Quintela | 0d82d0e | 2012-10-03 14:18:33 +0200 | [diff] [blame] | 2996 | |
Dr. David Alan Gilbert | ad767be | 2018-06-13 11:26:41 +0100 | [diff] [blame] | 2997 | if (urgent || !qemu_file_rate_limit(s->to_dst_file)) { |
Peter Xu | 2ad8730 | 2018-01-03 20:20:14 +0800 | [diff] [blame] | 2998 | MigIterateState iter_state = migration_iteration_run(s); |
| 2999 | if (iter_state == MIG_ITERATE_SKIP) { |
| 3000 | continue; |
| 3001 | } else if (iter_state == MIG_ITERATE_BREAK) { |
Dr. David Alan Gilbert | 09f6c85 | 2015-08-13 11:51:31 +0100 | [diff] [blame] | 3002 | break; |
Juan Quintela | c369f40 | 2012-10-03 20:33:34 +0200 | [diff] [blame] | 3003 | } |
| 3004 | } |
Paolo Bonzini | f4410a5 | 2013-02-22 17:36:20 +0100 | [diff] [blame] | 3005 | |
Peter Xu | b23c2ad | 2018-05-02 18:47:19 +0800 | [diff] [blame] | 3006 | /* |
| 3007 | * Try to detect any kind of failures, and see whether we |
| 3008 | * should stop the migration now. |
| 3009 | */ |
| 3010 | thr_error = migration_detect_error(s); |
| 3011 | if (thr_error == MIG_THR_ERR_FATAL) { |
| 3012 | /* Stop migration */ |
Paolo Bonzini | fd45ee2 | 2013-02-22 17:36:33 +0100 | [diff] [blame] | 3013 | break; |
Peter Xu | b23c2ad | 2018-05-02 18:47:19 +0800 | [diff] [blame] | 3014 | } else if (thr_error == MIG_THR_ERR_RECOVERED) { |
| 3015 | /* |
| 3016 | * Just recovered from a e.g. network failure, reset all |
| 3017 | * the local variables. This is important to avoid |
| 3018 | * breaking transferred_bytes and bandwidth calculation |
| 3019 | */ |
| 3020 | s->iteration_start_time = qemu_clock_get_ms(QEMU_CLOCK_REALTIME); |
| 3021 | s->iteration_initial_bytes = 0; |
Paolo Bonzini | fd45ee2 | 2013-02-22 17:36:33 +0100 | [diff] [blame] | 3022 | } |
Peter Xu | b15df1a | 2018-01-03 20:20:13 +0800 | [diff] [blame] | 3023 | |
Alex Bligh | bc72ad6 | 2013-08-21 16:03:08 +0100 | [diff] [blame] | 3024 | current_time = qemu_clock_get_ms(QEMU_CLOCK_REALTIME); |
Juan Quintela | 0d82d0e | 2012-10-03 14:18:33 +0200 | [diff] [blame] | 3025 | |
Peter Xu | b15df1a | 2018-01-03 20:20:13 +0800 | [diff] [blame] | 3026 | migration_update_counters(s, current_time); |
Michael R. Hines | 7e114f8 | 2013-06-25 21:35:30 -0400 | [diff] [blame] | 3027 | |
Dr. David Alan Gilbert | ad767be | 2018-06-13 11:26:41 +0100 | [diff] [blame] | 3028 | urgent = false; |
zhanghailiang | 89a02a9 | 2016-01-15 11:37:42 +0800 | [diff] [blame] | 3029 | if (qemu_file_rate_limit(s->to_dst_file)) { |
Dr. David Alan Gilbert | ad767be | 2018-06-13 11:26:41 +0100 | [diff] [blame] | 3030 | /* Wait for a delay to do rate limiting OR |
| 3031 | * something urgent to post the semaphore. |
| 3032 | */ |
| 3033 | int ms = s->iteration_start_time + BUFFER_DELAY - current_time; |
| 3034 | trace_migration_thread_ratelimit_pre(ms); |
| 3035 | if (qemu_sem_timedwait(&s->rate_limit_sem, ms) == 0) { |
| 3036 | /* We were worken by one or more urgent things but |
| 3037 | * the timedwait will have consumed one of them. |
| 3038 | * The service routine for the urgent wake will dec |
| 3039 | * the semaphore itself for each item it consumes, |
| 3040 | * so add this one we just eat back. |
| 3041 | */ |
| 3042 | qemu_sem_post(&s->rate_limit_sem); |
| 3043 | urgent = true; |
| 3044 | } |
| 3045 | trace_migration_thread_ratelimit_post(urgent); |
Juan Quintela | 0d82d0e | 2012-10-03 14:18:33 +0200 | [diff] [blame] | 3046 | } |
Paolo Bonzini | a3fa1d7 | 2013-02-22 17:36:18 +0100 | [diff] [blame] | 3047 | } |
| 3048 | |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 3049 | trace_migration_thread_after_loop(); |
Peter Xu | 199aa6d | 2018-01-03 20:20:15 +0800 | [diff] [blame] | 3050 | migration_iteration_finish(s); |
Paolo Bonzini | ab28bd2 | 2015-07-09 08:55:38 +0200 | [diff] [blame] | 3051 | rcu_unregister_thread(); |
Juan Quintela | 0d82d0e | 2012-10-03 14:18:33 +0200 | [diff] [blame] | 3052 | return NULL; |
| 3053 | } |
| 3054 | |
Dr. David Alan Gilbert | cce8040 | 2017-12-15 17:16:54 +0000 | [diff] [blame] | 3055 | void migrate_fd_connect(MigrationState *s, Error *error_in) |
Juan Quintela | 0d82d0e | 2012-10-03 14:18:33 +0200 | [diff] [blame] | 3056 | { |
Peter Xu | d3e35b8 | 2018-05-02 18:47:24 +0800 | [diff] [blame] | 3057 | int64_t rate_limit; |
| 3058 | bool resume = s->state == MIGRATION_STATUS_POSTCOPY_PAUSED; |
| 3059 | |
Ashijeet Acharya | 2ff3025 | 2016-09-15 21:50:28 +0530 | [diff] [blame] | 3060 | s->expected_downtime = s->parameters.downtime_limit; |
Paolo Bonzini | bb1fadc | 2013-02-22 17:36:21 +0100 | [diff] [blame] | 3061 | s->cleanup_bh = qemu_bh_new(migrate_fd_cleanup, s); |
Dr. David Alan Gilbert | cce8040 | 2017-12-15 17:16:54 +0000 | [diff] [blame] | 3062 | if (error_in) { |
| 3063 | migrate_fd_error(s, error_in); |
| 3064 | migrate_fd_cleanup(s); |
| 3065 | return; |
| 3066 | } |
Juan Quintela | 0d82d0e | 2012-10-03 14:18:33 +0200 | [diff] [blame] | 3067 | |
Peter Xu | d3e35b8 | 2018-05-02 18:47:24 +0800 | [diff] [blame] | 3068 | if (resume) { |
| 3069 | /* This is a resumed migration */ |
| 3070 | rate_limit = INT64_MAX; |
| 3071 | } else { |
| 3072 | /* This is a fresh new migration */ |
| 3073 | rate_limit = s->parameters.max_bandwidth / XFER_LIMIT_RATIO; |
Paolo Bonzini | 442773c | 2013-02-22 17:36:44 +0100 | [diff] [blame] | 3074 | |
Peter Xu | d3e35b8 | 2018-05-02 18:47:24 +0800 | [diff] [blame] | 3075 | /* Notify before starting migration thread */ |
| 3076 | notifier_list_notify(&migration_state_notifiers, s); |
| 3077 | } |
| 3078 | |
| 3079 | qemu_file_set_rate_limit(s->to_dst_file, rate_limit); |
| 3080 | qemu_file_set_blocking(s->to_dst_file, true); |
Stefan Hajnoczi | 9287ac2 | 2013-07-29 15:01:57 +0200 | [diff] [blame] | 3081 | |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 3082 | /* |
Peter Xu | c788ada | 2017-06-26 18:28:55 +0800 | [diff] [blame] | 3083 | * Open the return path. For postcopy, it is used exclusively. For |
| 3084 | * precopy, only if user specified "return-path" capability would |
| 3085 | * QEMU uses the return path. |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 3086 | */ |
Peter Xu | c788ada | 2017-06-26 18:28:55 +0800 | [diff] [blame] | 3087 | if (migrate_postcopy_ram() || migrate_use_return_path()) { |
Peter Xu | d3e35b8 | 2018-05-02 18:47:24 +0800 | [diff] [blame] | 3088 | if (open_return_path_on_source(s, !resume)) { |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 3089 | error_report("Unable to open return-path for postcopy"); |
Peter Xu | d3e35b8 | 2018-05-02 18:47:24 +0800 | [diff] [blame] | 3090 | migrate_set_state(&s->state, s->state, MIGRATION_STATUS_FAILED); |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 3091 | migrate_fd_cleanup(s); |
| 3092 | return; |
| 3093 | } |
| 3094 | } |
| 3095 | |
Peter Xu | d3e35b8 | 2018-05-02 18:47:24 +0800 | [diff] [blame] | 3096 | if (resume) { |
Peter Xu | 135b87b | 2018-05-02 18:47:25 +0800 | [diff] [blame] | 3097 | /* Wakeup the main migration thread to do the recovery */ |
| 3098 | migrate_set_state(&s->state, MIGRATION_STATUS_POSTCOPY_PAUSED, |
| 3099 | MIGRATION_STATUS_POSTCOPY_RECOVER); |
| 3100 | qemu_sem_post(&s->postcopy_pause_sem); |
Peter Xu | d3e35b8 | 2018-05-02 18:47:24 +0800 | [diff] [blame] | 3101 | return; |
| 3102 | } |
| 3103 | |
Juan Quintela | f986c3d | 2016-01-14 16:52:55 +0100 | [diff] [blame] | 3104 | if (multifd_save_setup() != 0) { |
| 3105 | migrate_set_state(&s->state, MIGRATION_STATUS_SETUP, |
| 3106 | MIGRATION_STATUS_FAILED); |
| 3107 | migrate_fd_cleanup(s); |
| 3108 | return; |
| 3109 | } |
Pankaj Gupta | 009fad7 | 2017-01-23 19:12:56 +0530 | [diff] [blame] | 3110 | qemu_thread_create(&s->thread, "live_migration", migration_thread, s, |
Paolo Bonzini | bb1fadc | 2013-02-22 17:36:21 +0100 | [diff] [blame] | 3111 | QEMU_THREAD_JOINABLE); |
Dr. David Alan Gilbert | 1d34e4b | 2015-11-05 18:11:05 +0000 | [diff] [blame] | 3112 | s->migration_thread_running = true; |
Juan Quintela | 0d82d0e | 2012-10-03 14:18:33 +0200 | [diff] [blame] | 3113 | } |
Dr. David Alan Gilbert | 093e3c4 | 2015-11-05 18:10:52 +0000 | [diff] [blame] | 3114 | |
Peter Xu | 9d18af9 | 2017-06-27 12:10:19 +0800 | [diff] [blame] | 3115 | void migration_global_dump(Monitor *mon) |
| 3116 | { |
| 3117 | MigrationState *ms = migrate_get_current(); |
| 3118 | |
Juan Quintela | 6f0f642 | 2017-10-26 11:49:57 +0200 | [diff] [blame] | 3119 | monitor_printf(mon, "globals:\n"); |
| 3120 | monitor_printf(mon, "store-global-state: %s\n", |
| 3121 | ms->store_global_state ? "on" : "off"); |
| 3122 | monitor_printf(mon, "only-migratable: %s\n", |
| 3123 | ms->only_migratable ? "on" : "off"); |
| 3124 | monitor_printf(mon, "send-configuration: %s\n", |
| 3125 | ms->send_configuration ? "on" : "off"); |
| 3126 | monitor_printf(mon, "send-section-footer: %s\n", |
| 3127 | ms->send_section_footer ? "on" : "off"); |
Xiao Guangrong | f548222 | 2018-05-03 16:06:11 +0800 | [diff] [blame] | 3128 | monitor_printf(mon, "decompress-error-check: %s\n", |
| 3129 | ms->decompress_error_check ? "on" : "off"); |
Peter Xu | 9d18af9 | 2017-06-27 12:10:19 +0800 | [diff] [blame] | 3130 | } |
| 3131 | |
Peter Xu | 2081475 | 2017-07-18 11:39:03 +0800 | [diff] [blame] | 3132 | #define DEFINE_PROP_MIG_CAP(name, x) \ |
| 3133 | DEFINE_PROP_BOOL(name, MigrationState, enabled_capabilities[x], false) |
| 3134 | |
Peter Xu | 5272298 | 2017-06-27 12:10:14 +0800 | [diff] [blame] | 3135 | static Property migration_properties[] = { |
| 3136 | DEFINE_PROP_BOOL("store-global-state", MigrationState, |
| 3137 | store_global_state, true), |
Peter Xu | 3df663e | 2017-06-27 12:10:15 +0800 | [diff] [blame] | 3138 | DEFINE_PROP_BOOL("only-migratable", MigrationState, only_migratable, false), |
Peter Xu | 71dd4c1 | 2017-06-27 12:10:16 +0800 | [diff] [blame] | 3139 | DEFINE_PROP_BOOL("send-configuration", MigrationState, |
| 3140 | send_configuration, true), |
Peter Xu | 15c3850 | 2017-06-27 12:10:17 +0800 | [diff] [blame] | 3141 | DEFINE_PROP_BOOL("send-section-footer", MigrationState, |
| 3142 | send_section_footer, true), |
Xiao Guangrong | f548222 | 2018-05-03 16:06:11 +0800 | [diff] [blame] | 3143 | DEFINE_PROP_BOOL("decompress-error-check", MigrationState, |
| 3144 | decompress_error_check, true), |
Peter Xu | 89632fa | 2017-07-18 11:39:02 +0800 | [diff] [blame] | 3145 | |
| 3146 | /* Migration parameters */ |
Juan Quintela | 741d408 | 2017-12-01 13:08:38 +0100 | [diff] [blame] | 3147 | DEFINE_PROP_UINT8("x-compress-level", MigrationState, |
Peter Xu | 89632fa | 2017-07-18 11:39:02 +0800 | [diff] [blame] | 3148 | parameters.compress_level, |
| 3149 | DEFAULT_MIGRATE_COMPRESS_LEVEL), |
Juan Quintela | 741d408 | 2017-12-01 13:08:38 +0100 | [diff] [blame] | 3150 | DEFINE_PROP_UINT8("x-compress-threads", MigrationState, |
Peter Xu | 89632fa | 2017-07-18 11:39:02 +0800 | [diff] [blame] | 3151 | parameters.compress_threads, |
| 3152 | DEFAULT_MIGRATE_COMPRESS_THREAD_COUNT), |
Juan Quintela | 741d408 | 2017-12-01 13:08:38 +0100 | [diff] [blame] | 3153 | DEFINE_PROP_UINT8("x-decompress-threads", MigrationState, |
Peter Xu | 89632fa | 2017-07-18 11:39:02 +0800 | [diff] [blame] | 3154 | parameters.decompress_threads, |
| 3155 | DEFAULT_MIGRATE_DECOMPRESS_THREAD_COUNT), |
Juan Quintela | 741d408 | 2017-12-01 13:08:38 +0100 | [diff] [blame] | 3156 | DEFINE_PROP_UINT8("x-cpu-throttle-initial", MigrationState, |
Peter Xu | 89632fa | 2017-07-18 11:39:02 +0800 | [diff] [blame] | 3157 | parameters.cpu_throttle_initial, |
| 3158 | DEFAULT_MIGRATE_CPU_THROTTLE_INITIAL), |
Juan Quintela | 741d408 | 2017-12-01 13:08:38 +0100 | [diff] [blame] | 3159 | DEFINE_PROP_UINT8("x-cpu-throttle-increment", MigrationState, |
Peter Xu | 89632fa | 2017-07-18 11:39:02 +0800 | [diff] [blame] | 3160 | parameters.cpu_throttle_increment, |
| 3161 | DEFAULT_MIGRATE_CPU_THROTTLE_INCREMENT), |
Juan Quintela | 741d408 | 2017-12-01 13:08:38 +0100 | [diff] [blame] | 3162 | DEFINE_PROP_SIZE("x-max-bandwidth", MigrationState, |
Peter Xu | 89632fa | 2017-07-18 11:39:02 +0800 | [diff] [blame] | 3163 | parameters.max_bandwidth, MAX_THROTTLE), |
Juan Quintela | 741d408 | 2017-12-01 13:08:38 +0100 | [diff] [blame] | 3164 | DEFINE_PROP_UINT64("x-downtime-limit", MigrationState, |
Peter Xu | 89632fa | 2017-07-18 11:39:02 +0800 | [diff] [blame] | 3165 | parameters.downtime_limit, |
| 3166 | DEFAULT_MIGRATE_SET_DOWNTIME), |
Juan Quintela | 741d408 | 2017-12-01 13:08:38 +0100 | [diff] [blame] | 3167 | DEFINE_PROP_UINT32("x-checkpoint-delay", MigrationState, |
Peter Xu | 89632fa | 2017-07-18 11:39:02 +0800 | [diff] [blame] | 3168 | parameters.x_checkpoint_delay, |
| 3169 | DEFAULT_MIGRATE_X_CHECKPOINT_DELAY), |
Juan Quintela | 741d408 | 2017-12-01 13:08:38 +0100 | [diff] [blame] | 3170 | DEFINE_PROP_UINT8("x-multifd-channels", MigrationState, |
Juan Quintela | 4075fb1 | 2016-01-15 08:56:17 +0100 | [diff] [blame] | 3171 | parameters.x_multifd_channels, |
| 3172 | DEFAULT_MIGRATE_MULTIFD_CHANNELS), |
Juan Quintela | 741d408 | 2017-12-01 13:08:38 +0100 | [diff] [blame] | 3173 | DEFINE_PROP_UINT32("x-multifd-page-count", MigrationState, |
Juan Quintela | 0fb8660 | 2017-04-27 10:48:25 +0200 | [diff] [blame] | 3174 | parameters.x_multifd_page_count, |
| 3175 | DEFAULT_MIGRATE_MULTIFD_PAGE_COUNT), |
Juan Quintela | 73af8dd | 2017-10-05 21:30:10 +0200 | [diff] [blame] | 3176 | DEFINE_PROP_SIZE("xbzrle-cache-size", MigrationState, |
| 3177 | parameters.xbzrle_cache_size, |
| 3178 | DEFAULT_MIGRATE_XBZRLE_CACHE_SIZE), |
Dr. David Alan Gilbert | 7e555c6 | 2018-06-13 11:26:40 +0100 | [diff] [blame] | 3179 | DEFINE_PROP_SIZE("max-postcopy-bandwidth", MigrationState, |
| 3180 | parameters.max_postcopy_bandwidth, |
| 3181 | DEFAULT_MIGRATE_MAX_POSTCOPY_BANDWIDTH), |
Li Qiang | 4cbc9c7 | 2018-08-01 06:00:20 -0700 | [diff] [blame] | 3182 | DEFINE_PROP_UINT8("max-cpu-throttle", MigrationState, |
| 3183 | parameters.max_cpu_throttle, |
| 3184 | DEFAULT_MIGRATE_MAX_CPU_THROTTLE), |
Peter Xu | 2081475 | 2017-07-18 11:39:03 +0800 | [diff] [blame] | 3185 | |
| 3186 | /* Migration capabilities */ |
| 3187 | DEFINE_PROP_MIG_CAP("x-xbzrle", MIGRATION_CAPABILITY_XBZRLE), |
| 3188 | DEFINE_PROP_MIG_CAP("x-rdma-pin-all", MIGRATION_CAPABILITY_RDMA_PIN_ALL), |
| 3189 | DEFINE_PROP_MIG_CAP("x-auto-converge", MIGRATION_CAPABILITY_AUTO_CONVERGE), |
| 3190 | DEFINE_PROP_MIG_CAP("x-zero-blocks", MIGRATION_CAPABILITY_ZERO_BLOCKS), |
| 3191 | DEFINE_PROP_MIG_CAP("x-compress", MIGRATION_CAPABILITY_COMPRESS), |
| 3192 | DEFINE_PROP_MIG_CAP("x-events", MIGRATION_CAPABILITY_EVENTS), |
| 3193 | DEFINE_PROP_MIG_CAP("x-postcopy-ram", MIGRATION_CAPABILITY_POSTCOPY_RAM), |
| 3194 | DEFINE_PROP_MIG_CAP("x-colo", MIGRATION_CAPABILITY_X_COLO), |
| 3195 | DEFINE_PROP_MIG_CAP("x-release-ram", MIGRATION_CAPABILITY_RELEASE_RAM), |
| 3196 | DEFINE_PROP_MIG_CAP("x-block", MIGRATION_CAPABILITY_BLOCK), |
| 3197 | DEFINE_PROP_MIG_CAP("x-return-path", MIGRATION_CAPABILITY_RETURN_PATH), |
Juan Quintela | 30126bb | 2016-01-14 12:23:00 +0100 | [diff] [blame] | 3198 | DEFINE_PROP_MIG_CAP("x-multifd", MIGRATION_CAPABILITY_X_MULTIFD), |
Peter Xu | 2081475 | 2017-07-18 11:39:03 +0800 | [diff] [blame] | 3199 | |
Peter Xu | 5272298 | 2017-06-27 12:10:14 +0800 | [diff] [blame] | 3200 | DEFINE_PROP_END_OF_LIST(), |
| 3201 | }; |
| 3202 | |
Peter Xu | e5cb7e7 | 2017-06-27 12:10:13 +0800 | [diff] [blame] | 3203 | static void migration_class_init(ObjectClass *klass, void *data) |
| 3204 | { |
| 3205 | DeviceClass *dc = DEVICE_CLASS(klass); |
| 3206 | |
| 3207 | dc->user_creatable = false; |
Peter Xu | 5272298 | 2017-06-27 12:10:14 +0800 | [diff] [blame] | 3208 | dc->props = migration_properties; |
Peter Xu | e5cb7e7 | 2017-06-27 12:10:13 +0800 | [diff] [blame] | 3209 | } |
| 3210 | |
Marc-André Lureau | b91bf5e | 2017-08-01 17:04:18 +0100 | [diff] [blame] | 3211 | static void migration_instance_finalize(Object *obj) |
| 3212 | { |
| 3213 | MigrationState *ms = MIGRATION_OBJ(obj); |
| 3214 | MigrationParameters *params = &ms->parameters; |
| 3215 | |
Juan Quintela | 87db1a7 | 2017-09-05 12:50:22 +0200 | [diff] [blame] | 3216 | qemu_mutex_destroy(&ms->error_mutex); |
Peter Xu | 62df066 | 2018-05-02 18:47:38 +0800 | [diff] [blame] | 3217 | qemu_mutex_destroy(&ms->qemu_file_lock); |
Marc-André Lureau | b91bf5e | 2017-08-01 17:04:18 +0100 | [diff] [blame] | 3218 | g_free(params->tls_hostname); |
| 3219 | g_free(params->tls_creds); |
Dr. David Alan Gilbert | ad767be | 2018-06-13 11:26:41 +0100 | [diff] [blame] | 3220 | qemu_sem_destroy(&ms->rate_limit_sem); |
Dr. David Alan Gilbert | e91d895 | 2017-10-20 10:05:52 +0100 | [diff] [blame] | 3221 | qemu_sem_destroy(&ms->pause_sem); |
Peter Xu | b23c2ad | 2018-05-02 18:47:19 +0800 | [diff] [blame] | 3222 | qemu_sem_destroy(&ms->postcopy_pause_sem); |
Peter Xu | 14b1742 | 2018-05-02 18:47:21 +0800 | [diff] [blame] | 3223 | qemu_sem_destroy(&ms->postcopy_pause_rp_sem); |
Peter Xu | edd090c | 2018-05-02 18:47:32 +0800 | [diff] [blame] | 3224 | qemu_sem_destroy(&ms->rp_state.rp_sem); |
Marc-André Lureau | ab105cc | 2018-03-06 18:09:59 +0100 | [diff] [blame] | 3225 | error_free(ms->error); |
Marc-André Lureau | b91bf5e | 2017-08-01 17:04:18 +0100 | [diff] [blame] | 3226 | } |
| 3227 | |
Peter Xu | e5cb7e7 | 2017-06-27 12:10:13 +0800 | [diff] [blame] | 3228 | static void migration_instance_init(Object *obj) |
| 3229 | { |
| 3230 | MigrationState *ms = MIGRATION_OBJ(obj); |
Peter Xu | 8b0b29d | 2017-07-18 11:39:06 +0800 | [diff] [blame] | 3231 | MigrationParameters *params = &ms->parameters; |
Peter Xu | e5cb7e7 | 2017-06-27 12:10:13 +0800 | [diff] [blame] | 3232 | |
| 3233 | ms->state = MIGRATION_STATUS_NONE; |
Peter Xu | e5cb7e7 | 2017-06-27 12:10:13 +0800 | [diff] [blame] | 3234 | ms->mbps = -1; |
Dr. David Alan Gilbert | e91d895 | 2017-10-20 10:05:52 +0100 | [diff] [blame] | 3235 | qemu_sem_init(&ms->pause_sem, 0); |
Juan Quintela | 87db1a7 | 2017-09-05 12:50:22 +0200 | [diff] [blame] | 3236 | qemu_mutex_init(&ms->error_mutex); |
Peter Xu | 8b0b29d | 2017-07-18 11:39:06 +0800 | [diff] [blame] | 3237 | |
| 3238 | params->tls_hostname = g_strdup(""); |
| 3239 | params->tls_creds = g_strdup(""); |
| 3240 | |
| 3241 | /* Set has_* up only for parameter checks */ |
| 3242 | params->has_compress_level = true; |
| 3243 | params->has_compress_threads = true; |
| 3244 | params->has_decompress_threads = true; |
| 3245 | params->has_cpu_throttle_initial = true; |
| 3246 | params->has_cpu_throttle_increment = true; |
| 3247 | params->has_max_bandwidth = true; |
| 3248 | params->has_downtime_limit = true; |
| 3249 | params->has_x_checkpoint_delay = true; |
| 3250 | params->has_block_incremental = true; |
Juan Quintela | 4075fb1 | 2016-01-15 08:56:17 +0100 | [diff] [blame] | 3251 | params->has_x_multifd_channels = true; |
Juan Quintela | 0fb8660 | 2017-04-27 10:48:25 +0200 | [diff] [blame] | 3252 | params->has_x_multifd_page_count = true; |
Juan Quintela | 73af8dd | 2017-10-05 21:30:10 +0200 | [diff] [blame] | 3253 | params->has_xbzrle_cache_size = true; |
Dr. David Alan Gilbert | 7e555c6 | 2018-06-13 11:26:40 +0100 | [diff] [blame] | 3254 | params->has_max_postcopy_bandwidth = true; |
Li Qiang | 4cbc9c7 | 2018-08-01 06:00:20 -0700 | [diff] [blame] | 3255 | params->has_max_cpu_throttle = true; |
Peter Xu | b23c2ad | 2018-05-02 18:47:19 +0800 | [diff] [blame] | 3256 | |
| 3257 | qemu_sem_init(&ms->postcopy_pause_sem, 0); |
Peter Xu | 14b1742 | 2018-05-02 18:47:21 +0800 | [diff] [blame] | 3258 | qemu_sem_init(&ms->postcopy_pause_rp_sem, 0); |
Peter Xu | edd090c | 2018-05-02 18:47:32 +0800 | [diff] [blame] | 3259 | qemu_sem_init(&ms->rp_state.rp_sem, 0); |
Dr. David Alan Gilbert | ad767be | 2018-06-13 11:26:41 +0100 | [diff] [blame] | 3260 | qemu_sem_init(&ms->rate_limit_sem, 0); |
Peter Xu | 62df066 | 2018-05-02 18:47:38 +0800 | [diff] [blame] | 3261 | qemu_mutex_init(&ms->qemu_file_lock); |
Peter Xu | 8b0b29d | 2017-07-18 11:39:06 +0800 | [diff] [blame] | 3262 | } |
| 3263 | |
| 3264 | /* |
| 3265 | * Return true if check pass, false otherwise. Error will be put |
| 3266 | * inside errp if provided. |
| 3267 | */ |
| 3268 | static bool migration_object_check(MigrationState *ms, Error **errp) |
| 3269 | { |
Peter Xu | 6b19a7d | 2017-07-18 11:39:10 +0800 | [diff] [blame] | 3270 | MigrationCapabilityStatusList *head = NULL; |
| 3271 | /* Assuming all off */ |
| 3272 | bool cap_list[MIGRATION_CAPABILITY__MAX] = { 0 }, ret; |
| 3273 | int i; |
| 3274 | |
Peter Xu | 8b0b29d | 2017-07-18 11:39:06 +0800 | [diff] [blame] | 3275 | if (!migrate_params_check(&ms->parameters, errp)) { |
| 3276 | return false; |
| 3277 | } |
| 3278 | |
Peter Xu | 6b19a7d | 2017-07-18 11:39:10 +0800 | [diff] [blame] | 3279 | for (i = 0; i < MIGRATION_CAPABILITY__MAX; i++) { |
| 3280 | if (ms->enabled_capabilities[i]) { |
| 3281 | head = migrate_cap_add(head, i, true); |
| 3282 | } |
| 3283 | } |
| 3284 | |
| 3285 | ret = migrate_caps_check(cap_list, head, errp); |
| 3286 | |
| 3287 | /* It works with head == NULL */ |
| 3288 | qapi_free_MigrationCapabilityStatusList(head); |
| 3289 | |
| 3290 | return ret; |
Peter Xu | e5cb7e7 | 2017-06-27 12:10:13 +0800 | [diff] [blame] | 3291 | } |
| 3292 | |
| 3293 | static const TypeInfo migration_type = { |
| 3294 | .name = TYPE_MIGRATION, |
Peter Xu | 01f6e14 | 2017-06-28 15:15:44 +0800 | [diff] [blame] | 3295 | /* |
Peter Xu | c8d3ff3 | 2017-07-05 16:21:23 +0800 | [diff] [blame] | 3296 | * NOTE: TYPE_MIGRATION is not really a device, as the object is |
| 3297 | * not created using qdev_create(), it is not attached to the qdev |
| 3298 | * device tree, and it is never realized. |
| 3299 | * |
| 3300 | * TODO: Make this TYPE_OBJECT once QOM provides something like |
| 3301 | * TYPE_DEVICE's "-global" properties. |
Peter Xu | 01f6e14 | 2017-06-28 15:15:44 +0800 | [diff] [blame] | 3302 | */ |
Peter Xu | e5cb7e7 | 2017-06-27 12:10:13 +0800 | [diff] [blame] | 3303 | .parent = TYPE_DEVICE, |
| 3304 | .class_init = migration_class_init, |
| 3305 | .class_size = sizeof(MigrationClass), |
| 3306 | .instance_size = sizeof(MigrationState), |
| 3307 | .instance_init = migration_instance_init, |
Marc-André Lureau | b91bf5e | 2017-08-01 17:04:18 +0100 | [diff] [blame] | 3308 | .instance_finalize = migration_instance_finalize, |
Peter Xu | e5cb7e7 | 2017-06-27 12:10:13 +0800 | [diff] [blame] | 3309 | }; |
| 3310 | |
| 3311 | static void register_migration_types(void) |
| 3312 | { |
| 3313 | type_register_static(&migration_type); |
| 3314 | } |
| 3315 | |
| 3316 | type_init(register_migration_types); |