blob: 8200ac6b754bd0dffd5bb3d2e5219188a91889a6 [file] [log] [blame]
Blue Swirl296af7c2010-03-29 19:23:50 +00001/*
2 * QEMU System Emulator
3 *
4 * Copyright (c) 2003-2008 Fabrice Bellard
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
24
25/* Needed early for CONFIG_BSD etc. */
Peter Maydell7b31bbc2016-01-26 18:16:56 +000026#include "qemu/osdep.h"
Paolo Bonzini33c11872016-03-15 16:58:45 +010027#include "qemu-common.h"
KONRAD Frederic8d4e9142017-02-23 18:29:08 +000028#include "qemu/config-file.h"
Paolo Bonzini33c11872016-03-15 16:58:45 +010029#include "cpu.h"
Paolo Bonzini83c90892012-12-17 18:19:49 +010030#include "monitor/monitor.h"
Wenchao Xiaa4e15de2014-06-18 08:43:36 +020031#include "qapi/qmp/qerror.h"
Markus Armbrusterd49b6832015-03-17 18:29:20 +010032#include "qemu/error-report.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010033#include "sysemu/sysemu.h"
Max Reitzda31d592016-03-16 19:54:32 +010034#include "sysemu/block-backend.h"
Paolo Bonzini022c62c2012-12-17 18:19:49 +010035#include "exec/gdbstub.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010036#include "sysemu/dma.h"
Vincent Palatinb3946622017-01-10 11:59:55 +010037#include "sysemu/hw_accel.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010038#include "sysemu/kvm.h"
Vincent Palatinb0cb0a62017-01-10 11:59:57 +010039#include "sysemu/hax.h"
Luiz Capitulinode0b36b2011-09-21 16:38:35 -030040#include "qmp-commands.h"
Paolo Bonzini63c91552016-03-15 13:18:37 +010041#include "exec/exec-all.h"
Blue Swirl296af7c2010-03-29 19:23:50 +000042
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010043#include "qemu/thread.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010044#include "sysemu/cpus.h"
45#include "sysemu/qtest.h"
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010046#include "qemu/main-loop.h"
47#include "qemu/bitmap.h"
Liu Ping Fancb365642013-09-25 14:20:58 +080048#include "qemu/seqlock.h"
KONRAD Frederic8d4e9142017-02-23 18:29:08 +000049#include "tcg.h"
Wenchao Xiaa4e15de2014-06-18 08:43:36 +020050#include "qapi-event.h"
Alexey Kardashevskiy9cb805f2014-08-20 22:16:33 +100051#include "hw/nmi.h"
Pavel Dovgalyuk8b427042015-09-17 19:24:05 +030052#include "sysemu/replay.h"
Jan Kiszka0ff0fc12011-06-23 10:15:55 +020053
54#ifndef _WIN32
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010055#include "qemu/compatfd.h"
Jan Kiszka0ff0fc12011-06-23 10:15:55 +020056#endif
Blue Swirl296af7c2010-03-29 19:23:50 +000057
Jan Kiszka6d9cb732011-02-01 22:15:58 +010058#ifdef CONFIG_LINUX
59
60#include <sys/prctl.h>
61
Marcelo Tosattic0532a72010-10-11 15:31:21 -030062#ifndef PR_MCE_KILL
63#define PR_MCE_KILL 33
64#endif
65
Jan Kiszka6d9cb732011-02-01 22:15:58 +010066#ifndef PR_MCE_KILL_SET
67#define PR_MCE_KILL_SET 1
68#endif
69
70#ifndef PR_MCE_KILL_EARLY
71#define PR_MCE_KILL_EARLY 1
72#endif
73
74#endif /* CONFIG_LINUX */
75
Sebastian Tanase27498be2014-07-25 11:56:33 +020076int64_t max_delay;
77int64_t max_advance;
Blue Swirl296af7c2010-03-29 19:23:50 +000078
Jason J. Herne2adcc852015-09-08 13:12:33 -040079/* vcpu throttling controls */
80static QEMUTimer *throttle_timer;
81static unsigned int throttle_percentage;
82
83#define CPU_THROTTLE_PCT_MIN 1
84#define CPU_THROTTLE_PCT_MAX 99
85#define CPU_THROTTLE_TIMESLICE_NS 10000000
86
Tiejun Chen321bc0b2013-08-02 09:43:09 +080087bool cpu_is_stopped(CPUState *cpu)
88{
89 return cpu->stopped || !runstate_is_running();
90}
91
Andreas Färbera98ae1d2013-05-26 23:21:08 +020092static bool cpu_thread_is_idle(CPUState *cpu)
Peter Maydellac873f12012-07-19 16:52:27 +010093{
Andreas Färberc64ca812012-05-03 02:11:45 +020094 if (cpu->stop || cpu->queued_work_first) {
Peter Maydellac873f12012-07-19 16:52:27 +010095 return false;
96 }
Tiejun Chen321bc0b2013-08-02 09:43:09 +080097 if (cpu_is_stopped(cpu)) {
Peter Maydellac873f12012-07-19 16:52:27 +010098 return true;
99 }
Andreas Färber8c2e1b02013-08-25 18:53:55 +0200100 if (!cpu->halted || cpu_has_work(cpu) ||
Alexander Graf215e79c2013-04-24 22:24:12 +0200101 kvm_halt_in_kernel()) {
Peter Maydellac873f12012-07-19 16:52:27 +0100102 return false;
103 }
104 return true;
105}
106
107static bool all_cpu_threads_idle(void)
108{
Andreas Färber182735e2013-05-29 22:29:20 +0200109 CPUState *cpu;
Peter Maydellac873f12012-07-19 16:52:27 +0100110
Andreas Färberbdc44642013-06-24 23:50:24 +0200111 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200112 if (!cpu_thread_is_idle(cpu)) {
Peter Maydellac873f12012-07-19 16:52:27 +0100113 return false;
114 }
115 }
116 return true;
117}
118
Blue Swirl296af7c2010-03-29 19:23:50 +0000119/***********************************************************/
Paolo Bonzini946fb272011-09-12 13:57:37 +0200120/* guest cycle counter */
121
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200122/* Protected by TimersState seqlock */
123
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200124static bool icount_sleep = true;
Sebastian Tanase71468392014-07-23 11:47:50 +0200125static int64_t vm_clock_warp_start = -1;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200126/* Conversion factor from emulated instructions to virtual clock ticks. */
127static int icount_time_shift;
128/* Arbitrarily pick 1MIPS as the minimum allowable speed. */
129#define MAX_ICOUNT_SHIFT 10
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200130
Paolo Bonzini946fb272011-09-12 13:57:37 +0200131static QEMUTimer *icount_rt_timer;
132static QEMUTimer *icount_vm_timer;
133static QEMUTimer *icount_warp_timer;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200134
135typedef struct TimersState {
Liu Ping Fancb365642013-09-25 14:20:58 +0800136 /* Protected by BQL. */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200137 int64_t cpu_ticks_prev;
138 int64_t cpu_ticks_offset;
Liu Ping Fancb365642013-09-25 14:20:58 +0800139
140 /* cpu_clock_offset can be read out of BQL, so protect it with
141 * this lock.
142 */
143 QemuSeqLock vm_clock_seqlock;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200144 int64_t cpu_clock_offset;
145 int32_t cpu_ticks_enabled;
146 int64_t dummy;
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200147
148 /* Compensate for varying guest execution speed. */
149 int64_t qemu_icount_bias;
150 /* Only written by TCG thread */
151 int64_t qemu_icount;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200152} TimersState;
153
Liu Ping Fand9cd4002013-07-21 08:43:00 +0000154static TimersState timers_state;
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000155bool mttcg_enabled;
156
157/*
158 * We default to false if we know other options have been enabled
159 * which are currently incompatible with MTTCG. Otherwise when each
160 * guest (target) has been updated to support:
161 * - atomic instructions
162 * - memory ordering primitives (barriers)
163 * they can set the appropriate CONFIG flags in ${target}-softmmu.mak
164 *
165 * Once a guest architecture has been converted to the new primitives
166 * there are two remaining limitations to check.
167 *
168 * - The guest can't be oversized (e.g. 64 bit guest on 32 bit host)
169 * - The host must have a stronger memory order than the guest
170 *
171 * It may be possible in future to support strong guests on weak hosts
172 * but that will require tagging all load/stores in a guest with their
173 * implicit memory order requirements which would likely slow things
174 * down a lot.
175 */
176
177static bool check_tcg_memory_orders_compatible(void)
178{
179#if defined(TCG_GUEST_DEFAULT_MO) && defined(TCG_TARGET_DEFAULT_MO)
180 return (TCG_GUEST_DEFAULT_MO & ~TCG_TARGET_DEFAULT_MO) == 0;
181#else
182 return false;
183#endif
184}
185
186static bool default_mttcg_enabled(void)
187{
188 QemuOpts *icount_opts = qemu_find_opts_singleton("icount");
189 const char *rr = qemu_opt_get(icount_opts, "rr");
190
191 if (rr || TCG_OVERSIZED_GUEST) {
192 return false;
193 } else {
194#ifdef TARGET_SUPPORTS_MTTCG
195 return check_tcg_memory_orders_compatible();
196#else
197 return false;
198#endif
199 }
200}
201
202void qemu_tcg_configure(QemuOpts *opts, Error **errp)
203{
204 const char *t = qemu_opt_get(opts, "thread");
205 if (t) {
206 if (strcmp(t, "multi") == 0) {
207 if (TCG_OVERSIZED_GUEST) {
208 error_setg(errp, "No MTTCG when guest word size > hosts");
209 } else {
210 if (!check_tcg_memory_orders_compatible()) {
211 error_report("Guest expects a stronger memory ordering "
212 "than the host provides");
213 error_printf("This may cause strange/hard to debug errors");
214 }
215 mttcg_enabled = true;
216 }
217 } else if (strcmp(t, "single") == 0) {
218 mttcg_enabled = false;
219 } else {
220 error_setg(errp, "Invalid 'thread' setting %s", t);
221 }
222 } else {
223 mttcg_enabled = default_mttcg_enabled();
224 }
225}
Paolo Bonzini946fb272011-09-12 13:57:37 +0200226
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300227int64_t cpu_get_icount_raw(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200228{
229 int64_t icount;
Andreas Färber4917cf42013-05-27 05:17:50 +0200230 CPUState *cpu = current_cpu;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200231
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200232 icount = timers_state.qemu_icount;
Andreas Färber4917cf42013-05-27 05:17:50 +0200233 if (cpu) {
Paolo Bonzini414b15c2015-06-24 14:16:26 +0200234 if (!cpu->can_do_io) {
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300235 fprintf(stderr, "Bad icount read\n");
236 exit(1);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200237 }
Andreas Färber28ecfd72013-08-26 05:51:49 +0200238 icount -= (cpu->icount_decr.u16.low + cpu->icount_extra);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200239 }
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300240 return icount;
241}
242
243/* Return the virtual CPU time, based on the instruction counter. */
244static int64_t cpu_get_icount_locked(void)
245{
246 int64_t icount = cpu_get_icount_raw();
KONRAD Frederic3f031312014-08-01 01:37:15 +0200247 return timers_state.qemu_icount_bias + cpu_icount_to_ns(icount);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200248}
249
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200250int64_t cpu_get_icount(void)
251{
252 int64_t icount;
253 unsigned start;
254
255 do {
256 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
257 icount = cpu_get_icount_locked();
258 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
259
260 return icount;
261}
262
KONRAD Frederic3f031312014-08-01 01:37:15 +0200263int64_t cpu_icount_to_ns(int64_t icount)
264{
265 return icount << icount_time_shift;
266}
267
Cao jind90f3cc2016-07-29 19:05:38 +0800268/* return the time elapsed in VM between vm_start and vm_stop. Unless
269 * icount is active, cpu_get_ticks() uses units of the host CPU cycle
270 * counter.
271 *
272 * Caller must hold the BQL
273 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200274int64_t cpu_get_ticks(void)
275{
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100276 int64_t ticks;
277
Paolo Bonzini946fb272011-09-12 13:57:37 +0200278 if (use_icount) {
279 return cpu_get_icount();
280 }
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100281
282 ticks = timers_state.cpu_ticks_offset;
283 if (timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400284 ticks += cpu_get_host_ticks();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200285 }
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100286
287 if (timers_state.cpu_ticks_prev > ticks) {
288 /* Note: non increasing ticks may happen if the host uses
289 software suspend */
290 timers_state.cpu_ticks_offset += timers_state.cpu_ticks_prev - ticks;
291 ticks = timers_state.cpu_ticks_prev;
292 }
293
294 timers_state.cpu_ticks_prev = ticks;
295 return ticks;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200296}
297
Liu Ping Fancb365642013-09-25 14:20:58 +0800298static int64_t cpu_get_clock_locked(void)
299{
Cao jin1d45cea2016-07-29 19:05:37 +0800300 int64_t time;
Liu Ping Fancb365642013-09-25 14:20:58 +0800301
Cao jin1d45cea2016-07-29 19:05:37 +0800302 time = timers_state.cpu_clock_offset;
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100303 if (timers_state.cpu_ticks_enabled) {
Cao jin1d45cea2016-07-29 19:05:37 +0800304 time += get_clock();
Liu Ping Fancb365642013-09-25 14:20:58 +0800305 }
306
Cao jin1d45cea2016-07-29 19:05:37 +0800307 return time;
Liu Ping Fancb365642013-09-25 14:20:58 +0800308}
309
Cao jind90f3cc2016-07-29 19:05:38 +0800310/* Return the monotonic time elapsed in VM, i.e.,
Peter Maydell8212ff82016-09-15 10:24:22 +0100311 * the time between vm_start and vm_stop
312 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200313int64_t cpu_get_clock(void)
314{
315 int64_t ti;
Liu Ping Fancb365642013-09-25 14:20:58 +0800316 unsigned start;
317
318 do {
319 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
320 ti = cpu_get_clock_locked();
321 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
322
323 return ti;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200324}
325
Liu Ping Fancb365642013-09-25 14:20:58 +0800326/* enable cpu_get_ticks()
Cao jin3224e872016-07-08 18:31:37 +0800327 * Caller must hold BQL which serves as mutex for vm_clock_seqlock.
Liu Ping Fancb365642013-09-25 14:20:58 +0800328 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200329void cpu_enable_ticks(void)
330{
Liu Ping Fancb365642013-09-25 14:20:58 +0800331 /* Here, the really thing protected by seqlock is cpu_clock_offset. */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400332 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200333 if (!timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400334 timers_state.cpu_ticks_offset -= cpu_get_host_ticks();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200335 timers_state.cpu_clock_offset -= get_clock();
336 timers_state.cpu_ticks_enabled = 1;
337 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400338 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200339}
340
341/* disable cpu_get_ticks() : the clock is stopped. You must not call
Liu Ping Fancb365642013-09-25 14:20:58 +0800342 * cpu_get_ticks() after that.
Cao jin3224e872016-07-08 18:31:37 +0800343 * Caller must hold BQL which serves as mutex for vm_clock_seqlock.
Liu Ping Fancb365642013-09-25 14:20:58 +0800344 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200345void cpu_disable_ticks(void)
346{
Liu Ping Fancb365642013-09-25 14:20:58 +0800347 /* Here, the really thing protected by seqlock is cpu_clock_offset. */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400348 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200349 if (timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400350 timers_state.cpu_ticks_offset += cpu_get_host_ticks();
Liu Ping Fancb365642013-09-25 14:20:58 +0800351 timers_state.cpu_clock_offset = cpu_get_clock_locked();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200352 timers_state.cpu_ticks_enabled = 0;
353 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400354 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200355}
356
357/* Correlation between real and virtual time is always going to be
358 fairly approximate, so ignore small variation.
359 When the guest is idle real and virtual time will be aligned in
360 the IO wait loop. */
Rutuja Shah73bcb242016-03-21 21:32:30 +0530361#define ICOUNT_WOBBLE (NANOSECONDS_PER_SECOND / 10)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200362
363static void icount_adjust(void)
364{
365 int64_t cur_time;
366 int64_t cur_icount;
367 int64_t delta;
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200368
369 /* Protected by TimersState mutex. */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200370 static int64_t last_delta;
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200371
Paolo Bonzini946fb272011-09-12 13:57:37 +0200372 /* If the VM is not running, then do nothing. */
373 if (!runstate_is_running()) {
374 return;
375 }
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200376
Emilio G. Cota03719e42016-06-08 14:55:21 -0400377 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200378 cur_time = cpu_get_clock_locked();
379 cur_icount = cpu_get_icount_locked();
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200380
Paolo Bonzini946fb272011-09-12 13:57:37 +0200381 delta = cur_icount - cur_time;
382 /* FIXME: This is a very crude algorithm, somewhat prone to oscillation. */
383 if (delta > 0
384 && last_delta + ICOUNT_WOBBLE < delta * 2
385 && icount_time_shift > 0) {
386 /* The guest is getting too far ahead. Slow time down. */
387 icount_time_shift--;
388 }
389 if (delta < 0
390 && last_delta - ICOUNT_WOBBLE > delta * 2
391 && icount_time_shift < MAX_ICOUNT_SHIFT) {
392 /* The guest is getting too far behind. Speed time up. */
393 icount_time_shift++;
394 }
395 last_delta = delta;
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200396 timers_state.qemu_icount_bias = cur_icount
397 - (timers_state.qemu_icount << icount_time_shift);
Emilio G. Cota03719e42016-06-08 14:55:21 -0400398 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200399}
400
401static void icount_adjust_rt(void *opaque)
402{
Alex Bligh40daca52013-08-21 16:03:02 +0100403 timer_mod(icount_rt_timer,
Pavel Dovgalyuk1979b902015-01-12 15:00:43 +0300404 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL_RT) + 1000);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200405 icount_adjust();
406}
407
408static void icount_adjust_vm(void *opaque)
409{
Alex Bligh40daca52013-08-21 16:03:02 +0100410 timer_mod(icount_vm_timer,
411 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
Rutuja Shah73bcb242016-03-21 21:32:30 +0530412 NANOSECONDS_PER_SECOND / 10);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200413 icount_adjust();
414}
415
416static int64_t qemu_icount_round(int64_t count)
417{
418 return (count + (1 << icount_time_shift) - 1) >> icount_time_shift;
419}
420
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300421static void icount_warp_rt(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200422{
Alex Bennéeccffff42016-04-04 15:35:48 +0100423 unsigned seq;
424 int64_t warp_start;
425
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200426 /* The icount_warp_timer is rescheduled soon after vm_clock_warp_start
427 * changes from -1 to another value, so the race here is okay.
428 */
Alex Bennéeccffff42016-04-04 15:35:48 +0100429 do {
430 seq = seqlock_read_begin(&timers_state.vm_clock_seqlock);
431 warp_start = vm_clock_warp_start;
432 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, seq));
433
434 if (warp_start == -1) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200435 return;
436 }
437
Emilio G. Cota03719e42016-06-08 14:55:21 -0400438 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200439 if (runstate_is_running()) {
Pavel Dovgalyuk8eda2062015-09-17 19:24:28 +0300440 int64_t clock = REPLAY_CLOCK(REPLAY_CLOCK_VIRTUAL_RT,
441 cpu_get_clock_locked());
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200442 int64_t warp_delta;
443
444 warp_delta = clock - vm_clock_warp_start;
445 if (use_icount == 2) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200446 /*
Alex Bligh40daca52013-08-21 16:03:02 +0100447 * In adaptive mode, do not let QEMU_CLOCK_VIRTUAL run too
Paolo Bonzini946fb272011-09-12 13:57:37 +0200448 * far ahead of real time.
449 */
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200450 int64_t cur_icount = cpu_get_icount_locked();
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300451 int64_t delta = clock - cur_icount;
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200452 warp_delta = MIN(warp_delta, delta);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200453 }
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200454 timers_state.qemu_icount_bias += warp_delta;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200455 }
456 vm_clock_warp_start = -1;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400457 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200458
459 if (qemu_clock_expired(QEMU_CLOCK_VIRTUAL)) {
460 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
461 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200462}
463
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300464static void icount_timer_cb(void *opaque)
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300465{
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300466 /* No need for a checkpoint because the timer already synchronizes
467 * with CHECKPOINT_CLOCK_VIRTUAL_RT.
468 */
469 icount_warp_rt();
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300470}
471
Paolo Bonzini8156be52012-03-28 15:42:04 +0200472void qtest_clock_warp(int64_t dest)
473{
Alex Bligh40daca52013-08-21 16:03:02 +0100474 int64_t clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
Fam Zhengefef88b2015-01-19 17:51:43 +0800475 AioContext *aio_context;
Paolo Bonzini8156be52012-03-28 15:42:04 +0200476 assert(qtest_enabled());
Fam Zhengefef88b2015-01-19 17:51:43 +0800477 aio_context = qemu_get_aio_context();
Paolo Bonzini8156be52012-03-28 15:42:04 +0200478 while (clock < dest) {
Alex Bligh40daca52013-08-21 16:03:02 +0100479 int64_t deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
Sergey Fedorovc9299e22014-06-10 13:10:28 +0400480 int64_t warp = qemu_soonest_timeout(dest - clock, deadline);
Fam Zhengefef88b2015-01-19 17:51:43 +0800481
Emilio G. Cota03719e42016-06-08 14:55:21 -0400482 seqlock_write_begin(&timers_state.vm_clock_seqlock);
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200483 timers_state.qemu_icount_bias += warp;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400484 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200485
Alex Bligh40daca52013-08-21 16:03:02 +0100486 qemu_clock_run_timers(QEMU_CLOCK_VIRTUAL);
Fam Zhengefef88b2015-01-19 17:51:43 +0800487 timerlist_run_timers(aio_context->tlg.tl[QEMU_CLOCK_VIRTUAL]);
Alex Bligh40daca52013-08-21 16:03:02 +0100488 clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini8156be52012-03-28 15:42:04 +0200489 }
Alex Bligh40daca52013-08-21 16:03:02 +0100490 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini8156be52012-03-28 15:42:04 +0200491}
492
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300493void qemu_start_warp_timer(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200494{
Paolo Bonzinice78d182013-10-07 17:30:02 +0200495 int64_t clock;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200496 int64_t deadline;
497
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300498 if (!use_icount) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200499 return;
500 }
501
Pavel Dovgalyuk8bd7f712015-09-17 19:24:44 +0300502 /* Nothing to do if the VM is stopped: QEMU_CLOCK_VIRTUAL timers
503 * do not fire, so computing the deadline does not make sense.
504 */
505 if (!runstate_is_running()) {
506 return;
507 }
508
509 /* warp clock deterministically in record/replay mode */
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300510 if (!replay_checkpoint(CHECKPOINT_CLOCK_WARP_START)) {
Pavel Dovgalyuk8bd7f712015-09-17 19:24:44 +0300511 return;
512 }
513
Paolo Bonzinice78d182013-10-07 17:30:02 +0200514 if (!all_cpu_threads_idle()) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200515 return;
516 }
517
Paolo Bonzini8156be52012-03-28 15:42:04 +0200518 if (qtest_enabled()) {
519 /* When testing, qtest commands advance icount. */
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300520 return;
Paolo Bonzini8156be52012-03-28 15:42:04 +0200521 }
522
Alex Blighac70aaf2013-08-21 16:02:57 +0100523 /* We want to use the earliest deadline from ALL vm_clocks */
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300524 clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT);
Alex Bligh40daca52013-08-21 16:03:02 +0100525 deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
Paolo Bonzinice78d182013-10-07 17:30:02 +0200526 if (deadline < 0) {
Victor CLEMENTd7a0f712015-05-29 17:14:06 +0200527 static bool notified;
528 if (!icount_sleep && !notified) {
529 error_report("WARNING: icount sleep disabled and no active timers");
530 notified = true;
531 }
Paolo Bonzinice78d182013-10-07 17:30:02 +0200532 return;
Alex Blighac70aaf2013-08-21 16:02:57 +0100533 }
534
Paolo Bonzini946fb272011-09-12 13:57:37 +0200535 if (deadline > 0) {
536 /*
Alex Bligh40daca52013-08-21 16:03:02 +0100537 * Ensure QEMU_CLOCK_VIRTUAL proceeds even when the virtual CPU goes to
Paolo Bonzini946fb272011-09-12 13:57:37 +0200538 * sleep. Otherwise, the CPU might be waiting for a future timer
539 * interrupt to wake it up, but the interrupt never comes because
540 * the vCPU isn't running any insns and thus doesn't advance the
Alex Bligh40daca52013-08-21 16:03:02 +0100541 * QEMU_CLOCK_VIRTUAL.
Paolo Bonzini946fb272011-09-12 13:57:37 +0200542 */
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200543 if (!icount_sleep) {
544 /*
545 * We never let VCPUs sleep in no sleep icount mode.
546 * If there is a pending QEMU_CLOCK_VIRTUAL timer we just advance
547 * to the next QEMU_CLOCK_VIRTUAL event and notify it.
548 * It is useful when we want a deterministic execution time,
549 * isolated from host latencies.
550 */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400551 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200552 timers_state.qemu_icount_bias += deadline;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400553 seqlock_write_end(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200554 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
555 } else {
556 /*
557 * We do stop VCPUs and only advance QEMU_CLOCK_VIRTUAL after some
558 * "real" time, (related to the time left until the next event) has
559 * passed. The QEMU_CLOCK_VIRTUAL_RT clock will do this.
560 * This avoids that the warps are visible externally; for example,
561 * you will not be sending network packets continuously instead of
562 * every 100ms.
563 */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400564 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200565 if (vm_clock_warp_start == -1 || vm_clock_warp_start > clock) {
566 vm_clock_warp_start = clock;
567 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400568 seqlock_write_end(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200569 timer_mod_anticipate(icount_warp_timer, clock + deadline);
Paolo Bonzinice78d182013-10-07 17:30:02 +0200570 }
Alex Blighac70aaf2013-08-21 16:02:57 +0100571 } else if (deadline == 0) {
Alex Bligh40daca52013-08-21 16:03:02 +0100572 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200573 }
574}
575
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300576static void qemu_account_warp_timer(void)
577{
578 if (!use_icount || !icount_sleep) {
579 return;
580 }
581
582 /* Nothing to do if the VM is stopped: QEMU_CLOCK_VIRTUAL timers
583 * do not fire, so computing the deadline does not make sense.
584 */
585 if (!runstate_is_running()) {
586 return;
587 }
588
589 /* warp clock deterministically in record/replay mode */
590 if (!replay_checkpoint(CHECKPOINT_CLOCK_WARP_ACCOUNT)) {
591 return;
592 }
593
594 timer_del(icount_warp_timer);
595 icount_warp_rt();
596}
597
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200598static bool icount_state_needed(void *opaque)
599{
600 return use_icount;
601}
602
603/*
604 * This is a subsection for icount migration.
605 */
606static const VMStateDescription icount_vmstate_timers = {
607 .name = "timer/icount",
608 .version_id = 1,
609 .minimum_version_id = 1,
Juan Quintela5cd8cad2014-09-23 14:09:54 +0200610 .needed = icount_state_needed,
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200611 .fields = (VMStateField[]) {
612 VMSTATE_INT64(qemu_icount_bias, TimersState),
613 VMSTATE_INT64(qemu_icount, TimersState),
614 VMSTATE_END_OF_LIST()
615 }
616};
617
Paolo Bonzini946fb272011-09-12 13:57:37 +0200618static const VMStateDescription vmstate_timers = {
619 .name = "timer",
620 .version_id = 2,
621 .minimum_version_id = 1,
Juan Quintela35d08452014-04-16 16:01:33 +0200622 .fields = (VMStateField[]) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200623 VMSTATE_INT64(cpu_ticks_offset, TimersState),
624 VMSTATE_INT64(dummy, TimersState),
625 VMSTATE_INT64_V(cpu_clock_offset, TimersState, 2),
626 VMSTATE_END_OF_LIST()
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200627 },
Juan Quintela5cd8cad2014-09-23 14:09:54 +0200628 .subsections = (const VMStateDescription*[]) {
629 &icount_vmstate_timers,
630 NULL
Paolo Bonzini946fb272011-09-12 13:57:37 +0200631 }
632};
633
Paolo Bonzini14e6fe12016-10-31 10:36:08 +0100634static void cpu_throttle_thread(CPUState *cpu, run_on_cpu_data opaque)
Jason J. Herne2adcc852015-09-08 13:12:33 -0400635{
Jason J. Herne2adcc852015-09-08 13:12:33 -0400636 double pct;
637 double throttle_ratio;
638 long sleeptime_ns;
639
640 if (!cpu_throttle_get_percentage()) {
641 return;
642 }
643
644 pct = (double)cpu_throttle_get_percentage()/100;
645 throttle_ratio = pct / (1 - pct);
646 sleeptime_ns = (long)(throttle_ratio * CPU_THROTTLE_TIMESLICE_NS);
647
648 qemu_mutex_unlock_iothread();
649 atomic_set(&cpu->throttle_thread_scheduled, 0);
650 g_usleep(sleeptime_ns / 1000); /* Convert ns to us for usleep call */
651 qemu_mutex_lock_iothread();
652}
653
654static void cpu_throttle_timer_tick(void *opaque)
655{
656 CPUState *cpu;
657 double pct;
658
659 /* Stop the timer if needed */
660 if (!cpu_throttle_get_percentage()) {
661 return;
662 }
663 CPU_FOREACH(cpu) {
664 if (!atomic_xchg(&cpu->throttle_thread_scheduled, 1)) {
Paolo Bonzini14e6fe12016-10-31 10:36:08 +0100665 async_run_on_cpu(cpu, cpu_throttle_thread,
666 RUN_ON_CPU_NULL);
Jason J. Herne2adcc852015-09-08 13:12:33 -0400667 }
668 }
669
670 pct = (double)cpu_throttle_get_percentage()/100;
671 timer_mod(throttle_timer, qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT) +
672 CPU_THROTTLE_TIMESLICE_NS / (1-pct));
673}
674
675void cpu_throttle_set(int new_throttle_pct)
676{
677 /* Ensure throttle percentage is within valid range */
678 new_throttle_pct = MIN(new_throttle_pct, CPU_THROTTLE_PCT_MAX);
679 new_throttle_pct = MAX(new_throttle_pct, CPU_THROTTLE_PCT_MIN);
680
681 atomic_set(&throttle_percentage, new_throttle_pct);
682
683 timer_mod(throttle_timer, qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT) +
684 CPU_THROTTLE_TIMESLICE_NS);
685}
686
687void cpu_throttle_stop(void)
688{
689 atomic_set(&throttle_percentage, 0);
690}
691
692bool cpu_throttle_active(void)
693{
694 return (cpu_throttle_get_percentage() != 0);
695}
696
697int cpu_throttle_get_percentage(void)
698{
699 return atomic_read(&throttle_percentage);
700}
701
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400702void cpu_ticks_init(void)
703{
Emilio G. Cotaccdb3c12016-06-08 14:55:20 -0400704 seqlock_init(&timers_state.vm_clock_seqlock);
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400705 vmstate_register(NULL, 0, &vmstate_timers, &timers_state);
Jason J. Herne2adcc852015-09-08 13:12:33 -0400706 throttle_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL_RT,
707 cpu_throttle_timer_tick, NULL);
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400708}
709
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200710void configure_icount(QemuOpts *opts, Error **errp)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200711{
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200712 const char *option;
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200713 char *rem_str = NULL;
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200714
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200715 option = qemu_opt_get(opts, "shift");
Paolo Bonzini946fb272011-09-12 13:57:37 +0200716 if (!option) {
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200717 if (qemu_opt_get(opts, "align") != NULL) {
718 error_setg(errp, "Please specify shift option when using align");
719 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200720 return;
721 }
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200722
723 icount_sleep = qemu_opt_get_bool(opts, "sleep", true);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200724 if (icount_sleep) {
725 icount_warp_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL_RT,
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300726 icount_timer_cb, NULL);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200727 }
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200728
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200729 icount_align_option = qemu_opt_get_bool(opts, "align", false);
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200730
731 if (icount_align_option && !icount_sleep) {
Pranith Kumar778d9f92016-02-26 10:16:51 -0500732 error_setg(errp, "align=on and sleep=off are incompatible");
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200733 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200734 if (strcmp(option, "auto") != 0) {
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200735 errno = 0;
736 icount_time_shift = strtol(option, &rem_str, 0);
737 if (errno != 0 || *rem_str != '\0' || !strlen(option)) {
738 error_setg(errp, "icount: Invalid shift value");
739 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200740 use_icount = 1;
741 return;
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200742 } else if (icount_align_option) {
743 error_setg(errp, "shift=auto and align=on are incompatible");
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200744 } else if (!icount_sleep) {
Pranith Kumar778d9f92016-02-26 10:16:51 -0500745 error_setg(errp, "shift=auto and sleep=off are incompatible");
Paolo Bonzini946fb272011-09-12 13:57:37 +0200746 }
747
748 use_icount = 2;
749
750 /* 125MIPS seems a reasonable initial guess at the guest speed.
751 It will be corrected fairly quickly anyway. */
752 icount_time_shift = 3;
753
754 /* Have both realtime and virtual time triggers for speed adjustment.
755 The realtime trigger catches emulated time passing too slowly,
756 the virtual time trigger catches emulated time passing too fast.
757 Realtime triggers occur even when idle, so use them less frequently
758 than VM triggers. */
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300759 icount_rt_timer = timer_new_ms(QEMU_CLOCK_VIRTUAL_RT,
760 icount_adjust_rt, NULL);
Alex Bligh40daca52013-08-21 16:03:02 +0100761 timer_mod(icount_rt_timer,
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300762 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL_RT) + 1000);
Alex Bligh40daca52013-08-21 16:03:02 +0100763 icount_vm_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
764 icount_adjust_vm, NULL);
765 timer_mod(icount_vm_timer,
766 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
Rutuja Shah73bcb242016-03-21 21:32:30 +0530767 NANOSECONDS_PER_SECOND / 10);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200768}
769
770/***********************************************************/
Alex Bennée65467062017-02-23 18:29:09 +0000771/* TCG vCPU kick timer
772 *
773 * The kick timer is responsible for moving single threaded vCPU
774 * emulation on to the next vCPU. If more than one vCPU is running a
775 * timer event with force a cpu->exit so the next vCPU can get
776 * scheduled.
777 *
778 * The timer is removed if all vCPUs are idle and restarted again once
779 * idleness is complete.
780 */
781
782static QEMUTimer *tcg_kick_vcpu_timer;
Alex Bennée791158d2017-02-23 18:29:10 +0000783static CPUState *tcg_current_rr_cpu;
Alex Bennée65467062017-02-23 18:29:09 +0000784
785#define TCG_KICK_PERIOD (NANOSECONDS_PER_SECOND / 10)
786
787static inline int64_t qemu_tcg_next_kick(void)
788{
789 return qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + TCG_KICK_PERIOD;
790}
791
Alex Bennée791158d2017-02-23 18:29:10 +0000792/* Kick the currently round-robin scheduled vCPU */
793static void qemu_cpu_kick_rr_cpu(void)
794{
795 CPUState *cpu;
Alex Bennée791158d2017-02-23 18:29:10 +0000796 do {
797 cpu = atomic_mb_read(&tcg_current_rr_cpu);
798 if (cpu) {
799 cpu_exit(cpu);
800 }
801 } while (cpu != atomic_mb_read(&tcg_current_rr_cpu));
802}
803
Alex Bennée65467062017-02-23 18:29:09 +0000804static void kick_tcg_thread(void *opaque)
805{
806 timer_mod(tcg_kick_vcpu_timer, qemu_tcg_next_kick());
Alex Bennée791158d2017-02-23 18:29:10 +0000807 qemu_cpu_kick_rr_cpu();
Alex Bennée65467062017-02-23 18:29:09 +0000808}
809
810static void start_tcg_kick_timer(void)
811{
Alex Bennée37257942017-02-23 18:29:14 +0000812 if (!mttcg_enabled && !tcg_kick_vcpu_timer && CPU_NEXT(first_cpu)) {
Alex Bennée65467062017-02-23 18:29:09 +0000813 tcg_kick_vcpu_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
814 kick_tcg_thread, NULL);
815 timer_mod(tcg_kick_vcpu_timer, qemu_tcg_next_kick());
816 }
817}
818
819static void stop_tcg_kick_timer(void)
820{
821 if (tcg_kick_vcpu_timer) {
822 timer_del(tcg_kick_vcpu_timer);
823 tcg_kick_vcpu_timer = NULL;
824 }
825}
826
Alex Bennée65467062017-02-23 18:29:09 +0000827/***********************************************************/
Blue Swirl296af7c2010-03-29 19:23:50 +0000828void hw_error(const char *fmt, ...)
829{
830 va_list ap;
Andreas Färber55e5c282012-12-17 06:18:02 +0100831 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000832
833 va_start(ap, fmt);
834 fprintf(stderr, "qemu: hardware error: ");
835 vfprintf(stderr, fmt, ap);
836 fprintf(stderr, "\n");
Andreas Färberbdc44642013-06-24 23:50:24 +0200837 CPU_FOREACH(cpu) {
Andreas Färber55e5c282012-12-17 06:18:02 +0100838 fprintf(stderr, "CPU #%d:\n", cpu->cpu_index);
Andreas Färber878096e2013-05-27 01:33:50 +0200839 cpu_dump_state(cpu, stderr, fprintf, CPU_DUMP_FPU);
Blue Swirl296af7c2010-03-29 19:23:50 +0000840 }
841 va_end(ap);
842 abort();
843}
844
845void cpu_synchronize_all_states(void)
846{
Andreas Färber182735e2013-05-29 22:29:20 +0200847 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000848
Andreas Färberbdc44642013-06-24 23:50:24 +0200849 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200850 cpu_synchronize_state(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000851 }
852}
853
854void cpu_synchronize_all_post_reset(void)
855{
Andreas Färber182735e2013-05-29 22:29:20 +0200856 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000857
Andreas Färberbdc44642013-06-24 23:50:24 +0200858 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200859 cpu_synchronize_post_reset(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000860 }
861}
862
863void cpu_synchronize_all_post_init(void)
864{
Andreas Färber182735e2013-05-29 22:29:20 +0200865 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000866
Andreas Färberbdc44642013-06-24 23:50:24 +0200867 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200868 cpu_synchronize_post_init(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000869 }
870}
871
Kevin Wolf56983462013-07-05 13:49:54 +0200872static int do_vm_stop(RunState state)
Blue Swirl296af7c2010-03-29 19:23:50 +0000873{
Kevin Wolf56983462013-07-05 13:49:54 +0200874 int ret = 0;
875
Luiz Capitulino13548692011-07-29 15:36:43 -0300876 if (runstate_is_running()) {
Blue Swirl296af7c2010-03-29 19:23:50 +0000877 cpu_disable_ticks();
Blue Swirl296af7c2010-03-29 19:23:50 +0000878 pause_all_vcpus();
Luiz Capitulinof5bbfba2011-07-29 15:04:45 -0300879 runstate_set(state);
Luiz Capitulino1dfb4dd2011-07-29 14:26:33 -0300880 vm_state_notify(0, state);
Wenchao Xiaa4e15de2014-06-18 08:43:36 +0200881 qapi_event_send_stop(&error_abort);
Blue Swirl296af7c2010-03-29 19:23:50 +0000882 }
Kevin Wolf56983462013-07-05 13:49:54 +0200883
Kevin Wolf594a45c2013-07-18 14:52:19 +0200884 bdrv_drain_all();
Pavel Dovgalyuk6d0ceb82016-09-26 11:08:16 +0300885 replay_disable_events();
John Snow22af08e2016-09-22 21:45:51 -0400886 ret = bdrv_flush_all();
Kevin Wolf594a45c2013-07-18 14:52:19 +0200887
Kevin Wolf56983462013-07-05 13:49:54 +0200888 return ret;
Blue Swirl296af7c2010-03-29 19:23:50 +0000889}
890
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200891static bool cpu_can_run(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +0000892{
Andreas Färber4fdeee72012-05-02 23:10:09 +0200893 if (cpu->stop) {
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200894 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +0100895 }
Tiejun Chen321bc0b2013-08-02 09:43:09 +0800896 if (cpu_is_stopped(cpu)) {
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200897 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +0100898 }
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200899 return true;
Blue Swirl296af7c2010-03-29 19:23:50 +0000900}
901
Andreas Färber91325042013-05-27 02:07:49 +0200902static void cpu_handle_guest_debug(CPUState *cpu)
Jan Kiszka3c638d02010-06-25 16:56:56 +0200903{
Andreas Färber64f6b342013-05-27 02:06:09 +0200904 gdb_set_stop_cpu(cpu);
Jan Kiszka8cf71712011-02-07 12:19:16 +0100905 qemu_system_debug_request();
Andreas Färberf324e762012-05-02 23:26:21 +0200906 cpu->stopped = true;
Jan Kiszka3c638d02010-06-25 16:56:56 +0200907}
908
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100909#ifdef CONFIG_LINUX
910static void sigbus_reraise(void)
911{
912 sigset_t set;
913 struct sigaction action;
914
915 memset(&action, 0, sizeof(action));
916 action.sa_handler = SIG_DFL;
917 if (!sigaction(SIGBUS, &action, NULL)) {
918 raise(SIGBUS);
919 sigemptyset(&set);
920 sigaddset(&set, SIGBUS);
Peter Maydella2d17612016-05-16 18:33:59 +0100921 pthread_sigmask(SIG_UNBLOCK, &set, NULL);
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100922 }
923 perror("Failed to re-raise SIGBUS!\n");
924 abort();
925}
926
927static void sigbus_handler(int n, struct qemu_signalfd_siginfo *siginfo,
928 void *ctx)
929{
930 if (kvm_on_sigbus(siginfo->ssi_code,
931 (void *)(intptr_t)siginfo->ssi_addr)) {
932 sigbus_reraise();
933 }
934}
935
936static void qemu_init_sigbus(void)
937{
938 struct sigaction action;
939
940 memset(&action, 0, sizeof(action));
941 action.sa_flags = SA_SIGINFO;
942 action.sa_sigaction = (void (*)(int, siginfo_t*, void*))sigbus_handler;
943 sigaction(SIGBUS, &action, NULL);
944
945 prctl(PR_MCE_KILL, PR_MCE_KILL_SET, PR_MCE_KILL_EARLY, 0, 0);
946}
947
Andreas Färber290adf32013-01-17 09:30:27 +0100948static void qemu_kvm_eat_signals(CPUState *cpu)
Jan Kiszka1ab3c6c2011-03-15 12:26:12 +0100949{
950 struct timespec ts = { 0, 0 };
951 siginfo_t siginfo;
952 sigset_t waitset;
953 sigset_t chkset;
954 int r;
955
956 sigemptyset(&waitset);
957 sigaddset(&waitset, SIG_IPI);
958 sigaddset(&waitset, SIGBUS);
959
960 do {
961 r = sigtimedwait(&waitset, &siginfo, &ts);
962 if (r == -1 && !(errno == EAGAIN || errno == EINTR)) {
963 perror("sigtimedwait");
964 exit(1);
965 }
966
967 switch (r) {
968 case SIGBUS:
Andreas Färber290adf32013-01-17 09:30:27 +0100969 if (kvm_on_sigbus_vcpu(cpu, siginfo.si_code, siginfo.si_addr)) {
Jan Kiszka1ab3c6c2011-03-15 12:26:12 +0100970 sigbus_reraise();
971 }
972 break;
973 default:
974 break;
975 }
976
977 r = sigpending(&chkset);
978 if (r == -1) {
979 perror("sigpending");
980 exit(1);
981 }
982 } while (sigismember(&chkset, SIG_IPI) || sigismember(&chkset, SIGBUS));
Jan Kiszka1ab3c6c2011-03-15 12:26:12 +0100983}
984
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100985#else /* !CONFIG_LINUX */
986
987static void qemu_init_sigbus(void)
988{
989}
Jan Kiszka1ab3c6c2011-03-15 12:26:12 +0100990
Andreas Färber290adf32013-01-17 09:30:27 +0100991static void qemu_kvm_eat_signals(CPUState *cpu)
Jan Kiszka1ab3c6c2011-03-15 12:26:12 +0100992{
993}
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100994#endif /* !CONFIG_LINUX */
995
Blue Swirl296af7c2010-03-29 19:23:50 +0000996#ifndef _WIN32
Jan Kiszka55f8d6a2011-02-01 22:15:52 +0100997static void dummy_signal(int sig)
Blue Swirl296af7c2010-03-29 19:23:50 +0000998{
999}
1000
Andreas Färber13618e02013-05-26 23:41:00 +02001001static void qemu_kvm_init_cpu_signals(CPUState *cpu)
Paolo Bonzini714bd042011-03-12 17:44:06 +01001002{
1003 int r;
1004 sigset_t set;
1005 struct sigaction sigact;
1006
1007 memset(&sigact, 0, sizeof(sigact));
1008 sigact.sa_handler = dummy_signal;
1009 sigaction(SIG_IPI, &sigact, NULL);
1010
Paolo Bonzini714bd042011-03-12 17:44:06 +01001011 pthread_sigmask(SIG_BLOCK, NULL, &set);
1012 sigdelset(&set, SIG_IPI);
1013 sigdelset(&set, SIGBUS);
Andreas Färber491d6e82013-05-26 23:38:10 +02001014 r = kvm_set_signal_mask(cpu, &set);
Paolo Bonzini714bd042011-03-12 17:44:06 +01001015 if (r) {
1016 fprintf(stderr, "kvm_set_signal_mask: %s\n", strerror(-r));
1017 exit(1);
1018 }
Paolo Bonzini714bd042011-03-12 17:44:06 +01001019}
1020
Jan Kiszka55f8d6a2011-02-01 22:15:52 +01001021#else /* _WIN32 */
Andreas Färber13618e02013-05-26 23:41:00 +02001022static void qemu_kvm_init_cpu_signals(CPUState *cpu)
Paolo Bonzini714bd042011-03-12 17:44:06 +01001023{
1024 abort();
1025}
Jan Kiszka55f8d6a2011-02-01 22:15:52 +01001026#endif /* _WIN32 */
Blue Swirl296af7c2010-03-29 19:23:50 +00001027
Stefan Weilb2532d82012-09-27 07:41:42 +02001028static QemuMutex qemu_global_mutex;
Blue Swirl296af7c2010-03-29 19:23:50 +00001029
1030static QemuThread io_thread;
1031
Blue Swirl296af7c2010-03-29 19:23:50 +00001032/* cpu creation */
1033static QemuCond qemu_cpu_cond;
1034/* system init */
Blue Swirl296af7c2010-03-29 19:23:50 +00001035static QemuCond qemu_pause_cond;
1036
Paolo Bonzinid3b12f52011-09-13 10:30:52 +02001037void qemu_init_cpu_loop(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001038{
Jan Kiszka6d9cb732011-02-01 22:15:58 +01001039 qemu_init_sigbus();
Anthony Liguoried945922011-02-08 18:18:18 +01001040 qemu_cond_init(&qemu_cpu_cond);
Anthony Liguoried945922011-02-08 18:18:18 +01001041 qemu_cond_init(&qemu_pause_cond);
Blue Swirl296af7c2010-03-29 19:23:50 +00001042 qemu_mutex_init(&qemu_global_mutex);
Blue Swirl296af7c2010-03-29 19:23:50 +00001043
Jan Kiszkab7680cb2011-03-12 17:43:51 +01001044 qemu_thread_get_self(&io_thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001045}
1046
Paolo Bonzini14e6fe12016-10-31 10:36:08 +01001047void run_on_cpu(CPUState *cpu, run_on_cpu_func func, run_on_cpu_data data)
Marcelo Tosattie82bcec2010-05-04 09:45:22 -03001048{
Sergey Fedorovd148d902016-08-29 09:51:00 +02001049 do_run_on_cpu(cpu, func, data, &qemu_global_mutex);
Chegu Vinod3c022702013-06-24 03:49:41 -06001050}
1051
Gu Zheng4c055ab2016-05-12 09:18:13 +05301052static void qemu_kvm_destroy_vcpu(CPUState *cpu)
1053{
1054 if (kvm_destroy_vcpu(cpu) < 0) {
1055 error_report("kvm_destroy_vcpu failed");
1056 exit(EXIT_FAILURE);
1057 }
1058}
1059
1060static void qemu_tcg_destroy_vcpu(CPUState *cpu)
1061{
1062}
1063
Andreas Färber509a0d72012-05-03 02:18:09 +02001064static void qemu_wait_io_event_common(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001065{
Alex Bennée37257942017-02-23 18:29:14 +00001066 atomic_mb_set(&cpu->thread_kicked, false);
Andreas Färber4fdeee72012-05-02 23:10:09 +02001067 if (cpu->stop) {
1068 cpu->stop = false;
Andreas Färberf324e762012-05-02 23:26:21 +02001069 cpu->stopped = true;
Dr. David Alan Gilbert96bce682016-01-25 10:08:18 +00001070 qemu_cond_broadcast(&qemu_pause_cond);
Blue Swirl296af7c2010-03-29 19:23:50 +00001071 }
Sergey Fedorova5403c62016-08-02 18:27:36 +01001072 process_queued_cpu_work(cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001073}
1074
1075static bool qemu_tcg_should_sleep(CPUState *cpu)
1076{
1077 if (mttcg_enabled) {
1078 return cpu_thread_is_idle(cpu);
1079 } else {
1080 return all_cpu_threads_idle();
1081 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001082}
1083
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001084static void qemu_tcg_wait_io_event(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001085{
Alex Bennée37257942017-02-23 18:29:14 +00001086 while (qemu_tcg_should_sleep(cpu)) {
Alex Bennée65467062017-02-23 18:29:09 +00001087 stop_tcg_kick_timer();
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001088 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka16400322011-02-09 16:29:37 +01001089 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001090
Alex Bennée65467062017-02-23 18:29:09 +00001091 start_tcg_kick_timer();
1092
Alex Bennée37257942017-02-23 18:29:14 +00001093 qemu_wait_io_event_common(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001094}
1095
Andreas Färberfd529e82013-05-26 23:24:55 +02001096static void qemu_kvm_wait_io_event(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001097{
Andreas Färbera98ae1d2013-05-26 23:21:08 +02001098 while (cpu_thread_is_idle(cpu)) {
Andreas Färberf5c121b2012-05-03 01:22:49 +02001099 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka16400322011-02-09 16:29:37 +01001100 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001101
Andreas Färber290adf32013-01-17 09:30:27 +01001102 qemu_kvm_eat_signals(cpu);
Andreas Färber509a0d72012-05-03 02:18:09 +02001103 qemu_wait_io_event_common(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001104}
1105
Jan Kiszka7e97cd82011-02-07 12:19:12 +01001106static void *qemu_kvm_cpu_thread_fn(void *arg)
Blue Swirl296af7c2010-03-29 19:23:50 +00001107{
Andreas Färber48a106b2013-05-27 02:20:39 +02001108 CPUState *cpu = arg;
Jan Kiszka84b49152011-02-01 22:15:50 +01001109 int r;
Blue Swirl296af7c2010-03-29 19:23:50 +00001110
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001111 rcu_register_thread();
1112
Paolo Bonzini2e7f7a32015-06-18 18:47:18 +02001113 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001114 qemu_thread_get_self(cpu->thread);
Andreas Färber9f09e182012-05-03 06:59:07 +02001115 cpu->thread_id = qemu_get_thread_id();
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001116 cpu->can_do_io = 1;
Andreas Färber4917cf42013-05-27 05:17:50 +02001117 current_cpu = cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001118
Andreas Färber504134d2012-12-17 06:38:45 +01001119 r = kvm_init_vcpu(cpu);
Jan Kiszka84b49152011-02-01 22:15:50 +01001120 if (r < 0) {
1121 fprintf(stderr, "kvm_init_vcpu failed: %s\n", strerror(-r));
1122 exit(1);
1123 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001124
Andreas Färber13618e02013-05-26 23:41:00 +02001125 qemu_kvm_init_cpu_signals(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001126
1127 /* signal CPU creation */
Andreas Färber61a46212012-05-02 22:49:36 +02001128 cpu->created = true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001129 qemu_cond_signal(&qemu_cpu_cond);
1130
Gu Zheng4c055ab2016-05-12 09:18:13 +05301131 do {
Andreas Färbera1fcaa72012-05-02 23:42:26 +02001132 if (cpu_can_run(cpu)) {
Andreas Färber1458c362013-05-26 23:46:55 +02001133 r = kvm_cpu_exec(cpu);
Jan Kiszka83f338f2011-02-07 12:19:17 +01001134 if (r == EXCP_DEBUG) {
Andreas Färber91325042013-05-27 02:07:49 +02001135 cpu_handle_guest_debug(cpu);
Jan Kiszka83f338f2011-02-07 12:19:17 +01001136 }
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001137 }
Andreas Färberfd529e82013-05-26 23:24:55 +02001138 qemu_kvm_wait_io_event(cpu);
Gu Zheng4c055ab2016-05-12 09:18:13 +05301139 } while (!cpu->unplug || cpu_can_run(cpu));
Blue Swirl296af7c2010-03-29 19:23:50 +00001140
Gu Zheng4c055ab2016-05-12 09:18:13 +05301141 qemu_kvm_destroy_vcpu(cpu);
Bharata B Rao2c579042016-05-12 09:18:14 +05301142 cpu->created = false;
1143 qemu_cond_signal(&qemu_cpu_cond);
Gu Zheng4c055ab2016-05-12 09:18:13 +05301144 qemu_mutex_unlock_iothread();
Blue Swirl296af7c2010-03-29 19:23:50 +00001145 return NULL;
1146}
1147
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001148static void *qemu_dummy_cpu_thread_fn(void *arg)
1149{
1150#ifdef _WIN32
1151 fprintf(stderr, "qtest is not supported under Windows\n");
1152 exit(1);
1153#else
Andreas Färber10a90212013-05-27 02:24:35 +02001154 CPUState *cpu = arg;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001155 sigset_t waitset;
1156 int r;
1157
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001158 rcu_register_thread();
1159
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001160 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001161 qemu_thread_get_self(cpu->thread);
Andreas Färber9f09e182012-05-03 06:59:07 +02001162 cpu->thread_id = qemu_get_thread_id();
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001163 cpu->can_do_io = 1;
Alex Bennée37257942017-02-23 18:29:14 +00001164 current_cpu = cpu;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001165
1166 sigemptyset(&waitset);
1167 sigaddset(&waitset, SIG_IPI);
1168
1169 /* signal CPU creation */
Andreas Färber61a46212012-05-02 22:49:36 +02001170 cpu->created = true;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001171 qemu_cond_signal(&qemu_cpu_cond);
1172
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001173 while (1) {
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001174 qemu_mutex_unlock_iothread();
1175 do {
1176 int sig;
1177 r = sigwait(&waitset, &sig);
1178 } while (r == -1 && (errno == EAGAIN || errno == EINTR));
1179 if (r == -1) {
1180 perror("sigwait");
1181 exit(1);
1182 }
1183 qemu_mutex_lock_iothread();
Andreas Färber509a0d72012-05-03 02:18:09 +02001184 qemu_wait_io_event_common(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001185 }
1186
1187 return NULL;
1188#endif
1189}
1190
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001191static int64_t tcg_get_icount_limit(void)
1192{
1193 int64_t deadline;
1194
1195 if (replay_mode != REPLAY_MODE_PLAY) {
1196 deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
1197
1198 /* Maintain prior (possibly buggy) behaviour where if no deadline
1199 * was set (as there is no QEMU_CLOCK_VIRTUAL timer) or it is more than
1200 * INT32_MAX nanoseconds ahead, we still use INT32_MAX
1201 * nanoseconds.
1202 */
1203 if ((deadline < 0) || (deadline > INT32_MAX)) {
1204 deadline = INT32_MAX;
1205 }
1206
1207 return qemu_icount_round(deadline);
1208 } else {
1209 return replay_get_instructions();
1210 }
1211}
1212
Alex Bennée12e97002016-10-27 16:10:14 +01001213static void handle_icount_deadline(void)
1214{
1215 if (use_icount) {
1216 int64_t deadline =
1217 qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
1218
1219 if (deadline == 0) {
1220 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
1221 }
1222 }
1223}
1224
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001225static int tcg_cpu_exec(CPUState *cpu)
1226{
1227 int ret;
1228#ifdef CONFIG_PROFILER
1229 int64_t ti;
1230#endif
1231
1232#ifdef CONFIG_PROFILER
1233 ti = profile_getclock();
1234#endif
1235 if (use_icount) {
1236 int64_t count;
1237 int decr;
1238 timers_state.qemu_icount -= (cpu->icount_decr.u16.low
1239 + cpu->icount_extra);
1240 cpu->icount_decr.u16.low = 0;
1241 cpu->icount_extra = 0;
1242 count = tcg_get_icount_limit();
1243 timers_state.qemu_icount += count;
1244 decr = (count > 0xffff) ? 0xffff : count;
1245 count -= decr;
1246 cpu->icount_decr.u16.low = decr;
1247 cpu->icount_extra = count;
1248 }
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001249 qemu_mutex_unlock_iothread();
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001250 cpu_exec_start(cpu);
1251 ret = cpu_exec(cpu);
1252 cpu_exec_end(cpu);
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001253 qemu_mutex_lock_iothread();
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001254#ifdef CONFIG_PROFILER
1255 tcg_time += profile_getclock() - ti;
1256#endif
1257 if (use_icount) {
1258 /* Fold pending instructions back into the
1259 instruction counter, and clear the interrupt flag. */
1260 timers_state.qemu_icount -= (cpu->icount_decr.u16.low
1261 + cpu->icount_extra);
1262 cpu->icount_decr.u32 = 0;
1263 cpu->icount_extra = 0;
1264 replay_account_executed_instructions();
1265 }
1266 return ret;
1267}
1268
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001269/* Destroy any remaining vCPUs which have been unplugged and have
1270 * finished running
1271 */
1272static void deal_with_unplugged_cpus(void)
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001273{
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001274 CPUState *cpu;
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001275
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001276 CPU_FOREACH(cpu) {
1277 if (cpu->unplug && !cpu_can_run(cpu)) {
1278 qemu_tcg_destroy_vcpu(cpu);
1279 cpu->created = false;
1280 qemu_cond_signal(&qemu_cpu_cond);
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001281 break;
1282 }
1283 }
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001284}
Jan Kiszkabdb7ca62011-09-26 09:40:39 +02001285
Alex Bennée65467062017-02-23 18:29:09 +00001286/* Single-threaded TCG
1287 *
1288 * In the single-threaded case each vCPU is simulated in turn. If
1289 * there is more than a single vCPU we create a simple timer to kick
1290 * the vCPU and ensure we don't get stuck in a tight loop in one vCPU.
1291 * This is done explicitly rather than relying on side-effects
1292 * elsewhere.
1293 */
1294
Alex Bennée37257942017-02-23 18:29:14 +00001295static void *qemu_tcg_rr_cpu_thread_fn(void *arg)
Blue Swirl296af7c2010-03-29 19:23:50 +00001296{
Andreas Färberc3586ba2012-05-03 01:41:24 +02001297 CPUState *cpu = arg;
Blue Swirl296af7c2010-03-29 19:23:50 +00001298
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001299 rcu_register_thread();
1300
Paolo Bonzini2e7f7a32015-06-18 18:47:18 +02001301 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001302 qemu_thread_get_self(cpu->thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001303
Andreas Färber38fcbd32013-07-07 19:50:23 +02001304 CPU_FOREACH(cpu) {
1305 cpu->thread_id = qemu_get_thread_id();
1306 cpu->created = true;
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001307 cpu->can_do_io = 1;
Andreas Färber38fcbd32013-07-07 19:50:23 +02001308 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001309 qemu_cond_signal(&qemu_cpu_cond);
1310
Jan Kiszkafa7d1862011-08-22 18:35:25 +02001311 /* wait for initial kick-off after machine start */
Emilio G. Cotac28e3992015-04-27 12:45:28 -04001312 while (first_cpu->stopped) {
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001313 qemu_cond_wait(first_cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka8e564b42012-02-17 18:31:15 +01001314
1315 /* process any pending work */
Andreas Färberbdc44642013-06-24 23:50:24 +02001316 CPU_FOREACH(cpu) {
Alex Bennée37257942017-02-23 18:29:14 +00001317 current_cpu = cpu;
Andreas Färber182735e2013-05-29 22:29:20 +02001318 qemu_wait_io_event_common(cpu);
Jan Kiszka8e564b42012-02-17 18:31:15 +01001319 }
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001320 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001321
Alex Bennée65467062017-02-23 18:29:09 +00001322 start_tcg_kick_timer();
1323
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001324 cpu = first_cpu;
1325
Alex Bennéee5143e32017-02-23 18:29:12 +00001326 /* process any pending work */
1327 cpu->exit_request = 1;
1328
Blue Swirl296af7c2010-03-29 19:23:50 +00001329 while (1) {
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001330 /* Account partial waits to QEMU_CLOCK_VIRTUAL. */
1331 qemu_account_warp_timer();
1332
1333 if (!cpu) {
1334 cpu = first_cpu;
1335 }
1336
Alex Bennéee5143e32017-02-23 18:29:12 +00001337 while (cpu && !cpu->queued_work_first && !cpu->exit_request) {
1338
Alex Bennée791158d2017-02-23 18:29:10 +00001339 atomic_mb_set(&tcg_current_rr_cpu, cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001340 current_cpu = cpu;
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001341
1342 qemu_clock_enable(QEMU_CLOCK_VIRTUAL,
1343 (cpu->singlestep_enabled & SSTEP_NOTIMER) == 0);
1344
1345 if (cpu_can_run(cpu)) {
1346 int r;
1347 r = tcg_cpu_exec(cpu);
1348 if (r == EXCP_DEBUG) {
1349 cpu_handle_guest_debug(cpu);
1350 break;
Pranith Kumar08e73c42017-02-23 18:29:15 +00001351 } else if (r == EXCP_ATOMIC) {
1352 qemu_mutex_unlock_iothread();
1353 cpu_exec_step_atomic(cpu);
1354 qemu_mutex_lock_iothread();
1355 break;
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001356 }
Alex Bennée37257942017-02-23 18:29:14 +00001357 } else if (cpu->stop) {
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001358 if (cpu->unplug) {
1359 cpu = CPU_NEXT(cpu);
1360 }
1361 break;
1362 }
1363
Alex Bennéee5143e32017-02-23 18:29:12 +00001364 cpu = CPU_NEXT(cpu);
1365 } /* while (cpu && !cpu->exit_request).. */
1366
Alex Bennée791158d2017-02-23 18:29:10 +00001367 /* Does not need atomic_mb_set because a spurious wakeup is okay. */
1368 atomic_set(&tcg_current_rr_cpu, NULL);
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001369
Alex Bennéee5143e32017-02-23 18:29:12 +00001370 if (cpu && cpu->exit_request) {
1371 atomic_mb_set(&cpu->exit_request, 0);
1372 }
Alex Blighac70aaf2013-08-21 16:02:57 +01001373
Alex Bennée12e97002016-10-27 16:10:14 +01001374 handle_icount_deadline();
Alex Blighac70aaf2013-08-21 16:02:57 +01001375
Alex Bennée37257942017-02-23 18:29:14 +00001376 qemu_tcg_wait_io_event(cpu ? cpu : QTAILQ_FIRST(&cpus));
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001377 deal_with_unplugged_cpus();
Blue Swirl296af7c2010-03-29 19:23:50 +00001378 }
1379
1380 return NULL;
1381}
1382
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001383static void *qemu_hax_cpu_thread_fn(void *arg)
1384{
1385 CPUState *cpu = arg;
1386 int r;
1387 qemu_thread_get_self(cpu->thread);
1388 qemu_mutex_lock(&qemu_global_mutex);
1389
1390 cpu->thread_id = qemu_get_thread_id();
1391 cpu->created = true;
1392 cpu->halted = 0;
1393 current_cpu = cpu;
1394
1395 hax_init_vcpu(cpu);
1396 qemu_cond_signal(&qemu_cpu_cond);
1397
1398 while (1) {
1399 if (cpu_can_run(cpu)) {
1400 r = hax_smp_cpu_exec(cpu);
1401 if (r == EXCP_DEBUG) {
1402 cpu_handle_guest_debug(cpu);
1403 }
1404 }
1405
1406 while (cpu_thread_is_idle(cpu)) {
1407 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
1408 }
1409#ifdef _WIN32
1410 SleepEx(0, TRUE);
1411#endif
1412 qemu_wait_io_event_common(cpu);
1413 }
1414 return NULL;
1415}
1416
1417#ifdef _WIN32
1418static void CALLBACK dummy_apc_func(ULONG_PTR unused)
1419{
1420}
1421#endif
1422
Alex Bennée37257942017-02-23 18:29:14 +00001423/* Multi-threaded TCG
1424 *
1425 * In the multi-threaded case each vCPU has its own thread. The TLS
1426 * variable current_cpu can be used deep in the code to find the
1427 * current CPUState for a given thread.
1428 */
1429
1430static void *qemu_tcg_cpu_thread_fn(void *arg)
1431{
1432 CPUState *cpu = arg;
1433
1434 rcu_register_thread();
1435
1436 qemu_mutex_lock_iothread();
1437 qemu_thread_get_self(cpu->thread);
1438
1439 cpu->thread_id = qemu_get_thread_id();
1440 cpu->created = true;
1441 cpu->can_do_io = 1;
1442 current_cpu = cpu;
1443 qemu_cond_signal(&qemu_cpu_cond);
1444
1445 /* process any pending work */
1446 cpu->exit_request = 1;
1447
1448 while (1) {
1449 if (cpu_can_run(cpu)) {
1450 int r;
1451 r = tcg_cpu_exec(cpu);
1452 switch (r) {
1453 case EXCP_DEBUG:
1454 cpu_handle_guest_debug(cpu);
1455 break;
1456 case EXCP_HALTED:
1457 /* during start-up the vCPU is reset and the thread is
1458 * kicked several times. If we don't ensure we go back
1459 * to sleep in the halted state we won't cleanly
1460 * start-up when the vCPU is enabled.
1461 *
1462 * cpu->halted should ensure we sleep in wait_io_event
1463 */
1464 g_assert(cpu->halted);
1465 break;
Pranith Kumar08e73c42017-02-23 18:29:15 +00001466 case EXCP_ATOMIC:
1467 qemu_mutex_unlock_iothread();
1468 cpu_exec_step_atomic(cpu);
1469 qemu_mutex_lock_iothread();
Alex Bennée37257942017-02-23 18:29:14 +00001470 default:
1471 /* Ignore everything else? */
1472 break;
1473 }
1474 }
1475
1476 handle_icount_deadline();
1477
1478 atomic_mb_set(&cpu->exit_request, 0);
1479 qemu_tcg_wait_io_event(cpu);
1480 }
1481
1482 return NULL;
1483}
1484
Andreas Färber2ff09a42012-05-03 00:23:30 +02001485static void qemu_cpu_kick_thread(CPUState *cpu)
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001486{
1487#ifndef _WIN32
1488 int err;
1489
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001490 if (cpu->thread_kicked) {
1491 return;
Paolo Bonzini9102ded2015-08-18 06:52:09 -07001492 }
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001493 cpu->thread_kicked = true;
Andreas Färber814e6122012-05-02 17:00:37 +02001494 err = pthread_kill(cpu->thread->thread, SIG_IPI);
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001495 if (err) {
1496 fprintf(stderr, "qemu:%s: %s", __func__, strerror(err));
1497 exit(1);
1498 }
1499#else /* _WIN32 */
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001500 if (!qemu_cpu_is_self(cpu)) {
1501 if (!QueueUserAPC(dummy_apc_func, cpu->hThread, 0)) {
1502 fprintf(stderr, "%s: QueueUserAPC failed with error %lu\n",
1503 __func__, GetLastError());
1504 exit(1);
1505 }
1506 }
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001507#endif
1508}
1509
Andreas Färberc08d7422012-05-03 04:34:15 +02001510void qemu_cpu_kick(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001511{
Andreas Färberf5c121b2012-05-03 01:22:49 +02001512 qemu_cond_broadcast(cpu->halt_cond);
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001513 if (tcg_enabled()) {
Alex Bennée791158d2017-02-23 18:29:10 +00001514 cpu_exit(cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001515 /* NOP unless doing single-thread RR */
Alex Bennée791158d2017-02-23 18:29:10 +00001516 qemu_cpu_kick_rr_cpu();
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001517 } else {
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001518 if (hax_enabled()) {
1519 /*
1520 * FIXME: race condition with the exit_request check in
1521 * hax_vcpu_hax_exec
1522 */
1523 cpu->exit_request = 1;
1524 }
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001525 qemu_cpu_kick_thread(cpu);
1526 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001527}
1528
Jan Kiszka46d62fa2011-02-01 22:15:59 +01001529void qemu_cpu_kick_self(void)
1530{
Andreas Färber4917cf42013-05-27 05:17:50 +02001531 assert(current_cpu);
Paolo Bonzini9102ded2015-08-18 06:52:09 -07001532 qemu_cpu_kick_thread(current_cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001533}
1534
Andreas Färber60e82572012-05-02 22:23:49 +02001535bool qemu_cpu_is_self(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001536{
Andreas Färber814e6122012-05-02 17:00:37 +02001537 return qemu_thread_is_self(cpu->thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001538}
1539
Paolo Bonzini79e2b9a2015-01-21 12:09:14 +01001540bool qemu_in_vcpu_thread(void)
Juan Quintelaaa723c22012-09-18 16:30:11 +02001541{
Andreas Färber4917cf42013-05-27 05:17:50 +02001542 return current_cpu && qemu_cpu_is_self(current_cpu);
Juan Quintelaaa723c22012-09-18 16:30:11 +02001543}
1544
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001545static __thread bool iothread_locked = false;
1546
1547bool qemu_mutex_iothread_locked(void)
1548{
1549 return iothread_locked;
1550}
1551
Blue Swirl296af7c2010-03-29 19:23:50 +00001552void qemu_mutex_lock_iothread(void)
1553{
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001554 g_assert(!qemu_mutex_iothread_locked());
1555 qemu_mutex_lock(&qemu_global_mutex);
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001556 iothread_locked = true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001557}
1558
1559void qemu_mutex_unlock_iothread(void)
1560{
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001561 g_assert(qemu_mutex_iothread_locked());
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001562 iothread_locked = false;
Blue Swirl296af7c2010-03-29 19:23:50 +00001563 qemu_mutex_unlock(&qemu_global_mutex);
1564}
1565
Alex Bennéee8faee02016-10-27 16:09:58 +01001566static bool all_vcpus_paused(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001567{
Andreas Färberbdc44642013-06-24 23:50:24 +02001568 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001569
Andreas Färberbdc44642013-06-24 23:50:24 +02001570 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001571 if (!cpu->stopped) {
Alex Bennéee8faee02016-10-27 16:09:58 +01001572 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001573 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001574 }
1575
Alex Bennéee8faee02016-10-27 16:09:58 +01001576 return true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001577}
1578
1579void pause_all_vcpus(void)
1580{
Andreas Färberbdc44642013-06-24 23:50:24 +02001581 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001582
Alex Bligh40daca52013-08-21 16:03:02 +01001583 qemu_clock_enable(QEMU_CLOCK_VIRTUAL, false);
Andreas Färberbdc44642013-06-24 23:50:24 +02001584 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001585 cpu->stop = true;
1586 qemu_cpu_kick(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001587 }
1588
Juan Quintelaaa723c22012-09-18 16:30:11 +02001589 if (qemu_in_vcpu_thread()) {
Jan Kiszkad798e972012-02-17 18:31:16 +01001590 cpu_stop_current();
Jan Kiszkad798e972012-02-17 18:31:16 +01001591 }
1592
Blue Swirl296af7c2010-03-29 19:23:50 +00001593 while (!all_vcpus_paused()) {
Paolo Bonzinibe7d6c52011-03-12 17:44:02 +01001594 qemu_cond_wait(&qemu_pause_cond, &qemu_global_mutex);
Andreas Färberbdc44642013-06-24 23:50:24 +02001595 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001596 qemu_cpu_kick(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001597 }
1598 }
1599}
1600
Igor Mammedov29936832013-04-23 10:29:37 +02001601void cpu_resume(CPUState *cpu)
1602{
1603 cpu->stop = false;
1604 cpu->stopped = false;
1605 qemu_cpu_kick(cpu);
1606}
1607
Blue Swirl296af7c2010-03-29 19:23:50 +00001608void resume_all_vcpus(void)
1609{
Andreas Färberbdc44642013-06-24 23:50:24 +02001610 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001611
Alex Bligh40daca52013-08-21 16:03:02 +01001612 qemu_clock_enable(QEMU_CLOCK_VIRTUAL, true);
Andreas Färberbdc44642013-06-24 23:50:24 +02001613 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001614 cpu_resume(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001615 }
1616}
1617
Gu Zheng4c055ab2016-05-12 09:18:13 +05301618void cpu_remove(CPUState *cpu)
1619{
1620 cpu->stop = true;
1621 cpu->unplug = true;
1622 qemu_cpu_kick(cpu);
1623}
1624
Bharata B Rao2c579042016-05-12 09:18:14 +05301625void cpu_remove_sync(CPUState *cpu)
1626{
1627 cpu_remove(cpu);
1628 while (cpu->created) {
1629 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1630 }
1631}
1632
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001633/* For temporary buffers for forming a name */
1634#define VCPU_THREAD_NAME_SIZE 16
1635
Andreas Färbere5ab30a2012-05-03 01:50:44 +02001636static void qemu_tcg_init_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001637{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001638 char thread_name[VCPU_THREAD_NAME_SIZE];
Alex Bennée37257942017-02-23 18:29:14 +00001639 static QemuCond *single_tcg_halt_cond;
1640 static QemuThread *single_tcg_cpu_thread;
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001641
Alex Bennée37257942017-02-23 18:29:14 +00001642 if (qemu_tcg_mttcg_enabled() || !single_tcg_cpu_thread) {
Andreas Färber814e6122012-05-02 17:00:37 +02001643 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001644 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1645 qemu_cond_init(cpu->halt_cond);
Alex Bennée37257942017-02-23 18:29:14 +00001646
1647 if (qemu_tcg_mttcg_enabled()) {
1648 /* create a thread per vCPU with TCG (MTTCG) */
1649 parallel_cpus = true;
1650 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/TCG",
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001651 cpu->cpu_index);
Alex Bennée37257942017-02-23 18:29:14 +00001652
1653 qemu_thread_create(cpu->thread, thread_name, qemu_tcg_cpu_thread_fn,
1654 cpu, QEMU_THREAD_JOINABLE);
1655
1656 } else {
1657 /* share a single thread for all cpus with TCG */
1658 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "ALL CPUs/TCG");
1659 qemu_thread_create(cpu->thread, thread_name,
1660 qemu_tcg_rr_cpu_thread_fn,
1661 cpu, QEMU_THREAD_JOINABLE);
1662
1663 single_tcg_halt_cond = cpu->halt_cond;
1664 single_tcg_cpu_thread = cpu->thread;
1665 }
Paolo Bonzini1ecf47b2011-12-13 13:43:52 +01001666#ifdef _WIN32
Andreas Färber814e6122012-05-02 17:00:37 +02001667 cpu->hThread = qemu_thread_get_handle(cpu->thread);
Paolo Bonzini1ecf47b2011-12-13 13:43:52 +01001668#endif
Andreas Färber61a46212012-05-02 22:49:36 +02001669 while (!cpu->created) {
Paolo Bonzini18a85722011-03-12 17:44:03 +01001670 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001671 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001672 } else {
Alex Bennée37257942017-02-23 18:29:14 +00001673 /* For non-MTTCG cases we share the thread */
1674 cpu->thread = single_tcg_cpu_thread;
1675 cpu->halt_cond = single_tcg_halt_cond;
Blue Swirl296af7c2010-03-29 19:23:50 +00001676 }
1677}
1678
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001679static void qemu_hax_start_vcpu(CPUState *cpu)
1680{
1681 char thread_name[VCPU_THREAD_NAME_SIZE];
1682
1683 cpu->thread = g_malloc0(sizeof(QemuThread));
1684 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1685 qemu_cond_init(cpu->halt_cond);
1686
1687 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/HAX",
1688 cpu->cpu_index);
1689 qemu_thread_create(cpu->thread, thread_name, qemu_hax_cpu_thread_fn,
1690 cpu, QEMU_THREAD_JOINABLE);
1691#ifdef _WIN32
1692 cpu->hThread = qemu_thread_get_handle(cpu->thread);
1693#endif
1694 while (!cpu->created) {
1695 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1696 }
1697}
1698
Andreas Färber48a106b2013-05-27 02:20:39 +02001699static void qemu_kvm_start_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001700{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001701 char thread_name[VCPU_THREAD_NAME_SIZE];
1702
Andreas Färber814e6122012-05-02 17:00:37 +02001703 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001704 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1705 qemu_cond_init(cpu->halt_cond);
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001706 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/KVM",
1707 cpu->cpu_index);
1708 qemu_thread_create(cpu->thread, thread_name, qemu_kvm_cpu_thread_fn,
1709 cpu, QEMU_THREAD_JOINABLE);
Andreas Färber61a46212012-05-02 22:49:36 +02001710 while (!cpu->created) {
Paolo Bonzini18a85722011-03-12 17:44:03 +01001711 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001712 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001713}
1714
Andreas Färber10a90212013-05-27 02:24:35 +02001715static void qemu_dummy_start_vcpu(CPUState *cpu)
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001716{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001717 char thread_name[VCPU_THREAD_NAME_SIZE];
1718
Andreas Färber814e6122012-05-02 17:00:37 +02001719 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001720 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1721 qemu_cond_init(cpu->halt_cond);
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001722 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/DUMMY",
1723 cpu->cpu_index);
1724 qemu_thread_create(cpu->thread, thread_name, qemu_dummy_cpu_thread_fn, cpu,
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001725 QEMU_THREAD_JOINABLE);
Andreas Färber61a46212012-05-02 22:49:36 +02001726 while (!cpu->created) {
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001727 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1728 }
1729}
1730
Andreas Färberc643bed2013-05-27 03:23:24 +02001731void qemu_init_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001732{
Andreas Färberce3960e2012-12-17 03:27:07 +01001733 cpu->nr_cores = smp_cores;
1734 cpu->nr_threads = smp_threads;
Andreas Färberf324e762012-05-02 23:26:21 +02001735 cpu->stopped = true;
Peter Maydell56943e82016-01-21 14:15:04 +00001736
1737 if (!cpu->as) {
1738 /* If the target cpu hasn't set up any address spaces itself,
1739 * give it the default one.
1740 */
Peter Crosthwaite6731d862016-01-21 14:15:06 +00001741 AddressSpace *as = address_space_init_shareable(cpu->memory,
1742 "cpu-memory");
Peter Maydell12ebc9a2016-01-21 14:15:04 +00001743 cpu->num_ases = 1;
Peter Crosthwaite6731d862016-01-21 14:15:06 +00001744 cpu_address_space_init(cpu, as, 0);
Peter Maydell56943e82016-01-21 14:15:04 +00001745 }
1746
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001747 if (kvm_enabled()) {
Andreas Färber48a106b2013-05-27 02:20:39 +02001748 qemu_kvm_start_vcpu(cpu);
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001749 } else if (hax_enabled()) {
1750 qemu_hax_start_vcpu(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001751 } else if (tcg_enabled()) {
Andreas Färbere5ab30a2012-05-03 01:50:44 +02001752 qemu_tcg_init_vcpu(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001753 } else {
Andreas Färber10a90212013-05-27 02:24:35 +02001754 qemu_dummy_start_vcpu(cpu);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001755 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001756}
1757
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001758void cpu_stop_current(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001759{
Andreas Färber4917cf42013-05-27 05:17:50 +02001760 if (current_cpu) {
1761 current_cpu->stop = false;
1762 current_cpu->stopped = true;
1763 cpu_exit(current_cpu);
Dr. David Alan Gilbert96bce682016-01-25 10:08:18 +00001764 qemu_cond_broadcast(&qemu_pause_cond);
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001765 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001766}
1767
Kevin Wolf56983462013-07-05 13:49:54 +02001768int vm_stop(RunState state)
Blue Swirl296af7c2010-03-29 19:23:50 +00001769{
Juan Quintelaaa723c22012-09-18 16:30:11 +02001770 if (qemu_in_vcpu_thread()) {
Paolo Bonzini74892d22014-06-05 14:53:58 +02001771 qemu_system_vmstop_request_prepare();
Luiz Capitulino1dfb4dd2011-07-29 14:26:33 -03001772 qemu_system_vmstop_request(state);
Blue Swirl296af7c2010-03-29 19:23:50 +00001773 /*
1774 * FIXME: should not return to device code in case
1775 * vm_stop() has been requested.
1776 */
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001777 cpu_stop_current();
Kevin Wolf56983462013-07-05 13:49:54 +02001778 return 0;
Blue Swirl296af7c2010-03-29 19:23:50 +00001779 }
Kevin Wolf56983462013-07-05 13:49:54 +02001780
1781 return do_vm_stop(state);
Blue Swirl296af7c2010-03-29 19:23:50 +00001782}
1783
Claudio Imbrenda2d76e822017-02-14 18:07:47 +01001784/**
1785 * Prepare for (re)starting the VM.
1786 * Returns -1 if the vCPUs are not to be restarted (e.g. if they are already
1787 * running or in case of an error condition), 0 otherwise.
1788 */
1789int vm_prepare_start(void)
1790{
1791 RunState requested;
1792 int res = 0;
1793
1794 qemu_vmstop_requested(&requested);
1795 if (runstate_is_running() && requested == RUN_STATE__MAX) {
1796 return -1;
1797 }
1798
1799 /* Ensure that a STOP/RESUME pair of events is emitted if a
1800 * vmstop request was pending. The BLOCK_IO_ERROR event, for
1801 * example, according to documentation is always followed by
1802 * the STOP event.
1803 */
1804 if (runstate_is_running()) {
1805 qapi_event_send_stop(&error_abort);
1806 res = -1;
1807 } else {
1808 replay_enable_events();
1809 cpu_enable_ticks();
1810 runstate_set(RUN_STATE_RUNNING);
1811 vm_state_notify(1, RUN_STATE_RUNNING);
1812 }
1813
1814 /* We are sending this now, but the CPUs will be resumed shortly later */
1815 qapi_event_send_resume(&error_abort);
1816 return res;
1817}
1818
1819void vm_start(void)
1820{
1821 if (!vm_prepare_start()) {
1822 resume_all_vcpus();
1823 }
1824}
1825
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001826/* does a state transition even if the VM is already stopped,
1827 current state is forgotten forever */
Kevin Wolf56983462013-07-05 13:49:54 +02001828int vm_stop_force_state(RunState state)
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001829{
1830 if (runstate_is_running()) {
Kevin Wolf56983462013-07-05 13:49:54 +02001831 return vm_stop(state);
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001832 } else {
1833 runstate_set(state);
Wen Congyangb2780d32015-11-20 17:34:38 +08001834
1835 bdrv_drain_all();
Kevin Wolf594a45c2013-07-18 14:52:19 +02001836 /* Make sure to return an error if the flush in a previous vm_stop()
1837 * failed. */
John Snow22af08e2016-09-22 21:45:51 -04001838 return bdrv_flush_all();
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001839 }
1840}
1841
Stefan Weil9a78eea2010-10-22 23:03:33 +02001842void list_cpus(FILE *f, fprintf_function cpu_fprintf, const char *optarg)
Blue Swirl262353c2010-05-04 19:55:35 +00001843{
1844 /* XXX: implement xxx_cpu_list for targets that still miss it */
Peter Maydelle916cbf2012-09-05 17:41:08 -03001845#if defined(cpu_list)
1846 cpu_list(f, cpu_fprintf);
Blue Swirl262353c2010-05-04 19:55:35 +00001847#endif
1848}
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001849
1850CpuInfoList *qmp_query_cpus(Error **errp)
1851{
1852 CpuInfoList *head = NULL, *cur_item = NULL;
Andreas Färber182735e2013-05-29 22:29:20 +02001853 CPUState *cpu;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001854
Andreas Färberbdc44642013-06-24 23:50:24 +02001855 CPU_FOREACH(cpu) {
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001856 CpuInfoList *info;
Andreas Färber182735e2013-05-29 22:29:20 +02001857#if defined(TARGET_I386)
1858 X86CPU *x86_cpu = X86_CPU(cpu);
1859 CPUX86State *env = &x86_cpu->env;
1860#elif defined(TARGET_PPC)
1861 PowerPCCPU *ppc_cpu = POWERPC_CPU(cpu);
1862 CPUPPCState *env = &ppc_cpu->env;
1863#elif defined(TARGET_SPARC)
1864 SPARCCPU *sparc_cpu = SPARC_CPU(cpu);
1865 CPUSPARCState *env = &sparc_cpu->env;
1866#elif defined(TARGET_MIPS)
1867 MIPSCPU *mips_cpu = MIPS_CPU(cpu);
1868 CPUMIPSState *env = &mips_cpu->env;
Bastian Koppelmann48e06fe2014-09-01 12:59:46 +01001869#elif defined(TARGET_TRICORE)
1870 TriCoreCPU *tricore_cpu = TRICORE_CPU(cpu);
1871 CPUTriCoreState *env = &tricore_cpu->env;
Andreas Färber182735e2013-05-29 22:29:20 +02001872#endif
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001873
Andreas Färbercb446ec2013-05-01 14:24:52 +02001874 cpu_synchronize_state(cpu);
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001875
1876 info = g_malloc0(sizeof(*info));
1877 info->value = g_malloc0(sizeof(*info->value));
Andreas Färber55e5c282012-12-17 06:18:02 +01001878 info->value->CPU = cpu->cpu_index;
Andreas Färber182735e2013-05-29 22:29:20 +02001879 info->value->current = (cpu == first_cpu);
Andreas Färber259186a2013-01-17 18:51:17 +01001880 info->value->halted = cpu->halted;
Eduardo Habkost58f88d42015-05-08 16:04:22 -03001881 info->value->qom_path = object_get_canonical_path(OBJECT(cpu));
Andreas Färber9f09e182012-05-03 06:59:07 +02001882 info->value->thread_id = cpu->thread_id;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001883#if defined(TARGET_I386)
Eric Blake86f4b682015-11-18 01:52:59 -07001884 info->value->arch = CPU_INFO_ARCH_X86;
Eric Blake544a3732016-02-17 23:48:27 -07001885 info->value->u.x86.pc = env->eip + env->segs[R_CS].base;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001886#elif defined(TARGET_PPC)
Eric Blake86f4b682015-11-18 01:52:59 -07001887 info->value->arch = CPU_INFO_ARCH_PPC;
Eric Blake544a3732016-02-17 23:48:27 -07001888 info->value->u.ppc.nip = env->nip;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001889#elif defined(TARGET_SPARC)
Eric Blake86f4b682015-11-18 01:52:59 -07001890 info->value->arch = CPU_INFO_ARCH_SPARC;
Eric Blake544a3732016-02-17 23:48:27 -07001891 info->value->u.q_sparc.pc = env->pc;
1892 info->value->u.q_sparc.npc = env->npc;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001893#elif defined(TARGET_MIPS)
Eric Blake86f4b682015-11-18 01:52:59 -07001894 info->value->arch = CPU_INFO_ARCH_MIPS;
Eric Blake544a3732016-02-17 23:48:27 -07001895 info->value->u.q_mips.PC = env->active_tc.PC;
Bastian Koppelmann48e06fe2014-09-01 12:59:46 +01001896#elif defined(TARGET_TRICORE)
Eric Blake86f4b682015-11-18 01:52:59 -07001897 info->value->arch = CPU_INFO_ARCH_TRICORE;
Eric Blake544a3732016-02-17 23:48:27 -07001898 info->value->u.tricore.PC = env->PC;
Eric Blake86f4b682015-11-18 01:52:59 -07001899#else
1900 info->value->arch = CPU_INFO_ARCH_OTHER;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001901#endif
1902
1903 /* XXX: waiting for the qapi to support GSList */
1904 if (!cur_item) {
1905 head = cur_item = info;
1906 } else {
1907 cur_item->next = info;
1908 cur_item = info;
1909 }
1910 }
1911
1912 return head;
1913}
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001914
1915void qmp_memsave(int64_t addr, int64_t size, const char *filename,
1916 bool has_cpu, int64_t cpu_index, Error **errp)
1917{
1918 FILE *f;
1919 uint32_t l;
Andreas Färber55e5c282012-12-17 06:18:02 +01001920 CPUState *cpu;
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001921 uint8_t buf[1024];
Borislav Petkov0dc9daf2015-02-08 13:14:38 +01001922 int64_t orig_addr = addr, orig_size = size;
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001923
1924 if (!has_cpu) {
1925 cpu_index = 0;
1926 }
1927
Andreas Färber151d1322013-02-15 15:41:49 +01001928 cpu = qemu_get_cpu(cpu_index);
1929 if (cpu == NULL) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01001930 error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "cpu-index",
1931 "a CPU number");
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001932 return;
1933 }
1934
1935 f = fopen(filename, "wb");
1936 if (!f) {
Luiz Capitulino618da852013-06-07 14:35:06 -04001937 error_setg_file_open(errp, errno, filename);
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001938 return;
1939 }
1940
1941 while (size != 0) {
1942 l = sizeof(buf);
1943 if (l > size)
1944 l = size;
Aneesh Kumar K.V2f4d0f52013-10-01 21:49:30 +05301945 if (cpu_memory_rw_debug(cpu, addr, buf, l, 0) != 0) {
Borislav Petkov0dc9daf2015-02-08 13:14:38 +01001946 error_setg(errp, "Invalid addr 0x%016" PRIx64 "/size %" PRId64
1947 " specified", orig_addr, orig_size);
Aneesh Kumar K.V2f4d0f52013-10-01 21:49:30 +05301948 goto exit;
1949 }
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001950 if (fwrite(buf, 1, l, f) != l) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01001951 error_setg(errp, QERR_IO_ERROR);
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001952 goto exit;
1953 }
1954 addr += l;
1955 size -= l;
1956 }
1957
1958exit:
1959 fclose(f);
1960}
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001961
1962void qmp_pmemsave(int64_t addr, int64_t size, const char *filename,
1963 Error **errp)
1964{
1965 FILE *f;
1966 uint32_t l;
1967 uint8_t buf[1024];
1968
1969 f = fopen(filename, "wb");
1970 if (!f) {
Luiz Capitulino618da852013-06-07 14:35:06 -04001971 error_setg_file_open(errp, errno, filename);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001972 return;
1973 }
1974
1975 while (size != 0) {
1976 l = sizeof(buf);
1977 if (l > size)
1978 l = size;
Stefan Weileb6282f2014-04-07 20:28:23 +02001979 cpu_physical_memory_read(addr, buf, l);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001980 if (fwrite(buf, 1, l, f) != l) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01001981 error_setg(errp, QERR_IO_ERROR);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001982 goto exit;
1983 }
1984 addr += l;
1985 size -= l;
1986 }
1987
1988exit:
1989 fclose(f);
1990}
Luiz Capitulinoab49ab52011-11-23 12:55:53 -02001991
1992void qmp_inject_nmi(Error **errp)
1993{
Alexey Kardashevskiy9cb805f2014-08-20 22:16:33 +10001994 nmi_monitor_handle(monitor_get_cpu_index(), errp);
Luiz Capitulinoab49ab52011-11-23 12:55:53 -02001995}
Sebastian Tanase27498be2014-07-25 11:56:33 +02001996
1997void dump_drift_info(FILE *f, fprintf_function cpu_fprintf)
1998{
1999 if (!use_icount) {
2000 return;
2001 }
2002
2003 cpu_fprintf(f, "Host - Guest clock %"PRIi64" ms\n",
2004 (cpu_get_clock() - cpu_get_icount())/SCALE_MS);
2005 if (icount_align_option) {
2006 cpu_fprintf(f, "Max guest delay %"PRIi64" ms\n", -max_delay/SCALE_MS);
2007 cpu_fprintf(f, "Max guest advance %"PRIi64" ms\n", max_advance/SCALE_MS);
2008 } else {
2009 cpu_fprintf(f, "Max guest delay NA\n");
2010 cpu_fprintf(f, "Max guest advance NA\n");
2011 }
2012}