blob: 516e5cbac1ad3daaa9d6a58fb6182d2bf56d4d39 [file] [log] [blame]
Blue Swirl296af7c2010-03-29 19:23:50 +00001/*
2 * QEMU System Emulator
3 *
4 * Copyright (c) 2003-2008 Fabrice Bellard
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
24
25/* Needed early for CONFIG_BSD etc. */
Peter Maydell7b31bbc2016-01-26 18:16:56 +000026#include "qemu/osdep.h"
Paolo Bonzini33c11872016-03-15 16:58:45 +010027#include "qemu-common.h"
KONRAD Frederic8d4e9142017-02-23 18:29:08 +000028#include "qemu/config-file.h"
Paolo Bonzini33c11872016-03-15 16:58:45 +010029#include "cpu.h"
Paolo Bonzini83c90892012-12-17 18:19:49 +010030#include "monitor/monitor.h"
Wenchao Xiaa4e15de2014-06-18 08:43:36 +020031#include "qapi/qmp/qerror.h"
Markus Armbrusterd49b6832015-03-17 18:29:20 +010032#include "qemu/error-report.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010033#include "sysemu/sysemu.h"
Max Reitzda31d592016-03-16 19:54:32 +010034#include "sysemu/block-backend.h"
Paolo Bonzini022c62c2012-12-17 18:19:49 +010035#include "exec/gdbstub.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010036#include "sysemu/dma.h"
Vincent Palatinb3946622017-01-10 11:59:55 +010037#include "sysemu/hw_accel.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010038#include "sysemu/kvm.h"
Vincent Palatinb0cb0a62017-01-10 11:59:57 +010039#include "sysemu/hax.h"
Luiz Capitulinode0b36b2011-09-21 16:38:35 -030040#include "qmp-commands.h"
Paolo Bonzini63c91552016-03-15 13:18:37 +010041#include "exec/exec-all.h"
Blue Swirl296af7c2010-03-29 19:23:50 +000042
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010043#include "qemu/thread.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010044#include "sysemu/cpus.h"
45#include "sysemu/qtest.h"
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010046#include "qemu/main-loop.h"
47#include "qemu/bitmap.h"
Liu Ping Fancb365642013-09-25 14:20:58 +080048#include "qemu/seqlock.h"
KONRAD Frederic8d4e9142017-02-23 18:29:08 +000049#include "tcg.h"
Wenchao Xiaa4e15de2014-06-18 08:43:36 +020050#include "qapi-event.h"
Alexey Kardashevskiy9cb805f2014-08-20 22:16:33 +100051#include "hw/nmi.h"
Pavel Dovgalyuk8b427042015-09-17 19:24:05 +030052#include "sysemu/replay.h"
Igor Mammedovafed5a52017-05-10 13:29:55 +020053#include "hw/boards.h"
Jan Kiszka0ff0fc12011-06-23 10:15:55 +020054
Jan Kiszka6d9cb732011-02-01 22:15:58 +010055#ifdef CONFIG_LINUX
56
57#include <sys/prctl.h>
58
Marcelo Tosattic0532a72010-10-11 15:31:21 -030059#ifndef PR_MCE_KILL
60#define PR_MCE_KILL 33
61#endif
62
Jan Kiszka6d9cb732011-02-01 22:15:58 +010063#ifndef PR_MCE_KILL_SET
64#define PR_MCE_KILL_SET 1
65#endif
66
67#ifndef PR_MCE_KILL_EARLY
68#define PR_MCE_KILL_EARLY 1
69#endif
70
71#endif /* CONFIG_LINUX */
72
Sebastian Tanase27498be2014-07-25 11:56:33 +020073int64_t max_delay;
74int64_t max_advance;
Blue Swirl296af7c2010-03-29 19:23:50 +000075
Jason J. Herne2adcc852015-09-08 13:12:33 -040076/* vcpu throttling controls */
77static QEMUTimer *throttle_timer;
78static unsigned int throttle_percentage;
79
80#define CPU_THROTTLE_PCT_MIN 1
81#define CPU_THROTTLE_PCT_MAX 99
82#define CPU_THROTTLE_TIMESLICE_NS 10000000
83
Tiejun Chen321bc0b2013-08-02 09:43:09 +080084bool cpu_is_stopped(CPUState *cpu)
85{
86 return cpu->stopped || !runstate_is_running();
87}
88
Andreas Färbera98ae1d2013-05-26 23:21:08 +020089static bool cpu_thread_is_idle(CPUState *cpu)
Peter Maydellac873f12012-07-19 16:52:27 +010090{
Andreas Färberc64ca812012-05-03 02:11:45 +020091 if (cpu->stop || cpu->queued_work_first) {
Peter Maydellac873f12012-07-19 16:52:27 +010092 return false;
93 }
Tiejun Chen321bc0b2013-08-02 09:43:09 +080094 if (cpu_is_stopped(cpu)) {
Peter Maydellac873f12012-07-19 16:52:27 +010095 return true;
96 }
Andreas Färber8c2e1b02013-08-25 18:53:55 +020097 if (!cpu->halted || cpu_has_work(cpu) ||
Alexander Graf215e79c2013-04-24 22:24:12 +020098 kvm_halt_in_kernel()) {
Peter Maydellac873f12012-07-19 16:52:27 +010099 return false;
100 }
101 return true;
102}
103
104static bool all_cpu_threads_idle(void)
105{
Andreas Färber182735e2013-05-29 22:29:20 +0200106 CPUState *cpu;
Peter Maydellac873f12012-07-19 16:52:27 +0100107
Andreas Färberbdc44642013-06-24 23:50:24 +0200108 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200109 if (!cpu_thread_is_idle(cpu)) {
Peter Maydellac873f12012-07-19 16:52:27 +0100110 return false;
111 }
112 }
113 return true;
114}
115
Blue Swirl296af7c2010-03-29 19:23:50 +0000116/***********************************************************/
Paolo Bonzini946fb272011-09-12 13:57:37 +0200117/* guest cycle counter */
118
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200119/* Protected by TimersState seqlock */
120
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200121static bool icount_sleep = true;
Sebastian Tanase71468392014-07-23 11:47:50 +0200122static int64_t vm_clock_warp_start = -1;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200123/* Conversion factor from emulated instructions to virtual clock ticks. */
124static int icount_time_shift;
125/* Arbitrarily pick 1MIPS as the minimum allowable speed. */
126#define MAX_ICOUNT_SHIFT 10
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200127
Paolo Bonzini946fb272011-09-12 13:57:37 +0200128static QEMUTimer *icount_rt_timer;
129static QEMUTimer *icount_vm_timer;
130static QEMUTimer *icount_warp_timer;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200131
132typedef struct TimersState {
Liu Ping Fancb365642013-09-25 14:20:58 +0800133 /* Protected by BQL. */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200134 int64_t cpu_ticks_prev;
135 int64_t cpu_ticks_offset;
Liu Ping Fancb365642013-09-25 14:20:58 +0800136
137 /* cpu_clock_offset can be read out of BQL, so protect it with
138 * this lock.
139 */
140 QemuSeqLock vm_clock_seqlock;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200141 int64_t cpu_clock_offset;
142 int32_t cpu_ticks_enabled;
143 int64_t dummy;
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200144
145 /* Compensate for varying guest execution speed. */
146 int64_t qemu_icount_bias;
147 /* Only written by TCG thread */
148 int64_t qemu_icount;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200149} TimersState;
150
Liu Ping Fand9cd4002013-07-21 08:43:00 +0000151static TimersState timers_state;
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000152bool mttcg_enabled;
153
154/*
155 * We default to false if we know other options have been enabled
156 * which are currently incompatible with MTTCG. Otherwise when each
157 * guest (target) has been updated to support:
158 * - atomic instructions
159 * - memory ordering primitives (barriers)
160 * they can set the appropriate CONFIG flags in ${target}-softmmu.mak
161 *
162 * Once a guest architecture has been converted to the new primitives
163 * there are two remaining limitations to check.
164 *
165 * - The guest can't be oversized (e.g. 64 bit guest on 32 bit host)
166 * - The host must have a stronger memory order than the guest
167 *
168 * It may be possible in future to support strong guests on weak hosts
169 * but that will require tagging all load/stores in a guest with their
170 * implicit memory order requirements which would likely slow things
171 * down a lot.
172 */
173
174static bool check_tcg_memory_orders_compatible(void)
175{
176#if defined(TCG_GUEST_DEFAULT_MO) && defined(TCG_TARGET_DEFAULT_MO)
177 return (TCG_GUEST_DEFAULT_MO & ~TCG_TARGET_DEFAULT_MO) == 0;
178#else
179 return false;
180#endif
181}
182
183static bool default_mttcg_enabled(void)
184{
Alex Bennée83fd9622017-02-27 17:09:01 +0000185 if (use_icount || TCG_OVERSIZED_GUEST) {
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000186 return false;
187 } else {
188#ifdef TARGET_SUPPORTS_MTTCG
189 return check_tcg_memory_orders_compatible();
190#else
191 return false;
192#endif
193 }
194}
195
196void qemu_tcg_configure(QemuOpts *opts, Error **errp)
197{
198 const char *t = qemu_opt_get(opts, "thread");
199 if (t) {
200 if (strcmp(t, "multi") == 0) {
201 if (TCG_OVERSIZED_GUEST) {
202 error_setg(errp, "No MTTCG when guest word size > hosts");
Alex Bennée83fd9622017-02-27 17:09:01 +0000203 } else if (use_icount) {
204 error_setg(errp, "No MTTCG when icount is enabled");
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000205 } else {
Nikunj A Dadhania86953502017-04-10 11:36:55 +0530206#ifndef TARGET_SUPPORTS_MTTCG
Alex Bennéec34c7622017-02-28 14:40:17 +0000207 error_report("Guest not yet converted to MTTCG - "
208 "you may get unexpected results");
209#endif
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000210 if (!check_tcg_memory_orders_compatible()) {
211 error_report("Guest expects a stronger memory ordering "
212 "than the host provides");
Pranith Kumar8cfef892017-03-25 16:19:23 -0400213 error_printf("This may cause strange/hard to debug errors\n");
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000214 }
215 mttcg_enabled = true;
216 }
217 } else if (strcmp(t, "single") == 0) {
218 mttcg_enabled = false;
219 } else {
220 error_setg(errp, "Invalid 'thread' setting %s", t);
221 }
222 } else {
223 mttcg_enabled = default_mttcg_enabled();
224 }
225}
Paolo Bonzini946fb272011-09-12 13:57:37 +0200226
Alex Bennéee4cd9652017-03-31 16:09:42 +0100227/* The current number of executed instructions is based on what we
228 * originally budgeted minus the current state of the decrementing
229 * icount counters in extra/u16.low.
230 */
231static int64_t cpu_get_icount_executed(CPUState *cpu)
232{
233 return cpu->icount_budget - (cpu->icount_decr.u16.low + cpu->icount_extra);
234}
235
Alex Bennée512d3c82017-04-05 12:32:37 +0100236/*
237 * Update the global shared timer_state.qemu_icount to take into
238 * account executed instructions. This is done by the TCG vCPU
239 * thread so the main-loop can see time has moved forward.
240 */
241void cpu_update_icount(CPUState *cpu)
242{
243 int64_t executed = cpu_get_icount_executed(cpu);
244 cpu->icount_budget -= executed;
245
246#ifdef CONFIG_ATOMIC64
247 atomic_set__nocheck(&timers_state.qemu_icount,
248 atomic_read__nocheck(&timers_state.qemu_icount) +
249 executed);
250#else /* FIXME: we need 64bit atomics to do this safely */
251 timers_state.qemu_icount += executed;
252#endif
253}
254
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300255int64_t cpu_get_icount_raw(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200256{
Andreas Färber4917cf42013-05-27 05:17:50 +0200257 CPUState *cpu = current_cpu;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200258
Alex Bennée243c5f72017-03-30 18:49:22 +0100259 if (cpu && cpu->running) {
Paolo Bonzini414b15c2015-06-24 14:16:26 +0200260 if (!cpu->can_do_io) {
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300261 fprintf(stderr, "Bad icount read\n");
262 exit(1);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200263 }
Alex Bennéee4cd9652017-03-31 16:09:42 +0100264 /* Take into account what has run */
Alex Bennée1d059062017-04-05 10:53:47 +0100265 cpu_update_icount(cpu);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200266 }
Alex Bennée1d059062017-04-05 10:53:47 +0100267#ifdef CONFIG_ATOMIC64
268 return atomic_read__nocheck(&timers_state.qemu_icount);
269#else /* FIXME: we need 64bit atomics to do this safely */
270 return timers_state.qemu_icount;
271#endif
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300272}
273
274/* Return the virtual CPU time, based on the instruction counter. */
275static int64_t cpu_get_icount_locked(void)
276{
277 int64_t icount = cpu_get_icount_raw();
KONRAD Frederic3f031312014-08-01 01:37:15 +0200278 return timers_state.qemu_icount_bias + cpu_icount_to_ns(icount);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200279}
280
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200281int64_t cpu_get_icount(void)
282{
283 int64_t icount;
284 unsigned start;
285
286 do {
287 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
288 icount = cpu_get_icount_locked();
289 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
290
291 return icount;
292}
293
KONRAD Frederic3f031312014-08-01 01:37:15 +0200294int64_t cpu_icount_to_ns(int64_t icount)
295{
296 return icount << icount_time_shift;
297}
298
Cao jind90f3cc2016-07-29 19:05:38 +0800299/* return the time elapsed in VM between vm_start and vm_stop. Unless
300 * icount is active, cpu_get_ticks() uses units of the host CPU cycle
301 * counter.
302 *
303 * Caller must hold the BQL
304 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200305int64_t cpu_get_ticks(void)
306{
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100307 int64_t ticks;
308
Paolo Bonzini946fb272011-09-12 13:57:37 +0200309 if (use_icount) {
310 return cpu_get_icount();
311 }
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100312
313 ticks = timers_state.cpu_ticks_offset;
314 if (timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400315 ticks += cpu_get_host_ticks();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200316 }
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100317
318 if (timers_state.cpu_ticks_prev > ticks) {
319 /* Note: non increasing ticks may happen if the host uses
320 software suspend */
321 timers_state.cpu_ticks_offset += timers_state.cpu_ticks_prev - ticks;
322 ticks = timers_state.cpu_ticks_prev;
323 }
324
325 timers_state.cpu_ticks_prev = ticks;
326 return ticks;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200327}
328
Liu Ping Fancb365642013-09-25 14:20:58 +0800329static int64_t cpu_get_clock_locked(void)
330{
Cao jin1d45cea2016-07-29 19:05:37 +0800331 int64_t time;
Liu Ping Fancb365642013-09-25 14:20:58 +0800332
Cao jin1d45cea2016-07-29 19:05:37 +0800333 time = timers_state.cpu_clock_offset;
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100334 if (timers_state.cpu_ticks_enabled) {
Cao jin1d45cea2016-07-29 19:05:37 +0800335 time += get_clock();
Liu Ping Fancb365642013-09-25 14:20:58 +0800336 }
337
Cao jin1d45cea2016-07-29 19:05:37 +0800338 return time;
Liu Ping Fancb365642013-09-25 14:20:58 +0800339}
340
Cao jind90f3cc2016-07-29 19:05:38 +0800341/* Return the monotonic time elapsed in VM, i.e.,
Peter Maydell8212ff82016-09-15 10:24:22 +0100342 * the time between vm_start and vm_stop
343 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200344int64_t cpu_get_clock(void)
345{
346 int64_t ti;
Liu Ping Fancb365642013-09-25 14:20:58 +0800347 unsigned start;
348
349 do {
350 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
351 ti = cpu_get_clock_locked();
352 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
353
354 return ti;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200355}
356
Liu Ping Fancb365642013-09-25 14:20:58 +0800357/* enable cpu_get_ticks()
Cao jin3224e872016-07-08 18:31:37 +0800358 * Caller must hold BQL which serves as mutex for vm_clock_seqlock.
Liu Ping Fancb365642013-09-25 14:20:58 +0800359 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200360void cpu_enable_ticks(void)
361{
Liu Ping Fancb365642013-09-25 14:20:58 +0800362 /* Here, the really thing protected by seqlock is cpu_clock_offset. */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400363 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200364 if (!timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400365 timers_state.cpu_ticks_offset -= cpu_get_host_ticks();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200366 timers_state.cpu_clock_offset -= get_clock();
367 timers_state.cpu_ticks_enabled = 1;
368 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400369 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200370}
371
372/* disable cpu_get_ticks() : the clock is stopped. You must not call
Liu Ping Fancb365642013-09-25 14:20:58 +0800373 * cpu_get_ticks() after that.
Cao jin3224e872016-07-08 18:31:37 +0800374 * Caller must hold BQL which serves as mutex for vm_clock_seqlock.
Liu Ping Fancb365642013-09-25 14:20:58 +0800375 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200376void cpu_disable_ticks(void)
377{
Liu Ping Fancb365642013-09-25 14:20:58 +0800378 /* Here, the really thing protected by seqlock is cpu_clock_offset. */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400379 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200380 if (timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400381 timers_state.cpu_ticks_offset += cpu_get_host_ticks();
Liu Ping Fancb365642013-09-25 14:20:58 +0800382 timers_state.cpu_clock_offset = cpu_get_clock_locked();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200383 timers_state.cpu_ticks_enabled = 0;
384 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400385 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200386}
387
388/* Correlation between real and virtual time is always going to be
389 fairly approximate, so ignore small variation.
390 When the guest is idle real and virtual time will be aligned in
391 the IO wait loop. */
Rutuja Shah73bcb242016-03-21 21:32:30 +0530392#define ICOUNT_WOBBLE (NANOSECONDS_PER_SECOND / 10)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200393
394static void icount_adjust(void)
395{
396 int64_t cur_time;
397 int64_t cur_icount;
398 int64_t delta;
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200399
400 /* Protected by TimersState mutex. */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200401 static int64_t last_delta;
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200402
Paolo Bonzini946fb272011-09-12 13:57:37 +0200403 /* If the VM is not running, then do nothing. */
404 if (!runstate_is_running()) {
405 return;
406 }
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200407
Emilio G. Cota03719e42016-06-08 14:55:21 -0400408 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200409 cur_time = cpu_get_clock_locked();
410 cur_icount = cpu_get_icount_locked();
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200411
Paolo Bonzini946fb272011-09-12 13:57:37 +0200412 delta = cur_icount - cur_time;
413 /* FIXME: This is a very crude algorithm, somewhat prone to oscillation. */
414 if (delta > 0
415 && last_delta + ICOUNT_WOBBLE < delta * 2
416 && icount_time_shift > 0) {
417 /* The guest is getting too far ahead. Slow time down. */
418 icount_time_shift--;
419 }
420 if (delta < 0
421 && last_delta - ICOUNT_WOBBLE > delta * 2
422 && icount_time_shift < MAX_ICOUNT_SHIFT) {
423 /* The guest is getting too far behind. Speed time up. */
424 icount_time_shift++;
425 }
426 last_delta = delta;
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200427 timers_state.qemu_icount_bias = cur_icount
428 - (timers_state.qemu_icount << icount_time_shift);
Emilio G. Cota03719e42016-06-08 14:55:21 -0400429 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200430}
431
432static void icount_adjust_rt(void *opaque)
433{
Alex Bligh40daca52013-08-21 16:03:02 +0100434 timer_mod(icount_rt_timer,
Pavel Dovgalyuk1979b902015-01-12 15:00:43 +0300435 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL_RT) + 1000);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200436 icount_adjust();
437}
438
439static void icount_adjust_vm(void *opaque)
440{
Alex Bligh40daca52013-08-21 16:03:02 +0100441 timer_mod(icount_vm_timer,
442 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
Rutuja Shah73bcb242016-03-21 21:32:30 +0530443 NANOSECONDS_PER_SECOND / 10);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200444 icount_adjust();
445}
446
447static int64_t qemu_icount_round(int64_t count)
448{
449 return (count + (1 << icount_time_shift) - 1) >> icount_time_shift;
450}
451
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300452static void icount_warp_rt(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200453{
Alex Bennéeccffff42016-04-04 15:35:48 +0100454 unsigned seq;
455 int64_t warp_start;
456
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200457 /* The icount_warp_timer is rescheduled soon after vm_clock_warp_start
458 * changes from -1 to another value, so the race here is okay.
459 */
Alex Bennéeccffff42016-04-04 15:35:48 +0100460 do {
461 seq = seqlock_read_begin(&timers_state.vm_clock_seqlock);
462 warp_start = vm_clock_warp_start;
463 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, seq));
464
465 if (warp_start == -1) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200466 return;
467 }
468
Emilio G. Cota03719e42016-06-08 14:55:21 -0400469 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200470 if (runstate_is_running()) {
Pavel Dovgalyuk8eda2062015-09-17 19:24:28 +0300471 int64_t clock = REPLAY_CLOCK(REPLAY_CLOCK_VIRTUAL_RT,
472 cpu_get_clock_locked());
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200473 int64_t warp_delta;
474
475 warp_delta = clock - vm_clock_warp_start;
476 if (use_icount == 2) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200477 /*
Alex Bligh40daca52013-08-21 16:03:02 +0100478 * In adaptive mode, do not let QEMU_CLOCK_VIRTUAL run too
Paolo Bonzini946fb272011-09-12 13:57:37 +0200479 * far ahead of real time.
480 */
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200481 int64_t cur_icount = cpu_get_icount_locked();
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300482 int64_t delta = clock - cur_icount;
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200483 warp_delta = MIN(warp_delta, delta);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200484 }
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200485 timers_state.qemu_icount_bias += warp_delta;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200486 }
487 vm_clock_warp_start = -1;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400488 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200489
490 if (qemu_clock_expired(QEMU_CLOCK_VIRTUAL)) {
491 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
492 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200493}
494
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300495static void icount_timer_cb(void *opaque)
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300496{
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300497 /* No need for a checkpoint because the timer already synchronizes
498 * with CHECKPOINT_CLOCK_VIRTUAL_RT.
499 */
500 icount_warp_rt();
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300501}
502
Paolo Bonzini8156be52012-03-28 15:42:04 +0200503void qtest_clock_warp(int64_t dest)
504{
Alex Bligh40daca52013-08-21 16:03:02 +0100505 int64_t clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
Fam Zhengefef88b2015-01-19 17:51:43 +0800506 AioContext *aio_context;
Paolo Bonzini8156be52012-03-28 15:42:04 +0200507 assert(qtest_enabled());
Fam Zhengefef88b2015-01-19 17:51:43 +0800508 aio_context = qemu_get_aio_context();
Paolo Bonzini8156be52012-03-28 15:42:04 +0200509 while (clock < dest) {
Alex Bligh40daca52013-08-21 16:03:02 +0100510 int64_t deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
Sergey Fedorovc9299e22014-06-10 13:10:28 +0400511 int64_t warp = qemu_soonest_timeout(dest - clock, deadline);
Fam Zhengefef88b2015-01-19 17:51:43 +0800512
Emilio G. Cota03719e42016-06-08 14:55:21 -0400513 seqlock_write_begin(&timers_state.vm_clock_seqlock);
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200514 timers_state.qemu_icount_bias += warp;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400515 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200516
Alex Bligh40daca52013-08-21 16:03:02 +0100517 qemu_clock_run_timers(QEMU_CLOCK_VIRTUAL);
Fam Zhengefef88b2015-01-19 17:51:43 +0800518 timerlist_run_timers(aio_context->tlg.tl[QEMU_CLOCK_VIRTUAL]);
Alex Bligh40daca52013-08-21 16:03:02 +0100519 clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini8156be52012-03-28 15:42:04 +0200520 }
Alex Bligh40daca52013-08-21 16:03:02 +0100521 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini8156be52012-03-28 15:42:04 +0200522}
523
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300524void qemu_start_warp_timer(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200525{
Paolo Bonzinice78d182013-10-07 17:30:02 +0200526 int64_t clock;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200527 int64_t deadline;
528
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300529 if (!use_icount) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200530 return;
531 }
532
Pavel Dovgalyuk8bd7f712015-09-17 19:24:44 +0300533 /* Nothing to do if the VM is stopped: QEMU_CLOCK_VIRTUAL timers
534 * do not fire, so computing the deadline does not make sense.
535 */
536 if (!runstate_is_running()) {
537 return;
538 }
539
540 /* warp clock deterministically in record/replay mode */
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300541 if (!replay_checkpoint(CHECKPOINT_CLOCK_WARP_START)) {
Pavel Dovgalyuk8bd7f712015-09-17 19:24:44 +0300542 return;
543 }
544
Paolo Bonzinice78d182013-10-07 17:30:02 +0200545 if (!all_cpu_threads_idle()) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200546 return;
547 }
548
Paolo Bonzini8156be52012-03-28 15:42:04 +0200549 if (qtest_enabled()) {
550 /* When testing, qtest commands advance icount. */
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300551 return;
Paolo Bonzini8156be52012-03-28 15:42:04 +0200552 }
553
Alex Blighac70aaf2013-08-21 16:02:57 +0100554 /* We want to use the earliest deadline from ALL vm_clocks */
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300555 clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT);
Alex Bligh40daca52013-08-21 16:03:02 +0100556 deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
Paolo Bonzinice78d182013-10-07 17:30:02 +0200557 if (deadline < 0) {
Victor CLEMENTd7a0f712015-05-29 17:14:06 +0200558 static bool notified;
559 if (!icount_sleep && !notified) {
560 error_report("WARNING: icount sleep disabled and no active timers");
561 notified = true;
562 }
Paolo Bonzinice78d182013-10-07 17:30:02 +0200563 return;
Alex Blighac70aaf2013-08-21 16:02:57 +0100564 }
565
Paolo Bonzini946fb272011-09-12 13:57:37 +0200566 if (deadline > 0) {
567 /*
Alex Bligh40daca52013-08-21 16:03:02 +0100568 * Ensure QEMU_CLOCK_VIRTUAL proceeds even when the virtual CPU goes to
Paolo Bonzini946fb272011-09-12 13:57:37 +0200569 * sleep. Otherwise, the CPU might be waiting for a future timer
570 * interrupt to wake it up, but the interrupt never comes because
571 * the vCPU isn't running any insns and thus doesn't advance the
Alex Bligh40daca52013-08-21 16:03:02 +0100572 * QEMU_CLOCK_VIRTUAL.
Paolo Bonzini946fb272011-09-12 13:57:37 +0200573 */
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200574 if (!icount_sleep) {
575 /*
576 * We never let VCPUs sleep in no sleep icount mode.
577 * If there is a pending QEMU_CLOCK_VIRTUAL timer we just advance
578 * to the next QEMU_CLOCK_VIRTUAL event and notify it.
579 * It is useful when we want a deterministic execution time,
580 * isolated from host latencies.
581 */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400582 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200583 timers_state.qemu_icount_bias += deadline;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400584 seqlock_write_end(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200585 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
586 } else {
587 /*
588 * We do stop VCPUs and only advance QEMU_CLOCK_VIRTUAL after some
589 * "real" time, (related to the time left until the next event) has
590 * passed. The QEMU_CLOCK_VIRTUAL_RT clock will do this.
591 * This avoids that the warps are visible externally; for example,
592 * you will not be sending network packets continuously instead of
593 * every 100ms.
594 */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400595 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200596 if (vm_clock_warp_start == -1 || vm_clock_warp_start > clock) {
597 vm_clock_warp_start = clock;
598 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400599 seqlock_write_end(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200600 timer_mod_anticipate(icount_warp_timer, clock + deadline);
Paolo Bonzinice78d182013-10-07 17:30:02 +0200601 }
Alex Blighac70aaf2013-08-21 16:02:57 +0100602 } else if (deadline == 0) {
Alex Bligh40daca52013-08-21 16:03:02 +0100603 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200604 }
605}
606
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300607static void qemu_account_warp_timer(void)
608{
609 if (!use_icount || !icount_sleep) {
610 return;
611 }
612
613 /* Nothing to do if the VM is stopped: QEMU_CLOCK_VIRTUAL timers
614 * do not fire, so computing the deadline does not make sense.
615 */
616 if (!runstate_is_running()) {
617 return;
618 }
619
620 /* warp clock deterministically in record/replay mode */
621 if (!replay_checkpoint(CHECKPOINT_CLOCK_WARP_ACCOUNT)) {
622 return;
623 }
624
625 timer_del(icount_warp_timer);
626 icount_warp_rt();
627}
628
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200629static bool icount_state_needed(void *opaque)
630{
631 return use_icount;
632}
633
634/*
635 * This is a subsection for icount migration.
636 */
637static const VMStateDescription icount_vmstate_timers = {
638 .name = "timer/icount",
639 .version_id = 1,
640 .minimum_version_id = 1,
Juan Quintela5cd8cad2014-09-23 14:09:54 +0200641 .needed = icount_state_needed,
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200642 .fields = (VMStateField[]) {
643 VMSTATE_INT64(qemu_icount_bias, TimersState),
644 VMSTATE_INT64(qemu_icount, TimersState),
645 VMSTATE_END_OF_LIST()
646 }
647};
648
Paolo Bonzini946fb272011-09-12 13:57:37 +0200649static const VMStateDescription vmstate_timers = {
650 .name = "timer",
651 .version_id = 2,
652 .minimum_version_id = 1,
Juan Quintela35d08452014-04-16 16:01:33 +0200653 .fields = (VMStateField[]) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200654 VMSTATE_INT64(cpu_ticks_offset, TimersState),
655 VMSTATE_INT64(dummy, TimersState),
656 VMSTATE_INT64_V(cpu_clock_offset, TimersState, 2),
657 VMSTATE_END_OF_LIST()
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200658 },
Juan Quintela5cd8cad2014-09-23 14:09:54 +0200659 .subsections = (const VMStateDescription*[]) {
660 &icount_vmstate_timers,
661 NULL
Paolo Bonzini946fb272011-09-12 13:57:37 +0200662 }
663};
664
Paolo Bonzini14e6fe12016-10-31 10:36:08 +0100665static void cpu_throttle_thread(CPUState *cpu, run_on_cpu_data opaque)
Jason J. Herne2adcc852015-09-08 13:12:33 -0400666{
Jason J. Herne2adcc852015-09-08 13:12:33 -0400667 double pct;
668 double throttle_ratio;
669 long sleeptime_ns;
670
671 if (!cpu_throttle_get_percentage()) {
672 return;
673 }
674
675 pct = (double)cpu_throttle_get_percentage()/100;
676 throttle_ratio = pct / (1 - pct);
677 sleeptime_ns = (long)(throttle_ratio * CPU_THROTTLE_TIMESLICE_NS);
678
679 qemu_mutex_unlock_iothread();
680 atomic_set(&cpu->throttle_thread_scheduled, 0);
681 g_usleep(sleeptime_ns / 1000); /* Convert ns to us for usleep call */
682 qemu_mutex_lock_iothread();
683}
684
685static void cpu_throttle_timer_tick(void *opaque)
686{
687 CPUState *cpu;
688 double pct;
689
690 /* Stop the timer if needed */
691 if (!cpu_throttle_get_percentage()) {
692 return;
693 }
694 CPU_FOREACH(cpu) {
695 if (!atomic_xchg(&cpu->throttle_thread_scheduled, 1)) {
Paolo Bonzini14e6fe12016-10-31 10:36:08 +0100696 async_run_on_cpu(cpu, cpu_throttle_thread,
697 RUN_ON_CPU_NULL);
Jason J. Herne2adcc852015-09-08 13:12:33 -0400698 }
699 }
700
701 pct = (double)cpu_throttle_get_percentage()/100;
702 timer_mod(throttle_timer, qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT) +
703 CPU_THROTTLE_TIMESLICE_NS / (1-pct));
704}
705
706void cpu_throttle_set(int new_throttle_pct)
707{
708 /* Ensure throttle percentage is within valid range */
709 new_throttle_pct = MIN(new_throttle_pct, CPU_THROTTLE_PCT_MAX);
710 new_throttle_pct = MAX(new_throttle_pct, CPU_THROTTLE_PCT_MIN);
711
712 atomic_set(&throttle_percentage, new_throttle_pct);
713
714 timer_mod(throttle_timer, qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT) +
715 CPU_THROTTLE_TIMESLICE_NS);
716}
717
718void cpu_throttle_stop(void)
719{
720 atomic_set(&throttle_percentage, 0);
721}
722
723bool cpu_throttle_active(void)
724{
725 return (cpu_throttle_get_percentage() != 0);
726}
727
728int cpu_throttle_get_percentage(void)
729{
730 return atomic_read(&throttle_percentage);
731}
732
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400733void cpu_ticks_init(void)
734{
Emilio G. Cotaccdb3c12016-06-08 14:55:20 -0400735 seqlock_init(&timers_state.vm_clock_seqlock);
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400736 vmstate_register(NULL, 0, &vmstate_timers, &timers_state);
Jason J. Herne2adcc852015-09-08 13:12:33 -0400737 throttle_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL_RT,
738 cpu_throttle_timer_tick, NULL);
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400739}
740
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200741void configure_icount(QemuOpts *opts, Error **errp)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200742{
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200743 const char *option;
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200744 char *rem_str = NULL;
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200745
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200746 option = qemu_opt_get(opts, "shift");
Paolo Bonzini946fb272011-09-12 13:57:37 +0200747 if (!option) {
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200748 if (qemu_opt_get(opts, "align") != NULL) {
749 error_setg(errp, "Please specify shift option when using align");
750 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200751 return;
752 }
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200753
754 icount_sleep = qemu_opt_get_bool(opts, "sleep", true);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200755 if (icount_sleep) {
756 icount_warp_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL_RT,
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300757 icount_timer_cb, NULL);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200758 }
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200759
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200760 icount_align_option = qemu_opt_get_bool(opts, "align", false);
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200761
762 if (icount_align_option && !icount_sleep) {
Pranith Kumar778d9f92016-02-26 10:16:51 -0500763 error_setg(errp, "align=on and sleep=off are incompatible");
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200764 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200765 if (strcmp(option, "auto") != 0) {
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200766 errno = 0;
767 icount_time_shift = strtol(option, &rem_str, 0);
768 if (errno != 0 || *rem_str != '\0' || !strlen(option)) {
769 error_setg(errp, "icount: Invalid shift value");
770 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200771 use_icount = 1;
772 return;
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200773 } else if (icount_align_option) {
774 error_setg(errp, "shift=auto and align=on are incompatible");
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200775 } else if (!icount_sleep) {
Pranith Kumar778d9f92016-02-26 10:16:51 -0500776 error_setg(errp, "shift=auto and sleep=off are incompatible");
Paolo Bonzini946fb272011-09-12 13:57:37 +0200777 }
778
779 use_icount = 2;
780
781 /* 125MIPS seems a reasonable initial guess at the guest speed.
782 It will be corrected fairly quickly anyway. */
783 icount_time_shift = 3;
784
785 /* Have both realtime and virtual time triggers for speed adjustment.
786 The realtime trigger catches emulated time passing too slowly,
787 the virtual time trigger catches emulated time passing too fast.
788 Realtime triggers occur even when idle, so use them less frequently
789 than VM triggers. */
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300790 icount_rt_timer = timer_new_ms(QEMU_CLOCK_VIRTUAL_RT,
791 icount_adjust_rt, NULL);
Alex Bligh40daca52013-08-21 16:03:02 +0100792 timer_mod(icount_rt_timer,
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300793 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL_RT) + 1000);
Alex Bligh40daca52013-08-21 16:03:02 +0100794 icount_vm_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
795 icount_adjust_vm, NULL);
796 timer_mod(icount_vm_timer,
797 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
Rutuja Shah73bcb242016-03-21 21:32:30 +0530798 NANOSECONDS_PER_SECOND / 10);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200799}
800
801/***********************************************************/
Alex Bennée65467062017-02-23 18:29:09 +0000802/* TCG vCPU kick timer
803 *
804 * The kick timer is responsible for moving single threaded vCPU
805 * emulation on to the next vCPU. If more than one vCPU is running a
806 * timer event with force a cpu->exit so the next vCPU can get
807 * scheduled.
808 *
809 * The timer is removed if all vCPUs are idle and restarted again once
810 * idleness is complete.
811 */
812
813static QEMUTimer *tcg_kick_vcpu_timer;
Alex Bennée791158d2017-02-23 18:29:10 +0000814static CPUState *tcg_current_rr_cpu;
Alex Bennée65467062017-02-23 18:29:09 +0000815
816#define TCG_KICK_PERIOD (NANOSECONDS_PER_SECOND / 10)
817
818static inline int64_t qemu_tcg_next_kick(void)
819{
820 return qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + TCG_KICK_PERIOD;
821}
822
Alex Bennée791158d2017-02-23 18:29:10 +0000823/* Kick the currently round-robin scheduled vCPU */
824static void qemu_cpu_kick_rr_cpu(void)
825{
826 CPUState *cpu;
Alex Bennée791158d2017-02-23 18:29:10 +0000827 do {
828 cpu = atomic_mb_read(&tcg_current_rr_cpu);
829 if (cpu) {
830 cpu_exit(cpu);
831 }
832 } while (cpu != atomic_mb_read(&tcg_current_rr_cpu));
833}
834
Paolo Bonzini6b8f0182017-03-02 19:56:40 +0100835static void do_nothing(CPUState *cpu, run_on_cpu_data unused)
836{
837}
838
Paolo Bonzini3f53bc62017-03-03 11:50:29 +0100839void qemu_timer_notify_cb(void *opaque, QEMUClockType type)
840{
Paolo Bonzini6b8f0182017-03-02 19:56:40 +0100841 if (!use_icount || type != QEMU_CLOCK_VIRTUAL) {
842 qemu_notify_event();
843 return;
844 }
845
846 if (!qemu_in_vcpu_thread() && first_cpu) {
847 /* qemu_cpu_kick is not enough to kick a halted CPU out of
848 * qemu_tcg_wait_io_event. async_run_on_cpu, instead,
849 * causes cpu_thread_is_idle to return false. This way,
850 * handle_icount_deadline can run.
851 */
852 async_run_on_cpu(first_cpu, do_nothing, RUN_ON_CPU_NULL);
853 }
Paolo Bonzini3f53bc62017-03-03 11:50:29 +0100854}
855
Alex Bennée65467062017-02-23 18:29:09 +0000856static void kick_tcg_thread(void *opaque)
857{
858 timer_mod(tcg_kick_vcpu_timer, qemu_tcg_next_kick());
Alex Bennée791158d2017-02-23 18:29:10 +0000859 qemu_cpu_kick_rr_cpu();
Alex Bennée65467062017-02-23 18:29:09 +0000860}
861
862static void start_tcg_kick_timer(void)
863{
Alex Bennée37257942017-02-23 18:29:14 +0000864 if (!mttcg_enabled && !tcg_kick_vcpu_timer && CPU_NEXT(first_cpu)) {
Alex Bennée65467062017-02-23 18:29:09 +0000865 tcg_kick_vcpu_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
866 kick_tcg_thread, NULL);
867 timer_mod(tcg_kick_vcpu_timer, qemu_tcg_next_kick());
868 }
869}
870
871static void stop_tcg_kick_timer(void)
872{
873 if (tcg_kick_vcpu_timer) {
874 timer_del(tcg_kick_vcpu_timer);
875 tcg_kick_vcpu_timer = NULL;
876 }
877}
878
Alex Bennée65467062017-02-23 18:29:09 +0000879/***********************************************************/
Blue Swirl296af7c2010-03-29 19:23:50 +0000880void hw_error(const char *fmt, ...)
881{
882 va_list ap;
Andreas Färber55e5c282012-12-17 06:18:02 +0100883 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000884
885 va_start(ap, fmt);
886 fprintf(stderr, "qemu: hardware error: ");
887 vfprintf(stderr, fmt, ap);
888 fprintf(stderr, "\n");
Andreas Färberbdc44642013-06-24 23:50:24 +0200889 CPU_FOREACH(cpu) {
Andreas Färber55e5c282012-12-17 06:18:02 +0100890 fprintf(stderr, "CPU #%d:\n", cpu->cpu_index);
Andreas Färber878096e2013-05-27 01:33:50 +0200891 cpu_dump_state(cpu, stderr, fprintf, CPU_DUMP_FPU);
Blue Swirl296af7c2010-03-29 19:23:50 +0000892 }
893 va_end(ap);
894 abort();
895}
896
897void cpu_synchronize_all_states(void)
898{
Andreas Färber182735e2013-05-29 22:29:20 +0200899 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000900
Andreas Färberbdc44642013-06-24 23:50:24 +0200901 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200902 cpu_synchronize_state(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000903 }
904}
905
906void cpu_synchronize_all_post_reset(void)
907{
Andreas Färber182735e2013-05-29 22:29:20 +0200908 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000909
Andreas Färberbdc44642013-06-24 23:50:24 +0200910 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200911 cpu_synchronize_post_reset(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000912 }
913}
914
915void cpu_synchronize_all_post_init(void)
916{
Andreas Färber182735e2013-05-29 22:29:20 +0200917 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000918
Andreas Färberbdc44642013-06-24 23:50:24 +0200919 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200920 cpu_synchronize_post_init(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000921 }
922}
923
Kevin Wolf56983462013-07-05 13:49:54 +0200924static int do_vm_stop(RunState state)
Blue Swirl296af7c2010-03-29 19:23:50 +0000925{
Kevin Wolf56983462013-07-05 13:49:54 +0200926 int ret = 0;
927
Luiz Capitulino13548692011-07-29 15:36:43 -0300928 if (runstate_is_running()) {
Blue Swirl296af7c2010-03-29 19:23:50 +0000929 cpu_disable_ticks();
Blue Swirl296af7c2010-03-29 19:23:50 +0000930 pause_all_vcpus();
Luiz Capitulinof5bbfba2011-07-29 15:04:45 -0300931 runstate_set(state);
Luiz Capitulino1dfb4dd2011-07-29 14:26:33 -0300932 vm_state_notify(0, state);
Wenchao Xiaa4e15de2014-06-18 08:43:36 +0200933 qapi_event_send_stop(&error_abort);
Blue Swirl296af7c2010-03-29 19:23:50 +0000934 }
Kevin Wolf56983462013-07-05 13:49:54 +0200935
Kevin Wolf594a45c2013-07-18 14:52:19 +0200936 bdrv_drain_all();
Pavel Dovgalyuk6d0ceb82016-09-26 11:08:16 +0300937 replay_disable_events();
John Snow22af08e2016-09-22 21:45:51 -0400938 ret = bdrv_flush_all();
Kevin Wolf594a45c2013-07-18 14:52:19 +0200939
Kevin Wolf56983462013-07-05 13:49:54 +0200940 return ret;
Blue Swirl296af7c2010-03-29 19:23:50 +0000941}
942
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200943static bool cpu_can_run(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +0000944{
Andreas Färber4fdeee72012-05-02 23:10:09 +0200945 if (cpu->stop) {
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200946 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +0100947 }
Tiejun Chen321bc0b2013-08-02 09:43:09 +0800948 if (cpu_is_stopped(cpu)) {
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200949 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +0100950 }
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200951 return true;
Blue Swirl296af7c2010-03-29 19:23:50 +0000952}
953
Andreas Färber91325042013-05-27 02:07:49 +0200954static void cpu_handle_guest_debug(CPUState *cpu)
Jan Kiszka3c638d02010-06-25 16:56:56 +0200955{
Andreas Färber64f6b342013-05-27 02:06:09 +0200956 gdb_set_stop_cpu(cpu);
Jan Kiszka8cf71712011-02-07 12:19:16 +0100957 qemu_system_debug_request();
Andreas Färberf324e762012-05-02 23:26:21 +0200958 cpu->stopped = true;
Jan Kiszka3c638d02010-06-25 16:56:56 +0200959}
960
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100961#ifdef CONFIG_LINUX
962static void sigbus_reraise(void)
963{
964 sigset_t set;
965 struct sigaction action;
966
967 memset(&action, 0, sizeof(action));
968 action.sa_handler = SIG_DFL;
969 if (!sigaction(SIGBUS, &action, NULL)) {
970 raise(SIGBUS);
971 sigemptyset(&set);
972 sigaddset(&set, SIGBUS);
Peter Maydella2d17612016-05-16 18:33:59 +0100973 pthread_sigmask(SIG_UNBLOCK, &set, NULL);
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100974 }
975 perror("Failed to re-raise SIGBUS!\n");
976 abort();
977}
978
Paolo Bonzinid98d4072017-02-08 13:22:12 +0100979static void sigbus_handler(int n, siginfo_t *siginfo, void *ctx)
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100980{
Paolo Bonzinia16fc072017-02-09 09:50:02 +0100981 if (siginfo->si_code != BUS_MCEERR_AO && siginfo->si_code != BUS_MCEERR_AR) {
982 sigbus_reraise();
983 }
984
Paolo Bonzini2ae41db2017-02-08 12:48:54 +0100985 if (current_cpu) {
986 /* Called asynchronously in VCPU thread. */
987 if (kvm_on_sigbus_vcpu(current_cpu, siginfo->si_code, siginfo->si_addr)) {
988 sigbus_reraise();
989 }
990 } else {
991 /* Called synchronously (via signalfd) in main thread. */
992 if (kvm_on_sigbus(siginfo->si_code, siginfo->si_addr)) {
993 sigbus_reraise();
994 }
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100995 }
996}
997
998static void qemu_init_sigbus(void)
999{
1000 struct sigaction action;
1001
1002 memset(&action, 0, sizeof(action));
1003 action.sa_flags = SA_SIGINFO;
Paolo Bonzinid98d4072017-02-08 13:22:12 +01001004 action.sa_sigaction = sigbus_handler;
Jan Kiszka6d9cb732011-02-01 22:15:58 +01001005 sigaction(SIGBUS, &action, NULL);
1006
1007 prctl(PR_MCE_KILL, PR_MCE_KILL_SET, PR_MCE_KILL_EARLY, 0, 0);
1008}
Paolo Bonzinia16fc072017-02-09 09:50:02 +01001009#else /* !CONFIG_LINUX */
1010static void qemu_init_sigbus(void)
1011{
1012}
Paolo Bonzinia16fc072017-02-09 09:50:02 +01001013#endif /* !CONFIG_LINUX */
Blue Swirl296af7c2010-03-29 19:23:50 +00001014
Stefan Weilb2532d82012-09-27 07:41:42 +02001015static QemuMutex qemu_global_mutex;
Blue Swirl296af7c2010-03-29 19:23:50 +00001016
1017static QemuThread io_thread;
1018
Blue Swirl296af7c2010-03-29 19:23:50 +00001019/* cpu creation */
1020static QemuCond qemu_cpu_cond;
1021/* system init */
Blue Swirl296af7c2010-03-29 19:23:50 +00001022static QemuCond qemu_pause_cond;
1023
Paolo Bonzinid3b12f52011-09-13 10:30:52 +02001024void qemu_init_cpu_loop(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001025{
Jan Kiszka6d9cb732011-02-01 22:15:58 +01001026 qemu_init_sigbus();
Anthony Liguoried945922011-02-08 18:18:18 +01001027 qemu_cond_init(&qemu_cpu_cond);
Anthony Liguoried945922011-02-08 18:18:18 +01001028 qemu_cond_init(&qemu_pause_cond);
Blue Swirl296af7c2010-03-29 19:23:50 +00001029 qemu_mutex_init(&qemu_global_mutex);
Blue Swirl296af7c2010-03-29 19:23:50 +00001030
Jan Kiszkab7680cb2011-03-12 17:43:51 +01001031 qemu_thread_get_self(&io_thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001032}
1033
Paolo Bonzini14e6fe12016-10-31 10:36:08 +01001034void run_on_cpu(CPUState *cpu, run_on_cpu_func func, run_on_cpu_data data)
Marcelo Tosattie82bcec2010-05-04 09:45:22 -03001035{
Sergey Fedorovd148d902016-08-29 09:51:00 +02001036 do_run_on_cpu(cpu, func, data, &qemu_global_mutex);
Chegu Vinod3c022702013-06-24 03:49:41 -06001037}
1038
Gu Zheng4c055ab2016-05-12 09:18:13 +05301039static void qemu_kvm_destroy_vcpu(CPUState *cpu)
1040{
1041 if (kvm_destroy_vcpu(cpu) < 0) {
1042 error_report("kvm_destroy_vcpu failed");
1043 exit(EXIT_FAILURE);
1044 }
1045}
1046
1047static void qemu_tcg_destroy_vcpu(CPUState *cpu)
1048{
1049}
1050
Andreas Färber509a0d72012-05-03 02:18:09 +02001051static void qemu_wait_io_event_common(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001052{
Alex Bennée37257942017-02-23 18:29:14 +00001053 atomic_mb_set(&cpu->thread_kicked, false);
Andreas Färber4fdeee72012-05-02 23:10:09 +02001054 if (cpu->stop) {
1055 cpu->stop = false;
Andreas Färberf324e762012-05-02 23:26:21 +02001056 cpu->stopped = true;
Dr. David Alan Gilbert96bce682016-01-25 10:08:18 +00001057 qemu_cond_broadcast(&qemu_pause_cond);
Blue Swirl296af7c2010-03-29 19:23:50 +00001058 }
Sergey Fedorova5403c62016-08-02 18:27:36 +01001059 process_queued_cpu_work(cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001060}
1061
1062static bool qemu_tcg_should_sleep(CPUState *cpu)
1063{
1064 if (mttcg_enabled) {
1065 return cpu_thread_is_idle(cpu);
1066 } else {
1067 return all_cpu_threads_idle();
1068 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001069}
1070
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001071static void qemu_tcg_wait_io_event(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001072{
Alex Bennée37257942017-02-23 18:29:14 +00001073 while (qemu_tcg_should_sleep(cpu)) {
Alex Bennée65467062017-02-23 18:29:09 +00001074 stop_tcg_kick_timer();
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001075 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka16400322011-02-09 16:29:37 +01001076 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001077
Alex Bennée65467062017-02-23 18:29:09 +00001078 start_tcg_kick_timer();
1079
Alex Bennée37257942017-02-23 18:29:14 +00001080 qemu_wait_io_event_common(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001081}
1082
Andreas Färberfd529e82013-05-26 23:24:55 +02001083static void qemu_kvm_wait_io_event(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001084{
Andreas Färbera98ae1d2013-05-26 23:21:08 +02001085 while (cpu_thread_is_idle(cpu)) {
Andreas Färberf5c121b2012-05-03 01:22:49 +02001086 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka16400322011-02-09 16:29:37 +01001087 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001088
Andreas Färber509a0d72012-05-03 02:18:09 +02001089 qemu_wait_io_event_common(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001090}
1091
Jan Kiszka7e97cd82011-02-07 12:19:12 +01001092static void *qemu_kvm_cpu_thread_fn(void *arg)
Blue Swirl296af7c2010-03-29 19:23:50 +00001093{
Andreas Färber48a106b2013-05-27 02:20:39 +02001094 CPUState *cpu = arg;
Jan Kiszka84b49152011-02-01 22:15:50 +01001095 int r;
Blue Swirl296af7c2010-03-29 19:23:50 +00001096
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001097 rcu_register_thread();
1098
Paolo Bonzini2e7f7a32015-06-18 18:47:18 +02001099 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001100 qemu_thread_get_self(cpu->thread);
Andreas Färber9f09e182012-05-03 06:59:07 +02001101 cpu->thread_id = qemu_get_thread_id();
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001102 cpu->can_do_io = 1;
Andreas Färber4917cf42013-05-27 05:17:50 +02001103 current_cpu = cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001104
Andreas Färber504134d2012-12-17 06:38:45 +01001105 r = kvm_init_vcpu(cpu);
Jan Kiszka84b49152011-02-01 22:15:50 +01001106 if (r < 0) {
1107 fprintf(stderr, "kvm_init_vcpu failed: %s\n", strerror(-r));
1108 exit(1);
1109 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001110
Paolo Bonzini18268b62017-02-09 09:41:14 +01001111 kvm_init_cpu_signals(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001112
1113 /* signal CPU creation */
Andreas Färber61a46212012-05-02 22:49:36 +02001114 cpu->created = true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001115 qemu_cond_signal(&qemu_cpu_cond);
1116
Gu Zheng4c055ab2016-05-12 09:18:13 +05301117 do {
Andreas Färbera1fcaa72012-05-02 23:42:26 +02001118 if (cpu_can_run(cpu)) {
Andreas Färber1458c362013-05-26 23:46:55 +02001119 r = kvm_cpu_exec(cpu);
Jan Kiszka83f338f2011-02-07 12:19:17 +01001120 if (r == EXCP_DEBUG) {
Andreas Färber91325042013-05-27 02:07:49 +02001121 cpu_handle_guest_debug(cpu);
Jan Kiszka83f338f2011-02-07 12:19:17 +01001122 }
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001123 }
Andreas Färberfd529e82013-05-26 23:24:55 +02001124 qemu_kvm_wait_io_event(cpu);
Gu Zheng4c055ab2016-05-12 09:18:13 +05301125 } while (!cpu->unplug || cpu_can_run(cpu));
Blue Swirl296af7c2010-03-29 19:23:50 +00001126
Gu Zheng4c055ab2016-05-12 09:18:13 +05301127 qemu_kvm_destroy_vcpu(cpu);
Bharata B Rao2c579042016-05-12 09:18:14 +05301128 cpu->created = false;
1129 qemu_cond_signal(&qemu_cpu_cond);
Gu Zheng4c055ab2016-05-12 09:18:13 +05301130 qemu_mutex_unlock_iothread();
Blue Swirl296af7c2010-03-29 19:23:50 +00001131 return NULL;
1132}
1133
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001134static void *qemu_dummy_cpu_thread_fn(void *arg)
1135{
1136#ifdef _WIN32
1137 fprintf(stderr, "qtest is not supported under Windows\n");
1138 exit(1);
1139#else
Andreas Färber10a90212013-05-27 02:24:35 +02001140 CPUState *cpu = arg;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001141 sigset_t waitset;
1142 int r;
1143
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001144 rcu_register_thread();
1145
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001146 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001147 qemu_thread_get_self(cpu->thread);
Andreas Färber9f09e182012-05-03 06:59:07 +02001148 cpu->thread_id = qemu_get_thread_id();
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001149 cpu->can_do_io = 1;
Alex Bennée37257942017-02-23 18:29:14 +00001150 current_cpu = cpu;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001151
1152 sigemptyset(&waitset);
1153 sigaddset(&waitset, SIG_IPI);
1154
1155 /* signal CPU creation */
Andreas Färber61a46212012-05-02 22:49:36 +02001156 cpu->created = true;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001157 qemu_cond_signal(&qemu_cpu_cond);
1158
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001159 while (1) {
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001160 qemu_mutex_unlock_iothread();
1161 do {
1162 int sig;
1163 r = sigwait(&waitset, &sig);
1164 } while (r == -1 && (errno == EAGAIN || errno == EINTR));
1165 if (r == -1) {
1166 perror("sigwait");
1167 exit(1);
1168 }
1169 qemu_mutex_lock_iothread();
Andreas Färber509a0d72012-05-03 02:18:09 +02001170 qemu_wait_io_event_common(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001171 }
1172
1173 return NULL;
1174#endif
1175}
1176
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001177static int64_t tcg_get_icount_limit(void)
1178{
1179 int64_t deadline;
1180
1181 if (replay_mode != REPLAY_MODE_PLAY) {
1182 deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
1183
1184 /* Maintain prior (possibly buggy) behaviour where if no deadline
1185 * was set (as there is no QEMU_CLOCK_VIRTUAL timer) or it is more than
1186 * INT32_MAX nanoseconds ahead, we still use INT32_MAX
1187 * nanoseconds.
1188 */
1189 if ((deadline < 0) || (deadline > INT32_MAX)) {
1190 deadline = INT32_MAX;
1191 }
1192
1193 return qemu_icount_round(deadline);
1194 } else {
1195 return replay_get_instructions();
1196 }
1197}
1198
Alex Bennée12e97002016-10-27 16:10:14 +01001199static void handle_icount_deadline(void)
1200{
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001201 assert(qemu_in_vcpu_thread());
Alex Bennée12e97002016-10-27 16:10:14 +01001202 if (use_icount) {
1203 int64_t deadline =
1204 qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
1205
1206 if (deadline == 0) {
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001207 /* Wake up other AioContexts. */
Alex Bennée12e97002016-10-27 16:10:14 +01001208 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001209 qemu_clock_run_timers(QEMU_CLOCK_VIRTUAL);
Alex Bennée12e97002016-10-27 16:10:14 +01001210 }
1211 }
1212}
1213
Alex Bennée05248382017-03-29 16:46:59 +01001214static void prepare_icount_for_run(CPUState *cpu)
1215{
1216 if (use_icount) {
Alex Bennéeeda5f7c2017-04-05 12:35:48 +01001217 int insns_left;
Alex Bennée05248382017-03-29 16:46:59 +01001218
1219 /* These should always be cleared by process_icount_data after
1220 * each vCPU execution. However u16.high can be raised
1221 * asynchronously by cpu_exit/cpu_interrupt/tcg_handle_interrupt
1222 */
1223 g_assert(cpu->icount_decr.u16.low == 0);
1224 g_assert(cpu->icount_extra == 0);
1225
Alex Bennéeeda5f7c2017-04-05 12:35:48 +01001226 cpu->icount_budget = tcg_get_icount_limit();
1227 insns_left = MIN(0xffff, cpu->icount_budget);
1228 cpu->icount_decr.u16.low = insns_left;
1229 cpu->icount_extra = cpu->icount_budget - insns_left;
Alex Bennée05248382017-03-29 16:46:59 +01001230 }
1231}
1232
1233static void process_icount_data(CPUState *cpu)
1234{
1235 if (use_icount) {
Alex Bennéee4cd9652017-03-31 16:09:42 +01001236 /* Account for executed instructions */
Alex Bennée512d3c82017-04-05 12:32:37 +01001237 cpu_update_icount(cpu);
Alex Bennée05248382017-03-29 16:46:59 +01001238
1239 /* Reset the counters */
1240 cpu->icount_decr.u16.low = 0;
1241 cpu->icount_extra = 0;
Alex Bennéee4cd9652017-03-31 16:09:42 +01001242 cpu->icount_budget = 0;
1243
Alex Bennée05248382017-03-29 16:46:59 +01001244 replay_account_executed_instructions();
1245 }
1246}
1247
1248
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001249static int tcg_cpu_exec(CPUState *cpu)
1250{
1251 int ret;
1252#ifdef CONFIG_PROFILER
1253 int64_t ti;
1254#endif
1255
1256#ifdef CONFIG_PROFILER
1257 ti = profile_getclock();
1258#endif
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001259 qemu_mutex_unlock_iothread();
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001260 cpu_exec_start(cpu);
1261 ret = cpu_exec(cpu);
1262 cpu_exec_end(cpu);
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001263 qemu_mutex_lock_iothread();
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001264#ifdef CONFIG_PROFILER
1265 tcg_time += profile_getclock() - ti;
1266#endif
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001267 return ret;
1268}
1269
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001270/* Destroy any remaining vCPUs which have been unplugged and have
1271 * finished running
1272 */
1273static void deal_with_unplugged_cpus(void)
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001274{
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001275 CPUState *cpu;
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001276
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001277 CPU_FOREACH(cpu) {
1278 if (cpu->unplug && !cpu_can_run(cpu)) {
1279 qemu_tcg_destroy_vcpu(cpu);
1280 cpu->created = false;
1281 qemu_cond_signal(&qemu_cpu_cond);
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001282 break;
1283 }
1284 }
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001285}
Jan Kiszkabdb7ca62011-09-26 09:40:39 +02001286
Alex Bennée65467062017-02-23 18:29:09 +00001287/* Single-threaded TCG
1288 *
1289 * In the single-threaded case each vCPU is simulated in turn. If
1290 * there is more than a single vCPU we create a simple timer to kick
1291 * the vCPU and ensure we don't get stuck in a tight loop in one vCPU.
1292 * This is done explicitly rather than relying on side-effects
1293 * elsewhere.
1294 */
1295
Alex Bennée37257942017-02-23 18:29:14 +00001296static void *qemu_tcg_rr_cpu_thread_fn(void *arg)
Blue Swirl296af7c2010-03-29 19:23:50 +00001297{
Andreas Färberc3586ba2012-05-03 01:41:24 +02001298 CPUState *cpu = arg;
Blue Swirl296af7c2010-03-29 19:23:50 +00001299
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001300 rcu_register_thread();
1301
Paolo Bonzini2e7f7a32015-06-18 18:47:18 +02001302 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001303 qemu_thread_get_self(cpu->thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001304
Andreas Färber38fcbd32013-07-07 19:50:23 +02001305 CPU_FOREACH(cpu) {
1306 cpu->thread_id = qemu_get_thread_id();
1307 cpu->created = true;
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001308 cpu->can_do_io = 1;
Andreas Färber38fcbd32013-07-07 19:50:23 +02001309 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001310 qemu_cond_signal(&qemu_cpu_cond);
1311
Jan Kiszkafa7d1862011-08-22 18:35:25 +02001312 /* wait for initial kick-off after machine start */
Emilio G. Cotac28e3992015-04-27 12:45:28 -04001313 while (first_cpu->stopped) {
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001314 qemu_cond_wait(first_cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka8e564b42012-02-17 18:31:15 +01001315
1316 /* process any pending work */
Andreas Färberbdc44642013-06-24 23:50:24 +02001317 CPU_FOREACH(cpu) {
Alex Bennée37257942017-02-23 18:29:14 +00001318 current_cpu = cpu;
Andreas Färber182735e2013-05-29 22:29:20 +02001319 qemu_wait_io_event_common(cpu);
Jan Kiszka8e564b42012-02-17 18:31:15 +01001320 }
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001321 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001322
Alex Bennée65467062017-02-23 18:29:09 +00001323 start_tcg_kick_timer();
1324
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001325 cpu = first_cpu;
1326
Alex Bennéee5143e32017-02-23 18:29:12 +00001327 /* process any pending work */
1328 cpu->exit_request = 1;
1329
Blue Swirl296af7c2010-03-29 19:23:50 +00001330 while (1) {
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001331 /* Account partial waits to QEMU_CLOCK_VIRTUAL. */
1332 qemu_account_warp_timer();
1333
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001334 /* Run the timers here. This is much more efficient than
1335 * waking up the I/O thread and waiting for completion.
1336 */
1337 handle_icount_deadline();
1338
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001339 if (!cpu) {
1340 cpu = first_cpu;
1341 }
1342
Alex Bennéee5143e32017-02-23 18:29:12 +00001343 while (cpu && !cpu->queued_work_first && !cpu->exit_request) {
1344
Alex Bennée791158d2017-02-23 18:29:10 +00001345 atomic_mb_set(&tcg_current_rr_cpu, cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001346 current_cpu = cpu;
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001347
1348 qemu_clock_enable(QEMU_CLOCK_VIRTUAL,
1349 (cpu->singlestep_enabled & SSTEP_NOTIMER) == 0);
1350
1351 if (cpu_can_run(cpu)) {
1352 int r;
Alex Bennée05248382017-03-29 16:46:59 +01001353
1354 prepare_icount_for_run(cpu);
1355
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001356 r = tcg_cpu_exec(cpu);
Alex Bennée05248382017-03-29 16:46:59 +01001357
1358 process_icount_data(cpu);
1359
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001360 if (r == EXCP_DEBUG) {
1361 cpu_handle_guest_debug(cpu);
1362 break;
Pranith Kumar08e73c42017-02-23 18:29:15 +00001363 } else if (r == EXCP_ATOMIC) {
1364 qemu_mutex_unlock_iothread();
1365 cpu_exec_step_atomic(cpu);
1366 qemu_mutex_lock_iothread();
1367 break;
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001368 }
Alex Bennée37257942017-02-23 18:29:14 +00001369 } else if (cpu->stop) {
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001370 if (cpu->unplug) {
1371 cpu = CPU_NEXT(cpu);
1372 }
1373 break;
1374 }
1375
Alex Bennéee5143e32017-02-23 18:29:12 +00001376 cpu = CPU_NEXT(cpu);
1377 } /* while (cpu && !cpu->exit_request).. */
1378
Alex Bennée791158d2017-02-23 18:29:10 +00001379 /* Does not need atomic_mb_set because a spurious wakeup is okay. */
1380 atomic_set(&tcg_current_rr_cpu, NULL);
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001381
Alex Bennéee5143e32017-02-23 18:29:12 +00001382 if (cpu && cpu->exit_request) {
1383 atomic_mb_set(&cpu->exit_request, 0);
1384 }
Alex Blighac70aaf2013-08-21 16:02:57 +01001385
Alex Bennée37257942017-02-23 18:29:14 +00001386 qemu_tcg_wait_io_event(cpu ? cpu : QTAILQ_FIRST(&cpus));
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001387 deal_with_unplugged_cpus();
Blue Swirl296af7c2010-03-29 19:23:50 +00001388 }
1389
1390 return NULL;
1391}
1392
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001393static void *qemu_hax_cpu_thread_fn(void *arg)
1394{
1395 CPUState *cpu = arg;
1396 int r;
Vincent Palatinb3d3a422017-03-20 11:15:49 +01001397
1398 qemu_mutex_lock_iothread();
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001399 qemu_thread_get_self(cpu->thread);
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001400
1401 cpu->thread_id = qemu_get_thread_id();
1402 cpu->created = true;
1403 cpu->halted = 0;
1404 current_cpu = cpu;
1405
1406 hax_init_vcpu(cpu);
1407 qemu_cond_signal(&qemu_cpu_cond);
1408
1409 while (1) {
1410 if (cpu_can_run(cpu)) {
1411 r = hax_smp_cpu_exec(cpu);
1412 if (r == EXCP_DEBUG) {
1413 cpu_handle_guest_debug(cpu);
1414 }
1415 }
1416
1417 while (cpu_thread_is_idle(cpu)) {
1418 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
1419 }
1420#ifdef _WIN32
1421 SleepEx(0, TRUE);
1422#endif
1423 qemu_wait_io_event_common(cpu);
1424 }
1425 return NULL;
1426}
1427
1428#ifdef _WIN32
1429static void CALLBACK dummy_apc_func(ULONG_PTR unused)
1430{
1431}
1432#endif
1433
Alex Bennée37257942017-02-23 18:29:14 +00001434/* Multi-threaded TCG
1435 *
1436 * In the multi-threaded case each vCPU has its own thread. The TLS
1437 * variable current_cpu can be used deep in the code to find the
1438 * current CPUState for a given thread.
1439 */
1440
1441static void *qemu_tcg_cpu_thread_fn(void *arg)
1442{
1443 CPUState *cpu = arg;
1444
Alex Bennéebf51c722017-03-30 18:32:29 +01001445 g_assert(!use_icount);
1446
Alex Bennée37257942017-02-23 18:29:14 +00001447 rcu_register_thread();
1448
1449 qemu_mutex_lock_iothread();
1450 qemu_thread_get_self(cpu->thread);
1451
1452 cpu->thread_id = qemu_get_thread_id();
1453 cpu->created = true;
1454 cpu->can_do_io = 1;
1455 current_cpu = cpu;
1456 qemu_cond_signal(&qemu_cpu_cond);
1457
1458 /* process any pending work */
1459 cpu->exit_request = 1;
1460
1461 while (1) {
1462 if (cpu_can_run(cpu)) {
1463 int r;
1464 r = tcg_cpu_exec(cpu);
1465 switch (r) {
1466 case EXCP_DEBUG:
1467 cpu_handle_guest_debug(cpu);
1468 break;
1469 case EXCP_HALTED:
1470 /* during start-up the vCPU is reset and the thread is
1471 * kicked several times. If we don't ensure we go back
1472 * to sleep in the halted state we won't cleanly
1473 * start-up when the vCPU is enabled.
1474 *
1475 * cpu->halted should ensure we sleep in wait_io_event
1476 */
1477 g_assert(cpu->halted);
1478 break;
Pranith Kumar08e73c42017-02-23 18:29:15 +00001479 case EXCP_ATOMIC:
1480 qemu_mutex_unlock_iothread();
1481 cpu_exec_step_atomic(cpu);
1482 qemu_mutex_lock_iothread();
Alex Bennée37257942017-02-23 18:29:14 +00001483 default:
1484 /* Ignore everything else? */
1485 break;
1486 }
Bharata B Raoa3e53272017-04-27 10:48:22 +05301487 } else if (cpu->unplug) {
1488 qemu_tcg_destroy_vcpu(cpu);
1489 cpu->created = false;
1490 qemu_cond_signal(&qemu_cpu_cond);
1491 qemu_mutex_unlock_iothread();
1492 return NULL;
Alex Bennée37257942017-02-23 18:29:14 +00001493 }
1494
Alex Bennée37257942017-02-23 18:29:14 +00001495 atomic_mb_set(&cpu->exit_request, 0);
1496 qemu_tcg_wait_io_event(cpu);
1497 }
1498
1499 return NULL;
1500}
1501
Andreas Färber2ff09a42012-05-03 00:23:30 +02001502static void qemu_cpu_kick_thread(CPUState *cpu)
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001503{
1504#ifndef _WIN32
1505 int err;
1506
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001507 if (cpu->thread_kicked) {
1508 return;
Paolo Bonzini9102ded2015-08-18 06:52:09 -07001509 }
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001510 cpu->thread_kicked = true;
Andreas Färber814e6122012-05-02 17:00:37 +02001511 err = pthread_kill(cpu->thread->thread, SIG_IPI);
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001512 if (err) {
1513 fprintf(stderr, "qemu:%s: %s", __func__, strerror(err));
1514 exit(1);
1515 }
1516#else /* _WIN32 */
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001517 if (!qemu_cpu_is_self(cpu)) {
1518 if (!QueueUserAPC(dummy_apc_func, cpu->hThread, 0)) {
1519 fprintf(stderr, "%s: QueueUserAPC failed with error %lu\n",
1520 __func__, GetLastError());
1521 exit(1);
1522 }
1523 }
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001524#endif
1525}
1526
Andreas Färberc08d7422012-05-03 04:34:15 +02001527void qemu_cpu_kick(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001528{
Andreas Färberf5c121b2012-05-03 01:22:49 +02001529 qemu_cond_broadcast(cpu->halt_cond);
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001530 if (tcg_enabled()) {
Alex Bennée791158d2017-02-23 18:29:10 +00001531 cpu_exit(cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001532 /* NOP unless doing single-thread RR */
Alex Bennée791158d2017-02-23 18:29:10 +00001533 qemu_cpu_kick_rr_cpu();
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001534 } else {
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001535 if (hax_enabled()) {
1536 /*
1537 * FIXME: race condition with the exit_request check in
1538 * hax_vcpu_hax_exec
1539 */
1540 cpu->exit_request = 1;
1541 }
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001542 qemu_cpu_kick_thread(cpu);
1543 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001544}
1545
Jan Kiszka46d62fa2011-02-01 22:15:59 +01001546void qemu_cpu_kick_self(void)
1547{
Andreas Färber4917cf42013-05-27 05:17:50 +02001548 assert(current_cpu);
Paolo Bonzini9102ded2015-08-18 06:52:09 -07001549 qemu_cpu_kick_thread(current_cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001550}
1551
Andreas Färber60e82572012-05-02 22:23:49 +02001552bool qemu_cpu_is_self(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001553{
Andreas Färber814e6122012-05-02 17:00:37 +02001554 return qemu_thread_is_self(cpu->thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001555}
1556
Paolo Bonzini79e2b9a2015-01-21 12:09:14 +01001557bool qemu_in_vcpu_thread(void)
Juan Quintelaaa723c22012-09-18 16:30:11 +02001558{
Andreas Färber4917cf42013-05-27 05:17:50 +02001559 return current_cpu && qemu_cpu_is_self(current_cpu);
Juan Quintelaaa723c22012-09-18 16:30:11 +02001560}
1561
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001562static __thread bool iothread_locked = false;
1563
1564bool qemu_mutex_iothread_locked(void)
1565{
1566 return iothread_locked;
1567}
1568
Blue Swirl296af7c2010-03-29 19:23:50 +00001569void qemu_mutex_lock_iothread(void)
1570{
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001571 g_assert(!qemu_mutex_iothread_locked());
1572 qemu_mutex_lock(&qemu_global_mutex);
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001573 iothread_locked = true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001574}
1575
1576void qemu_mutex_unlock_iothread(void)
1577{
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001578 g_assert(qemu_mutex_iothread_locked());
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001579 iothread_locked = false;
Blue Swirl296af7c2010-03-29 19:23:50 +00001580 qemu_mutex_unlock(&qemu_global_mutex);
1581}
1582
Alex Bennéee8faee02016-10-27 16:09:58 +01001583static bool all_vcpus_paused(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001584{
Andreas Färberbdc44642013-06-24 23:50:24 +02001585 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001586
Andreas Färberbdc44642013-06-24 23:50:24 +02001587 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001588 if (!cpu->stopped) {
Alex Bennéee8faee02016-10-27 16:09:58 +01001589 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001590 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001591 }
1592
Alex Bennéee8faee02016-10-27 16:09:58 +01001593 return true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001594}
1595
1596void pause_all_vcpus(void)
1597{
Andreas Färberbdc44642013-06-24 23:50:24 +02001598 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001599
Alex Bligh40daca52013-08-21 16:03:02 +01001600 qemu_clock_enable(QEMU_CLOCK_VIRTUAL, false);
Andreas Färberbdc44642013-06-24 23:50:24 +02001601 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001602 cpu->stop = true;
1603 qemu_cpu_kick(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001604 }
1605
Juan Quintelaaa723c22012-09-18 16:30:11 +02001606 if (qemu_in_vcpu_thread()) {
Jan Kiszkad798e972012-02-17 18:31:16 +01001607 cpu_stop_current();
Jan Kiszkad798e972012-02-17 18:31:16 +01001608 }
1609
Blue Swirl296af7c2010-03-29 19:23:50 +00001610 while (!all_vcpus_paused()) {
Paolo Bonzinibe7d6c52011-03-12 17:44:02 +01001611 qemu_cond_wait(&qemu_pause_cond, &qemu_global_mutex);
Andreas Färberbdc44642013-06-24 23:50:24 +02001612 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001613 qemu_cpu_kick(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001614 }
1615 }
1616}
1617
Igor Mammedov29936832013-04-23 10:29:37 +02001618void cpu_resume(CPUState *cpu)
1619{
1620 cpu->stop = false;
1621 cpu->stopped = false;
1622 qemu_cpu_kick(cpu);
1623}
1624
Blue Swirl296af7c2010-03-29 19:23:50 +00001625void resume_all_vcpus(void)
1626{
Andreas Färberbdc44642013-06-24 23:50:24 +02001627 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001628
Alex Bligh40daca52013-08-21 16:03:02 +01001629 qemu_clock_enable(QEMU_CLOCK_VIRTUAL, true);
Andreas Färberbdc44642013-06-24 23:50:24 +02001630 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001631 cpu_resume(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001632 }
1633}
1634
Gu Zheng4c055ab2016-05-12 09:18:13 +05301635void cpu_remove(CPUState *cpu)
1636{
1637 cpu->stop = true;
1638 cpu->unplug = true;
1639 qemu_cpu_kick(cpu);
1640}
1641
Bharata B Rao2c579042016-05-12 09:18:14 +05301642void cpu_remove_sync(CPUState *cpu)
1643{
1644 cpu_remove(cpu);
1645 while (cpu->created) {
1646 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1647 }
1648}
1649
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001650/* For temporary buffers for forming a name */
1651#define VCPU_THREAD_NAME_SIZE 16
1652
Andreas Färbere5ab30a2012-05-03 01:50:44 +02001653static void qemu_tcg_init_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001654{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001655 char thread_name[VCPU_THREAD_NAME_SIZE];
Alex Bennée37257942017-02-23 18:29:14 +00001656 static QemuCond *single_tcg_halt_cond;
1657 static QemuThread *single_tcg_cpu_thread;
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001658
Alex Bennée37257942017-02-23 18:29:14 +00001659 if (qemu_tcg_mttcg_enabled() || !single_tcg_cpu_thread) {
Andreas Färber814e6122012-05-02 17:00:37 +02001660 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001661 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1662 qemu_cond_init(cpu->halt_cond);
Alex Bennée37257942017-02-23 18:29:14 +00001663
1664 if (qemu_tcg_mttcg_enabled()) {
1665 /* create a thread per vCPU with TCG (MTTCG) */
1666 parallel_cpus = true;
1667 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/TCG",
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001668 cpu->cpu_index);
Alex Bennée37257942017-02-23 18:29:14 +00001669
1670 qemu_thread_create(cpu->thread, thread_name, qemu_tcg_cpu_thread_fn,
1671 cpu, QEMU_THREAD_JOINABLE);
1672
1673 } else {
1674 /* share a single thread for all cpus with TCG */
1675 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "ALL CPUs/TCG");
1676 qemu_thread_create(cpu->thread, thread_name,
1677 qemu_tcg_rr_cpu_thread_fn,
1678 cpu, QEMU_THREAD_JOINABLE);
1679
1680 single_tcg_halt_cond = cpu->halt_cond;
1681 single_tcg_cpu_thread = cpu->thread;
1682 }
Paolo Bonzini1ecf47b2011-12-13 13:43:52 +01001683#ifdef _WIN32
Andreas Färber814e6122012-05-02 17:00:37 +02001684 cpu->hThread = qemu_thread_get_handle(cpu->thread);
Paolo Bonzini1ecf47b2011-12-13 13:43:52 +01001685#endif
Andreas Färber61a46212012-05-02 22:49:36 +02001686 while (!cpu->created) {
Paolo Bonzini18a85722011-03-12 17:44:03 +01001687 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001688 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001689 } else {
Alex Bennée37257942017-02-23 18:29:14 +00001690 /* For non-MTTCG cases we share the thread */
1691 cpu->thread = single_tcg_cpu_thread;
1692 cpu->halt_cond = single_tcg_halt_cond;
Blue Swirl296af7c2010-03-29 19:23:50 +00001693 }
1694}
1695
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001696static void qemu_hax_start_vcpu(CPUState *cpu)
1697{
1698 char thread_name[VCPU_THREAD_NAME_SIZE];
1699
1700 cpu->thread = g_malloc0(sizeof(QemuThread));
1701 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1702 qemu_cond_init(cpu->halt_cond);
1703
1704 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/HAX",
1705 cpu->cpu_index);
1706 qemu_thread_create(cpu->thread, thread_name, qemu_hax_cpu_thread_fn,
1707 cpu, QEMU_THREAD_JOINABLE);
1708#ifdef _WIN32
1709 cpu->hThread = qemu_thread_get_handle(cpu->thread);
1710#endif
1711 while (!cpu->created) {
1712 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1713 }
1714}
1715
Andreas Färber48a106b2013-05-27 02:20:39 +02001716static void qemu_kvm_start_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001717{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001718 char thread_name[VCPU_THREAD_NAME_SIZE];
1719
Andreas Färber814e6122012-05-02 17:00:37 +02001720 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001721 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1722 qemu_cond_init(cpu->halt_cond);
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001723 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/KVM",
1724 cpu->cpu_index);
1725 qemu_thread_create(cpu->thread, thread_name, qemu_kvm_cpu_thread_fn,
1726 cpu, QEMU_THREAD_JOINABLE);
Andreas Färber61a46212012-05-02 22:49:36 +02001727 while (!cpu->created) {
Paolo Bonzini18a85722011-03-12 17:44:03 +01001728 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001729 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001730}
1731
Andreas Färber10a90212013-05-27 02:24:35 +02001732static void qemu_dummy_start_vcpu(CPUState *cpu)
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001733{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001734 char thread_name[VCPU_THREAD_NAME_SIZE];
1735
Andreas Färber814e6122012-05-02 17:00:37 +02001736 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001737 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1738 qemu_cond_init(cpu->halt_cond);
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001739 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/DUMMY",
1740 cpu->cpu_index);
1741 qemu_thread_create(cpu->thread, thread_name, qemu_dummy_cpu_thread_fn, cpu,
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001742 QEMU_THREAD_JOINABLE);
Andreas Färber61a46212012-05-02 22:49:36 +02001743 while (!cpu->created) {
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001744 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1745 }
1746}
1747
Andreas Färberc643bed2013-05-27 03:23:24 +02001748void qemu_init_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001749{
Andreas Färberce3960e2012-12-17 03:27:07 +01001750 cpu->nr_cores = smp_cores;
1751 cpu->nr_threads = smp_threads;
Andreas Färberf324e762012-05-02 23:26:21 +02001752 cpu->stopped = true;
Peter Maydell56943e82016-01-21 14:15:04 +00001753
1754 if (!cpu->as) {
1755 /* If the target cpu hasn't set up any address spaces itself,
1756 * give it the default one.
1757 */
Peter Crosthwaite6731d862016-01-21 14:15:06 +00001758 AddressSpace *as = address_space_init_shareable(cpu->memory,
1759 "cpu-memory");
Peter Maydell12ebc9a2016-01-21 14:15:04 +00001760 cpu->num_ases = 1;
Peter Crosthwaite6731d862016-01-21 14:15:06 +00001761 cpu_address_space_init(cpu, as, 0);
Peter Maydell56943e82016-01-21 14:15:04 +00001762 }
1763
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001764 if (kvm_enabled()) {
Andreas Färber48a106b2013-05-27 02:20:39 +02001765 qemu_kvm_start_vcpu(cpu);
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001766 } else if (hax_enabled()) {
1767 qemu_hax_start_vcpu(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001768 } else if (tcg_enabled()) {
Andreas Färbere5ab30a2012-05-03 01:50:44 +02001769 qemu_tcg_init_vcpu(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001770 } else {
Andreas Färber10a90212013-05-27 02:24:35 +02001771 qemu_dummy_start_vcpu(cpu);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001772 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001773}
1774
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001775void cpu_stop_current(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001776{
Andreas Färber4917cf42013-05-27 05:17:50 +02001777 if (current_cpu) {
1778 current_cpu->stop = false;
1779 current_cpu->stopped = true;
1780 cpu_exit(current_cpu);
Dr. David Alan Gilbert96bce682016-01-25 10:08:18 +00001781 qemu_cond_broadcast(&qemu_pause_cond);
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001782 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001783}
1784
Kevin Wolf56983462013-07-05 13:49:54 +02001785int vm_stop(RunState state)
Blue Swirl296af7c2010-03-29 19:23:50 +00001786{
Juan Quintelaaa723c22012-09-18 16:30:11 +02001787 if (qemu_in_vcpu_thread()) {
Paolo Bonzini74892d22014-06-05 14:53:58 +02001788 qemu_system_vmstop_request_prepare();
Luiz Capitulino1dfb4dd2011-07-29 14:26:33 -03001789 qemu_system_vmstop_request(state);
Blue Swirl296af7c2010-03-29 19:23:50 +00001790 /*
1791 * FIXME: should not return to device code in case
1792 * vm_stop() has been requested.
1793 */
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001794 cpu_stop_current();
Kevin Wolf56983462013-07-05 13:49:54 +02001795 return 0;
Blue Swirl296af7c2010-03-29 19:23:50 +00001796 }
Kevin Wolf56983462013-07-05 13:49:54 +02001797
1798 return do_vm_stop(state);
Blue Swirl296af7c2010-03-29 19:23:50 +00001799}
1800
Claudio Imbrenda2d76e822017-02-14 18:07:47 +01001801/**
1802 * Prepare for (re)starting the VM.
1803 * Returns -1 if the vCPUs are not to be restarted (e.g. if they are already
1804 * running or in case of an error condition), 0 otherwise.
1805 */
1806int vm_prepare_start(void)
1807{
1808 RunState requested;
1809 int res = 0;
1810
1811 qemu_vmstop_requested(&requested);
1812 if (runstate_is_running() && requested == RUN_STATE__MAX) {
1813 return -1;
1814 }
1815
1816 /* Ensure that a STOP/RESUME pair of events is emitted if a
1817 * vmstop request was pending. The BLOCK_IO_ERROR event, for
1818 * example, according to documentation is always followed by
1819 * the STOP event.
1820 */
1821 if (runstate_is_running()) {
1822 qapi_event_send_stop(&error_abort);
1823 res = -1;
1824 } else {
1825 replay_enable_events();
1826 cpu_enable_ticks();
1827 runstate_set(RUN_STATE_RUNNING);
1828 vm_state_notify(1, RUN_STATE_RUNNING);
1829 }
1830
1831 /* We are sending this now, but the CPUs will be resumed shortly later */
1832 qapi_event_send_resume(&error_abort);
1833 return res;
1834}
1835
1836void vm_start(void)
1837{
1838 if (!vm_prepare_start()) {
1839 resume_all_vcpus();
1840 }
1841}
1842
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001843/* does a state transition even if the VM is already stopped,
1844 current state is forgotten forever */
Kevin Wolf56983462013-07-05 13:49:54 +02001845int vm_stop_force_state(RunState state)
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001846{
1847 if (runstate_is_running()) {
Kevin Wolf56983462013-07-05 13:49:54 +02001848 return vm_stop(state);
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001849 } else {
1850 runstate_set(state);
Wen Congyangb2780d32015-11-20 17:34:38 +08001851
1852 bdrv_drain_all();
Kevin Wolf594a45c2013-07-18 14:52:19 +02001853 /* Make sure to return an error if the flush in a previous vm_stop()
1854 * failed. */
John Snow22af08e2016-09-22 21:45:51 -04001855 return bdrv_flush_all();
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001856 }
1857}
1858
Stefan Weil9a78eea2010-10-22 23:03:33 +02001859void list_cpus(FILE *f, fprintf_function cpu_fprintf, const char *optarg)
Blue Swirl262353c2010-05-04 19:55:35 +00001860{
1861 /* XXX: implement xxx_cpu_list for targets that still miss it */
Peter Maydelle916cbf2012-09-05 17:41:08 -03001862#if defined(cpu_list)
1863 cpu_list(f, cpu_fprintf);
Blue Swirl262353c2010-05-04 19:55:35 +00001864#endif
1865}
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001866
1867CpuInfoList *qmp_query_cpus(Error **errp)
1868{
Igor Mammedovafed5a52017-05-10 13:29:55 +02001869 MachineState *ms = MACHINE(qdev_get_machine());
1870 MachineClass *mc = MACHINE_GET_CLASS(ms);
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001871 CpuInfoList *head = NULL, *cur_item = NULL;
Andreas Färber182735e2013-05-29 22:29:20 +02001872 CPUState *cpu;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001873
Andreas Färberbdc44642013-06-24 23:50:24 +02001874 CPU_FOREACH(cpu) {
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001875 CpuInfoList *info;
Andreas Färber182735e2013-05-29 22:29:20 +02001876#if defined(TARGET_I386)
1877 X86CPU *x86_cpu = X86_CPU(cpu);
1878 CPUX86State *env = &x86_cpu->env;
1879#elif defined(TARGET_PPC)
1880 PowerPCCPU *ppc_cpu = POWERPC_CPU(cpu);
1881 CPUPPCState *env = &ppc_cpu->env;
1882#elif defined(TARGET_SPARC)
1883 SPARCCPU *sparc_cpu = SPARC_CPU(cpu);
1884 CPUSPARCState *env = &sparc_cpu->env;
1885#elif defined(TARGET_MIPS)
1886 MIPSCPU *mips_cpu = MIPS_CPU(cpu);
1887 CPUMIPSState *env = &mips_cpu->env;
Bastian Koppelmann48e06fe2014-09-01 12:59:46 +01001888#elif defined(TARGET_TRICORE)
1889 TriCoreCPU *tricore_cpu = TRICORE_CPU(cpu);
1890 CPUTriCoreState *env = &tricore_cpu->env;
Andreas Färber182735e2013-05-29 22:29:20 +02001891#endif
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001892
Andreas Färbercb446ec2013-05-01 14:24:52 +02001893 cpu_synchronize_state(cpu);
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001894
1895 info = g_malloc0(sizeof(*info));
1896 info->value = g_malloc0(sizeof(*info->value));
Andreas Färber55e5c282012-12-17 06:18:02 +01001897 info->value->CPU = cpu->cpu_index;
Andreas Färber182735e2013-05-29 22:29:20 +02001898 info->value->current = (cpu == first_cpu);
Andreas Färber259186a2013-01-17 18:51:17 +01001899 info->value->halted = cpu->halted;
Eduardo Habkost58f88d42015-05-08 16:04:22 -03001900 info->value->qom_path = object_get_canonical_path(OBJECT(cpu));
Andreas Färber9f09e182012-05-03 06:59:07 +02001901 info->value->thread_id = cpu->thread_id;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001902#if defined(TARGET_I386)
Eric Blake86f4b682015-11-18 01:52:59 -07001903 info->value->arch = CPU_INFO_ARCH_X86;
Eric Blake544a3732016-02-17 23:48:27 -07001904 info->value->u.x86.pc = env->eip + env->segs[R_CS].base;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001905#elif defined(TARGET_PPC)
Eric Blake86f4b682015-11-18 01:52:59 -07001906 info->value->arch = CPU_INFO_ARCH_PPC;
Eric Blake544a3732016-02-17 23:48:27 -07001907 info->value->u.ppc.nip = env->nip;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001908#elif defined(TARGET_SPARC)
Eric Blake86f4b682015-11-18 01:52:59 -07001909 info->value->arch = CPU_INFO_ARCH_SPARC;
Eric Blake544a3732016-02-17 23:48:27 -07001910 info->value->u.q_sparc.pc = env->pc;
1911 info->value->u.q_sparc.npc = env->npc;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001912#elif defined(TARGET_MIPS)
Eric Blake86f4b682015-11-18 01:52:59 -07001913 info->value->arch = CPU_INFO_ARCH_MIPS;
Eric Blake544a3732016-02-17 23:48:27 -07001914 info->value->u.q_mips.PC = env->active_tc.PC;
Bastian Koppelmann48e06fe2014-09-01 12:59:46 +01001915#elif defined(TARGET_TRICORE)
Eric Blake86f4b682015-11-18 01:52:59 -07001916 info->value->arch = CPU_INFO_ARCH_TRICORE;
Eric Blake544a3732016-02-17 23:48:27 -07001917 info->value->u.tricore.PC = env->PC;
Eric Blake86f4b682015-11-18 01:52:59 -07001918#else
1919 info->value->arch = CPU_INFO_ARCH_OTHER;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001920#endif
Igor Mammedovafed5a52017-05-10 13:29:55 +02001921 info->value->has_props = !!mc->cpu_index_to_instance_props;
1922 if (info->value->has_props) {
1923 CpuInstanceProperties *props;
1924 props = g_malloc0(sizeof(*props));
1925 *props = mc->cpu_index_to_instance_props(ms, cpu->cpu_index);
1926 info->value->props = props;
1927 }
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001928
1929 /* XXX: waiting for the qapi to support GSList */
1930 if (!cur_item) {
1931 head = cur_item = info;
1932 } else {
1933 cur_item->next = info;
1934 cur_item = info;
1935 }
1936 }
1937
1938 return head;
1939}
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001940
1941void qmp_memsave(int64_t addr, int64_t size, const char *filename,
1942 bool has_cpu, int64_t cpu_index, Error **errp)
1943{
1944 FILE *f;
1945 uint32_t l;
Andreas Färber55e5c282012-12-17 06:18:02 +01001946 CPUState *cpu;
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001947 uint8_t buf[1024];
Borislav Petkov0dc9daf2015-02-08 13:14:38 +01001948 int64_t orig_addr = addr, orig_size = size;
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001949
1950 if (!has_cpu) {
1951 cpu_index = 0;
1952 }
1953
Andreas Färber151d1322013-02-15 15:41:49 +01001954 cpu = qemu_get_cpu(cpu_index);
1955 if (cpu == NULL) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01001956 error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "cpu-index",
1957 "a CPU number");
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001958 return;
1959 }
1960
1961 f = fopen(filename, "wb");
1962 if (!f) {
Luiz Capitulino618da852013-06-07 14:35:06 -04001963 error_setg_file_open(errp, errno, filename);
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001964 return;
1965 }
1966
1967 while (size != 0) {
1968 l = sizeof(buf);
1969 if (l > size)
1970 l = size;
Aneesh Kumar K.V2f4d0f52013-10-01 21:49:30 +05301971 if (cpu_memory_rw_debug(cpu, addr, buf, l, 0) != 0) {
Borislav Petkov0dc9daf2015-02-08 13:14:38 +01001972 error_setg(errp, "Invalid addr 0x%016" PRIx64 "/size %" PRId64
1973 " specified", orig_addr, orig_size);
Aneesh Kumar K.V2f4d0f52013-10-01 21:49:30 +05301974 goto exit;
1975 }
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001976 if (fwrite(buf, 1, l, f) != l) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01001977 error_setg(errp, QERR_IO_ERROR);
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001978 goto exit;
1979 }
1980 addr += l;
1981 size -= l;
1982 }
1983
1984exit:
1985 fclose(f);
1986}
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001987
1988void qmp_pmemsave(int64_t addr, int64_t size, const char *filename,
1989 Error **errp)
1990{
1991 FILE *f;
1992 uint32_t l;
1993 uint8_t buf[1024];
1994
1995 f = fopen(filename, "wb");
1996 if (!f) {
Luiz Capitulino618da852013-06-07 14:35:06 -04001997 error_setg_file_open(errp, errno, filename);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001998 return;
1999 }
2000
2001 while (size != 0) {
2002 l = sizeof(buf);
2003 if (l > size)
2004 l = size;
Stefan Weileb6282f2014-04-07 20:28:23 +02002005 cpu_physical_memory_read(addr, buf, l);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02002006 if (fwrite(buf, 1, l, f) != l) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01002007 error_setg(errp, QERR_IO_ERROR);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02002008 goto exit;
2009 }
2010 addr += l;
2011 size -= l;
2012 }
2013
2014exit:
2015 fclose(f);
2016}
Luiz Capitulinoab49ab52011-11-23 12:55:53 -02002017
2018void qmp_inject_nmi(Error **errp)
2019{
Alexey Kardashevskiy9cb805f2014-08-20 22:16:33 +10002020 nmi_monitor_handle(monitor_get_cpu_index(), errp);
Luiz Capitulinoab49ab52011-11-23 12:55:53 -02002021}
Sebastian Tanase27498be2014-07-25 11:56:33 +02002022
2023void dump_drift_info(FILE *f, fprintf_function cpu_fprintf)
2024{
2025 if (!use_icount) {
2026 return;
2027 }
2028
2029 cpu_fprintf(f, "Host - Guest clock %"PRIi64" ms\n",
2030 (cpu_get_clock() - cpu_get_icount())/SCALE_MS);
2031 if (icount_align_option) {
2032 cpu_fprintf(f, "Max guest delay %"PRIi64" ms\n", -max_delay/SCALE_MS);
2033 cpu_fprintf(f, "Max guest advance %"PRIi64" ms\n", max_advance/SCALE_MS);
2034 } else {
2035 cpu_fprintf(f, "Max guest delay NA\n");
2036 cpu_fprintf(f, "Max guest advance NA\n");
2037 }
2038}