blob: 4f91d2551368e6dc6d73f28c72e5eab372eb2ece [file] [log] [blame]
Blue Swirl296af7c2010-03-29 19:23:50 +00001/*
2 * QEMU System Emulator
3 *
4 * Copyright (c) 2003-2008 Fabrice Bellard
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
24
25/* Needed early for CONFIG_BSD etc. */
Peter Maydell7b31bbc2016-01-26 18:16:56 +000026#include "qemu/osdep.h"
Paolo Bonzini33c11872016-03-15 16:58:45 +010027#include "qemu-common.h"
KONRAD Frederic8d4e9142017-02-23 18:29:08 +000028#include "qemu/config-file.h"
Paolo Bonzini33c11872016-03-15 16:58:45 +010029#include "cpu.h"
Paolo Bonzini83c90892012-12-17 18:19:49 +010030#include "monitor/monitor.h"
Wenchao Xiaa4e15de2014-06-18 08:43:36 +020031#include "qapi/qmp/qerror.h"
Markus Armbrusterd49b6832015-03-17 18:29:20 +010032#include "qemu/error-report.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010033#include "sysemu/sysemu.h"
Max Reitzda31d592016-03-16 19:54:32 +010034#include "sysemu/block-backend.h"
Paolo Bonzini022c62c2012-12-17 18:19:49 +010035#include "exec/gdbstub.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010036#include "sysemu/dma.h"
Vincent Palatinb3946622017-01-10 11:59:55 +010037#include "sysemu/hw_accel.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010038#include "sysemu/kvm.h"
Vincent Palatinb0cb0a62017-01-10 11:59:57 +010039#include "sysemu/hax.h"
Luiz Capitulinode0b36b2011-09-21 16:38:35 -030040#include "qmp-commands.h"
Paolo Bonzini63c91552016-03-15 13:18:37 +010041#include "exec/exec-all.h"
Blue Swirl296af7c2010-03-29 19:23:50 +000042
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010043#include "qemu/thread.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010044#include "sysemu/cpus.h"
45#include "sysemu/qtest.h"
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010046#include "qemu/main-loop.h"
47#include "qemu/bitmap.h"
Liu Ping Fancb365642013-09-25 14:20:58 +080048#include "qemu/seqlock.h"
KONRAD Frederic8d4e9142017-02-23 18:29:08 +000049#include "tcg.h"
Wenchao Xiaa4e15de2014-06-18 08:43:36 +020050#include "qapi-event.h"
Alexey Kardashevskiy9cb805f2014-08-20 22:16:33 +100051#include "hw/nmi.h"
Pavel Dovgalyuk8b427042015-09-17 19:24:05 +030052#include "sysemu/replay.h"
Igor Mammedovafed5a52017-05-10 13:29:55 +020053#include "hw/boards.h"
Jan Kiszka0ff0fc12011-06-23 10:15:55 +020054
Jan Kiszka6d9cb732011-02-01 22:15:58 +010055#ifdef CONFIG_LINUX
56
57#include <sys/prctl.h>
58
Marcelo Tosattic0532a72010-10-11 15:31:21 -030059#ifndef PR_MCE_KILL
60#define PR_MCE_KILL 33
61#endif
62
Jan Kiszka6d9cb732011-02-01 22:15:58 +010063#ifndef PR_MCE_KILL_SET
64#define PR_MCE_KILL_SET 1
65#endif
66
67#ifndef PR_MCE_KILL_EARLY
68#define PR_MCE_KILL_EARLY 1
69#endif
70
71#endif /* CONFIG_LINUX */
72
Sebastian Tanase27498be2014-07-25 11:56:33 +020073int64_t max_delay;
74int64_t max_advance;
Blue Swirl296af7c2010-03-29 19:23:50 +000075
Jason J. Herne2adcc852015-09-08 13:12:33 -040076/* vcpu throttling controls */
77static QEMUTimer *throttle_timer;
78static unsigned int throttle_percentage;
79
80#define CPU_THROTTLE_PCT_MIN 1
81#define CPU_THROTTLE_PCT_MAX 99
82#define CPU_THROTTLE_TIMESLICE_NS 10000000
83
Tiejun Chen321bc0b2013-08-02 09:43:09 +080084bool cpu_is_stopped(CPUState *cpu)
85{
86 return cpu->stopped || !runstate_is_running();
87}
88
Andreas Färbera98ae1d2013-05-26 23:21:08 +020089static bool cpu_thread_is_idle(CPUState *cpu)
Peter Maydellac873f12012-07-19 16:52:27 +010090{
Andreas Färberc64ca812012-05-03 02:11:45 +020091 if (cpu->stop || cpu->queued_work_first) {
Peter Maydellac873f12012-07-19 16:52:27 +010092 return false;
93 }
Tiejun Chen321bc0b2013-08-02 09:43:09 +080094 if (cpu_is_stopped(cpu)) {
Peter Maydellac873f12012-07-19 16:52:27 +010095 return true;
96 }
Andreas Färber8c2e1b02013-08-25 18:53:55 +020097 if (!cpu->halted || cpu_has_work(cpu) ||
Alexander Graf215e79c2013-04-24 22:24:12 +020098 kvm_halt_in_kernel()) {
Peter Maydellac873f12012-07-19 16:52:27 +010099 return false;
100 }
101 return true;
102}
103
104static bool all_cpu_threads_idle(void)
105{
Andreas Färber182735e2013-05-29 22:29:20 +0200106 CPUState *cpu;
Peter Maydellac873f12012-07-19 16:52:27 +0100107
Andreas Färberbdc44642013-06-24 23:50:24 +0200108 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200109 if (!cpu_thread_is_idle(cpu)) {
Peter Maydellac873f12012-07-19 16:52:27 +0100110 return false;
111 }
112 }
113 return true;
114}
115
Blue Swirl296af7c2010-03-29 19:23:50 +0000116/***********************************************************/
Paolo Bonzini946fb272011-09-12 13:57:37 +0200117/* guest cycle counter */
118
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200119/* Protected by TimersState seqlock */
120
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200121static bool icount_sleep = true;
Sebastian Tanase71468392014-07-23 11:47:50 +0200122static int64_t vm_clock_warp_start = -1;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200123/* Conversion factor from emulated instructions to virtual clock ticks. */
124static int icount_time_shift;
125/* Arbitrarily pick 1MIPS as the minimum allowable speed. */
126#define MAX_ICOUNT_SHIFT 10
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200127
Paolo Bonzini946fb272011-09-12 13:57:37 +0200128static QEMUTimer *icount_rt_timer;
129static QEMUTimer *icount_vm_timer;
130static QEMUTimer *icount_warp_timer;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200131
132typedef struct TimersState {
Liu Ping Fancb365642013-09-25 14:20:58 +0800133 /* Protected by BQL. */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200134 int64_t cpu_ticks_prev;
135 int64_t cpu_ticks_offset;
Liu Ping Fancb365642013-09-25 14:20:58 +0800136
137 /* cpu_clock_offset can be read out of BQL, so protect it with
138 * this lock.
139 */
140 QemuSeqLock vm_clock_seqlock;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200141 int64_t cpu_clock_offset;
142 int32_t cpu_ticks_enabled;
143 int64_t dummy;
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200144
145 /* Compensate for varying guest execution speed. */
146 int64_t qemu_icount_bias;
147 /* Only written by TCG thread */
148 int64_t qemu_icount;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200149} TimersState;
150
Liu Ping Fand9cd4002013-07-21 08:43:00 +0000151static TimersState timers_state;
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000152bool mttcg_enabled;
153
154/*
155 * We default to false if we know other options have been enabled
156 * which are currently incompatible with MTTCG. Otherwise when each
157 * guest (target) has been updated to support:
158 * - atomic instructions
159 * - memory ordering primitives (barriers)
160 * they can set the appropriate CONFIG flags in ${target}-softmmu.mak
161 *
162 * Once a guest architecture has been converted to the new primitives
163 * there are two remaining limitations to check.
164 *
165 * - The guest can't be oversized (e.g. 64 bit guest on 32 bit host)
166 * - The host must have a stronger memory order than the guest
167 *
168 * It may be possible in future to support strong guests on weak hosts
169 * but that will require tagging all load/stores in a guest with their
170 * implicit memory order requirements which would likely slow things
171 * down a lot.
172 */
173
174static bool check_tcg_memory_orders_compatible(void)
175{
176#if defined(TCG_GUEST_DEFAULT_MO) && defined(TCG_TARGET_DEFAULT_MO)
177 return (TCG_GUEST_DEFAULT_MO & ~TCG_TARGET_DEFAULT_MO) == 0;
178#else
179 return false;
180#endif
181}
182
183static bool default_mttcg_enabled(void)
184{
Alex Bennée83fd9622017-02-27 17:09:01 +0000185 if (use_icount || TCG_OVERSIZED_GUEST) {
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000186 return false;
187 } else {
188#ifdef TARGET_SUPPORTS_MTTCG
189 return check_tcg_memory_orders_compatible();
190#else
191 return false;
192#endif
193 }
194}
195
196void qemu_tcg_configure(QemuOpts *opts, Error **errp)
197{
198 const char *t = qemu_opt_get(opts, "thread");
199 if (t) {
200 if (strcmp(t, "multi") == 0) {
201 if (TCG_OVERSIZED_GUEST) {
202 error_setg(errp, "No MTTCG when guest word size > hosts");
Alex Bennée83fd9622017-02-27 17:09:01 +0000203 } else if (use_icount) {
204 error_setg(errp, "No MTTCG when icount is enabled");
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000205 } else {
Nikunj A Dadhania86953502017-04-10 11:36:55 +0530206#ifndef TARGET_SUPPORTS_MTTCG
Alex Bennéec34c7622017-02-28 14:40:17 +0000207 error_report("Guest not yet converted to MTTCG - "
208 "you may get unexpected results");
209#endif
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000210 if (!check_tcg_memory_orders_compatible()) {
211 error_report("Guest expects a stronger memory ordering "
212 "than the host provides");
Pranith Kumar8cfef892017-03-25 16:19:23 -0400213 error_printf("This may cause strange/hard to debug errors\n");
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000214 }
215 mttcg_enabled = true;
216 }
217 } else if (strcmp(t, "single") == 0) {
218 mttcg_enabled = false;
219 } else {
220 error_setg(errp, "Invalid 'thread' setting %s", t);
221 }
222 } else {
223 mttcg_enabled = default_mttcg_enabled();
224 }
225}
Paolo Bonzini946fb272011-09-12 13:57:37 +0200226
Alex Bennéee4cd9652017-03-31 16:09:42 +0100227/* The current number of executed instructions is based on what we
228 * originally budgeted minus the current state of the decrementing
229 * icount counters in extra/u16.low.
230 */
231static int64_t cpu_get_icount_executed(CPUState *cpu)
232{
233 return cpu->icount_budget - (cpu->icount_decr.u16.low + cpu->icount_extra);
234}
235
Alex Bennée512d3c82017-04-05 12:32:37 +0100236/*
237 * Update the global shared timer_state.qemu_icount to take into
238 * account executed instructions. This is done by the TCG vCPU
239 * thread so the main-loop can see time has moved forward.
240 */
241void cpu_update_icount(CPUState *cpu)
242{
243 int64_t executed = cpu_get_icount_executed(cpu);
244 cpu->icount_budget -= executed;
245
246#ifdef CONFIG_ATOMIC64
247 atomic_set__nocheck(&timers_state.qemu_icount,
248 atomic_read__nocheck(&timers_state.qemu_icount) +
249 executed);
250#else /* FIXME: we need 64bit atomics to do this safely */
251 timers_state.qemu_icount += executed;
252#endif
253}
254
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300255int64_t cpu_get_icount_raw(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200256{
Andreas Färber4917cf42013-05-27 05:17:50 +0200257 CPUState *cpu = current_cpu;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200258
Alex Bennée243c5f72017-03-30 18:49:22 +0100259 if (cpu && cpu->running) {
Paolo Bonzini414b15c2015-06-24 14:16:26 +0200260 if (!cpu->can_do_io) {
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300261 fprintf(stderr, "Bad icount read\n");
262 exit(1);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200263 }
Alex Bennéee4cd9652017-03-31 16:09:42 +0100264 /* Take into account what has run */
Alex Bennée1d059062017-04-05 10:53:47 +0100265 cpu_update_icount(cpu);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200266 }
Alex Bennée1d059062017-04-05 10:53:47 +0100267#ifdef CONFIG_ATOMIC64
268 return atomic_read__nocheck(&timers_state.qemu_icount);
269#else /* FIXME: we need 64bit atomics to do this safely */
270 return timers_state.qemu_icount;
271#endif
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300272}
273
274/* Return the virtual CPU time, based on the instruction counter. */
275static int64_t cpu_get_icount_locked(void)
276{
277 int64_t icount = cpu_get_icount_raw();
KONRAD Frederic3f031312014-08-01 01:37:15 +0200278 return timers_state.qemu_icount_bias + cpu_icount_to_ns(icount);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200279}
280
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200281int64_t cpu_get_icount(void)
282{
283 int64_t icount;
284 unsigned start;
285
286 do {
287 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
288 icount = cpu_get_icount_locked();
289 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
290
291 return icount;
292}
293
KONRAD Frederic3f031312014-08-01 01:37:15 +0200294int64_t cpu_icount_to_ns(int64_t icount)
295{
296 return icount << icount_time_shift;
297}
298
Cao jind90f3cc2016-07-29 19:05:38 +0800299/* return the time elapsed in VM between vm_start and vm_stop. Unless
300 * icount is active, cpu_get_ticks() uses units of the host CPU cycle
301 * counter.
302 *
303 * Caller must hold the BQL
304 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200305int64_t cpu_get_ticks(void)
306{
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100307 int64_t ticks;
308
Paolo Bonzini946fb272011-09-12 13:57:37 +0200309 if (use_icount) {
310 return cpu_get_icount();
311 }
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100312
313 ticks = timers_state.cpu_ticks_offset;
314 if (timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400315 ticks += cpu_get_host_ticks();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200316 }
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100317
318 if (timers_state.cpu_ticks_prev > ticks) {
319 /* Note: non increasing ticks may happen if the host uses
320 software suspend */
321 timers_state.cpu_ticks_offset += timers_state.cpu_ticks_prev - ticks;
322 ticks = timers_state.cpu_ticks_prev;
323 }
324
325 timers_state.cpu_ticks_prev = ticks;
326 return ticks;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200327}
328
Liu Ping Fancb365642013-09-25 14:20:58 +0800329static int64_t cpu_get_clock_locked(void)
330{
Cao jin1d45cea2016-07-29 19:05:37 +0800331 int64_t time;
Liu Ping Fancb365642013-09-25 14:20:58 +0800332
Cao jin1d45cea2016-07-29 19:05:37 +0800333 time = timers_state.cpu_clock_offset;
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100334 if (timers_state.cpu_ticks_enabled) {
Cao jin1d45cea2016-07-29 19:05:37 +0800335 time += get_clock();
Liu Ping Fancb365642013-09-25 14:20:58 +0800336 }
337
Cao jin1d45cea2016-07-29 19:05:37 +0800338 return time;
Liu Ping Fancb365642013-09-25 14:20:58 +0800339}
340
Cao jind90f3cc2016-07-29 19:05:38 +0800341/* Return the monotonic time elapsed in VM, i.e.,
Peter Maydell8212ff82016-09-15 10:24:22 +0100342 * the time between vm_start and vm_stop
343 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200344int64_t cpu_get_clock(void)
345{
346 int64_t ti;
Liu Ping Fancb365642013-09-25 14:20:58 +0800347 unsigned start;
348
349 do {
350 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
351 ti = cpu_get_clock_locked();
352 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
353
354 return ti;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200355}
356
Liu Ping Fancb365642013-09-25 14:20:58 +0800357/* enable cpu_get_ticks()
Cao jin3224e872016-07-08 18:31:37 +0800358 * Caller must hold BQL which serves as mutex for vm_clock_seqlock.
Liu Ping Fancb365642013-09-25 14:20:58 +0800359 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200360void cpu_enable_ticks(void)
361{
Liu Ping Fancb365642013-09-25 14:20:58 +0800362 /* Here, the really thing protected by seqlock is cpu_clock_offset. */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400363 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200364 if (!timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400365 timers_state.cpu_ticks_offset -= cpu_get_host_ticks();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200366 timers_state.cpu_clock_offset -= get_clock();
367 timers_state.cpu_ticks_enabled = 1;
368 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400369 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200370}
371
372/* disable cpu_get_ticks() : the clock is stopped. You must not call
Liu Ping Fancb365642013-09-25 14:20:58 +0800373 * cpu_get_ticks() after that.
Cao jin3224e872016-07-08 18:31:37 +0800374 * Caller must hold BQL which serves as mutex for vm_clock_seqlock.
Liu Ping Fancb365642013-09-25 14:20:58 +0800375 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200376void cpu_disable_ticks(void)
377{
Liu Ping Fancb365642013-09-25 14:20:58 +0800378 /* Here, the really thing protected by seqlock is cpu_clock_offset. */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400379 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200380 if (timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400381 timers_state.cpu_ticks_offset += cpu_get_host_ticks();
Liu Ping Fancb365642013-09-25 14:20:58 +0800382 timers_state.cpu_clock_offset = cpu_get_clock_locked();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200383 timers_state.cpu_ticks_enabled = 0;
384 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400385 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200386}
387
388/* Correlation between real and virtual time is always going to be
389 fairly approximate, so ignore small variation.
390 When the guest is idle real and virtual time will be aligned in
391 the IO wait loop. */
Rutuja Shah73bcb242016-03-21 21:32:30 +0530392#define ICOUNT_WOBBLE (NANOSECONDS_PER_SECOND / 10)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200393
394static void icount_adjust(void)
395{
396 int64_t cur_time;
397 int64_t cur_icount;
398 int64_t delta;
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200399
400 /* Protected by TimersState mutex. */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200401 static int64_t last_delta;
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200402
Paolo Bonzini946fb272011-09-12 13:57:37 +0200403 /* If the VM is not running, then do nothing. */
404 if (!runstate_is_running()) {
405 return;
406 }
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200407
Emilio G. Cota03719e42016-06-08 14:55:21 -0400408 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200409 cur_time = cpu_get_clock_locked();
410 cur_icount = cpu_get_icount_locked();
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200411
Paolo Bonzini946fb272011-09-12 13:57:37 +0200412 delta = cur_icount - cur_time;
413 /* FIXME: This is a very crude algorithm, somewhat prone to oscillation. */
414 if (delta > 0
415 && last_delta + ICOUNT_WOBBLE < delta * 2
416 && icount_time_shift > 0) {
417 /* The guest is getting too far ahead. Slow time down. */
418 icount_time_shift--;
419 }
420 if (delta < 0
421 && last_delta - ICOUNT_WOBBLE > delta * 2
422 && icount_time_shift < MAX_ICOUNT_SHIFT) {
423 /* The guest is getting too far behind. Speed time up. */
424 icount_time_shift++;
425 }
426 last_delta = delta;
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200427 timers_state.qemu_icount_bias = cur_icount
428 - (timers_state.qemu_icount << icount_time_shift);
Emilio G. Cota03719e42016-06-08 14:55:21 -0400429 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200430}
431
432static void icount_adjust_rt(void *opaque)
433{
Alex Bligh40daca52013-08-21 16:03:02 +0100434 timer_mod(icount_rt_timer,
Pavel Dovgalyuk1979b902015-01-12 15:00:43 +0300435 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL_RT) + 1000);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200436 icount_adjust();
437}
438
439static void icount_adjust_vm(void *opaque)
440{
Alex Bligh40daca52013-08-21 16:03:02 +0100441 timer_mod(icount_vm_timer,
442 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
Rutuja Shah73bcb242016-03-21 21:32:30 +0530443 NANOSECONDS_PER_SECOND / 10);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200444 icount_adjust();
445}
446
447static int64_t qemu_icount_round(int64_t count)
448{
449 return (count + (1 << icount_time_shift) - 1) >> icount_time_shift;
450}
451
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300452static void icount_warp_rt(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200453{
Alex Bennéeccffff42016-04-04 15:35:48 +0100454 unsigned seq;
455 int64_t warp_start;
456
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200457 /* The icount_warp_timer is rescheduled soon after vm_clock_warp_start
458 * changes from -1 to another value, so the race here is okay.
459 */
Alex Bennéeccffff42016-04-04 15:35:48 +0100460 do {
461 seq = seqlock_read_begin(&timers_state.vm_clock_seqlock);
462 warp_start = vm_clock_warp_start;
463 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, seq));
464
465 if (warp_start == -1) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200466 return;
467 }
468
Emilio G. Cota03719e42016-06-08 14:55:21 -0400469 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200470 if (runstate_is_running()) {
Pavel Dovgalyuk8eda2062015-09-17 19:24:28 +0300471 int64_t clock = REPLAY_CLOCK(REPLAY_CLOCK_VIRTUAL_RT,
472 cpu_get_clock_locked());
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200473 int64_t warp_delta;
474
475 warp_delta = clock - vm_clock_warp_start;
476 if (use_icount == 2) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200477 /*
Alex Bligh40daca52013-08-21 16:03:02 +0100478 * In adaptive mode, do not let QEMU_CLOCK_VIRTUAL run too
Paolo Bonzini946fb272011-09-12 13:57:37 +0200479 * far ahead of real time.
480 */
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200481 int64_t cur_icount = cpu_get_icount_locked();
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300482 int64_t delta = clock - cur_icount;
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200483 warp_delta = MIN(warp_delta, delta);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200484 }
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200485 timers_state.qemu_icount_bias += warp_delta;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200486 }
487 vm_clock_warp_start = -1;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400488 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200489
490 if (qemu_clock_expired(QEMU_CLOCK_VIRTUAL)) {
491 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
492 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200493}
494
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300495static void icount_timer_cb(void *opaque)
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300496{
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300497 /* No need for a checkpoint because the timer already synchronizes
498 * with CHECKPOINT_CLOCK_VIRTUAL_RT.
499 */
500 icount_warp_rt();
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300501}
502
Paolo Bonzini8156be52012-03-28 15:42:04 +0200503void qtest_clock_warp(int64_t dest)
504{
Alex Bligh40daca52013-08-21 16:03:02 +0100505 int64_t clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
Fam Zhengefef88b2015-01-19 17:51:43 +0800506 AioContext *aio_context;
Paolo Bonzini8156be52012-03-28 15:42:04 +0200507 assert(qtest_enabled());
Fam Zhengefef88b2015-01-19 17:51:43 +0800508 aio_context = qemu_get_aio_context();
Paolo Bonzini8156be52012-03-28 15:42:04 +0200509 while (clock < dest) {
Alex Bligh40daca52013-08-21 16:03:02 +0100510 int64_t deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
Sergey Fedorovc9299e22014-06-10 13:10:28 +0400511 int64_t warp = qemu_soonest_timeout(dest - clock, deadline);
Fam Zhengefef88b2015-01-19 17:51:43 +0800512
Emilio G. Cota03719e42016-06-08 14:55:21 -0400513 seqlock_write_begin(&timers_state.vm_clock_seqlock);
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200514 timers_state.qemu_icount_bias += warp;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400515 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200516
Alex Bligh40daca52013-08-21 16:03:02 +0100517 qemu_clock_run_timers(QEMU_CLOCK_VIRTUAL);
Fam Zhengefef88b2015-01-19 17:51:43 +0800518 timerlist_run_timers(aio_context->tlg.tl[QEMU_CLOCK_VIRTUAL]);
Alex Bligh40daca52013-08-21 16:03:02 +0100519 clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini8156be52012-03-28 15:42:04 +0200520 }
Alex Bligh40daca52013-08-21 16:03:02 +0100521 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini8156be52012-03-28 15:42:04 +0200522}
523
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300524void qemu_start_warp_timer(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200525{
Paolo Bonzinice78d182013-10-07 17:30:02 +0200526 int64_t clock;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200527 int64_t deadline;
528
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300529 if (!use_icount) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200530 return;
531 }
532
Pavel Dovgalyuk8bd7f712015-09-17 19:24:44 +0300533 /* Nothing to do if the VM is stopped: QEMU_CLOCK_VIRTUAL timers
534 * do not fire, so computing the deadline does not make sense.
535 */
536 if (!runstate_is_running()) {
537 return;
538 }
539
540 /* warp clock deterministically in record/replay mode */
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300541 if (!replay_checkpoint(CHECKPOINT_CLOCK_WARP_START)) {
Pavel Dovgalyuk8bd7f712015-09-17 19:24:44 +0300542 return;
543 }
544
Paolo Bonzinice78d182013-10-07 17:30:02 +0200545 if (!all_cpu_threads_idle()) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200546 return;
547 }
548
Paolo Bonzini8156be52012-03-28 15:42:04 +0200549 if (qtest_enabled()) {
550 /* When testing, qtest commands advance icount. */
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300551 return;
Paolo Bonzini8156be52012-03-28 15:42:04 +0200552 }
553
Alex Blighac70aaf2013-08-21 16:02:57 +0100554 /* We want to use the earliest deadline from ALL vm_clocks */
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300555 clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT);
Alex Bligh40daca52013-08-21 16:03:02 +0100556 deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
Paolo Bonzinice78d182013-10-07 17:30:02 +0200557 if (deadline < 0) {
Victor CLEMENTd7a0f712015-05-29 17:14:06 +0200558 static bool notified;
559 if (!icount_sleep && !notified) {
560 error_report("WARNING: icount sleep disabled and no active timers");
561 notified = true;
562 }
Paolo Bonzinice78d182013-10-07 17:30:02 +0200563 return;
Alex Blighac70aaf2013-08-21 16:02:57 +0100564 }
565
Paolo Bonzini946fb272011-09-12 13:57:37 +0200566 if (deadline > 0) {
567 /*
Alex Bligh40daca52013-08-21 16:03:02 +0100568 * Ensure QEMU_CLOCK_VIRTUAL proceeds even when the virtual CPU goes to
Paolo Bonzini946fb272011-09-12 13:57:37 +0200569 * sleep. Otherwise, the CPU might be waiting for a future timer
570 * interrupt to wake it up, but the interrupt never comes because
571 * the vCPU isn't running any insns and thus doesn't advance the
Alex Bligh40daca52013-08-21 16:03:02 +0100572 * QEMU_CLOCK_VIRTUAL.
Paolo Bonzini946fb272011-09-12 13:57:37 +0200573 */
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200574 if (!icount_sleep) {
575 /*
576 * We never let VCPUs sleep in no sleep icount mode.
577 * If there is a pending QEMU_CLOCK_VIRTUAL timer we just advance
578 * to the next QEMU_CLOCK_VIRTUAL event and notify it.
579 * It is useful when we want a deterministic execution time,
580 * isolated from host latencies.
581 */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400582 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200583 timers_state.qemu_icount_bias += deadline;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400584 seqlock_write_end(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200585 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
586 } else {
587 /*
588 * We do stop VCPUs and only advance QEMU_CLOCK_VIRTUAL after some
589 * "real" time, (related to the time left until the next event) has
590 * passed. The QEMU_CLOCK_VIRTUAL_RT clock will do this.
591 * This avoids that the warps are visible externally; for example,
592 * you will not be sending network packets continuously instead of
593 * every 100ms.
594 */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400595 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200596 if (vm_clock_warp_start == -1 || vm_clock_warp_start > clock) {
597 vm_clock_warp_start = clock;
598 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400599 seqlock_write_end(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200600 timer_mod_anticipate(icount_warp_timer, clock + deadline);
Paolo Bonzinice78d182013-10-07 17:30:02 +0200601 }
Alex Blighac70aaf2013-08-21 16:02:57 +0100602 } else if (deadline == 0) {
Alex Bligh40daca52013-08-21 16:03:02 +0100603 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200604 }
605}
606
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300607static void qemu_account_warp_timer(void)
608{
609 if (!use_icount || !icount_sleep) {
610 return;
611 }
612
613 /* Nothing to do if the VM is stopped: QEMU_CLOCK_VIRTUAL timers
614 * do not fire, so computing the deadline does not make sense.
615 */
616 if (!runstate_is_running()) {
617 return;
618 }
619
620 /* warp clock deterministically in record/replay mode */
621 if (!replay_checkpoint(CHECKPOINT_CLOCK_WARP_ACCOUNT)) {
622 return;
623 }
624
625 timer_del(icount_warp_timer);
626 icount_warp_rt();
627}
628
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200629static bool icount_state_needed(void *opaque)
630{
631 return use_icount;
632}
633
634/*
635 * This is a subsection for icount migration.
636 */
637static const VMStateDescription icount_vmstate_timers = {
638 .name = "timer/icount",
639 .version_id = 1,
640 .minimum_version_id = 1,
Juan Quintela5cd8cad2014-09-23 14:09:54 +0200641 .needed = icount_state_needed,
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200642 .fields = (VMStateField[]) {
643 VMSTATE_INT64(qemu_icount_bias, TimersState),
644 VMSTATE_INT64(qemu_icount, TimersState),
645 VMSTATE_END_OF_LIST()
646 }
647};
648
Paolo Bonzini946fb272011-09-12 13:57:37 +0200649static const VMStateDescription vmstate_timers = {
650 .name = "timer",
651 .version_id = 2,
652 .minimum_version_id = 1,
Juan Quintela35d08452014-04-16 16:01:33 +0200653 .fields = (VMStateField[]) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200654 VMSTATE_INT64(cpu_ticks_offset, TimersState),
655 VMSTATE_INT64(dummy, TimersState),
656 VMSTATE_INT64_V(cpu_clock_offset, TimersState, 2),
657 VMSTATE_END_OF_LIST()
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200658 },
Juan Quintela5cd8cad2014-09-23 14:09:54 +0200659 .subsections = (const VMStateDescription*[]) {
660 &icount_vmstate_timers,
661 NULL
Paolo Bonzini946fb272011-09-12 13:57:37 +0200662 }
663};
664
Paolo Bonzini14e6fe12016-10-31 10:36:08 +0100665static void cpu_throttle_thread(CPUState *cpu, run_on_cpu_data opaque)
Jason J. Herne2adcc852015-09-08 13:12:33 -0400666{
Jason J. Herne2adcc852015-09-08 13:12:33 -0400667 double pct;
668 double throttle_ratio;
669 long sleeptime_ns;
670
671 if (!cpu_throttle_get_percentage()) {
672 return;
673 }
674
675 pct = (double)cpu_throttle_get_percentage()/100;
676 throttle_ratio = pct / (1 - pct);
677 sleeptime_ns = (long)(throttle_ratio * CPU_THROTTLE_TIMESLICE_NS);
678
679 qemu_mutex_unlock_iothread();
680 atomic_set(&cpu->throttle_thread_scheduled, 0);
681 g_usleep(sleeptime_ns / 1000); /* Convert ns to us for usleep call */
682 qemu_mutex_lock_iothread();
683}
684
685static void cpu_throttle_timer_tick(void *opaque)
686{
687 CPUState *cpu;
688 double pct;
689
690 /* Stop the timer if needed */
691 if (!cpu_throttle_get_percentage()) {
692 return;
693 }
694 CPU_FOREACH(cpu) {
695 if (!atomic_xchg(&cpu->throttle_thread_scheduled, 1)) {
Paolo Bonzini14e6fe12016-10-31 10:36:08 +0100696 async_run_on_cpu(cpu, cpu_throttle_thread,
697 RUN_ON_CPU_NULL);
Jason J. Herne2adcc852015-09-08 13:12:33 -0400698 }
699 }
700
701 pct = (double)cpu_throttle_get_percentage()/100;
702 timer_mod(throttle_timer, qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT) +
703 CPU_THROTTLE_TIMESLICE_NS / (1-pct));
704}
705
706void cpu_throttle_set(int new_throttle_pct)
707{
708 /* Ensure throttle percentage is within valid range */
709 new_throttle_pct = MIN(new_throttle_pct, CPU_THROTTLE_PCT_MAX);
710 new_throttle_pct = MAX(new_throttle_pct, CPU_THROTTLE_PCT_MIN);
711
712 atomic_set(&throttle_percentage, new_throttle_pct);
713
714 timer_mod(throttle_timer, qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT) +
715 CPU_THROTTLE_TIMESLICE_NS);
716}
717
718void cpu_throttle_stop(void)
719{
720 atomic_set(&throttle_percentage, 0);
721}
722
723bool cpu_throttle_active(void)
724{
725 return (cpu_throttle_get_percentage() != 0);
726}
727
728int cpu_throttle_get_percentage(void)
729{
730 return atomic_read(&throttle_percentage);
731}
732
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400733void cpu_ticks_init(void)
734{
Emilio G. Cotaccdb3c12016-06-08 14:55:20 -0400735 seqlock_init(&timers_state.vm_clock_seqlock);
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400736 vmstate_register(NULL, 0, &vmstate_timers, &timers_state);
Jason J. Herne2adcc852015-09-08 13:12:33 -0400737 throttle_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL_RT,
738 cpu_throttle_timer_tick, NULL);
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400739}
740
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200741void configure_icount(QemuOpts *opts, Error **errp)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200742{
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200743 const char *option;
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200744 char *rem_str = NULL;
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200745
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200746 option = qemu_opt_get(opts, "shift");
Paolo Bonzini946fb272011-09-12 13:57:37 +0200747 if (!option) {
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200748 if (qemu_opt_get(opts, "align") != NULL) {
749 error_setg(errp, "Please specify shift option when using align");
750 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200751 return;
752 }
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200753
754 icount_sleep = qemu_opt_get_bool(opts, "sleep", true);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200755 if (icount_sleep) {
756 icount_warp_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL_RT,
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300757 icount_timer_cb, NULL);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200758 }
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200759
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200760 icount_align_option = qemu_opt_get_bool(opts, "align", false);
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200761
762 if (icount_align_option && !icount_sleep) {
Pranith Kumar778d9f92016-02-26 10:16:51 -0500763 error_setg(errp, "align=on and sleep=off are incompatible");
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200764 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200765 if (strcmp(option, "auto") != 0) {
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200766 errno = 0;
767 icount_time_shift = strtol(option, &rem_str, 0);
768 if (errno != 0 || *rem_str != '\0' || !strlen(option)) {
769 error_setg(errp, "icount: Invalid shift value");
770 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200771 use_icount = 1;
772 return;
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200773 } else if (icount_align_option) {
774 error_setg(errp, "shift=auto and align=on are incompatible");
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200775 } else if (!icount_sleep) {
Pranith Kumar778d9f92016-02-26 10:16:51 -0500776 error_setg(errp, "shift=auto and sleep=off are incompatible");
Paolo Bonzini946fb272011-09-12 13:57:37 +0200777 }
778
779 use_icount = 2;
780
781 /* 125MIPS seems a reasonable initial guess at the guest speed.
782 It will be corrected fairly quickly anyway. */
783 icount_time_shift = 3;
784
785 /* Have both realtime and virtual time triggers for speed adjustment.
786 The realtime trigger catches emulated time passing too slowly,
787 the virtual time trigger catches emulated time passing too fast.
788 Realtime triggers occur even when idle, so use them less frequently
789 than VM triggers. */
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300790 icount_rt_timer = timer_new_ms(QEMU_CLOCK_VIRTUAL_RT,
791 icount_adjust_rt, NULL);
Alex Bligh40daca52013-08-21 16:03:02 +0100792 timer_mod(icount_rt_timer,
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300793 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL_RT) + 1000);
Alex Bligh40daca52013-08-21 16:03:02 +0100794 icount_vm_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
795 icount_adjust_vm, NULL);
796 timer_mod(icount_vm_timer,
797 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
Rutuja Shah73bcb242016-03-21 21:32:30 +0530798 NANOSECONDS_PER_SECOND / 10);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200799}
800
801/***********************************************************/
Alex Bennée65467062017-02-23 18:29:09 +0000802/* TCG vCPU kick timer
803 *
804 * The kick timer is responsible for moving single threaded vCPU
805 * emulation on to the next vCPU. If more than one vCPU is running a
806 * timer event with force a cpu->exit so the next vCPU can get
807 * scheduled.
808 *
809 * The timer is removed if all vCPUs are idle and restarted again once
810 * idleness is complete.
811 */
812
813static QEMUTimer *tcg_kick_vcpu_timer;
Alex Bennée791158d2017-02-23 18:29:10 +0000814static CPUState *tcg_current_rr_cpu;
Alex Bennée65467062017-02-23 18:29:09 +0000815
816#define TCG_KICK_PERIOD (NANOSECONDS_PER_SECOND / 10)
817
818static inline int64_t qemu_tcg_next_kick(void)
819{
820 return qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + TCG_KICK_PERIOD;
821}
822
Alex Bennée791158d2017-02-23 18:29:10 +0000823/* Kick the currently round-robin scheduled vCPU */
824static void qemu_cpu_kick_rr_cpu(void)
825{
826 CPUState *cpu;
Alex Bennée791158d2017-02-23 18:29:10 +0000827 do {
828 cpu = atomic_mb_read(&tcg_current_rr_cpu);
829 if (cpu) {
830 cpu_exit(cpu);
831 }
832 } while (cpu != atomic_mb_read(&tcg_current_rr_cpu));
833}
834
Paolo Bonzini6b8f0182017-03-02 19:56:40 +0100835static void do_nothing(CPUState *cpu, run_on_cpu_data unused)
836{
837}
838
Paolo Bonzini3f53bc62017-03-03 11:50:29 +0100839void qemu_timer_notify_cb(void *opaque, QEMUClockType type)
840{
Paolo Bonzini6b8f0182017-03-02 19:56:40 +0100841 if (!use_icount || type != QEMU_CLOCK_VIRTUAL) {
842 qemu_notify_event();
843 return;
844 }
845
846 if (!qemu_in_vcpu_thread() && first_cpu) {
847 /* qemu_cpu_kick is not enough to kick a halted CPU out of
848 * qemu_tcg_wait_io_event. async_run_on_cpu, instead,
849 * causes cpu_thread_is_idle to return false. This way,
850 * handle_icount_deadline can run.
851 */
852 async_run_on_cpu(first_cpu, do_nothing, RUN_ON_CPU_NULL);
853 }
Paolo Bonzini3f53bc62017-03-03 11:50:29 +0100854}
855
Alex Bennée65467062017-02-23 18:29:09 +0000856static void kick_tcg_thread(void *opaque)
857{
858 timer_mod(tcg_kick_vcpu_timer, qemu_tcg_next_kick());
Alex Bennée791158d2017-02-23 18:29:10 +0000859 qemu_cpu_kick_rr_cpu();
Alex Bennée65467062017-02-23 18:29:09 +0000860}
861
862static void start_tcg_kick_timer(void)
863{
Alex Bennée37257942017-02-23 18:29:14 +0000864 if (!mttcg_enabled && !tcg_kick_vcpu_timer && CPU_NEXT(first_cpu)) {
Alex Bennée65467062017-02-23 18:29:09 +0000865 tcg_kick_vcpu_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
866 kick_tcg_thread, NULL);
867 timer_mod(tcg_kick_vcpu_timer, qemu_tcg_next_kick());
868 }
869}
870
871static void stop_tcg_kick_timer(void)
872{
873 if (tcg_kick_vcpu_timer) {
874 timer_del(tcg_kick_vcpu_timer);
875 tcg_kick_vcpu_timer = NULL;
876 }
877}
878
Alex Bennée65467062017-02-23 18:29:09 +0000879/***********************************************************/
Blue Swirl296af7c2010-03-29 19:23:50 +0000880void hw_error(const char *fmt, ...)
881{
882 va_list ap;
Andreas Färber55e5c282012-12-17 06:18:02 +0100883 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000884
885 va_start(ap, fmt);
886 fprintf(stderr, "qemu: hardware error: ");
887 vfprintf(stderr, fmt, ap);
888 fprintf(stderr, "\n");
Andreas Färberbdc44642013-06-24 23:50:24 +0200889 CPU_FOREACH(cpu) {
Andreas Färber55e5c282012-12-17 06:18:02 +0100890 fprintf(stderr, "CPU #%d:\n", cpu->cpu_index);
Andreas Färber878096e2013-05-27 01:33:50 +0200891 cpu_dump_state(cpu, stderr, fprintf, CPU_DUMP_FPU);
Blue Swirl296af7c2010-03-29 19:23:50 +0000892 }
893 va_end(ap);
894 abort();
895}
896
897void cpu_synchronize_all_states(void)
898{
Andreas Färber182735e2013-05-29 22:29:20 +0200899 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000900
Andreas Färberbdc44642013-06-24 23:50:24 +0200901 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200902 cpu_synchronize_state(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000903 }
904}
905
906void cpu_synchronize_all_post_reset(void)
907{
Andreas Färber182735e2013-05-29 22:29:20 +0200908 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000909
Andreas Färberbdc44642013-06-24 23:50:24 +0200910 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200911 cpu_synchronize_post_reset(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000912 }
913}
914
915void cpu_synchronize_all_post_init(void)
916{
Andreas Färber182735e2013-05-29 22:29:20 +0200917 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000918
Andreas Färberbdc44642013-06-24 23:50:24 +0200919 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200920 cpu_synchronize_post_init(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000921 }
922}
923
Kevin Wolf56983462013-07-05 13:49:54 +0200924static int do_vm_stop(RunState state)
Blue Swirl296af7c2010-03-29 19:23:50 +0000925{
Kevin Wolf56983462013-07-05 13:49:54 +0200926 int ret = 0;
927
Luiz Capitulino13548692011-07-29 15:36:43 -0300928 if (runstate_is_running()) {
Blue Swirl296af7c2010-03-29 19:23:50 +0000929 cpu_disable_ticks();
Blue Swirl296af7c2010-03-29 19:23:50 +0000930 pause_all_vcpus();
Luiz Capitulinof5bbfba2011-07-29 15:04:45 -0300931 runstate_set(state);
Luiz Capitulino1dfb4dd2011-07-29 14:26:33 -0300932 vm_state_notify(0, state);
Wenchao Xiaa4e15de2014-06-18 08:43:36 +0200933 qapi_event_send_stop(&error_abort);
Blue Swirl296af7c2010-03-29 19:23:50 +0000934 }
Kevin Wolf56983462013-07-05 13:49:54 +0200935
Kevin Wolf594a45c2013-07-18 14:52:19 +0200936 bdrv_drain_all();
Pavel Dovgalyuk6d0ceb82016-09-26 11:08:16 +0300937 replay_disable_events();
John Snow22af08e2016-09-22 21:45:51 -0400938 ret = bdrv_flush_all();
Kevin Wolf594a45c2013-07-18 14:52:19 +0200939
Kevin Wolf56983462013-07-05 13:49:54 +0200940 return ret;
Blue Swirl296af7c2010-03-29 19:23:50 +0000941}
942
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200943static bool cpu_can_run(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +0000944{
Andreas Färber4fdeee72012-05-02 23:10:09 +0200945 if (cpu->stop) {
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200946 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +0100947 }
Tiejun Chen321bc0b2013-08-02 09:43:09 +0800948 if (cpu_is_stopped(cpu)) {
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200949 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +0100950 }
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200951 return true;
Blue Swirl296af7c2010-03-29 19:23:50 +0000952}
953
Andreas Färber91325042013-05-27 02:07:49 +0200954static void cpu_handle_guest_debug(CPUState *cpu)
Jan Kiszka3c638d02010-06-25 16:56:56 +0200955{
Andreas Färber64f6b342013-05-27 02:06:09 +0200956 gdb_set_stop_cpu(cpu);
Jan Kiszka8cf71712011-02-07 12:19:16 +0100957 qemu_system_debug_request();
Andreas Färberf324e762012-05-02 23:26:21 +0200958 cpu->stopped = true;
Jan Kiszka3c638d02010-06-25 16:56:56 +0200959}
960
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100961#ifdef CONFIG_LINUX
962static void sigbus_reraise(void)
963{
964 sigset_t set;
965 struct sigaction action;
966
967 memset(&action, 0, sizeof(action));
968 action.sa_handler = SIG_DFL;
969 if (!sigaction(SIGBUS, &action, NULL)) {
970 raise(SIGBUS);
971 sigemptyset(&set);
972 sigaddset(&set, SIGBUS);
Peter Maydella2d17612016-05-16 18:33:59 +0100973 pthread_sigmask(SIG_UNBLOCK, &set, NULL);
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100974 }
975 perror("Failed to re-raise SIGBUS!\n");
976 abort();
977}
978
Paolo Bonzinid98d4072017-02-08 13:22:12 +0100979static void sigbus_handler(int n, siginfo_t *siginfo, void *ctx)
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100980{
Paolo Bonzinia16fc072017-02-09 09:50:02 +0100981 if (siginfo->si_code != BUS_MCEERR_AO && siginfo->si_code != BUS_MCEERR_AR) {
982 sigbus_reraise();
983 }
984
Paolo Bonzini2ae41db2017-02-08 12:48:54 +0100985 if (current_cpu) {
986 /* Called asynchronously in VCPU thread. */
987 if (kvm_on_sigbus_vcpu(current_cpu, siginfo->si_code, siginfo->si_addr)) {
988 sigbus_reraise();
989 }
990 } else {
991 /* Called synchronously (via signalfd) in main thread. */
992 if (kvm_on_sigbus(siginfo->si_code, siginfo->si_addr)) {
993 sigbus_reraise();
994 }
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100995 }
996}
997
998static void qemu_init_sigbus(void)
999{
1000 struct sigaction action;
1001
1002 memset(&action, 0, sizeof(action));
1003 action.sa_flags = SA_SIGINFO;
Paolo Bonzinid98d4072017-02-08 13:22:12 +01001004 action.sa_sigaction = sigbus_handler;
Jan Kiszka6d9cb732011-02-01 22:15:58 +01001005 sigaction(SIGBUS, &action, NULL);
1006
1007 prctl(PR_MCE_KILL, PR_MCE_KILL_SET, PR_MCE_KILL_EARLY, 0, 0);
1008}
Paolo Bonzinia16fc072017-02-09 09:50:02 +01001009#else /* !CONFIG_LINUX */
1010static void qemu_init_sigbus(void)
1011{
1012}
Paolo Bonzinia16fc072017-02-09 09:50:02 +01001013#endif /* !CONFIG_LINUX */
Blue Swirl296af7c2010-03-29 19:23:50 +00001014
Stefan Weilb2532d82012-09-27 07:41:42 +02001015static QemuMutex qemu_global_mutex;
Blue Swirl296af7c2010-03-29 19:23:50 +00001016
1017static QemuThread io_thread;
1018
Blue Swirl296af7c2010-03-29 19:23:50 +00001019/* cpu creation */
1020static QemuCond qemu_cpu_cond;
1021/* system init */
Blue Swirl296af7c2010-03-29 19:23:50 +00001022static QemuCond qemu_pause_cond;
1023
Paolo Bonzinid3b12f52011-09-13 10:30:52 +02001024void qemu_init_cpu_loop(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001025{
Jan Kiszka6d9cb732011-02-01 22:15:58 +01001026 qemu_init_sigbus();
Anthony Liguoried945922011-02-08 18:18:18 +01001027 qemu_cond_init(&qemu_cpu_cond);
Anthony Liguoried945922011-02-08 18:18:18 +01001028 qemu_cond_init(&qemu_pause_cond);
Blue Swirl296af7c2010-03-29 19:23:50 +00001029 qemu_mutex_init(&qemu_global_mutex);
Blue Swirl296af7c2010-03-29 19:23:50 +00001030
Jan Kiszkab7680cb2011-03-12 17:43:51 +01001031 qemu_thread_get_self(&io_thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001032}
1033
Paolo Bonzini14e6fe12016-10-31 10:36:08 +01001034void run_on_cpu(CPUState *cpu, run_on_cpu_func func, run_on_cpu_data data)
Marcelo Tosattie82bcec2010-05-04 09:45:22 -03001035{
Sergey Fedorovd148d902016-08-29 09:51:00 +02001036 do_run_on_cpu(cpu, func, data, &qemu_global_mutex);
Chegu Vinod3c022702013-06-24 03:49:41 -06001037}
1038
Gu Zheng4c055ab2016-05-12 09:18:13 +05301039static void qemu_kvm_destroy_vcpu(CPUState *cpu)
1040{
1041 if (kvm_destroy_vcpu(cpu) < 0) {
1042 error_report("kvm_destroy_vcpu failed");
1043 exit(EXIT_FAILURE);
1044 }
1045}
1046
1047static void qemu_tcg_destroy_vcpu(CPUState *cpu)
1048{
1049}
1050
Andreas Färber509a0d72012-05-03 02:18:09 +02001051static void qemu_wait_io_event_common(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001052{
Alex Bennée37257942017-02-23 18:29:14 +00001053 atomic_mb_set(&cpu->thread_kicked, false);
Andreas Färber4fdeee72012-05-02 23:10:09 +02001054 if (cpu->stop) {
1055 cpu->stop = false;
Andreas Färberf324e762012-05-02 23:26:21 +02001056 cpu->stopped = true;
Dr. David Alan Gilbert96bce682016-01-25 10:08:18 +00001057 qemu_cond_broadcast(&qemu_pause_cond);
Blue Swirl296af7c2010-03-29 19:23:50 +00001058 }
Sergey Fedorova5403c62016-08-02 18:27:36 +01001059 process_queued_cpu_work(cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001060}
1061
1062static bool qemu_tcg_should_sleep(CPUState *cpu)
1063{
1064 if (mttcg_enabled) {
1065 return cpu_thread_is_idle(cpu);
1066 } else {
1067 return all_cpu_threads_idle();
1068 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001069}
1070
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001071static void qemu_tcg_wait_io_event(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001072{
Alex Bennée37257942017-02-23 18:29:14 +00001073 while (qemu_tcg_should_sleep(cpu)) {
Alex Bennée65467062017-02-23 18:29:09 +00001074 stop_tcg_kick_timer();
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001075 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka16400322011-02-09 16:29:37 +01001076 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001077
Alex Bennée65467062017-02-23 18:29:09 +00001078 start_tcg_kick_timer();
1079
Alex Bennée37257942017-02-23 18:29:14 +00001080 qemu_wait_io_event_common(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001081}
1082
Andreas Färberfd529e82013-05-26 23:24:55 +02001083static void qemu_kvm_wait_io_event(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001084{
Andreas Färbera98ae1d2013-05-26 23:21:08 +02001085 while (cpu_thread_is_idle(cpu)) {
Andreas Färberf5c121b2012-05-03 01:22:49 +02001086 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka16400322011-02-09 16:29:37 +01001087 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001088
Andreas Färber509a0d72012-05-03 02:18:09 +02001089 qemu_wait_io_event_common(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001090}
1091
Jan Kiszka7e97cd82011-02-07 12:19:12 +01001092static void *qemu_kvm_cpu_thread_fn(void *arg)
Blue Swirl296af7c2010-03-29 19:23:50 +00001093{
Andreas Färber48a106b2013-05-27 02:20:39 +02001094 CPUState *cpu = arg;
Jan Kiszka84b49152011-02-01 22:15:50 +01001095 int r;
Blue Swirl296af7c2010-03-29 19:23:50 +00001096
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001097 rcu_register_thread();
1098
Paolo Bonzini2e7f7a32015-06-18 18:47:18 +02001099 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001100 qemu_thread_get_self(cpu->thread);
Andreas Färber9f09e182012-05-03 06:59:07 +02001101 cpu->thread_id = qemu_get_thread_id();
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001102 cpu->can_do_io = 1;
Andreas Färber4917cf42013-05-27 05:17:50 +02001103 current_cpu = cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001104
Andreas Färber504134d2012-12-17 06:38:45 +01001105 r = kvm_init_vcpu(cpu);
Jan Kiszka84b49152011-02-01 22:15:50 +01001106 if (r < 0) {
1107 fprintf(stderr, "kvm_init_vcpu failed: %s\n", strerror(-r));
1108 exit(1);
1109 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001110
Paolo Bonzini18268b62017-02-09 09:41:14 +01001111 kvm_init_cpu_signals(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001112
1113 /* signal CPU creation */
Andreas Färber61a46212012-05-02 22:49:36 +02001114 cpu->created = true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001115 qemu_cond_signal(&qemu_cpu_cond);
1116
Gu Zheng4c055ab2016-05-12 09:18:13 +05301117 do {
Andreas Färbera1fcaa72012-05-02 23:42:26 +02001118 if (cpu_can_run(cpu)) {
Andreas Färber1458c362013-05-26 23:46:55 +02001119 r = kvm_cpu_exec(cpu);
Jan Kiszka83f338f2011-02-07 12:19:17 +01001120 if (r == EXCP_DEBUG) {
Andreas Färber91325042013-05-27 02:07:49 +02001121 cpu_handle_guest_debug(cpu);
Jan Kiszka83f338f2011-02-07 12:19:17 +01001122 }
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001123 }
Andreas Färberfd529e82013-05-26 23:24:55 +02001124 qemu_kvm_wait_io_event(cpu);
Gu Zheng4c055ab2016-05-12 09:18:13 +05301125 } while (!cpu->unplug || cpu_can_run(cpu));
Blue Swirl296af7c2010-03-29 19:23:50 +00001126
Gu Zheng4c055ab2016-05-12 09:18:13 +05301127 qemu_kvm_destroy_vcpu(cpu);
Bharata B Rao2c579042016-05-12 09:18:14 +05301128 cpu->created = false;
1129 qemu_cond_signal(&qemu_cpu_cond);
Gu Zheng4c055ab2016-05-12 09:18:13 +05301130 qemu_mutex_unlock_iothread();
Blue Swirl296af7c2010-03-29 19:23:50 +00001131 return NULL;
1132}
1133
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001134static void *qemu_dummy_cpu_thread_fn(void *arg)
1135{
1136#ifdef _WIN32
1137 fprintf(stderr, "qtest is not supported under Windows\n");
1138 exit(1);
1139#else
Andreas Färber10a90212013-05-27 02:24:35 +02001140 CPUState *cpu = arg;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001141 sigset_t waitset;
1142 int r;
1143
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001144 rcu_register_thread();
1145
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001146 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001147 qemu_thread_get_self(cpu->thread);
Andreas Färber9f09e182012-05-03 06:59:07 +02001148 cpu->thread_id = qemu_get_thread_id();
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001149 cpu->can_do_io = 1;
Alex Bennée37257942017-02-23 18:29:14 +00001150 current_cpu = cpu;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001151
1152 sigemptyset(&waitset);
1153 sigaddset(&waitset, SIG_IPI);
1154
1155 /* signal CPU creation */
Andreas Färber61a46212012-05-02 22:49:36 +02001156 cpu->created = true;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001157 qemu_cond_signal(&qemu_cpu_cond);
1158
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001159 while (1) {
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001160 qemu_mutex_unlock_iothread();
1161 do {
1162 int sig;
1163 r = sigwait(&waitset, &sig);
1164 } while (r == -1 && (errno == EAGAIN || errno == EINTR));
1165 if (r == -1) {
1166 perror("sigwait");
1167 exit(1);
1168 }
1169 qemu_mutex_lock_iothread();
Andreas Färber509a0d72012-05-03 02:18:09 +02001170 qemu_wait_io_event_common(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001171 }
1172
1173 return NULL;
1174#endif
1175}
1176
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001177static int64_t tcg_get_icount_limit(void)
1178{
1179 int64_t deadline;
1180
1181 if (replay_mode != REPLAY_MODE_PLAY) {
1182 deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
1183
1184 /* Maintain prior (possibly buggy) behaviour where if no deadline
1185 * was set (as there is no QEMU_CLOCK_VIRTUAL timer) or it is more than
1186 * INT32_MAX nanoseconds ahead, we still use INT32_MAX
1187 * nanoseconds.
1188 */
1189 if ((deadline < 0) || (deadline > INT32_MAX)) {
1190 deadline = INT32_MAX;
1191 }
1192
1193 return qemu_icount_round(deadline);
1194 } else {
1195 return replay_get_instructions();
1196 }
1197}
1198
Alex Bennée12e97002016-10-27 16:10:14 +01001199static void handle_icount_deadline(void)
1200{
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001201 assert(qemu_in_vcpu_thread());
Alex Bennée12e97002016-10-27 16:10:14 +01001202 if (use_icount) {
1203 int64_t deadline =
1204 qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
1205
1206 if (deadline == 0) {
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001207 /* Wake up other AioContexts. */
Alex Bennée12e97002016-10-27 16:10:14 +01001208 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001209 qemu_clock_run_timers(QEMU_CLOCK_VIRTUAL);
Alex Bennée12e97002016-10-27 16:10:14 +01001210 }
1211 }
1212}
1213
Alex Bennée05248382017-03-29 16:46:59 +01001214static void prepare_icount_for_run(CPUState *cpu)
1215{
1216 if (use_icount) {
Alex Bennéeeda5f7c2017-04-05 12:35:48 +01001217 int insns_left;
Alex Bennée05248382017-03-29 16:46:59 +01001218
1219 /* These should always be cleared by process_icount_data after
1220 * each vCPU execution. However u16.high can be raised
1221 * asynchronously by cpu_exit/cpu_interrupt/tcg_handle_interrupt
1222 */
1223 g_assert(cpu->icount_decr.u16.low == 0);
1224 g_assert(cpu->icount_extra == 0);
1225
Alex Bennéeeda5f7c2017-04-05 12:35:48 +01001226 cpu->icount_budget = tcg_get_icount_limit();
1227 insns_left = MIN(0xffff, cpu->icount_budget);
1228 cpu->icount_decr.u16.low = insns_left;
1229 cpu->icount_extra = cpu->icount_budget - insns_left;
Alex Bennée05248382017-03-29 16:46:59 +01001230 }
1231}
1232
1233static void process_icount_data(CPUState *cpu)
1234{
1235 if (use_icount) {
Alex Bennéee4cd9652017-03-31 16:09:42 +01001236 /* Account for executed instructions */
Alex Bennée512d3c82017-04-05 12:32:37 +01001237 cpu_update_icount(cpu);
Alex Bennée05248382017-03-29 16:46:59 +01001238
1239 /* Reset the counters */
1240 cpu->icount_decr.u16.low = 0;
1241 cpu->icount_extra = 0;
Alex Bennéee4cd9652017-03-31 16:09:42 +01001242 cpu->icount_budget = 0;
1243
Alex Bennée05248382017-03-29 16:46:59 +01001244 replay_account_executed_instructions();
1245 }
1246}
1247
1248
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001249static int tcg_cpu_exec(CPUState *cpu)
1250{
1251 int ret;
1252#ifdef CONFIG_PROFILER
1253 int64_t ti;
1254#endif
1255
1256#ifdef CONFIG_PROFILER
1257 ti = profile_getclock();
1258#endif
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001259 qemu_mutex_unlock_iothread();
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001260 cpu_exec_start(cpu);
1261 ret = cpu_exec(cpu);
1262 cpu_exec_end(cpu);
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001263 qemu_mutex_lock_iothread();
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001264#ifdef CONFIG_PROFILER
1265 tcg_time += profile_getclock() - ti;
1266#endif
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001267 return ret;
1268}
1269
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001270/* Destroy any remaining vCPUs which have been unplugged and have
1271 * finished running
1272 */
1273static void deal_with_unplugged_cpus(void)
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001274{
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001275 CPUState *cpu;
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001276
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001277 CPU_FOREACH(cpu) {
1278 if (cpu->unplug && !cpu_can_run(cpu)) {
1279 qemu_tcg_destroy_vcpu(cpu);
1280 cpu->created = false;
1281 qemu_cond_signal(&qemu_cpu_cond);
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001282 break;
1283 }
1284 }
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001285}
Jan Kiszkabdb7ca62011-09-26 09:40:39 +02001286
Alex Bennée65467062017-02-23 18:29:09 +00001287/* Single-threaded TCG
1288 *
1289 * In the single-threaded case each vCPU is simulated in turn. If
1290 * there is more than a single vCPU we create a simple timer to kick
1291 * the vCPU and ensure we don't get stuck in a tight loop in one vCPU.
1292 * This is done explicitly rather than relying on side-effects
1293 * elsewhere.
1294 */
1295
Alex Bennée37257942017-02-23 18:29:14 +00001296static void *qemu_tcg_rr_cpu_thread_fn(void *arg)
Blue Swirl296af7c2010-03-29 19:23:50 +00001297{
Andreas Färberc3586ba2012-05-03 01:41:24 +02001298 CPUState *cpu = arg;
Blue Swirl296af7c2010-03-29 19:23:50 +00001299
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001300 rcu_register_thread();
1301
Paolo Bonzini2e7f7a32015-06-18 18:47:18 +02001302 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001303 qemu_thread_get_self(cpu->thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001304
Andreas Färber38fcbd32013-07-07 19:50:23 +02001305 CPU_FOREACH(cpu) {
1306 cpu->thread_id = qemu_get_thread_id();
1307 cpu->created = true;
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001308 cpu->can_do_io = 1;
Andreas Färber38fcbd32013-07-07 19:50:23 +02001309 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001310 qemu_cond_signal(&qemu_cpu_cond);
1311
Jan Kiszkafa7d1862011-08-22 18:35:25 +02001312 /* wait for initial kick-off after machine start */
Emilio G. Cotac28e3992015-04-27 12:45:28 -04001313 while (first_cpu->stopped) {
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001314 qemu_cond_wait(first_cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka8e564b42012-02-17 18:31:15 +01001315
1316 /* process any pending work */
Andreas Färberbdc44642013-06-24 23:50:24 +02001317 CPU_FOREACH(cpu) {
Alex Bennée37257942017-02-23 18:29:14 +00001318 current_cpu = cpu;
Andreas Färber182735e2013-05-29 22:29:20 +02001319 qemu_wait_io_event_common(cpu);
Jan Kiszka8e564b42012-02-17 18:31:15 +01001320 }
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001321 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001322
Alex Bennée65467062017-02-23 18:29:09 +00001323 start_tcg_kick_timer();
1324
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001325 cpu = first_cpu;
1326
Alex Bennéee5143e32017-02-23 18:29:12 +00001327 /* process any pending work */
1328 cpu->exit_request = 1;
1329
Blue Swirl296af7c2010-03-29 19:23:50 +00001330 while (1) {
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001331 /* Account partial waits to QEMU_CLOCK_VIRTUAL. */
1332 qemu_account_warp_timer();
1333
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001334 /* Run the timers here. This is much more efficient than
1335 * waking up the I/O thread and waiting for completion.
1336 */
1337 handle_icount_deadline();
1338
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001339 if (!cpu) {
1340 cpu = first_cpu;
1341 }
1342
Alex Bennéee5143e32017-02-23 18:29:12 +00001343 while (cpu && !cpu->queued_work_first && !cpu->exit_request) {
1344
Alex Bennée791158d2017-02-23 18:29:10 +00001345 atomic_mb_set(&tcg_current_rr_cpu, cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001346 current_cpu = cpu;
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001347
1348 qemu_clock_enable(QEMU_CLOCK_VIRTUAL,
1349 (cpu->singlestep_enabled & SSTEP_NOTIMER) == 0);
1350
1351 if (cpu_can_run(cpu)) {
1352 int r;
Alex Bennée05248382017-03-29 16:46:59 +01001353
1354 prepare_icount_for_run(cpu);
1355
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001356 r = tcg_cpu_exec(cpu);
Alex Bennée05248382017-03-29 16:46:59 +01001357
1358 process_icount_data(cpu);
1359
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001360 if (r == EXCP_DEBUG) {
1361 cpu_handle_guest_debug(cpu);
1362 break;
Pranith Kumar08e73c42017-02-23 18:29:15 +00001363 } else if (r == EXCP_ATOMIC) {
1364 qemu_mutex_unlock_iothread();
1365 cpu_exec_step_atomic(cpu);
1366 qemu_mutex_lock_iothread();
1367 break;
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001368 }
Alex Bennée37257942017-02-23 18:29:14 +00001369 } else if (cpu->stop) {
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001370 if (cpu->unplug) {
1371 cpu = CPU_NEXT(cpu);
1372 }
1373 break;
1374 }
1375
Alex Bennéee5143e32017-02-23 18:29:12 +00001376 cpu = CPU_NEXT(cpu);
1377 } /* while (cpu && !cpu->exit_request).. */
1378
Alex Bennée791158d2017-02-23 18:29:10 +00001379 /* Does not need atomic_mb_set because a spurious wakeup is okay. */
1380 atomic_set(&tcg_current_rr_cpu, NULL);
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001381
Alex Bennéee5143e32017-02-23 18:29:12 +00001382 if (cpu && cpu->exit_request) {
1383 atomic_mb_set(&cpu->exit_request, 0);
1384 }
Alex Blighac70aaf2013-08-21 16:02:57 +01001385
Alex Bennée37257942017-02-23 18:29:14 +00001386 qemu_tcg_wait_io_event(cpu ? cpu : QTAILQ_FIRST(&cpus));
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001387 deal_with_unplugged_cpus();
Blue Swirl296af7c2010-03-29 19:23:50 +00001388 }
1389
1390 return NULL;
1391}
1392
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001393static void *qemu_hax_cpu_thread_fn(void *arg)
1394{
1395 CPUState *cpu = arg;
1396 int r;
Vincent Palatinb3d3a422017-03-20 11:15:49 +01001397
1398 qemu_mutex_lock_iothread();
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001399 qemu_thread_get_self(cpu->thread);
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001400
1401 cpu->thread_id = qemu_get_thread_id();
1402 cpu->created = true;
1403 cpu->halted = 0;
1404 current_cpu = cpu;
1405
1406 hax_init_vcpu(cpu);
1407 qemu_cond_signal(&qemu_cpu_cond);
1408
1409 while (1) {
1410 if (cpu_can_run(cpu)) {
1411 r = hax_smp_cpu_exec(cpu);
1412 if (r == EXCP_DEBUG) {
1413 cpu_handle_guest_debug(cpu);
1414 }
1415 }
1416
1417 while (cpu_thread_is_idle(cpu)) {
1418 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
1419 }
1420#ifdef _WIN32
1421 SleepEx(0, TRUE);
1422#endif
1423 qemu_wait_io_event_common(cpu);
1424 }
1425 return NULL;
1426}
1427
1428#ifdef _WIN32
1429static void CALLBACK dummy_apc_func(ULONG_PTR unused)
1430{
1431}
1432#endif
1433
Alex Bennée37257942017-02-23 18:29:14 +00001434/* Multi-threaded TCG
1435 *
1436 * In the multi-threaded case each vCPU has its own thread. The TLS
1437 * variable current_cpu can be used deep in the code to find the
1438 * current CPUState for a given thread.
1439 */
1440
1441static void *qemu_tcg_cpu_thread_fn(void *arg)
1442{
1443 CPUState *cpu = arg;
1444
Alex Bennéebf51c722017-03-30 18:32:29 +01001445 g_assert(!use_icount);
1446
Alex Bennée37257942017-02-23 18:29:14 +00001447 rcu_register_thread();
1448
1449 qemu_mutex_lock_iothread();
1450 qemu_thread_get_self(cpu->thread);
1451
1452 cpu->thread_id = qemu_get_thread_id();
1453 cpu->created = true;
1454 cpu->can_do_io = 1;
1455 current_cpu = cpu;
1456 qemu_cond_signal(&qemu_cpu_cond);
1457
1458 /* process any pending work */
1459 cpu->exit_request = 1;
1460
1461 while (1) {
1462 if (cpu_can_run(cpu)) {
1463 int r;
1464 r = tcg_cpu_exec(cpu);
1465 switch (r) {
1466 case EXCP_DEBUG:
1467 cpu_handle_guest_debug(cpu);
1468 break;
1469 case EXCP_HALTED:
1470 /* during start-up the vCPU is reset and the thread is
1471 * kicked several times. If we don't ensure we go back
1472 * to sleep in the halted state we won't cleanly
1473 * start-up when the vCPU is enabled.
1474 *
1475 * cpu->halted should ensure we sleep in wait_io_event
1476 */
1477 g_assert(cpu->halted);
1478 break;
Pranith Kumar08e73c42017-02-23 18:29:15 +00001479 case EXCP_ATOMIC:
1480 qemu_mutex_unlock_iothread();
1481 cpu_exec_step_atomic(cpu);
1482 qemu_mutex_lock_iothread();
Alex Bennée37257942017-02-23 18:29:14 +00001483 default:
1484 /* Ignore everything else? */
1485 break;
1486 }
1487 }
1488
Alex Bennée37257942017-02-23 18:29:14 +00001489 atomic_mb_set(&cpu->exit_request, 0);
1490 qemu_tcg_wait_io_event(cpu);
1491 }
1492
1493 return NULL;
1494}
1495
Andreas Färber2ff09a42012-05-03 00:23:30 +02001496static void qemu_cpu_kick_thread(CPUState *cpu)
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001497{
1498#ifndef _WIN32
1499 int err;
1500
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001501 if (cpu->thread_kicked) {
1502 return;
Paolo Bonzini9102ded2015-08-18 06:52:09 -07001503 }
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001504 cpu->thread_kicked = true;
Andreas Färber814e6122012-05-02 17:00:37 +02001505 err = pthread_kill(cpu->thread->thread, SIG_IPI);
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001506 if (err) {
1507 fprintf(stderr, "qemu:%s: %s", __func__, strerror(err));
1508 exit(1);
1509 }
1510#else /* _WIN32 */
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001511 if (!qemu_cpu_is_self(cpu)) {
1512 if (!QueueUserAPC(dummy_apc_func, cpu->hThread, 0)) {
1513 fprintf(stderr, "%s: QueueUserAPC failed with error %lu\n",
1514 __func__, GetLastError());
1515 exit(1);
1516 }
1517 }
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001518#endif
1519}
1520
Andreas Färberc08d7422012-05-03 04:34:15 +02001521void qemu_cpu_kick(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001522{
Andreas Färberf5c121b2012-05-03 01:22:49 +02001523 qemu_cond_broadcast(cpu->halt_cond);
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001524 if (tcg_enabled()) {
Alex Bennée791158d2017-02-23 18:29:10 +00001525 cpu_exit(cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001526 /* NOP unless doing single-thread RR */
Alex Bennée791158d2017-02-23 18:29:10 +00001527 qemu_cpu_kick_rr_cpu();
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001528 } else {
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001529 if (hax_enabled()) {
1530 /*
1531 * FIXME: race condition with the exit_request check in
1532 * hax_vcpu_hax_exec
1533 */
1534 cpu->exit_request = 1;
1535 }
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001536 qemu_cpu_kick_thread(cpu);
1537 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001538}
1539
Jan Kiszka46d62fa2011-02-01 22:15:59 +01001540void qemu_cpu_kick_self(void)
1541{
Andreas Färber4917cf42013-05-27 05:17:50 +02001542 assert(current_cpu);
Paolo Bonzini9102ded2015-08-18 06:52:09 -07001543 qemu_cpu_kick_thread(current_cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001544}
1545
Andreas Färber60e82572012-05-02 22:23:49 +02001546bool qemu_cpu_is_self(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001547{
Andreas Färber814e6122012-05-02 17:00:37 +02001548 return qemu_thread_is_self(cpu->thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001549}
1550
Paolo Bonzini79e2b9a2015-01-21 12:09:14 +01001551bool qemu_in_vcpu_thread(void)
Juan Quintelaaa723c22012-09-18 16:30:11 +02001552{
Andreas Färber4917cf42013-05-27 05:17:50 +02001553 return current_cpu && qemu_cpu_is_self(current_cpu);
Juan Quintelaaa723c22012-09-18 16:30:11 +02001554}
1555
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001556static __thread bool iothread_locked = false;
1557
1558bool qemu_mutex_iothread_locked(void)
1559{
1560 return iothread_locked;
1561}
1562
Blue Swirl296af7c2010-03-29 19:23:50 +00001563void qemu_mutex_lock_iothread(void)
1564{
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001565 g_assert(!qemu_mutex_iothread_locked());
1566 qemu_mutex_lock(&qemu_global_mutex);
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001567 iothread_locked = true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001568}
1569
1570void qemu_mutex_unlock_iothread(void)
1571{
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001572 g_assert(qemu_mutex_iothread_locked());
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001573 iothread_locked = false;
Blue Swirl296af7c2010-03-29 19:23:50 +00001574 qemu_mutex_unlock(&qemu_global_mutex);
1575}
1576
Alex Bennéee8faee02016-10-27 16:09:58 +01001577static bool all_vcpus_paused(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001578{
Andreas Färberbdc44642013-06-24 23:50:24 +02001579 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001580
Andreas Färberbdc44642013-06-24 23:50:24 +02001581 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001582 if (!cpu->stopped) {
Alex Bennéee8faee02016-10-27 16:09:58 +01001583 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001584 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001585 }
1586
Alex Bennéee8faee02016-10-27 16:09:58 +01001587 return true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001588}
1589
1590void pause_all_vcpus(void)
1591{
Andreas Färberbdc44642013-06-24 23:50:24 +02001592 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001593
Alex Bligh40daca52013-08-21 16:03:02 +01001594 qemu_clock_enable(QEMU_CLOCK_VIRTUAL, false);
Andreas Färberbdc44642013-06-24 23:50:24 +02001595 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001596 cpu->stop = true;
1597 qemu_cpu_kick(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001598 }
1599
Juan Quintelaaa723c22012-09-18 16:30:11 +02001600 if (qemu_in_vcpu_thread()) {
Jan Kiszkad798e972012-02-17 18:31:16 +01001601 cpu_stop_current();
Jan Kiszkad798e972012-02-17 18:31:16 +01001602 }
1603
Blue Swirl296af7c2010-03-29 19:23:50 +00001604 while (!all_vcpus_paused()) {
Paolo Bonzinibe7d6c52011-03-12 17:44:02 +01001605 qemu_cond_wait(&qemu_pause_cond, &qemu_global_mutex);
Andreas Färberbdc44642013-06-24 23:50:24 +02001606 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001607 qemu_cpu_kick(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001608 }
1609 }
1610}
1611
Igor Mammedov29936832013-04-23 10:29:37 +02001612void cpu_resume(CPUState *cpu)
1613{
1614 cpu->stop = false;
1615 cpu->stopped = false;
1616 qemu_cpu_kick(cpu);
1617}
1618
Blue Swirl296af7c2010-03-29 19:23:50 +00001619void resume_all_vcpus(void)
1620{
Andreas Färberbdc44642013-06-24 23:50:24 +02001621 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001622
Alex Bligh40daca52013-08-21 16:03:02 +01001623 qemu_clock_enable(QEMU_CLOCK_VIRTUAL, true);
Andreas Färberbdc44642013-06-24 23:50:24 +02001624 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001625 cpu_resume(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001626 }
1627}
1628
Gu Zheng4c055ab2016-05-12 09:18:13 +05301629void cpu_remove(CPUState *cpu)
1630{
1631 cpu->stop = true;
1632 cpu->unplug = true;
1633 qemu_cpu_kick(cpu);
1634}
1635
Bharata B Rao2c579042016-05-12 09:18:14 +05301636void cpu_remove_sync(CPUState *cpu)
1637{
1638 cpu_remove(cpu);
1639 while (cpu->created) {
1640 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1641 }
1642}
1643
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001644/* For temporary buffers for forming a name */
1645#define VCPU_THREAD_NAME_SIZE 16
1646
Andreas Färbere5ab30a2012-05-03 01:50:44 +02001647static void qemu_tcg_init_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001648{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001649 char thread_name[VCPU_THREAD_NAME_SIZE];
Alex Bennée37257942017-02-23 18:29:14 +00001650 static QemuCond *single_tcg_halt_cond;
1651 static QemuThread *single_tcg_cpu_thread;
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001652
Alex Bennée37257942017-02-23 18:29:14 +00001653 if (qemu_tcg_mttcg_enabled() || !single_tcg_cpu_thread) {
Andreas Färber814e6122012-05-02 17:00:37 +02001654 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001655 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1656 qemu_cond_init(cpu->halt_cond);
Alex Bennée37257942017-02-23 18:29:14 +00001657
1658 if (qemu_tcg_mttcg_enabled()) {
1659 /* create a thread per vCPU with TCG (MTTCG) */
1660 parallel_cpus = true;
1661 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/TCG",
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001662 cpu->cpu_index);
Alex Bennée37257942017-02-23 18:29:14 +00001663
1664 qemu_thread_create(cpu->thread, thread_name, qemu_tcg_cpu_thread_fn,
1665 cpu, QEMU_THREAD_JOINABLE);
1666
1667 } else {
1668 /* share a single thread for all cpus with TCG */
1669 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "ALL CPUs/TCG");
1670 qemu_thread_create(cpu->thread, thread_name,
1671 qemu_tcg_rr_cpu_thread_fn,
1672 cpu, QEMU_THREAD_JOINABLE);
1673
1674 single_tcg_halt_cond = cpu->halt_cond;
1675 single_tcg_cpu_thread = cpu->thread;
1676 }
Paolo Bonzini1ecf47b2011-12-13 13:43:52 +01001677#ifdef _WIN32
Andreas Färber814e6122012-05-02 17:00:37 +02001678 cpu->hThread = qemu_thread_get_handle(cpu->thread);
Paolo Bonzini1ecf47b2011-12-13 13:43:52 +01001679#endif
Andreas Färber61a46212012-05-02 22:49:36 +02001680 while (!cpu->created) {
Paolo Bonzini18a85722011-03-12 17:44:03 +01001681 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001682 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001683 } else {
Alex Bennée37257942017-02-23 18:29:14 +00001684 /* For non-MTTCG cases we share the thread */
1685 cpu->thread = single_tcg_cpu_thread;
1686 cpu->halt_cond = single_tcg_halt_cond;
Blue Swirl296af7c2010-03-29 19:23:50 +00001687 }
1688}
1689
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001690static void qemu_hax_start_vcpu(CPUState *cpu)
1691{
1692 char thread_name[VCPU_THREAD_NAME_SIZE];
1693
1694 cpu->thread = g_malloc0(sizeof(QemuThread));
1695 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1696 qemu_cond_init(cpu->halt_cond);
1697
1698 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/HAX",
1699 cpu->cpu_index);
1700 qemu_thread_create(cpu->thread, thread_name, qemu_hax_cpu_thread_fn,
1701 cpu, QEMU_THREAD_JOINABLE);
1702#ifdef _WIN32
1703 cpu->hThread = qemu_thread_get_handle(cpu->thread);
1704#endif
1705 while (!cpu->created) {
1706 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1707 }
1708}
1709
Andreas Färber48a106b2013-05-27 02:20:39 +02001710static void qemu_kvm_start_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001711{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001712 char thread_name[VCPU_THREAD_NAME_SIZE];
1713
Andreas Färber814e6122012-05-02 17:00:37 +02001714 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001715 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1716 qemu_cond_init(cpu->halt_cond);
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001717 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/KVM",
1718 cpu->cpu_index);
1719 qemu_thread_create(cpu->thread, thread_name, qemu_kvm_cpu_thread_fn,
1720 cpu, QEMU_THREAD_JOINABLE);
Andreas Färber61a46212012-05-02 22:49:36 +02001721 while (!cpu->created) {
Paolo Bonzini18a85722011-03-12 17:44:03 +01001722 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001723 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001724}
1725
Andreas Färber10a90212013-05-27 02:24:35 +02001726static void qemu_dummy_start_vcpu(CPUState *cpu)
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001727{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001728 char thread_name[VCPU_THREAD_NAME_SIZE];
1729
Andreas Färber814e6122012-05-02 17:00:37 +02001730 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001731 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1732 qemu_cond_init(cpu->halt_cond);
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001733 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/DUMMY",
1734 cpu->cpu_index);
1735 qemu_thread_create(cpu->thread, thread_name, qemu_dummy_cpu_thread_fn, cpu,
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001736 QEMU_THREAD_JOINABLE);
Andreas Färber61a46212012-05-02 22:49:36 +02001737 while (!cpu->created) {
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001738 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1739 }
1740}
1741
Andreas Färberc643bed2013-05-27 03:23:24 +02001742void qemu_init_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001743{
Andreas Färberce3960e2012-12-17 03:27:07 +01001744 cpu->nr_cores = smp_cores;
1745 cpu->nr_threads = smp_threads;
Andreas Färberf324e762012-05-02 23:26:21 +02001746 cpu->stopped = true;
Peter Maydell56943e82016-01-21 14:15:04 +00001747
1748 if (!cpu->as) {
1749 /* If the target cpu hasn't set up any address spaces itself,
1750 * give it the default one.
1751 */
Peter Crosthwaite6731d862016-01-21 14:15:06 +00001752 AddressSpace *as = address_space_init_shareable(cpu->memory,
1753 "cpu-memory");
Peter Maydell12ebc9a2016-01-21 14:15:04 +00001754 cpu->num_ases = 1;
Peter Crosthwaite6731d862016-01-21 14:15:06 +00001755 cpu_address_space_init(cpu, as, 0);
Peter Maydell56943e82016-01-21 14:15:04 +00001756 }
1757
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001758 if (kvm_enabled()) {
Andreas Färber48a106b2013-05-27 02:20:39 +02001759 qemu_kvm_start_vcpu(cpu);
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001760 } else if (hax_enabled()) {
1761 qemu_hax_start_vcpu(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001762 } else if (tcg_enabled()) {
Andreas Färbere5ab30a2012-05-03 01:50:44 +02001763 qemu_tcg_init_vcpu(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001764 } else {
Andreas Färber10a90212013-05-27 02:24:35 +02001765 qemu_dummy_start_vcpu(cpu);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001766 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001767}
1768
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001769void cpu_stop_current(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001770{
Andreas Färber4917cf42013-05-27 05:17:50 +02001771 if (current_cpu) {
1772 current_cpu->stop = false;
1773 current_cpu->stopped = true;
1774 cpu_exit(current_cpu);
Dr. David Alan Gilbert96bce682016-01-25 10:08:18 +00001775 qemu_cond_broadcast(&qemu_pause_cond);
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001776 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001777}
1778
Kevin Wolf56983462013-07-05 13:49:54 +02001779int vm_stop(RunState state)
Blue Swirl296af7c2010-03-29 19:23:50 +00001780{
Juan Quintelaaa723c22012-09-18 16:30:11 +02001781 if (qemu_in_vcpu_thread()) {
Paolo Bonzini74892d22014-06-05 14:53:58 +02001782 qemu_system_vmstop_request_prepare();
Luiz Capitulino1dfb4dd2011-07-29 14:26:33 -03001783 qemu_system_vmstop_request(state);
Blue Swirl296af7c2010-03-29 19:23:50 +00001784 /*
1785 * FIXME: should not return to device code in case
1786 * vm_stop() has been requested.
1787 */
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001788 cpu_stop_current();
Kevin Wolf56983462013-07-05 13:49:54 +02001789 return 0;
Blue Swirl296af7c2010-03-29 19:23:50 +00001790 }
Kevin Wolf56983462013-07-05 13:49:54 +02001791
1792 return do_vm_stop(state);
Blue Swirl296af7c2010-03-29 19:23:50 +00001793}
1794
Claudio Imbrenda2d76e822017-02-14 18:07:47 +01001795/**
1796 * Prepare for (re)starting the VM.
1797 * Returns -1 if the vCPUs are not to be restarted (e.g. if they are already
1798 * running or in case of an error condition), 0 otherwise.
1799 */
1800int vm_prepare_start(void)
1801{
1802 RunState requested;
1803 int res = 0;
1804
1805 qemu_vmstop_requested(&requested);
1806 if (runstate_is_running() && requested == RUN_STATE__MAX) {
1807 return -1;
1808 }
1809
1810 /* Ensure that a STOP/RESUME pair of events is emitted if a
1811 * vmstop request was pending. The BLOCK_IO_ERROR event, for
1812 * example, according to documentation is always followed by
1813 * the STOP event.
1814 */
1815 if (runstate_is_running()) {
1816 qapi_event_send_stop(&error_abort);
1817 res = -1;
1818 } else {
1819 replay_enable_events();
1820 cpu_enable_ticks();
1821 runstate_set(RUN_STATE_RUNNING);
1822 vm_state_notify(1, RUN_STATE_RUNNING);
1823 }
1824
1825 /* We are sending this now, but the CPUs will be resumed shortly later */
1826 qapi_event_send_resume(&error_abort);
1827 return res;
1828}
1829
1830void vm_start(void)
1831{
1832 if (!vm_prepare_start()) {
1833 resume_all_vcpus();
1834 }
1835}
1836
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001837/* does a state transition even if the VM is already stopped,
1838 current state is forgotten forever */
Kevin Wolf56983462013-07-05 13:49:54 +02001839int vm_stop_force_state(RunState state)
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001840{
1841 if (runstate_is_running()) {
Kevin Wolf56983462013-07-05 13:49:54 +02001842 return vm_stop(state);
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001843 } else {
1844 runstate_set(state);
Wen Congyangb2780d32015-11-20 17:34:38 +08001845
1846 bdrv_drain_all();
Kevin Wolf594a45c2013-07-18 14:52:19 +02001847 /* Make sure to return an error if the flush in a previous vm_stop()
1848 * failed. */
John Snow22af08e2016-09-22 21:45:51 -04001849 return bdrv_flush_all();
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001850 }
1851}
1852
Stefan Weil9a78eea2010-10-22 23:03:33 +02001853void list_cpus(FILE *f, fprintf_function cpu_fprintf, const char *optarg)
Blue Swirl262353c2010-05-04 19:55:35 +00001854{
1855 /* XXX: implement xxx_cpu_list for targets that still miss it */
Peter Maydelle916cbf2012-09-05 17:41:08 -03001856#if defined(cpu_list)
1857 cpu_list(f, cpu_fprintf);
Blue Swirl262353c2010-05-04 19:55:35 +00001858#endif
1859}
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001860
1861CpuInfoList *qmp_query_cpus(Error **errp)
1862{
Igor Mammedovafed5a52017-05-10 13:29:55 +02001863 MachineState *ms = MACHINE(qdev_get_machine());
1864 MachineClass *mc = MACHINE_GET_CLASS(ms);
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001865 CpuInfoList *head = NULL, *cur_item = NULL;
Andreas Färber182735e2013-05-29 22:29:20 +02001866 CPUState *cpu;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001867
Andreas Färberbdc44642013-06-24 23:50:24 +02001868 CPU_FOREACH(cpu) {
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001869 CpuInfoList *info;
Andreas Färber182735e2013-05-29 22:29:20 +02001870#if defined(TARGET_I386)
1871 X86CPU *x86_cpu = X86_CPU(cpu);
1872 CPUX86State *env = &x86_cpu->env;
1873#elif defined(TARGET_PPC)
1874 PowerPCCPU *ppc_cpu = POWERPC_CPU(cpu);
1875 CPUPPCState *env = &ppc_cpu->env;
1876#elif defined(TARGET_SPARC)
1877 SPARCCPU *sparc_cpu = SPARC_CPU(cpu);
1878 CPUSPARCState *env = &sparc_cpu->env;
1879#elif defined(TARGET_MIPS)
1880 MIPSCPU *mips_cpu = MIPS_CPU(cpu);
1881 CPUMIPSState *env = &mips_cpu->env;
Bastian Koppelmann48e06fe2014-09-01 12:59:46 +01001882#elif defined(TARGET_TRICORE)
1883 TriCoreCPU *tricore_cpu = TRICORE_CPU(cpu);
1884 CPUTriCoreState *env = &tricore_cpu->env;
Andreas Färber182735e2013-05-29 22:29:20 +02001885#endif
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001886
Andreas Färbercb446ec2013-05-01 14:24:52 +02001887 cpu_synchronize_state(cpu);
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001888
1889 info = g_malloc0(sizeof(*info));
1890 info->value = g_malloc0(sizeof(*info->value));
Andreas Färber55e5c282012-12-17 06:18:02 +01001891 info->value->CPU = cpu->cpu_index;
Andreas Färber182735e2013-05-29 22:29:20 +02001892 info->value->current = (cpu == first_cpu);
Andreas Färber259186a2013-01-17 18:51:17 +01001893 info->value->halted = cpu->halted;
Eduardo Habkost58f88d42015-05-08 16:04:22 -03001894 info->value->qom_path = object_get_canonical_path(OBJECT(cpu));
Andreas Färber9f09e182012-05-03 06:59:07 +02001895 info->value->thread_id = cpu->thread_id;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001896#if defined(TARGET_I386)
Eric Blake86f4b682015-11-18 01:52:59 -07001897 info->value->arch = CPU_INFO_ARCH_X86;
Eric Blake544a3732016-02-17 23:48:27 -07001898 info->value->u.x86.pc = env->eip + env->segs[R_CS].base;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001899#elif defined(TARGET_PPC)
Eric Blake86f4b682015-11-18 01:52:59 -07001900 info->value->arch = CPU_INFO_ARCH_PPC;
Eric Blake544a3732016-02-17 23:48:27 -07001901 info->value->u.ppc.nip = env->nip;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001902#elif defined(TARGET_SPARC)
Eric Blake86f4b682015-11-18 01:52:59 -07001903 info->value->arch = CPU_INFO_ARCH_SPARC;
Eric Blake544a3732016-02-17 23:48:27 -07001904 info->value->u.q_sparc.pc = env->pc;
1905 info->value->u.q_sparc.npc = env->npc;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001906#elif defined(TARGET_MIPS)
Eric Blake86f4b682015-11-18 01:52:59 -07001907 info->value->arch = CPU_INFO_ARCH_MIPS;
Eric Blake544a3732016-02-17 23:48:27 -07001908 info->value->u.q_mips.PC = env->active_tc.PC;
Bastian Koppelmann48e06fe2014-09-01 12:59:46 +01001909#elif defined(TARGET_TRICORE)
Eric Blake86f4b682015-11-18 01:52:59 -07001910 info->value->arch = CPU_INFO_ARCH_TRICORE;
Eric Blake544a3732016-02-17 23:48:27 -07001911 info->value->u.tricore.PC = env->PC;
Eric Blake86f4b682015-11-18 01:52:59 -07001912#else
1913 info->value->arch = CPU_INFO_ARCH_OTHER;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001914#endif
Igor Mammedovafed5a52017-05-10 13:29:55 +02001915 info->value->has_props = !!mc->cpu_index_to_instance_props;
1916 if (info->value->has_props) {
1917 CpuInstanceProperties *props;
1918 props = g_malloc0(sizeof(*props));
1919 *props = mc->cpu_index_to_instance_props(ms, cpu->cpu_index);
1920 info->value->props = props;
1921 }
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001922
1923 /* XXX: waiting for the qapi to support GSList */
1924 if (!cur_item) {
1925 head = cur_item = info;
1926 } else {
1927 cur_item->next = info;
1928 cur_item = info;
1929 }
1930 }
1931
1932 return head;
1933}
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001934
1935void qmp_memsave(int64_t addr, int64_t size, const char *filename,
1936 bool has_cpu, int64_t cpu_index, Error **errp)
1937{
1938 FILE *f;
1939 uint32_t l;
Andreas Färber55e5c282012-12-17 06:18:02 +01001940 CPUState *cpu;
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001941 uint8_t buf[1024];
Borislav Petkov0dc9daf2015-02-08 13:14:38 +01001942 int64_t orig_addr = addr, orig_size = size;
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001943
1944 if (!has_cpu) {
1945 cpu_index = 0;
1946 }
1947
Andreas Färber151d1322013-02-15 15:41:49 +01001948 cpu = qemu_get_cpu(cpu_index);
1949 if (cpu == NULL) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01001950 error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "cpu-index",
1951 "a CPU number");
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001952 return;
1953 }
1954
1955 f = fopen(filename, "wb");
1956 if (!f) {
Luiz Capitulino618da852013-06-07 14:35:06 -04001957 error_setg_file_open(errp, errno, filename);
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001958 return;
1959 }
1960
1961 while (size != 0) {
1962 l = sizeof(buf);
1963 if (l > size)
1964 l = size;
Aneesh Kumar K.V2f4d0f52013-10-01 21:49:30 +05301965 if (cpu_memory_rw_debug(cpu, addr, buf, l, 0) != 0) {
Borislav Petkov0dc9daf2015-02-08 13:14:38 +01001966 error_setg(errp, "Invalid addr 0x%016" PRIx64 "/size %" PRId64
1967 " specified", orig_addr, orig_size);
Aneesh Kumar K.V2f4d0f52013-10-01 21:49:30 +05301968 goto exit;
1969 }
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001970 if (fwrite(buf, 1, l, f) != l) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01001971 error_setg(errp, QERR_IO_ERROR);
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001972 goto exit;
1973 }
1974 addr += l;
1975 size -= l;
1976 }
1977
1978exit:
1979 fclose(f);
1980}
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001981
1982void qmp_pmemsave(int64_t addr, int64_t size, const char *filename,
1983 Error **errp)
1984{
1985 FILE *f;
1986 uint32_t l;
1987 uint8_t buf[1024];
1988
1989 f = fopen(filename, "wb");
1990 if (!f) {
Luiz Capitulino618da852013-06-07 14:35:06 -04001991 error_setg_file_open(errp, errno, filename);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001992 return;
1993 }
1994
1995 while (size != 0) {
1996 l = sizeof(buf);
1997 if (l > size)
1998 l = size;
Stefan Weileb6282f2014-04-07 20:28:23 +02001999 cpu_physical_memory_read(addr, buf, l);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02002000 if (fwrite(buf, 1, l, f) != l) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01002001 error_setg(errp, QERR_IO_ERROR);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02002002 goto exit;
2003 }
2004 addr += l;
2005 size -= l;
2006 }
2007
2008exit:
2009 fclose(f);
2010}
Luiz Capitulinoab49ab52011-11-23 12:55:53 -02002011
2012void qmp_inject_nmi(Error **errp)
2013{
Alexey Kardashevskiy9cb805f2014-08-20 22:16:33 +10002014 nmi_monitor_handle(monitor_get_cpu_index(), errp);
Luiz Capitulinoab49ab52011-11-23 12:55:53 -02002015}
Sebastian Tanase27498be2014-07-25 11:56:33 +02002016
2017void dump_drift_info(FILE *f, fprintf_function cpu_fprintf)
2018{
2019 if (!use_icount) {
2020 return;
2021 }
2022
2023 cpu_fprintf(f, "Host - Guest clock %"PRIi64" ms\n",
2024 (cpu_get_clock() - cpu_get_icount())/SCALE_MS);
2025 if (icount_align_option) {
2026 cpu_fprintf(f, "Max guest delay %"PRIi64" ms\n", -max_delay/SCALE_MS);
2027 cpu_fprintf(f, "Max guest advance %"PRIi64" ms\n", max_advance/SCALE_MS);
2028 } else {
2029 cpu_fprintf(f, "Max guest delay NA\n");
2030 cpu_fprintf(f, "Max guest advance NA\n");
2031 }
2032}