blob: a5125d7167881ae84bae518ee68475de6e7ec344 [file] [log] [blame]
Blue Swirl296af7c2010-03-29 19:23:50 +00001/*
2 * QEMU System Emulator
3 *
4 * Copyright (c) 2003-2008 Fabrice Bellard
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
24
25/* Needed early for CONFIG_BSD etc. */
Peter Maydell7b31bbc2016-01-26 18:16:56 +000026#include "qemu/osdep.h"
Paolo Bonzini33c11872016-03-15 16:58:45 +010027#include "qemu-common.h"
KONRAD Frederic8d4e9142017-02-23 18:29:08 +000028#include "qemu/config-file.h"
Paolo Bonzini33c11872016-03-15 16:58:45 +010029#include "cpu.h"
Paolo Bonzini83c90892012-12-17 18:19:49 +010030#include "monitor/monitor.h"
Wenchao Xiaa4e15de2014-06-18 08:43:36 +020031#include "qapi/qmp/qerror.h"
Markus Armbrusterd49b6832015-03-17 18:29:20 +010032#include "qemu/error-report.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010033#include "sysemu/sysemu.h"
Max Reitzda31d592016-03-16 19:54:32 +010034#include "sysemu/block-backend.h"
Paolo Bonzini022c62c2012-12-17 18:19:49 +010035#include "exec/gdbstub.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010036#include "sysemu/dma.h"
Vincent Palatinb3946622017-01-10 11:59:55 +010037#include "sysemu/hw_accel.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010038#include "sysemu/kvm.h"
Vincent Palatinb0cb0a62017-01-10 11:59:57 +010039#include "sysemu/hax.h"
Luiz Capitulinode0b36b2011-09-21 16:38:35 -030040#include "qmp-commands.h"
Paolo Bonzini63c91552016-03-15 13:18:37 +010041#include "exec/exec-all.h"
Blue Swirl296af7c2010-03-29 19:23:50 +000042
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010043#include "qemu/thread.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010044#include "sysemu/cpus.h"
45#include "sysemu/qtest.h"
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010046#include "qemu/main-loop.h"
47#include "qemu/bitmap.h"
Liu Ping Fancb365642013-09-25 14:20:58 +080048#include "qemu/seqlock.h"
KONRAD Frederic8d4e9142017-02-23 18:29:08 +000049#include "tcg.h"
Wenchao Xiaa4e15de2014-06-18 08:43:36 +020050#include "qapi-event.h"
Alexey Kardashevskiy9cb805f2014-08-20 22:16:33 +100051#include "hw/nmi.h"
Pavel Dovgalyuk8b427042015-09-17 19:24:05 +030052#include "sysemu/replay.h"
Jan Kiszka0ff0fc12011-06-23 10:15:55 +020053
Jan Kiszka6d9cb732011-02-01 22:15:58 +010054#ifdef CONFIG_LINUX
55
56#include <sys/prctl.h>
57
Marcelo Tosattic0532a72010-10-11 15:31:21 -030058#ifndef PR_MCE_KILL
59#define PR_MCE_KILL 33
60#endif
61
Jan Kiszka6d9cb732011-02-01 22:15:58 +010062#ifndef PR_MCE_KILL_SET
63#define PR_MCE_KILL_SET 1
64#endif
65
66#ifndef PR_MCE_KILL_EARLY
67#define PR_MCE_KILL_EARLY 1
68#endif
69
70#endif /* CONFIG_LINUX */
71
Sebastian Tanase27498be2014-07-25 11:56:33 +020072int64_t max_delay;
73int64_t max_advance;
Blue Swirl296af7c2010-03-29 19:23:50 +000074
Jason J. Herne2adcc852015-09-08 13:12:33 -040075/* vcpu throttling controls */
76static QEMUTimer *throttle_timer;
77static unsigned int throttle_percentage;
78
79#define CPU_THROTTLE_PCT_MIN 1
80#define CPU_THROTTLE_PCT_MAX 99
81#define CPU_THROTTLE_TIMESLICE_NS 10000000
82
Tiejun Chen321bc0b2013-08-02 09:43:09 +080083bool cpu_is_stopped(CPUState *cpu)
84{
85 return cpu->stopped || !runstate_is_running();
86}
87
Andreas Färbera98ae1d2013-05-26 23:21:08 +020088static bool cpu_thread_is_idle(CPUState *cpu)
Peter Maydellac873f12012-07-19 16:52:27 +010089{
Andreas Färberc64ca812012-05-03 02:11:45 +020090 if (cpu->stop || cpu->queued_work_first) {
Peter Maydellac873f12012-07-19 16:52:27 +010091 return false;
92 }
Tiejun Chen321bc0b2013-08-02 09:43:09 +080093 if (cpu_is_stopped(cpu)) {
Peter Maydellac873f12012-07-19 16:52:27 +010094 return true;
95 }
Andreas Färber8c2e1b02013-08-25 18:53:55 +020096 if (!cpu->halted || cpu_has_work(cpu) ||
Alexander Graf215e79c2013-04-24 22:24:12 +020097 kvm_halt_in_kernel()) {
Peter Maydellac873f12012-07-19 16:52:27 +010098 return false;
99 }
100 return true;
101}
102
103static bool all_cpu_threads_idle(void)
104{
Andreas Färber182735e2013-05-29 22:29:20 +0200105 CPUState *cpu;
Peter Maydellac873f12012-07-19 16:52:27 +0100106
Andreas Färberbdc44642013-06-24 23:50:24 +0200107 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200108 if (!cpu_thread_is_idle(cpu)) {
Peter Maydellac873f12012-07-19 16:52:27 +0100109 return false;
110 }
111 }
112 return true;
113}
114
Blue Swirl296af7c2010-03-29 19:23:50 +0000115/***********************************************************/
Paolo Bonzini946fb272011-09-12 13:57:37 +0200116/* guest cycle counter */
117
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200118/* Protected by TimersState seqlock */
119
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200120static bool icount_sleep = true;
Sebastian Tanase71468392014-07-23 11:47:50 +0200121static int64_t vm_clock_warp_start = -1;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200122/* Conversion factor from emulated instructions to virtual clock ticks. */
123static int icount_time_shift;
124/* Arbitrarily pick 1MIPS as the minimum allowable speed. */
125#define MAX_ICOUNT_SHIFT 10
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200126
Paolo Bonzini946fb272011-09-12 13:57:37 +0200127static QEMUTimer *icount_rt_timer;
128static QEMUTimer *icount_vm_timer;
129static QEMUTimer *icount_warp_timer;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200130
131typedef struct TimersState {
Liu Ping Fancb365642013-09-25 14:20:58 +0800132 /* Protected by BQL. */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200133 int64_t cpu_ticks_prev;
134 int64_t cpu_ticks_offset;
Liu Ping Fancb365642013-09-25 14:20:58 +0800135
136 /* cpu_clock_offset can be read out of BQL, so protect it with
137 * this lock.
138 */
139 QemuSeqLock vm_clock_seqlock;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200140 int64_t cpu_clock_offset;
141 int32_t cpu_ticks_enabled;
142 int64_t dummy;
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200143
144 /* Compensate for varying guest execution speed. */
145 int64_t qemu_icount_bias;
146 /* Only written by TCG thread */
147 int64_t qemu_icount;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200148} TimersState;
149
Liu Ping Fand9cd4002013-07-21 08:43:00 +0000150static TimersState timers_state;
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000151bool mttcg_enabled;
152
153/*
154 * We default to false if we know other options have been enabled
155 * which are currently incompatible with MTTCG. Otherwise when each
156 * guest (target) has been updated to support:
157 * - atomic instructions
158 * - memory ordering primitives (barriers)
159 * they can set the appropriate CONFIG flags in ${target}-softmmu.mak
160 *
161 * Once a guest architecture has been converted to the new primitives
162 * there are two remaining limitations to check.
163 *
164 * - The guest can't be oversized (e.g. 64 bit guest on 32 bit host)
165 * - The host must have a stronger memory order than the guest
166 *
167 * It may be possible in future to support strong guests on weak hosts
168 * but that will require tagging all load/stores in a guest with their
169 * implicit memory order requirements which would likely slow things
170 * down a lot.
171 */
172
173static bool check_tcg_memory_orders_compatible(void)
174{
175#if defined(TCG_GUEST_DEFAULT_MO) && defined(TCG_TARGET_DEFAULT_MO)
176 return (TCG_GUEST_DEFAULT_MO & ~TCG_TARGET_DEFAULT_MO) == 0;
177#else
178 return false;
179#endif
180}
181
182static bool default_mttcg_enabled(void)
183{
Alex Bennée83fd9622017-02-27 17:09:01 +0000184 if (use_icount || TCG_OVERSIZED_GUEST) {
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000185 return false;
186 } else {
187#ifdef TARGET_SUPPORTS_MTTCG
188 return check_tcg_memory_orders_compatible();
189#else
190 return false;
191#endif
192 }
193}
194
195void qemu_tcg_configure(QemuOpts *opts, Error **errp)
196{
197 const char *t = qemu_opt_get(opts, "thread");
198 if (t) {
199 if (strcmp(t, "multi") == 0) {
200 if (TCG_OVERSIZED_GUEST) {
201 error_setg(errp, "No MTTCG when guest word size > hosts");
Alex Bennée83fd9622017-02-27 17:09:01 +0000202 } else if (use_icount) {
203 error_setg(errp, "No MTTCG when icount is enabled");
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000204 } else {
Nikunj A Dadhania86953502017-04-10 11:36:55 +0530205#ifndef TARGET_SUPPORTS_MTTCG
Alex Bennéec34c7622017-02-28 14:40:17 +0000206 error_report("Guest not yet converted to MTTCG - "
207 "you may get unexpected results");
208#endif
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000209 if (!check_tcg_memory_orders_compatible()) {
210 error_report("Guest expects a stronger memory ordering "
211 "than the host provides");
Pranith Kumar8cfef892017-03-25 16:19:23 -0400212 error_printf("This may cause strange/hard to debug errors\n");
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000213 }
214 mttcg_enabled = true;
215 }
216 } else if (strcmp(t, "single") == 0) {
217 mttcg_enabled = false;
218 } else {
219 error_setg(errp, "Invalid 'thread' setting %s", t);
220 }
221 } else {
222 mttcg_enabled = default_mttcg_enabled();
223 }
224}
Paolo Bonzini946fb272011-09-12 13:57:37 +0200225
Alex Bennéee4cd9652017-03-31 16:09:42 +0100226/* The current number of executed instructions is based on what we
227 * originally budgeted minus the current state of the decrementing
228 * icount counters in extra/u16.low.
229 */
230static int64_t cpu_get_icount_executed(CPUState *cpu)
231{
232 return cpu->icount_budget - (cpu->icount_decr.u16.low + cpu->icount_extra);
233}
234
Alex Bennée512d3c82017-04-05 12:32:37 +0100235/*
236 * Update the global shared timer_state.qemu_icount to take into
237 * account executed instructions. This is done by the TCG vCPU
238 * thread so the main-loop can see time has moved forward.
239 */
240void cpu_update_icount(CPUState *cpu)
241{
242 int64_t executed = cpu_get_icount_executed(cpu);
243 cpu->icount_budget -= executed;
244
245#ifdef CONFIG_ATOMIC64
246 atomic_set__nocheck(&timers_state.qemu_icount,
247 atomic_read__nocheck(&timers_state.qemu_icount) +
248 executed);
249#else /* FIXME: we need 64bit atomics to do this safely */
250 timers_state.qemu_icount += executed;
251#endif
252}
253
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300254int64_t cpu_get_icount_raw(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200255{
256 int64_t icount;
Andreas Färber4917cf42013-05-27 05:17:50 +0200257 CPUState *cpu = current_cpu;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200258
Alex Bennée512d3c82017-04-05 12:32:37 +0100259 icount = atomic_read(&timers_state.qemu_icount);
Alex Bennée243c5f72017-03-30 18:49:22 +0100260 if (cpu && cpu->running) {
Paolo Bonzini414b15c2015-06-24 14:16:26 +0200261 if (!cpu->can_do_io) {
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300262 fprintf(stderr, "Bad icount read\n");
263 exit(1);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200264 }
Alex Bennéee4cd9652017-03-31 16:09:42 +0100265 /* Take into account what has run */
266 icount += cpu_get_icount_executed(cpu);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200267 }
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300268 return icount;
269}
270
271/* Return the virtual CPU time, based on the instruction counter. */
272static int64_t cpu_get_icount_locked(void)
273{
274 int64_t icount = cpu_get_icount_raw();
KONRAD Frederic3f031312014-08-01 01:37:15 +0200275 return timers_state.qemu_icount_bias + cpu_icount_to_ns(icount);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200276}
277
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200278int64_t cpu_get_icount(void)
279{
280 int64_t icount;
281 unsigned start;
282
283 do {
284 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
285 icount = cpu_get_icount_locked();
286 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
287
288 return icount;
289}
290
KONRAD Frederic3f031312014-08-01 01:37:15 +0200291int64_t cpu_icount_to_ns(int64_t icount)
292{
293 return icount << icount_time_shift;
294}
295
Cao jind90f3cc2016-07-29 19:05:38 +0800296/* return the time elapsed in VM between vm_start and vm_stop. Unless
297 * icount is active, cpu_get_ticks() uses units of the host CPU cycle
298 * counter.
299 *
300 * Caller must hold the BQL
301 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200302int64_t cpu_get_ticks(void)
303{
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100304 int64_t ticks;
305
Paolo Bonzini946fb272011-09-12 13:57:37 +0200306 if (use_icount) {
307 return cpu_get_icount();
308 }
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100309
310 ticks = timers_state.cpu_ticks_offset;
311 if (timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400312 ticks += cpu_get_host_ticks();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200313 }
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100314
315 if (timers_state.cpu_ticks_prev > ticks) {
316 /* Note: non increasing ticks may happen if the host uses
317 software suspend */
318 timers_state.cpu_ticks_offset += timers_state.cpu_ticks_prev - ticks;
319 ticks = timers_state.cpu_ticks_prev;
320 }
321
322 timers_state.cpu_ticks_prev = ticks;
323 return ticks;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200324}
325
Liu Ping Fancb365642013-09-25 14:20:58 +0800326static int64_t cpu_get_clock_locked(void)
327{
Cao jin1d45cea2016-07-29 19:05:37 +0800328 int64_t time;
Liu Ping Fancb365642013-09-25 14:20:58 +0800329
Cao jin1d45cea2016-07-29 19:05:37 +0800330 time = timers_state.cpu_clock_offset;
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100331 if (timers_state.cpu_ticks_enabled) {
Cao jin1d45cea2016-07-29 19:05:37 +0800332 time += get_clock();
Liu Ping Fancb365642013-09-25 14:20:58 +0800333 }
334
Cao jin1d45cea2016-07-29 19:05:37 +0800335 return time;
Liu Ping Fancb365642013-09-25 14:20:58 +0800336}
337
Cao jind90f3cc2016-07-29 19:05:38 +0800338/* Return the monotonic time elapsed in VM, i.e.,
Peter Maydell8212ff82016-09-15 10:24:22 +0100339 * the time between vm_start and vm_stop
340 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200341int64_t cpu_get_clock(void)
342{
343 int64_t ti;
Liu Ping Fancb365642013-09-25 14:20:58 +0800344 unsigned start;
345
346 do {
347 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
348 ti = cpu_get_clock_locked();
349 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
350
351 return ti;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200352}
353
Liu Ping Fancb365642013-09-25 14:20:58 +0800354/* enable cpu_get_ticks()
Cao jin3224e872016-07-08 18:31:37 +0800355 * Caller must hold BQL which serves as mutex for vm_clock_seqlock.
Liu Ping Fancb365642013-09-25 14:20:58 +0800356 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200357void cpu_enable_ticks(void)
358{
Liu Ping Fancb365642013-09-25 14:20:58 +0800359 /* Here, the really thing protected by seqlock is cpu_clock_offset. */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400360 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200361 if (!timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400362 timers_state.cpu_ticks_offset -= cpu_get_host_ticks();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200363 timers_state.cpu_clock_offset -= get_clock();
364 timers_state.cpu_ticks_enabled = 1;
365 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400366 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200367}
368
369/* disable cpu_get_ticks() : the clock is stopped. You must not call
Liu Ping Fancb365642013-09-25 14:20:58 +0800370 * cpu_get_ticks() after that.
Cao jin3224e872016-07-08 18:31:37 +0800371 * Caller must hold BQL which serves as mutex for vm_clock_seqlock.
Liu Ping Fancb365642013-09-25 14:20:58 +0800372 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200373void cpu_disable_ticks(void)
374{
Liu Ping Fancb365642013-09-25 14:20:58 +0800375 /* Here, the really thing protected by seqlock is cpu_clock_offset. */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400376 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200377 if (timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400378 timers_state.cpu_ticks_offset += cpu_get_host_ticks();
Liu Ping Fancb365642013-09-25 14:20:58 +0800379 timers_state.cpu_clock_offset = cpu_get_clock_locked();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200380 timers_state.cpu_ticks_enabled = 0;
381 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400382 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200383}
384
385/* Correlation between real and virtual time is always going to be
386 fairly approximate, so ignore small variation.
387 When the guest is idle real and virtual time will be aligned in
388 the IO wait loop. */
Rutuja Shah73bcb242016-03-21 21:32:30 +0530389#define ICOUNT_WOBBLE (NANOSECONDS_PER_SECOND / 10)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200390
391static void icount_adjust(void)
392{
393 int64_t cur_time;
394 int64_t cur_icount;
395 int64_t delta;
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200396
397 /* Protected by TimersState mutex. */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200398 static int64_t last_delta;
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200399
Paolo Bonzini946fb272011-09-12 13:57:37 +0200400 /* If the VM is not running, then do nothing. */
401 if (!runstate_is_running()) {
402 return;
403 }
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200404
Emilio G. Cota03719e42016-06-08 14:55:21 -0400405 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200406 cur_time = cpu_get_clock_locked();
407 cur_icount = cpu_get_icount_locked();
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200408
Paolo Bonzini946fb272011-09-12 13:57:37 +0200409 delta = cur_icount - cur_time;
410 /* FIXME: This is a very crude algorithm, somewhat prone to oscillation. */
411 if (delta > 0
412 && last_delta + ICOUNT_WOBBLE < delta * 2
413 && icount_time_shift > 0) {
414 /* The guest is getting too far ahead. Slow time down. */
415 icount_time_shift--;
416 }
417 if (delta < 0
418 && last_delta - ICOUNT_WOBBLE > delta * 2
419 && icount_time_shift < MAX_ICOUNT_SHIFT) {
420 /* The guest is getting too far behind. Speed time up. */
421 icount_time_shift++;
422 }
423 last_delta = delta;
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200424 timers_state.qemu_icount_bias = cur_icount
425 - (timers_state.qemu_icount << icount_time_shift);
Emilio G. Cota03719e42016-06-08 14:55:21 -0400426 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200427}
428
429static void icount_adjust_rt(void *opaque)
430{
Alex Bligh40daca52013-08-21 16:03:02 +0100431 timer_mod(icount_rt_timer,
Pavel Dovgalyuk1979b902015-01-12 15:00:43 +0300432 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL_RT) + 1000);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200433 icount_adjust();
434}
435
436static void icount_adjust_vm(void *opaque)
437{
Alex Bligh40daca52013-08-21 16:03:02 +0100438 timer_mod(icount_vm_timer,
439 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
Rutuja Shah73bcb242016-03-21 21:32:30 +0530440 NANOSECONDS_PER_SECOND / 10);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200441 icount_adjust();
442}
443
444static int64_t qemu_icount_round(int64_t count)
445{
446 return (count + (1 << icount_time_shift) - 1) >> icount_time_shift;
447}
448
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300449static void icount_warp_rt(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200450{
Alex Bennéeccffff42016-04-04 15:35:48 +0100451 unsigned seq;
452 int64_t warp_start;
453
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200454 /* The icount_warp_timer is rescheduled soon after vm_clock_warp_start
455 * changes from -1 to another value, so the race here is okay.
456 */
Alex Bennéeccffff42016-04-04 15:35:48 +0100457 do {
458 seq = seqlock_read_begin(&timers_state.vm_clock_seqlock);
459 warp_start = vm_clock_warp_start;
460 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, seq));
461
462 if (warp_start == -1) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200463 return;
464 }
465
Emilio G. Cota03719e42016-06-08 14:55:21 -0400466 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200467 if (runstate_is_running()) {
Pavel Dovgalyuk8eda2062015-09-17 19:24:28 +0300468 int64_t clock = REPLAY_CLOCK(REPLAY_CLOCK_VIRTUAL_RT,
469 cpu_get_clock_locked());
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200470 int64_t warp_delta;
471
472 warp_delta = clock - vm_clock_warp_start;
473 if (use_icount == 2) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200474 /*
Alex Bligh40daca52013-08-21 16:03:02 +0100475 * In adaptive mode, do not let QEMU_CLOCK_VIRTUAL run too
Paolo Bonzini946fb272011-09-12 13:57:37 +0200476 * far ahead of real time.
477 */
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200478 int64_t cur_icount = cpu_get_icount_locked();
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300479 int64_t delta = clock - cur_icount;
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200480 warp_delta = MIN(warp_delta, delta);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200481 }
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200482 timers_state.qemu_icount_bias += warp_delta;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200483 }
484 vm_clock_warp_start = -1;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400485 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200486
487 if (qemu_clock_expired(QEMU_CLOCK_VIRTUAL)) {
488 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
489 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200490}
491
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300492static void icount_timer_cb(void *opaque)
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300493{
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300494 /* No need for a checkpoint because the timer already synchronizes
495 * with CHECKPOINT_CLOCK_VIRTUAL_RT.
496 */
497 icount_warp_rt();
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300498}
499
Paolo Bonzini8156be52012-03-28 15:42:04 +0200500void qtest_clock_warp(int64_t dest)
501{
Alex Bligh40daca52013-08-21 16:03:02 +0100502 int64_t clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
Fam Zhengefef88b2015-01-19 17:51:43 +0800503 AioContext *aio_context;
Paolo Bonzini8156be52012-03-28 15:42:04 +0200504 assert(qtest_enabled());
Fam Zhengefef88b2015-01-19 17:51:43 +0800505 aio_context = qemu_get_aio_context();
Paolo Bonzini8156be52012-03-28 15:42:04 +0200506 while (clock < dest) {
Alex Bligh40daca52013-08-21 16:03:02 +0100507 int64_t deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
Sergey Fedorovc9299e22014-06-10 13:10:28 +0400508 int64_t warp = qemu_soonest_timeout(dest - clock, deadline);
Fam Zhengefef88b2015-01-19 17:51:43 +0800509
Emilio G. Cota03719e42016-06-08 14:55:21 -0400510 seqlock_write_begin(&timers_state.vm_clock_seqlock);
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200511 timers_state.qemu_icount_bias += warp;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400512 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200513
Alex Bligh40daca52013-08-21 16:03:02 +0100514 qemu_clock_run_timers(QEMU_CLOCK_VIRTUAL);
Fam Zhengefef88b2015-01-19 17:51:43 +0800515 timerlist_run_timers(aio_context->tlg.tl[QEMU_CLOCK_VIRTUAL]);
Alex Bligh40daca52013-08-21 16:03:02 +0100516 clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini8156be52012-03-28 15:42:04 +0200517 }
Alex Bligh40daca52013-08-21 16:03:02 +0100518 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini8156be52012-03-28 15:42:04 +0200519}
520
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300521void qemu_start_warp_timer(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200522{
Paolo Bonzinice78d182013-10-07 17:30:02 +0200523 int64_t clock;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200524 int64_t deadline;
525
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300526 if (!use_icount) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200527 return;
528 }
529
Pavel Dovgalyuk8bd7f712015-09-17 19:24:44 +0300530 /* Nothing to do if the VM is stopped: QEMU_CLOCK_VIRTUAL timers
531 * do not fire, so computing the deadline does not make sense.
532 */
533 if (!runstate_is_running()) {
534 return;
535 }
536
537 /* warp clock deterministically in record/replay mode */
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300538 if (!replay_checkpoint(CHECKPOINT_CLOCK_WARP_START)) {
Pavel Dovgalyuk8bd7f712015-09-17 19:24:44 +0300539 return;
540 }
541
Paolo Bonzinice78d182013-10-07 17:30:02 +0200542 if (!all_cpu_threads_idle()) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200543 return;
544 }
545
Paolo Bonzini8156be52012-03-28 15:42:04 +0200546 if (qtest_enabled()) {
547 /* When testing, qtest commands advance icount. */
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300548 return;
Paolo Bonzini8156be52012-03-28 15:42:04 +0200549 }
550
Alex Blighac70aaf2013-08-21 16:02:57 +0100551 /* We want to use the earliest deadline from ALL vm_clocks */
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300552 clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT);
Alex Bligh40daca52013-08-21 16:03:02 +0100553 deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
Paolo Bonzinice78d182013-10-07 17:30:02 +0200554 if (deadline < 0) {
Victor CLEMENTd7a0f712015-05-29 17:14:06 +0200555 static bool notified;
556 if (!icount_sleep && !notified) {
557 error_report("WARNING: icount sleep disabled and no active timers");
558 notified = true;
559 }
Paolo Bonzinice78d182013-10-07 17:30:02 +0200560 return;
Alex Blighac70aaf2013-08-21 16:02:57 +0100561 }
562
Paolo Bonzini946fb272011-09-12 13:57:37 +0200563 if (deadline > 0) {
564 /*
Alex Bligh40daca52013-08-21 16:03:02 +0100565 * Ensure QEMU_CLOCK_VIRTUAL proceeds even when the virtual CPU goes to
Paolo Bonzini946fb272011-09-12 13:57:37 +0200566 * sleep. Otherwise, the CPU might be waiting for a future timer
567 * interrupt to wake it up, but the interrupt never comes because
568 * the vCPU isn't running any insns and thus doesn't advance the
Alex Bligh40daca52013-08-21 16:03:02 +0100569 * QEMU_CLOCK_VIRTUAL.
Paolo Bonzini946fb272011-09-12 13:57:37 +0200570 */
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200571 if (!icount_sleep) {
572 /*
573 * We never let VCPUs sleep in no sleep icount mode.
574 * If there is a pending QEMU_CLOCK_VIRTUAL timer we just advance
575 * to the next QEMU_CLOCK_VIRTUAL event and notify it.
576 * It is useful when we want a deterministic execution time,
577 * isolated from host latencies.
578 */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400579 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200580 timers_state.qemu_icount_bias += deadline;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400581 seqlock_write_end(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200582 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
583 } else {
584 /*
585 * We do stop VCPUs and only advance QEMU_CLOCK_VIRTUAL after some
586 * "real" time, (related to the time left until the next event) has
587 * passed. The QEMU_CLOCK_VIRTUAL_RT clock will do this.
588 * This avoids that the warps are visible externally; for example,
589 * you will not be sending network packets continuously instead of
590 * every 100ms.
591 */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400592 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200593 if (vm_clock_warp_start == -1 || vm_clock_warp_start > clock) {
594 vm_clock_warp_start = clock;
595 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400596 seqlock_write_end(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200597 timer_mod_anticipate(icount_warp_timer, clock + deadline);
Paolo Bonzinice78d182013-10-07 17:30:02 +0200598 }
Alex Blighac70aaf2013-08-21 16:02:57 +0100599 } else if (deadline == 0) {
Alex Bligh40daca52013-08-21 16:03:02 +0100600 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200601 }
602}
603
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300604static void qemu_account_warp_timer(void)
605{
606 if (!use_icount || !icount_sleep) {
607 return;
608 }
609
610 /* Nothing to do if the VM is stopped: QEMU_CLOCK_VIRTUAL timers
611 * do not fire, so computing the deadline does not make sense.
612 */
613 if (!runstate_is_running()) {
614 return;
615 }
616
617 /* warp clock deterministically in record/replay mode */
618 if (!replay_checkpoint(CHECKPOINT_CLOCK_WARP_ACCOUNT)) {
619 return;
620 }
621
622 timer_del(icount_warp_timer);
623 icount_warp_rt();
624}
625
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200626static bool icount_state_needed(void *opaque)
627{
628 return use_icount;
629}
630
631/*
632 * This is a subsection for icount migration.
633 */
634static const VMStateDescription icount_vmstate_timers = {
635 .name = "timer/icount",
636 .version_id = 1,
637 .minimum_version_id = 1,
Juan Quintela5cd8cad2014-09-23 14:09:54 +0200638 .needed = icount_state_needed,
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200639 .fields = (VMStateField[]) {
640 VMSTATE_INT64(qemu_icount_bias, TimersState),
641 VMSTATE_INT64(qemu_icount, TimersState),
642 VMSTATE_END_OF_LIST()
643 }
644};
645
Paolo Bonzini946fb272011-09-12 13:57:37 +0200646static const VMStateDescription vmstate_timers = {
647 .name = "timer",
648 .version_id = 2,
649 .minimum_version_id = 1,
Juan Quintela35d08452014-04-16 16:01:33 +0200650 .fields = (VMStateField[]) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200651 VMSTATE_INT64(cpu_ticks_offset, TimersState),
652 VMSTATE_INT64(dummy, TimersState),
653 VMSTATE_INT64_V(cpu_clock_offset, TimersState, 2),
654 VMSTATE_END_OF_LIST()
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200655 },
Juan Quintela5cd8cad2014-09-23 14:09:54 +0200656 .subsections = (const VMStateDescription*[]) {
657 &icount_vmstate_timers,
658 NULL
Paolo Bonzini946fb272011-09-12 13:57:37 +0200659 }
660};
661
Paolo Bonzini14e6fe12016-10-31 10:36:08 +0100662static void cpu_throttle_thread(CPUState *cpu, run_on_cpu_data opaque)
Jason J. Herne2adcc852015-09-08 13:12:33 -0400663{
Jason J. Herne2adcc852015-09-08 13:12:33 -0400664 double pct;
665 double throttle_ratio;
666 long sleeptime_ns;
667
668 if (!cpu_throttle_get_percentage()) {
669 return;
670 }
671
672 pct = (double)cpu_throttle_get_percentage()/100;
673 throttle_ratio = pct / (1 - pct);
674 sleeptime_ns = (long)(throttle_ratio * CPU_THROTTLE_TIMESLICE_NS);
675
676 qemu_mutex_unlock_iothread();
677 atomic_set(&cpu->throttle_thread_scheduled, 0);
678 g_usleep(sleeptime_ns / 1000); /* Convert ns to us for usleep call */
679 qemu_mutex_lock_iothread();
680}
681
682static void cpu_throttle_timer_tick(void *opaque)
683{
684 CPUState *cpu;
685 double pct;
686
687 /* Stop the timer if needed */
688 if (!cpu_throttle_get_percentage()) {
689 return;
690 }
691 CPU_FOREACH(cpu) {
692 if (!atomic_xchg(&cpu->throttle_thread_scheduled, 1)) {
Paolo Bonzini14e6fe12016-10-31 10:36:08 +0100693 async_run_on_cpu(cpu, cpu_throttle_thread,
694 RUN_ON_CPU_NULL);
Jason J. Herne2adcc852015-09-08 13:12:33 -0400695 }
696 }
697
698 pct = (double)cpu_throttle_get_percentage()/100;
699 timer_mod(throttle_timer, qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT) +
700 CPU_THROTTLE_TIMESLICE_NS / (1-pct));
701}
702
703void cpu_throttle_set(int new_throttle_pct)
704{
705 /* Ensure throttle percentage is within valid range */
706 new_throttle_pct = MIN(new_throttle_pct, CPU_THROTTLE_PCT_MAX);
707 new_throttle_pct = MAX(new_throttle_pct, CPU_THROTTLE_PCT_MIN);
708
709 atomic_set(&throttle_percentage, new_throttle_pct);
710
711 timer_mod(throttle_timer, qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT) +
712 CPU_THROTTLE_TIMESLICE_NS);
713}
714
715void cpu_throttle_stop(void)
716{
717 atomic_set(&throttle_percentage, 0);
718}
719
720bool cpu_throttle_active(void)
721{
722 return (cpu_throttle_get_percentage() != 0);
723}
724
725int cpu_throttle_get_percentage(void)
726{
727 return atomic_read(&throttle_percentage);
728}
729
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400730void cpu_ticks_init(void)
731{
Emilio G. Cotaccdb3c12016-06-08 14:55:20 -0400732 seqlock_init(&timers_state.vm_clock_seqlock);
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400733 vmstate_register(NULL, 0, &vmstate_timers, &timers_state);
Jason J. Herne2adcc852015-09-08 13:12:33 -0400734 throttle_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL_RT,
735 cpu_throttle_timer_tick, NULL);
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400736}
737
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200738void configure_icount(QemuOpts *opts, Error **errp)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200739{
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200740 const char *option;
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200741 char *rem_str = NULL;
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200742
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200743 option = qemu_opt_get(opts, "shift");
Paolo Bonzini946fb272011-09-12 13:57:37 +0200744 if (!option) {
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200745 if (qemu_opt_get(opts, "align") != NULL) {
746 error_setg(errp, "Please specify shift option when using align");
747 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200748 return;
749 }
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200750
751 icount_sleep = qemu_opt_get_bool(opts, "sleep", true);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200752 if (icount_sleep) {
753 icount_warp_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL_RT,
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300754 icount_timer_cb, NULL);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200755 }
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200756
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200757 icount_align_option = qemu_opt_get_bool(opts, "align", false);
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200758
759 if (icount_align_option && !icount_sleep) {
Pranith Kumar778d9f92016-02-26 10:16:51 -0500760 error_setg(errp, "align=on and sleep=off are incompatible");
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200761 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200762 if (strcmp(option, "auto") != 0) {
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200763 errno = 0;
764 icount_time_shift = strtol(option, &rem_str, 0);
765 if (errno != 0 || *rem_str != '\0' || !strlen(option)) {
766 error_setg(errp, "icount: Invalid shift value");
767 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200768 use_icount = 1;
769 return;
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200770 } else if (icount_align_option) {
771 error_setg(errp, "shift=auto and align=on are incompatible");
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200772 } else if (!icount_sleep) {
Pranith Kumar778d9f92016-02-26 10:16:51 -0500773 error_setg(errp, "shift=auto and sleep=off are incompatible");
Paolo Bonzini946fb272011-09-12 13:57:37 +0200774 }
775
776 use_icount = 2;
777
778 /* 125MIPS seems a reasonable initial guess at the guest speed.
779 It will be corrected fairly quickly anyway. */
780 icount_time_shift = 3;
781
782 /* Have both realtime and virtual time triggers for speed adjustment.
783 The realtime trigger catches emulated time passing too slowly,
784 the virtual time trigger catches emulated time passing too fast.
785 Realtime triggers occur even when idle, so use them less frequently
786 than VM triggers. */
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300787 icount_rt_timer = timer_new_ms(QEMU_CLOCK_VIRTUAL_RT,
788 icount_adjust_rt, NULL);
Alex Bligh40daca52013-08-21 16:03:02 +0100789 timer_mod(icount_rt_timer,
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300790 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL_RT) + 1000);
Alex Bligh40daca52013-08-21 16:03:02 +0100791 icount_vm_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
792 icount_adjust_vm, NULL);
793 timer_mod(icount_vm_timer,
794 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
Rutuja Shah73bcb242016-03-21 21:32:30 +0530795 NANOSECONDS_PER_SECOND / 10);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200796}
797
798/***********************************************************/
Alex Bennée65467062017-02-23 18:29:09 +0000799/* TCG vCPU kick timer
800 *
801 * The kick timer is responsible for moving single threaded vCPU
802 * emulation on to the next vCPU. If more than one vCPU is running a
803 * timer event with force a cpu->exit so the next vCPU can get
804 * scheduled.
805 *
806 * The timer is removed if all vCPUs are idle and restarted again once
807 * idleness is complete.
808 */
809
810static QEMUTimer *tcg_kick_vcpu_timer;
Alex Bennée791158d2017-02-23 18:29:10 +0000811static CPUState *tcg_current_rr_cpu;
Alex Bennée65467062017-02-23 18:29:09 +0000812
813#define TCG_KICK_PERIOD (NANOSECONDS_PER_SECOND / 10)
814
815static inline int64_t qemu_tcg_next_kick(void)
816{
817 return qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + TCG_KICK_PERIOD;
818}
819
Alex Bennée791158d2017-02-23 18:29:10 +0000820/* Kick the currently round-robin scheduled vCPU */
821static void qemu_cpu_kick_rr_cpu(void)
822{
823 CPUState *cpu;
Alex Bennée791158d2017-02-23 18:29:10 +0000824 do {
825 cpu = atomic_mb_read(&tcg_current_rr_cpu);
826 if (cpu) {
827 cpu_exit(cpu);
828 }
829 } while (cpu != atomic_mb_read(&tcg_current_rr_cpu));
830}
831
Paolo Bonzini6b8f0182017-03-02 19:56:40 +0100832static void do_nothing(CPUState *cpu, run_on_cpu_data unused)
833{
834}
835
Paolo Bonzini3f53bc62017-03-03 11:50:29 +0100836void qemu_timer_notify_cb(void *opaque, QEMUClockType type)
837{
Paolo Bonzini6b8f0182017-03-02 19:56:40 +0100838 if (!use_icount || type != QEMU_CLOCK_VIRTUAL) {
839 qemu_notify_event();
840 return;
841 }
842
843 if (!qemu_in_vcpu_thread() && first_cpu) {
844 /* qemu_cpu_kick is not enough to kick a halted CPU out of
845 * qemu_tcg_wait_io_event. async_run_on_cpu, instead,
846 * causes cpu_thread_is_idle to return false. This way,
847 * handle_icount_deadline can run.
848 */
849 async_run_on_cpu(first_cpu, do_nothing, RUN_ON_CPU_NULL);
850 }
Paolo Bonzini3f53bc62017-03-03 11:50:29 +0100851}
852
Alex Bennée65467062017-02-23 18:29:09 +0000853static void kick_tcg_thread(void *opaque)
854{
855 timer_mod(tcg_kick_vcpu_timer, qemu_tcg_next_kick());
Alex Bennée791158d2017-02-23 18:29:10 +0000856 qemu_cpu_kick_rr_cpu();
Alex Bennée65467062017-02-23 18:29:09 +0000857}
858
859static void start_tcg_kick_timer(void)
860{
Alex Bennée37257942017-02-23 18:29:14 +0000861 if (!mttcg_enabled && !tcg_kick_vcpu_timer && CPU_NEXT(first_cpu)) {
Alex Bennée65467062017-02-23 18:29:09 +0000862 tcg_kick_vcpu_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
863 kick_tcg_thread, NULL);
864 timer_mod(tcg_kick_vcpu_timer, qemu_tcg_next_kick());
865 }
866}
867
868static void stop_tcg_kick_timer(void)
869{
870 if (tcg_kick_vcpu_timer) {
871 timer_del(tcg_kick_vcpu_timer);
872 tcg_kick_vcpu_timer = NULL;
873 }
874}
875
Alex Bennée65467062017-02-23 18:29:09 +0000876/***********************************************************/
Blue Swirl296af7c2010-03-29 19:23:50 +0000877void hw_error(const char *fmt, ...)
878{
879 va_list ap;
Andreas Färber55e5c282012-12-17 06:18:02 +0100880 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000881
882 va_start(ap, fmt);
883 fprintf(stderr, "qemu: hardware error: ");
884 vfprintf(stderr, fmt, ap);
885 fprintf(stderr, "\n");
Andreas Färberbdc44642013-06-24 23:50:24 +0200886 CPU_FOREACH(cpu) {
Andreas Färber55e5c282012-12-17 06:18:02 +0100887 fprintf(stderr, "CPU #%d:\n", cpu->cpu_index);
Andreas Färber878096e2013-05-27 01:33:50 +0200888 cpu_dump_state(cpu, stderr, fprintf, CPU_DUMP_FPU);
Blue Swirl296af7c2010-03-29 19:23:50 +0000889 }
890 va_end(ap);
891 abort();
892}
893
894void cpu_synchronize_all_states(void)
895{
Andreas Färber182735e2013-05-29 22:29:20 +0200896 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000897
Andreas Färberbdc44642013-06-24 23:50:24 +0200898 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200899 cpu_synchronize_state(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000900 }
901}
902
903void cpu_synchronize_all_post_reset(void)
904{
Andreas Färber182735e2013-05-29 22:29:20 +0200905 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000906
Andreas Färberbdc44642013-06-24 23:50:24 +0200907 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200908 cpu_synchronize_post_reset(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000909 }
910}
911
912void cpu_synchronize_all_post_init(void)
913{
Andreas Färber182735e2013-05-29 22:29:20 +0200914 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000915
Andreas Färberbdc44642013-06-24 23:50:24 +0200916 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200917 cpu_synchronize_post_init(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000918 }
919}
920
Kevin Wolf56983462013-07-05 13:49:54 +0200921static int do_vm_stop(RunState state)
Blue Swirl296af7c2010-03-29 19:23:50 +0000922{
Kevin Wolf56983462013-07-05 13:49:54 +0200923 int ret = 0;
924
Luiz Capitulino13548692011-07-29 15:36:43 -0300925 if (runstate_is_running()) {
Blue Swirl296af7c2010-03-29 19:23:50 +0000926 cpu_disable_ticks();
Blue Swirl296af7c2010-03-29 19:23:50 +0000927 pause_all_vcpus();
Luiz Capitulinof5bbfba2011-07-29 15:04:45 -0300928 runstate_set(state);
Luiz Capitulino1dfb4dd2011-07-29 14:26:33 -0300929 vm_state_notify(0, state);
Wenchao Xiaa4e15de2014-06-18 08:43:36 +0200930 qapi_event_send_stop(&error_abort);
Blue Swirl296af7c2010-03-29 19:23:50 +0000931 }
Kevin Wolf56983462013-07-05 13:49:54 +0200932
Kevin Wolf594a45c2013-07-18 14:52:19 +0200933 bdrv_drain_all();
Pavel Dovgalyuk6d0ceb82016-09-26 11:08:16 +0300934 replay_disable_events();
John Snow22af08e2016-09-22 21:45:51 -0400935 ret = bdrv_flush_all();
Kevin Wolf594a45c2013-07-18 14:52:19 +0200936
Kevin Wolf56983462013-07-05 13:49:54 +0200937 return ret;
Blue Swirl296af7c2010-03-29 19:23:50 +0000938}
939
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200940static bool cpu_can_run(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +0000941{
Andreas Färber4fdeee72012-05-02 23:10:09 +0200942 if (cpu->stop) {
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200943 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +0100944 }
Tiejun Chen321bc0b2013-08-02 09:43:09 +0800945 if (cpu_is_stopped(cpu)) {
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200946 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +0100947 }
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200948 return true;
Blue Swirl296af7c2010-03-29 19:23:50 +0000949}
950
Andreas Färber91325042013-05-27 02:07:49 +0200951static void cpu_handle_guest_debug(CPUState *cpu)
Jan Kiszka3c638d02010-06-25 16:56:56 +0200952{
Andreas Färber64f6b342013-05-27 02:06:09 +0200953 gdb_set_stop_cpu(cpu);
Jan Kiszka8cf71712011-02-07 12:19:16 +0100954 qemu_system_debug_request();
Andreas Färberf324e762012-05-02 23:26:21 +0200955 cpu->stopped = true;
Jan Kiszka3c638d02010-06-25 16:56:56 +0200956}
957
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100958#ifdef CONFIG_LINUX
959static void sigbus_reraise(void)
960{
961 sigset_t set;
962 struct sigaction action;
963
964 memset(&action, 0, sizeof(action));
965 action.sa_handler = SIG_DFL;
966 if (!sigaction(SIGBUS, &action, NULL)) {
967 raise(SIGBUS);
968 sigemptyset(&set);
969 sigaddset(&set, SIGBUS);
Peter Maydella2d17612016-05-16 18:33:59 +0100970 pthread_sigmask(SIG_UNBLOCK, &set, NULL);
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100971 }
972 perror("Failed to re-raise SIGBUS!\n");
973 abort();
974}
975
Paolo Bonzinid98d4072017-02-08 13:22:12 +0100976static void sigbus_handler(int n, siginfo_t *siginfo, void *ctx)
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100977{
Paolo Bonzinia16fc072017-02-09 09:50:02 +0100978 if (siginfo->si_code != BUS_MCEERR_AO && siginfo->si_code != BUS_MCEERR_AR) {
979 sigbus_reraise();
980 }
981
Paolo Bonzini2ae41db2017-02-08 12:48:54 +0100982 if (current_cpu) {
983 /* Called asynchronously in VCPU thread. */
984 if (kvm_on_sigbus_vcpu(current_cpu, siginfo->si_code, siginfo->si_addr)) {
985 sigbus_reraise();
986 }
987 } else {
988 /* Called synchronously (via signalfd) in main thread. */
989 if (kvm_on_sigbus(siginfo->si_code, siginfo->si_addr)) {
990 sigbus_reraise();
991 }
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100992 }
993}
994
995static void qemu_init_sigbus(void)
996{
997 struct sigaction action;
998
999 memset(&action, 0, sizeof(action));
1000 action.sa_flags = SA_SIGINFO;
Paolo Bonzinid98d4072017-02-08 13:22:12 +01001001 action.sa_sigaction = sigbus_handler;
Jan Kiszka6d9cb732011-02-01 22:15:58 +01001002 sigaction(SIGBUS, &action, NULL);
1003
1004 prctl(PR_MCE_KILL, PR_MCE_KILL_SET, PR_MCE_KILL_EARLY, 0, 0);
1005}
Paolo Bonzinia16fc072017-02-09 09:50:02 +01001006#else /* !CONFIG_LINUX */
1007static void qemu_init_sigbus(void)
1008{
1009}
Paolo Bonzinia16fc072017-02-09 09:50:02 +01001010#endif /* !CONFIG_LINUX */
Blue Swirl296af7c2010-03-29 19:23:50 +00001011
Stefan Weilb2532d82012-09-27 07:41:42 +02001012static QemuMutex qemu_global_mutex;
Blue Swirl296af7c2010-03-29 19:23:50 +00001013
1014static QemuThread io_thread;
1015
Blue Swirl296af7c2010-03-29 19:23:50 +00001016/* cpu creation */
1017static QemuCond qemu_cpu_cond;
1018/* system init */
Blue Swirl296af7c2010-03-29 19:23:50 +00001019static QemuCond qemu_pause_cond;
1020
Paolo Bonzinid3b12f52011-09-13 10:30:52 +02001021void qemu_init_cpu_loop(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001022{
Jan Kiszka6d9cb732011-02-01 22:15:58 +01001023 qemu_init_sigbus();
Anthony Liguoried945922011-02-08 18:18:18 +01001024 qemu_cond_init(&qemu_cpu_cond);
Anthony Liguoried945922011-02-08 18:18:18 +01001025 qemu_cond_init(&qemu_pause_cond);
Blue Swirl296af7c2010-03-29 19:23:50 +00001026 qemu_mutex_init(&qemu_global_mutex);
Blue Swirl296af7c2010-03-29 19:23:50 +00001027
Jan Kiszkab7680cb2011-03-12 17:43:51 +01001028 qemu_thread_get_self(&io_thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001029}
1030
Paolo Bonzini14e6fe12016-10-31 10:36:08 +01001031void run_on_cpu(CPUState *cpu, run_on_cpu_func func, run_on_cpu_data data)
Marcelo Tosattie82bcec2010-05-04 09:45:22 -03001032{
Sergey Fedorovd148d902016-08-29 09:51:00 +02001033 do_run_on_cpu(cpu, func, data, &qemu_global_mutex);
Chegu Vinod3c022702013-06-24 03:49:41 -06001034}
1035
Gu Zheng4c055ab2016-05-12 09:18:13 +05301036static void qemu_kvm_destroy_vcpu(CPUState *cpu)
1037{
1038 if (kvm_destroy_vcpu(cpu) < 0) {
1039 error_report("kvm_destroy_vcpu failed");
1040 exit(EXIT_FAILURE);
1041 }
1042}
1043
1044static void qemu_tcg_destroy_vcpu(CPUState *cpu)
1045{
1046}
1047
Andreas Färber509a0d72012-05-03 02:18:09 +02001048static void qemu_wait_io_event_common(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001049{
Alex Bennée37257942017-02-23 18:29:14 +00001050 atomic_mb_set(&cpu->thread_kicked, false);
Andreas Färber4fdeee72012-05-02 23:10:09 +02001051 if (cpu->stop) {
1052 cpu->stop = false;
Andreas Färberf324e762012-05-02 23:26:21 +02001053 cpu->stopped = true;
Dr. David Alan Gilbert96bce682016-01-25 10:08:18 +00001054 qemu_cond_broadcast(&qemu_pause_cond);
Blue Swirl296af7c2010-03-29 19:23:50 +00001055 }
Sergey Fedorova5403c62016-08-02 18:27:36 +01001056 process_queued_cpu_work(cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001057}
1058
1059static bool qemu_tcg_should_sleep(CPUState *cpu)
1060{
1061 if (mttcg_enabled) {
1062 return cpu_thread_is_idle(cpu);
1063 } else {
1064 return all_cpu_threads_idle();
1065 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001066}
1067
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001068static void qemu_tcg_wait_io_event(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001069{
Alex Bennée37257942017-02-23 18:29:14 +00001070 while (qemu_tcg_should_sleep(cpu)) {
Alex Bennée65467062017-02-23 18:29:09 +00001071 stop_tcg_kick_timer();
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001072 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka16400322011-02-09 16:29:37 +01001073 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001074
Alex Bennée65467062017-02-23 18:29:09 +00001075 start_tcg_kick_timer();
1076
Alex Bennée37257942017-02-23 18:29:14 +00001077 qemu_wait_io_event_common(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001078}
1079
Andreas Färberfd529e82013-05-26 23:24:55 +02001080static void qemu_kvm_wait_io_event(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001081{
Andreas Färbera98ae1d2013-05-26 23:21:08 +02001082 while (cpu_thread_is_idle(cpu)) {
Andreas Färberf5c121b2012-05-03 01:22:49 +02001083 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka16400322011-02-09 16:29:37 +01001084 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001085
Andreas Färber509a0d72012-05-03 02:18:09 +02001086 qemu_wait_io_event_common(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001087}
1088
Jan Kiszka7e97cd82011-02-07 12:19:12 +01001089static void *qemu_kvm_cpu_thread_fn(void *arg)
Blue Swirl296af7c2010-03-29 19:23:50 +00001090{
Andreas Färber48a106b2013-05-27 02:20:39 +02001091 CPUState *cpu = arg;
Jan Kiszka84b49152011-02-01 22:15:50 +01001092 int r;
Blue Swirl296af7c2010-03-29 19:23:50 +00001093
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001094 rcu_register_thread();
1095
Paolo Bonzini2e7f7a32015-06-18 18:47:18 +02001096 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001097 qemu_thread_get_self(cpu->thread);
Andreas Färber9f09e182012-05-03 06:59:07 +02001098 cpu->thread_id = qemu_get_thread_id();
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001099 cpu->can_do_io = 1;
Andreas Färber4917cf42013-05-27 05:17:50 +02001100 current_cpu = cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001101
Andreas Färber504134d2012-12-17 06:38:45 +01001102 r = kvm_init_vcpu(cpu);
Jan Kiszka84b49152011-02-01 22:15:50 +01001103 if (r < 0) {
1104 fprintf(stderr, "kvm_init_vcpu failed: %s\n", strerror(-r));
1105 exit(1);
1106 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001107
Paolo Bonzini18268b62017-02-09 09:41:14 +01001108 kvm_init_cpu_signals(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001109
1110 /* signal CPU creation */
Andreas Färber61a46212012-05-02 22:49:36 +02001111 cpu->created = true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001112 qemu_cond_signal(&qemu_cpu_cond);
1113
Gu Zheng4c055ab2016-05-12 09:18:13 +05301114 do {
Andreas Färbera1fcaa72012-05-02 23:42:26 +02001115 if (cpu_can_run(cpu)) {
Andreas Färber1458c362013-05-26 23:46:55 +02001116 r = kvm_cpu_exec(cpu);
Jan Kiszka83f338f2011-02-07 12:19:17 +01001117 if (r == EXCP_DEBUG) {
Andreas Färber91325042013-05-27 02:07:49 +02001118 cpu_handle_guest_debug(cpu);
Jan Kiszka83f338f2011-02-07 12:19:17 +01001119 }
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001120 }
Andreas Färberfd529e82013-05-26 23:24:55 +02001121 qemu_kvm_wait_io_event(cpu);
Gu Zheng4c055ab2016-05-12 09:18:13 +05301122 } while (!cpu->unplug || cpu_can_run(cpu));
Blue Swirl296af7c2010-03-29 19:23:50 +00001123
Gu Zheng4c055ab2016-05-12 09:18:13 +05301124 qemu_kvm_destroy_vcpu(cpu);
Bharata B Rao2c579042016-05-12 09:18:14 +05301125 cpu->created = false;
1126 qemu_cond_signal(&qemu_cpu_cond);
Gu Zheng4c055ab2016-05-12 09:18:13 +05301127 qemu_mutex_unlock_iothread();
Blue Swirl296af7c2010-03-29 19:23:50 +00001128 return NULL;
1129}
1130
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001131static void *qemu_dummy_cpu_thread_fn(void *arg)
1132{
1133#ifdef _WIN32
1134 fprintf(stderr, "qtest is not supported under Windows\n");
1135 exit(1);
1136#else
Andreas Färber10a90212013-05-27 02:24:35 +02001137 CPUState *cpu = arg;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001138 sigset_t waitset;
1139 int r;
1140
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001141 rcu_register_thread();
1142
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001143 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001144 qemu_thread_get_self(cpu->thread);
Andreas Färber9f09e182012-05-03 06:59:07 +02001145 cpu->thread_id = qemu_get_thread_id();
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001146 cpu->can_do_io = 1;
Alex Bennée37257942017-02-23 18:29:14 +00001147 current_cpu = cpu;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001148
1149 sigemptyset(&waitset);
1150 sigaddset(&waitset, SIG_IPI);
1151
1152 /* signal CPU creation */
Andreas Färber61a46212012-05-02 22:49:36 +02001153 cpu->created = true;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001154 qemu_cond_signal(&qemu_cpu_cond);
1155
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001156 while (1) {
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001157 qemu_mutex_unlock_iothread();
1158 do {
1159 int sig;
1160 r = sigwait(&waitset, &sig);
1161 } while (r == -1 && (errno == EAGAIN || errno == EINTR));
1162 if (r == -1) {
1163 perror("sigwait");
1164 exit(1);
1165 }
1166 qemu_mutex_lock_iothread();
Andreas Färber509a0d72012-05-03 02:18:09 +02001167 qemu_wait_io_event_common(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001168 }
1169
1170 return NULL;
1171#endif
1172}
1173
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001174static int64_t tcg_get_icount_limit(void)
1175{
1176 int64_t deadline;
1177
1178 if (replay_mode != REPLAY_MODE_PLAY) {
1179 deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
1180
1181 /* Maintain prior (possibly buggy) behaviour where if no deadline
1182 * was set (as there is no QEMU_CLOCK_VIRTUAL timer) or it is more than
1183 * INT32_MAX nanoseconds ahead, we still use INT32_MAX
1184 * nanoseconds.
1185 */
1186 if ((deadline < 0) || (deadline > INT32_MAX)) {
1187 deadline = INT32_MAX;
1188 }
1189
1190 return qemu_icount_round(deadline);
1191 } else {
1192 return replay_get_instructions();
1193 }
1194}
1195
Alex Bennée12e97002016-10-27 16:10:14 +01001196static void handle_icount_deadline(void)
1197{
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001198 assert(qemu_in_vcpu_thread());
Alex Bennée12e97002016-10-27 16:10:14 +01001199 if (use_icount) {
1200 int64_t deadline =
1201 qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
1202
1203 if (deadline == 0) {
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001204 /* Wake up other AioContexts. */
Alex Bennée12e97002016-10-27 16:10:14 +01001205 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001206 qemu_clock_run_timers(QEMU_CLOCK_VIRTUAL);
Alex Bennée12e97002016-10-27 16:10:14 +01001207 }
1208 }
1209}
1210
Alex Bennée05248382017-03-29 16:46:59 +01001211static void prepare_icount_for_run(CPUState *cpu)
1212{
1213 if (use_icount) {
1214 int64_t count;
1215 int decr;
1216
1217 /* These should always be cleared by process_icount_data after
1218 * each vCPU execution. However u16.high can be raised
1219 * asynchronously by cpu_exit/cpu_interrupt/tcg_handle_interrupt
1220 */
1221 g_assert(cpu->icount_decr.u16.low == 0);
1222 g_assert(cpu->icount_extra == 0);
1223
1224
1225 count = tcg_get_icount_limit();
1226
Alex Bennéee4cd9652017-03-31 16:09:42 +01001227 /* To calculate what we have executed so far we need to know
1228 * what we originally budgeted to run this cycle */
1229 cpu->icount_budget = count;
1230
Alex Bennée05248382017-03-29 16:46:59 +01001231 decr = (count > 0xffff) ? 0xffff : count;
1232 count -= decr;
1233 cpu->icount_decr.u16.low = decr;
1234 cpu->icount_extra = count;
1235 }
1236}
1237
1238static void process_icount_data(CPUState *cpu)
1239{
1240 if (use_icount) {
Alex Bennéee4cd9652017-03-31 16:09:42 +01001241 /* Account for executed instructions */
Alex Bennée512d3c82017-04-05 12:32:37 +01001242 cpu_update_icount(cpu);
Alex Bennée05248382017-03-29 16:46:59 +01001243
1244 /* Reset the counters */
1245 cpu->icount_decr.u16.low = 0;
1246 cpu->icount_extra = 0;
Alex Bennéee4cd9652017-03-31 16:09:42 +01001247 cpu->icount_budget = 0;
1248
Alex Bennée05248382017-03-29 16:46:59 +01001249 replay_account_executed_instructions();
1250 }
1251}
1252
1253
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001254static int tcg_cpu_exec(CPUState *cpu)
1255{
1256 int ret;
1257#ifdef CONFIG_PROFILER
1258 int64_t ti;
1259#endif
1260
1261#ifdef CONFIG_PROFILER
1262 ti = profile_getclock();
1263#endif
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001264 qemu_mutex_unlock_iothread();
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001265 cpu_exec_start(cpu);
1266 ret = cpu_exec(cpu);
1267 cpu_exec_end(cpu);
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001268 qemu_mutex_lock_iothread();
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001269#ifdef CONFIG_PROFILER
1270 tcg_time += profile_getclock() - ti;
1271#endif
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001272 return ret;
1273}
1274
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001275/* Destroy any remaining vCPUs which have been unplugged and have
1276 * finished running
1277 */
1278static void deal_with_unplugged_cpus(void)
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001279{
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001280 CPUState *cpu;
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001281
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001282 CPU_FOREACH(cpu) {
1283 if (cpu->unplug && !cpu_can_run(cpu)) {
1284 qemu_tcg_destroy_vcpu(cpu);
1285 cpu->created = false;
1286 qemu_cond_signal(&qemu_cpu_cond);
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001287 break;
1288 }
1289 }
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001290}
Jan Kiszkabdb7ca62011-09-26 09:40:39 +02001291
Alex Bennée65467062017-02-23 18:29:09 +00001292/* Single-threaded TCG
1293 *
1294 * In the single-threaded case each vCPU is simulated in turn. If
1295 * there is more than a single vCPU we create a simple timer to kick
1296 * the vCPU and ensure we don't get stuck in a tight loop in one vCPU.
1297 * This is done explicitly rather than relying on side-effects
1298 * elsewhere.
1299 */
1300
Alex Bennée37257942017-02-23 18:29:14 +00001301static void *qemu_tcg_rr_cpu_thread_fn(void *arg)
Blue Swirl296af7c2010-03-29 19:23:50 +00001302{
Andreas Färberc3586ba2012-05-03 01:41:24 +02001303 CPUState *cpu = arg;
Blue Swirl296af7c2010-03-29 19:23:50 +00001304
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001305 rcu_register_thread();
1306
Paolo Bonzini2e7f7a32015-06-18 18:47:18 +02001307 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001308 qemu_thread_get_self(cpu->thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001309
Andreas Färber38fcbd32013-07-07 19:50:23 +02001310 CPU_FOREACH(cpu) {
1311 cpu->thread_id = qemu_get_thread_id();
1312 cpu->created = true;
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001313 cpu->can_do_io = 1;
Andreas Färber38fcbd32013-07-07 19:50:23 +02001314 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001315 qemu_cond_signal(&qemu_cpu_cond);
1316
Jan Kiszkafa7d1862011-08-22 18:35:25 +02001317 /* wait for initial kick-off after machine start */
Emilio G. Cotac28e3992015-04-27 12:45:28 -04001318 while (first_cpu->stopped) {
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001319 qemu_cond_wait(first_cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka8e564b42012-02-17 18:31:15 +01001320
1321 /* process any pending work */
Andreas Färberbdc44642013-06-24 23:50:24 +02001322 CPU_FOREACH(cpu) {
Alex Bennée37257942017-02-23 18:29:14 +00001323 current_cpu = cpu;
Andreas Färber182735e2013-05-29 22:29:20 +02001324 qemu_wait_io_event_common(cpu);
Jan Kiszka8e564b42012-02-17 18:31:15 +01001325 }
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001326 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001327
Alex Bennée65467062017-02-23 18:29:09 +00001328 start_tcg_kick_timer();
1329
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001330 cpu = first_cpu;
1331
Alex Bennéee5143e32017-02-23 18:29:12 +00001332 /* process any pending work */
1333 cpu->exit_request = 1;
1334
Blue Swirl296af7c2010-03-29 19:23:50 +00001335 while (1) {
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001336 /* Account partial waits to QEMU_CLOCK_VIRTUAL. */
1337 qemu_account_warp_timer();
1338
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001339 /* Run the timers here. This is much more efficient than
1340 * waking up the I/O thread and waiting for completion.
1341 */
1342 handle_icount_deadline();
1343
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001344 if (!cpu) {
1345 cpu = first_cpu;
1346 }
1347
Alex Bennéee5143e32017-02-23 18:29:12 +00001348 while (cpu && !cpu->queued_work_first && !cpu->exit_request) {
1349
Alex Bennée791158d2017-02-23 18:29:10 +00001350 atomic_mb_set(&tcg_current_rr_cpu, cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001351 current_cpu = cpu;
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001352
1353 qemu_clock_enable(QEMU_CLOCK_VIRTUAL,
1354 (cpu->singlestep_enabled & SSTEP_NOTIMER) == 0);
1355
1356 if (cpu_can_run(cpu)) {
1357 int r;
Alex Bennée05248382017-03-29 16:46:59 +01001358
1359 prepare_icount_for_run(cpu);
1360
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001361 r = tcg_cpu_exec(cpu);
Alex Bennée05248382017-03-29 16:46:59 +01001362
1363 process_icount_data(cpu);
1364
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001365 if (r == EXCP_DEBUG) {
1366 cpu_handle_guest_debug(cpu);
1367 break;
Pranith Kumar08e73c42017-02-23 18:29:15 +00001368 } else if (r == EXCP_ATOMIC) {
1369 qemu_mutex_unlock_iothread();
1370 cpu_exec_step_atomic(cpu);
1371 qemu_mutex_lock_iothread();
1372 break;
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001373 }
Alex Bennée37257942017-02-23 18:29:14 +00001374 } else if (cpu->stop) {
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001375 if (cpu->unplug) {
1376 cpu = CPU_NEXT(cpu);
1377 }
1378 break;
1379 }
1380
Alex Bennéee5143e32017-02-23 18:29:12 +00001381 cpu = CPU_NEXT(cpu);
1382 } /* while (cpu && !cpu->exit_request).. */
1383
Alex Bennée791158d2017-02-23 18:29:10 +00001384 /* Does not need atomic_mb_set because a spurious wakeup is okay. */
1385 atomic_set(&tcg_current_rr_cpu, NULL);
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001386
Alex Bennéee5143e32017-02-23 18:29:12 +00001387 if (cpu && cpu->exit_request) {
1388 atomic_mb_set(&cpu->exit_request, 0);
1389 }
Alex Blighac70aaf2013-08-21 16:02:57 +01001390
Alex Bennée37257942017-02-23 18:29:14 +00001391 qemu_tcg_wait_io_event(cpu ? cpu : QTAILQ_FIRST(&cpus));
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001392 deal_with_unplugged_cpus();
Blue Swirl296af7c2010-03-29 19:23:50 +00001393 }
1394
1395 return NULL;
1396}
1397
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001398static void *qemu_hax_cpu_thread_fn(void *arg)
1399{
1400 CPUState *cpu = arg;
1401 int r;
Vincent Palatinb3d3a422017-03-20 11:15:49 +01001402
1403 qemu_mutex_lock_iothread();
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001404 qemu_thread_get_self(cpu->thread);
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001405
1406 cpu->thread_id = qemu_get_thread_id();
1407 cpu->created = true;
1408 cpu->halted = 0;
1409 current_cpu = cpu;
1410
1411 hax_init_vcpu(cpu);
1412 qemu_cond_signal(&qemu_cpu_cond);
1413
1414 while (1) {
1415 if (cpu_can_run(cpu)) {
1416 r = hax_smp_cpu_exec(cpu);
1417 if (r == EXCP_DEBUG) {
1418 cpu_handle_guest_debug(cpu);
1419 }
1420 }
1421
1422 while (cpu_thread_is_idle(cpu)) {
1423 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
1424 }
1425#ifdef _WIN32
1426 SleepEx(0, TRUE);
1427#endif
1428 qemu_wait_io_event_common(cpu);
1429 }
1430 return NULL;
1431}
1432
1433#ifdef _WIN32
1434static void CALLBACK dummy_apc_func(ULONG_PTR unused)
1435{
1436}
1437#endif
1438
Alex Bennée37257942017-02-23 18:29:14 +00001439/* Multi-threaded TCG
1440 *
1441 * In the multi-threaded case each vCPU has its own thread. The TLS
1442 * variable current_cpu can be used deep in the code to find the
1443 * current CPUState for a given thread.
1444 */
1445
1446static void *qemu_tcg_cpu_thread_fn(void *arg)
1447{
1448 CPUState *cpu = arg;
1449
Alex Bennéebf51c722017-03-30 18:32:29 +01001450 g_assert(!use_icount);
1451
Alex Bennée37257942017-02-23 18:29:14 +00001452 rcu_register_thread();
1453
1454 qemu_mutex_lock_iothread();
1455 qemu_thread_get_self(cpu->thread);
1456
1457 cpu->thread_id = qemu_get_thread_id();
1458 cpu->created = true;
1459 cpu->can_do_io = 1;
1460 current_cpu = cpu;
1461 qemu_cond_signal(&qemu_cpu_cond);
1462
1463 /* process any pending work */
1464 cpu->exit_request = 1;
1465
1466 while (1) {
1467 if (cpu_can_run(cpu)) {
1468 int r;
1469 r = tcg_cpu_exec(cpu);
1470 switch (r) {
1471 case EXCP_DEBUG:
1472 cpu_handle_guest_debug(cpu);
1473 break;
1474 case EXCP_HALTED:
1475 /* during start-up the vCPU is reset and the thread is
1476 * kicked several times. If we don't ensure we go back
1477 * to sleep in the halted state we won't cleanly
1478 * start-up when the vCPU is enabled.
1479 *
1480 * cpu->halted should ensure we sleep in wait_io_event
1481 */
1482 g_assert(cpu->halted);
1483 break;
Pranith Kumar08e73c42017-02-23 18:29:15 +00001484 case EXCP_ATOMIC:
1485 qemu_mutex_unlock_iothread();
1486 cpu_exec_step_atomic(cpu);
1487 qemu_mutex_lock_iothread();
Alex Bennée37257942017-02-23 18:29:14 +00001488 default:
1489 /* Ignore everything else? */
1490 break;
1491 }
1492 }
1493
Alex Bennée37257942017-02-23 18:29:14 +00001494 atomic_mb_set(&cpu->exit_request, 0);
1495 qemu_tcg_wait_io_event(cpu);
1496 }
1497
1498 return NULL;
1499}
1500
Andreas Färber2ff09a42012-05-03 00:23:30 +02001501static void qemu_cpu_kick_thread(CPUState *cpu)
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001502{
1503#ifndef _WIN32
1504 int err;
1505
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001506 if (cpu->thread_kicked) {
1507 return;
Paolo Bonzini9102ded2015-08-18 06:52:09 -07001508 }
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001509 cpu->thread_kicked = true;
Andreas Färber814e6122012-05-02 17:00:37 +02001510 err = pthread_kill(cpu->thread->thread, SIG_IPI);
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001511 if (err) {
1512 fprintf(stderr, "qemu:%s: %s", __func__, strerror(err));
1513 exit(1);
1514 }
1515#else /* _WIN32 */
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001516 if (!qemu_cpu_is_self(cpu)) {
1517 if (!QueueUserAPC(dummy_apc_func, cpu->hThread, 0)) {
1518 fprintf(stderr, "%s: QueueUserAPC failed with error %lu\n",
1519 __func__, GetLastError());
1520 exit(1);
1521 }
1522 }
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001523#endif
1524}
1525
Andreas Färberc08d7422012-05-03 04:34:15 +02001526void qemu_cpu_kick(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001527{
Andreas Färberf5c121b2012-05-03 01:22:49 +02001528 qemu_cond_broadcast(cpu->halt_cond);
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001529 if (tcg_enabled()) {
Alex Bennée791158d2017-02-23 18:29:10 +00001530 cpu_exit(cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001531 /* NOP unless doing single-thread RR */
Alex Bennée791158d2017-02-23 18:29:10 +00001532 qemu_cpu_kick_rr_cpu();
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001533 } else {
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001534 if (hax_enabled()) {
1535 /*
1536 * FIXME: race condition with the exit_request check in
1537 * hax_vcpu_hax_exec
1538 */
1539 cpu->exit_request = 1;
1540 }
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001541 qemu_cpu_kick_thread(cpu);
1542 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001543}
1544
Jan Kiszka46d62fa2011-02-01 22:15:59 +01001545void qemu_cpu_kick_self(void)
1546{
Andreas Färber4917cf42013-05-27 05:17:50 +02001547 assert(current_cpu);
Paolo Bonzini9102ded2015-08-18 06:52:09 -07001548 qemu_cpu_kick_thread(current_cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001549}
1550
Andreas Färber60e82572012-05-02 22:23:49 +02001551bool qemu_cpu_is_self(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001552{
Andreas Färber814e6122012-05-02 17:00:37 +02001553 return qemu_thread_is_self(cpu->thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001554}
1555
Paolo Bonzini79e2b9a2015-01-21 12:09:14 +01001556bool qemu_in_vcpu_thread(void)
Juan Quintelaaa723c22012-09-18 16:30:11 +02001557{
Andreas Färber4917cf42013-05-27 05:17:50 +02001558 return current_cpu && qemu_cpu_is_self(current_cpu);
Juan Quintelaaa723c22012-09-18 16:30:11 +02001559}
1560
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001561static __thread bool iothread_locked = false;
1562
1563bool qemu_mutex_iothread_locked(void)
1564{
1565 return iothread_locked;
1566}
1567
Blue Swirl296af7c2010-03-29 19:23:50 +00001568void qemu_mutex_lock_iothread(void)
1569{
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001570 g_assert(!qemu_mutex_iothread_locked());
1571 qemu_mutex_lock(&qemu_global_mutex);
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001572 iothread_locked = true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001573}
1574
1575void qemu_mutex_unlock_iothread(void)
1576{
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001577 g_assert(qemu_mutex_iothread_locked());
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001578 iothread_locked = false;
Blue Swirl296af7c2010-03-29 19:23:50 +00001579 qemu_mutex_unlock(&qemu_global_mutex);
1580}
1581
Alex Bennéee8faee02016-10-27 16:09:58 +01001582static bool all_vcpus_paused(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001583{
Andreas Färberbdc44642013-06-24 23:50:24 +02001584 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001585
Andreas Färberbdc44642013-06-24 23:50:24 +02001586 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001587 if (!cpu->stopped) {
Alex Bennéee8faee02016-10-27 16:09:58 +01001588 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001589 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001590 }
1591
Alex Bennéee8faee02016-10-27 16:09:58 +01001592 return true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001593}
1594
1595void pause_all_vcpus(void)
1596{
Andreas Färberbdc44642013-06-24 23:50:24 +02001597 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001598
Alex Bligh40daca52013-08-21 16:03:02 +01001599 qemu_clock_enable(QEMU_CLOCK_VIRTUAL, false);
Andreas Färberbdc44642013-06-24 23:50:24 +02001600 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001601 cpu->stop = true;
1602 qemu_cpu_kick(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001603 }
1604
Juan Quintelaaa723c22012-09-18 16:30:11 +02001605 if (qemu_in_vcpu_thread()) {
Jan Kiszkad798e972012-02-17 18:31:16 +01001606 cpu_stop_current();
Jan Kiszkad798e972012-02-17 18:31:16 +01001607 }
1608
Blue Swirl296af7c2010-03-29 19:23:50 +00001609 while (!all_vcpus_paused()) {
Paolo Bonzinibe7d6c52011-03-12 17:44:02 +01001610 qemu_cond_wait(&qemu_pause_cond, &qemu_global_mutex);
Andreas Färberbdc44642013-06-24 23:50:24 +02001611 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001612 qemu_cpu_kick(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001613 }
1614 }
1615}
1616
Igor Mammedov29936832013-04-23 10:29:37 +02001617void cpu_resume(CPUState *cpu)
1618{
1619 cpu->stop = false;
1620 cpu->stopped = false;
1621 qemu_cpu_kick(cpu);
1622}
1623
Blue Swirl296af7c2010-03-29 19:23:50 +00001624void resume_all_vcpus(void)
1625{
Andreas Färberbdc44642013-06-24 23:50:24 +02001626 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001627
Alex Bligh40daca52013-08-21 16:03:02 +01001628 qemu_clock_enable(QEMU_CLOCK_VIRTUAL, true);
Andreas Färberbdc44642013-06-24 23:50:24 +02001629 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001630 cpu_resume(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001631 }
1632}
1633
Gu Zheng4c055ab2016-05-12 09:18:13 +05301634void cpu_remove(CPUState *cpu)
1635{
1636 cpu->stop = true;
1637 cpu->unplug = true;
1638 qemu_cpu_kick(cpu);
1639}
1640
Bharata B Rao2c579042016-05-12 09:18:14 +05301641void cpu_remove_sync(CPUState *cpu)
1642{
1643 cpu_remove(cpu);
1644 while (cpu->created) {
1645 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1646 }
1647}
1648
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001649/* For temporary buffers for forming a name */
1650#define VCPU_THREAD_NAME_SIZE 16
1651
Andreas Färbere5ab30a2012-05-03 01:50:44 +02001652static void qemu_tcg_init_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001653{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001654 char thread_name[VCPU_THREAD_NAME_SIZE];
Alex Bennée37257942017-02-23 18:29:14 +00001655 static QemuCond *single_tcg_halt_cond;
1656 static QemuThread *single_tcg_cpu_thread;
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001657
Alex Bennée37257942017-02-23 18:29:14 +00001658 if (qemu_tcg_mttcg_enabled() || !single_tcg_cpu_thread) {
Andreas Färber814e6122012-05-02 17:00:37 +02001659 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001660 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1661 qemu_cond_init(cpu->halt_cond);
Alex Bennée37257942017-02-23 18:29:14 +00001662
1663 if (qemu_tcg_mttcg_enabled()) {
1664 /* create a thread per vCPU with TCG (MTTCG) */
1665 parallel_cpus = true;
1666 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/TCG",
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001667 cpu->cpu_index);
Alex Bennée37257942017-02-23 18:29:14 +00001668
1669 qemu_thread_create(cpu->thread, thread_name, qemu_tcg_cpu_thread_fn,
1670 cpu, QEMU_THREAD_JOINABLE);
1671
1672 } else {
1673 /* share a single thread for all cpus with TCG */
1674 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "ALL CPUs/TCG");
1675 qemu_thread_create(cpu->thread, thread_name,
1676 qemu_tcg_rr_cpu_thread_fn,
1677 cpu, QEMU_THREAD_JOINABLE);
1678
1679 single_tcg_halt_cond = cpu->halt_cond;
1680 single_tcg_cpu_thread = cpu->thread;
1681 }
Paolo Bonzini1ecf47b2011-12-13 13:43:52 +01001682#ifdef _WIN32
Andreas Färber814e6122012-05-02 17:00:37 +02001683 cpu->hThread = qemu_thread_get_handle(cpu->thread);
Paolo Bonzini1ecf47b2011-12-13 13:43:52 +01001684#endif
Andreas Färber61a46212012-05-02 22:49:36 +02001685 while (!cpu->created) {
Paolo Bonzini18a85722011-03-12 17:44:03 +01001686 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001687 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001688 } else {
Alex Bennée37257942017-02-23 18:29:14 +00001689 /* For non-MTTCG cases we share the thread */
1690 cpu->thread = single_tcg_cpu_thread;
1691 cpu->halt_cond = single_tcg_halt_cond;
Blue Swirl296af7c2010-03-29 19:23:50 +00001692 }
1693}
1694
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001695static void qemu_hax_start_vcpu(CPUState *cpu)
1696{
1697 char thread_name[VCPU_THREAD_NAME_SIZE];
1698
1699 cpu->thread = g_malloc0(sizeof(QemuThread));
1700 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1701 qemu_cond_init(cpu->halt_cond);
1702
1703 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/HAX",
1704 cpu->cpu_index);
1705 qemu_thread_create(cpu->thread, thread_name, qemu_hax_cpu_thread_fn,
1706 cpu, QEMU_THREAD_JOINABLE);
1707#ifdef _WIN32
1708 cpu->hThread = qemu_thread_get_handle(cpu->thread);
1709#endif
1710 while (!cpu->created) {
1711 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1712 }
1713}
1714
Andreas Färber48a106b2013-05-27 02:20:39 +02001715static void qemu_kvm_start_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001716{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001717 char thread_name[VCPU_THREAD_NAME_SIZE];
1718
Andreas Färber814e6122012-05-02 17:00:37 +02001719 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001720 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1721 qemu_cond_init(cpu->halt_cond);
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001722 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/KVM",
1723 cpu->cpu_index);
1724 qemu_thread_create(cpu->thread, thread_name, qemu_kvm_cpu_thread_fn,
1725 cpu, QEMU_THREAD_JOINABLE);
Andreas Färber61a46212012-05-02 22:49:36 +02001726 while (!cpu->created) {
Paolo Bonzini18a85722011-03-12 17:44:03 +01001727 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001728 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001729}
1730
Andreas Färber10a90212013-05-27 02:24:35 +02001731static void qemu_dummy_start_vcpu(CPUState *cpu)
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001732{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001733 char thread_name[VCPU_THREAD_NAME_SIZE];
1734
Andreas Färber814e6122012-05-02 17:00:37 +02001735 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001736 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1737 qemu_cond_init(cpu->halt_cond);
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001738 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/DUMMY",
1739 cpu->cpu_index);
1740 qemu_thread_create(cpu->thread, thread_name, qemu_dummy_cpu_thread_fn, cpu,
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001741 QEMU_THREAD_JOINABLE);
Andreas Färber61a46212012-05-02 22:49:36 +02001742 while (!cpu->created) {
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001743 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1744 }
1745}
1746
Andreas Färberc643bed2013-05-27 03:23:24 +02001747void qemu_init_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001748{
Andreas Färberce3960e2012-12-17 03:27:07 +01001749 cpu->nr_cores = smp_cores;
1750 cpu->nr_threads = smp_threads;
Andreas Färberf324e762012-05-02 23:26:21 +02001751 cpu->stopped = true;
Peter Maydell56943e82016-01-21 14:15:04 +00001752
1753 if (!cpu->as) {
1754 /* If the target cpu hasn't set up any address spaces itself,
1755 * give it the default one.
1756 */
Peter Crosthwaite6731d862016-01-21 14:15:06 +00001757 AddressSpace *as = address_space_init_shareable(cpu->memory,
1758 "cpu-memory");
Peter Maydell12ebc9a2016-01-21 14:15:04 +00001759 cpu->num_ases = 1;
Peter Crosthwaite6731d862016-01-21 14:15:06 +00001760 cpu_address_space_init(cpu, as, 0);
Peter Maydell56943e82016-01-21 14:15:04 +00001761 }
1762
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001763 if (kvm_enabled()) {
Andreas Färber48a106b2013-05-27 02:20:39 +02001764 qemu_kvm_start_vcpu(cpu);
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001765 } else if (hax_enabled()) {
1766 qemu_hax_start_vcpu(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001767 } else if (tcg_enabled()) {
Andreas Färbere5ab30a2012-05-03 01:50:44 +02001768 qemu_tcg_init_vcpu(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001769 } else {
Andreas Färber10a90212013-05-27 02:24:35 +02001770 qemu_dummy_start_vcpu(cpu);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001771 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001772}
1773
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001774void cpu_stop_current(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001775{
Andreas Färber4917cf42013-05-27 05:17:50 +02001776 if (current_cpu) {
1777 current_cpu->stop = false;
1778 current_cpu->stopped = true;
1779 cpu_exit(current_cpu);
Dr. David Alan Gilbert96bce682016-01-25 10:08:18 +00001780 qemu_cond_broadcast(&qemu_pause_cond);
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001781 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001782}
1783
Kevin Wolf56983462013-07-05 13:49:54 +02001784int vm_stop(RunState state)
Blue Swirl296af7c2010-03-29 19:23:50 +00001785{
Juan Quintelaaa723c22012-09-18 16:30:11 +02001786 if (qemu_in_vcpu_thread()) {
Paolo Bonzini74892d22014-06-05 14:53:58 +02001787 qemu_system_vmstop_request_prepare();
Luiz Capitulino1dfb4dd2011-07-29 14:26:33 -03001788 qemu_system_vmstop_request(state);
Blue Swirl296af7c2010-03-29 19:23:50 +00001789 /*
1790 * FIXME: should not return to device code in case
1791 * vm_stop() has been requested.
1792 */
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001793 cpu_stop_current();
Kevin Wolf56983462013-07-05 13:49:54 +02001794 return 0;
Blue Swirl296af7c2010-03-29 19:23:50 +00001795 }
Kevin Wolf56983462013-07-05 13:49:54 +02001796
1797 return do_vm_stop(state);
Blue Swirl296af7c2010-03-29 19:23:50 +00001798}
1799
Claudio Imbrenda2d76e822017-02-14 18:07:47 +01001800/**
1801 * Prepare for (re)starting the VM.
1802 * Returns -1 if the vCPUs are not to be restarted (e.g. if they are already
1803 * running or in case of an error condition), 0 otherwise.
1804 */
1805int vm_prepare_start(void)
1806{
1807 RunState requested;
1808 int res = 0;
1809
1810 qemu_vmstop_requested(&requested);
1811 if (runstate_is_running() && requested == RUN_STATE__MAX) {
1812 return -1;
1813 }
1814
1815 /* Ensure that a STOP/RESUME pair of events is emitted if a
1816 * vmstop request was pending. The BLOCK_IO_ERROR event, for
1817 * example, according to documentation is always followed by
1818 * the STOP event.
1819 */
1820 if (runstate_is_running()) {
1821 qapi_event_send_stop(&error_abort);
1822 res = -1;
1823 } else {
1824 replay_enable_events();
1825 cpu_enable_ticks();
1826 runstate_set(RUN_STATE_RUNNING);
1827 vm_state_notify(1, RUN_STATE_RUNNING);
1828 }
1829
1830 /* We are sending this now, but the CPUs will be resumed shortly later */
1831 qapi_event_send_resume(&error_abort);
1832 return res;
1833}
1834
1835void vm_start(void)
1836{
1837 if (!vm_prepare_start()) {
1838 resume_all_vcpus();
1839 }
1840}
1841
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001842/* does a state transition even if the VM is already stopped,
1843 current state is forgotten forever */
Kevin Wolf56983462013-07-05 13:49:54 +02001844int vm_stop_force_state(RunState state)
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001845{
1846 if (runstate_is_running()) {
Kevin Wolf56983462013-07-05 13:49:54 +02001847 return vm_stop(state);
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001848 } else {
1849 runstate_set(state);
Wen Congyangb2780d32015-11-20 17:34:38 +08001850
1851 bdrv_drain_all();
Kevin Wolf594a45c2013-07-18 14:52:19 +02001852 /* Make sure to return an error if the flush in a previous vm_stop()
1853 * failed. */
John Snow22af08e2016-09-22 21:45:51 -04001854 return bdrv_flush_all();
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001855 }
1856}
1857
Stefan Weil9a78eea2010-10-22 23:03:33 +02001858void list_cpus(FILE *f, fprintf_function cpu_fprintf, const char *optarg)
Blue Swirl262353c2010-05-04 19:55:35 +00001859{
1860 /* XXX: implement xxx_cpu_list for targets that still miss it */
Peter Maydelle916cbf2012-09-05 17:41:08 -03001861#if defined(cpu_list)
1862 cpu_list(f, cpu_fprintf);
Blue Swirl262353c2010-05-04 19:55:35 +00001863#endif
1864}
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001865
1866CpuInfoList *qmp_query_cpus(Error **errp)
1867{
1868 CpuInfoList *head = NULL, *cur_item = NULL;
Andreas Färber182735e2013-05-29 22:29:20 +02001869 CPUState *cpu;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001870
Andreas Färberbdc44642013-06-24 23:50:24 +02001871 CPU_FOREACH(cpu) {
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001872 CpuInfoList *info;
Andreas Färber182735e2013-05-29 22:29:20 +02001873#if defined(TARGET_I386)
1874 X86CPU *x86_cpu = X86_CPU(cpu);
1875 CPUX86State *env = &x86_cpu->env;
1876#elif defined(TARGET_PPC)
1877 PowerPCCPU *ppc_cpu = POWERPC_CPU(cpu);
1878 CPUPPCState *env = &ppc_cpu->env;
1879#elif defined(TARGET_SPARC)
1880 SPARCCPU *sparc_cpu = SPARC_CPU(cpu);
1881 CPUSPARCState *env = &sparc_cpu->env;
1882#elif defined(TARGET_MIPS)
1883 MIPSCPU *mips_cpu = MIPS_CPU(cpu);
1884 CPUMIPSState *env = &mips_cpu->env;
Bastian Koppelmann48e06fe2014-09-01 12:59:46 +01001885#elif defined(TARGET_TRICORE)
1886 TriCoreCPU *tricore_cpu = TRICORE_CPU(cpu);
1887 CPUTriCoreState *env = &tricore_cpu->env;
Andreas Färber182735e2013-05-29 22:29:20 +02001888#endif
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001889
Andreas Färbercb446ec2013-05-01 14:24:52 +02001890 cpu_synchronize_state(cpu);
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001891
1892 info = g_malloc0(sizeof(*info));
1893 info->value = g_malloc0(sizeof(*info->value));
Andreas Färber55e5c282012-12-17 06:18:02 +01001894 info->value->CPU = cpu->cpu_index;
Andreas Färber182735e2013-05-29 22:29:20 +02001895 info->value->current = (cpu == first_cpu);
Andreas Färber259186a2013-01-17 18:51:17 +01001896 info->value->halted = cpu->halted;
Eduardo Habkost58f88d42015-05-08 16:04:22 -03001897 info->value->qom_path = object_get_canonical_path(OBJECT(cpu));
Andreas Färber9f09e182012-05-03 06:59:07 +02001898 info->value->thread_id = cpu->thread_id;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001899#if defined(TARGET_I386)
Eric Blake86f4b682015-11-18 01:52:59 -07001900 info->value->arch = CPU_INFO_ARCH_X86;
Eric Blake544a3732016-02-17 23:48:27 -07001901 info->value->u.x86.pc = env->eip + env->segs[R_CS].base;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001902#elif defined(TARGET_PPC)
Eric Blake86f4b682015-11-18 01:52:59 -07001903 info->value->arch = CPU_INFO_ARCH_PPC;
Eric Blake544a3732016-02-17 23:48:27 -07001904 info->value->u.ppc.nip = env->nip;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001905#elif defined(TARGET_SPARC)
Eric Blake86f4b682015-11-18 01:52:59 -07001906 info->value->arch = CPU_INFO_ARCH_SPARC;
Eric Blake544a3732016-02-17 23:48:27 -07001907 info->value->u.q_sparc.pc = env->pc;
1908 info->value->u.q_sparc.npc = env->npc;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001909#elif defined(TARGET_MIPS)
Eric Blake86f4b682015-11-18 01:52:59 -07001910 info->value->arch = CPU_INFO_ARCH_MIPS;
Eric Blake544a3732016-02-17 23:48:27 -07001911 info->value->u.q_mips.PC = env->active_tc.PC;
Bastian Koppelmann48e06fe2014-09-01 12:59:46 +01001912#elif defined(TARGET_TRICORE)
Eric Blake86f4b682015-11-18 01:52:59 -07001913 info->value->arch = CPU_INFO_ARCH_TRICORE;
Eric Blake544a3732016-02-17 23:48:27 -07001914 info->value->u.tricore.PC = env->PC;
Eric Blake86f4b682015-11-18 01:52:59 -07001915#else
1916 info->value->arch = CPU_INFO_ARCH_OTHER;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001917#endif
1918
1919 /* XXX: waiting for the qapi to support GSList */
1920 if (!cur_item) {
1921 head = cur_item = info;
1922 } else {
1923 cur_item->next = info;
1924 cur_item = info;
1925 }
1926 }
1927
1928 return head;
1929}
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001930
1931void qmp_memsave(int64_t addr, int64_t size, const char *filename,
1932 bool has_cpu, int64_t cpu_index, Error **errp)
1933{
1934 FILE *f;
1935 uint32_t l;
Andreas Färber55e5c282012-12-17 06:18:02 +01001936 CPUState *cpu;
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001937 uint8_t buf[1024];
Borislav Petkov0dc9daf2015-02-08 13:14:38 +01001938 int64_t orig_addr = addr, orig_size = size;
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001939
1940 if (!has_cpu) {
1941 cpu_index = 0;
1942 }
1943
Andreas Färber151d1322013-02-15 15:41:49 +01001944 cpu = qemu_get_cpu(cpu_index);
1945 if (cpu == NULL) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01001946 error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "cpu-index",
1947 "a CPU number");
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001948 return;
1949 }
1950
1951 f = fopen(filename, "wb");
1952 if (!f) {
Luiz Capitulino618da852013-06-07 14:35:06 -04001953 error_setg_file_open(errp, errno, filename);
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001954 return;
1955 }
1956
1957 while (size != 0) {
1958 l = sizeof(buf);
1959 if (l > size)
1960 l = size;
Aneesh Kumar K.V2f4d0f52013-10-01 21:49:30 +05301961 if (cpu_memory_rw_debug(cpu, addr, buf, l, 0) != 0) {
Borislav Petkov0dc9daf2015-02-08 13:14:38 +01001962 error_setg(errp, "Invalid addr 0x%016" PRIx64 "/size %" PRId64
1963 " specified", orig_addr, orig_size);
Aneesh Kumar K.V2f4d0f52013-10-01 21:49:30 +05301964 goto exit;
1965 }
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001966 if (fwrite(buf, 1, l, f) != l) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01001967 error_setg(errp, QERR_IO_ERROR);
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001968 goto exit;
1969 }
1970 addr += l;
1971 size -= l;
1972 }
1973
1974exit:
1975 fclose(f);
1976}
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001977
1978void qmp_pmemsave(int64_t addr, int64_t size, const char *filename,
1979 Error **errp)
1980{
1981 FILE *f;
1982 uint32_t l;
1983 uint8_t buf[1024];
1984
1985 f = fopen(filename, "wb");
1986 if (!f) {
Luiz Capitulino618da852013-06-07 14:35:06 -04001987 error_setg_file_open(errp, errno, filename);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001988 return;
1989 }
1990
1991 while (size != 0) {
1992 l = sizeof(buf);
1993 if (l > size)
1994 l = size;
Stefan Weileb6282f2014-04-07 20:28:23 +02001995 cpu_physical_memory_read(addr, buf, l);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001996 if (fwrite(buf, 1, l, f) != l) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01001997 error_setg(errp, QERR_IO_ERROR);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001998 goto exit;
1999 }
2000 addr += l;
2001 size -= l;
2002 }
2003
2004exit:
2005 fclose(f);
2006}
Luiz Capitulinoab49ab52011-11-23 12:55:53 -02002007
2008void qmp_inject_nmi(Error **errp)
2009{
Alexey Kardashevskiy9cb805f2014-08-20 22:16:33 +10002010 nmi_monitor_handle(monitor_get_cpu_index(), errp);
Luiz Capitulinoab49ab52011-11-23 12:55:53 -02002011}
Sebastian Tanase27498be2014-07-25 11:56:33 +02002012
2013void dump_drift_info(FILE *f, fprintf_function cpu_fprintf)
2014{
2015 if (!use_icount) {
2016 return;
2017 }
2018
2019 cpu_fprintf(f, "Host - Guest clock %"PRIi64" ms\n",
2020 (cpu_get_clock() - cpu_get_icount())/SCALE_MS);
2021 if (icount_align_option) {
2022 cpu_fprintf(f, "Max guest delay %"PRIi64" ms\n", -max_delay/SCALE_MS);
2023 cpu_fprintf(f, "Max guest advance %"PRIi64" ms\n", max_advance/SCALE_MS);
2024 } else {
2025 cpu_fprintf(f, "Max guest delay NA\n");
2026 cpu_fprintf(f, "Max guest advance NA\n");
2027 }
2028}