blob: 0ecb0b87f0b6a3a2d52fc61f409a2ad483406809 [file] [log] [blame]
Blue Swirl296af7c2010-03-29 19:23:50 +00001/*
2 * QEMU System Emulator
3 *
4 * Copyright (c) 2003-2008 Fabrice Bellard
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
24
25/* Needed early for CONFIG_BSD etc. */
Peter Maydell7b31bbc2016-01-26 18:16:56 +000026#include "qemu/osdep.h"
Paolo Bonzini33c11872016-03-15 16:58:45 +010027#include "qemu-common.h"
KONRAD Frederic8d4e9142017-02-23 18:29:08 +000028#include "qemu/config-file.h"
Paolo Bonzini33c11872016-03-15 16:58:45 +010029#include "cpu.h"
Paolo Bonzini83c90892012-12-17 18:19:49 +010030#include "monitor/monitor.h"
Wenchao Xiaa4e15de2014-06-18 08:43:36 +020031#include "qapi/qmp/qerror.h"
Markus Armbrusterd49b6832015-03-17 18:29:20 +010032#include "qemu/error-report.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010033#include "sysemu/sysemu.h"
Max Reitzda31d592016-03-16 19:54:32 +010034#include "sysemu/block-backend.h"
Paolo Bonzini022c62c2012-12-17 18:19:49 +010035#include "exec/gdbstub.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010036#include "sysemu/dma.h"
Vincent Palatinb3946622017-01-10 11:59:55 +010037#include "sysemu/hw_accel.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010038#include "sysemu/kvm.h"
Vincent Palatinb0cb0a62017-01-10 11:59:57 +010039#include "sysemu/hax.h"
Luiz Capitulinode0b36b2011-09-21 16:38:35 -030040#include "qmp-commands.h"
Paolo Bonzini63c91552016-03-15 13:18:37 +010041#include "exec/exec-all.h"
Blue Swirl296af7c2010-03-29 19:23:50 +000042
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010043#include "qemu/thread.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010044#include "sysemu/cpus.h"
45#include "sysemu/qtest.h"
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010046#include "qemu/main-loop.h"
47#include "qemu/bitmap.h"
Liu Ping Fancb365642013-09-25 14:20:58 +080048#include "qemu/seqlock.h"
KONRAD Frederic8d4e9142017-02-23 18:29:08 +000049#include "tcg.h"
Wenchao Xiaa4e15de2014-06-18 08:43:36 +020050#include "qapi-event.h"
Alexey Kardashevskiy9cb805f2014-08-20 22:16:33 +100051#include "hw/nmi.h"
Pavel Dovgalyuk8b427042015-09-17 19:24:05 +030052#include "sysemu/replay.h"
Jan Kiszka0ff0fc12011-06-23 10:15:55 +020053
Jan Kiszka6d9cb732011-02-01 22:15:58 +010054#ifdef CONFIG_LINUX
55
56#include <sys/prctl.h>
57
Marcelo Tosattic0532a72010-10-11 15:31:21 -030058#ifndef PR_MCE_KILL
59#define PR_MCE_KILL 33
60#endif
61
Jan Kiszka6d9cb732011-02-01 22:15:58 +010062#ifndef PR_MCE_KILL_SET
63#define PR_MCE_KILL_SET 1
64#endif
65
66#ifndef PR_MCE_KILL_EARLY
67#define PR_MCE_KILL_EARLY 1
68#endif
69
70#endif /* CONFIG_LINUX */
71
Sebastian Tanase27498be2014-07-25 11:56:33 +020072int64_t max_delay;
73int64_t max_advance;
Blue Swirl296af7c2010-03-29 19:23:50 +000074
Jason J. Herne2adcc852015-09-08 13:12:33 -040075/* vcpu throttling controls */
76static QEMUTimer *throttle_timer;
77static unsigned int throttle_percentage;
78
79#define CPU_THROTTLE_PCT_MIN 1
80#define CPU_THROTTLE_PCT_MAX 99
81#define CPU_THROTTLE_TIMESLICE_NS 10000000
82
Tiejun Chen321bc0b2013-08-02 09:43:09 +080083bool cpu_is_stopped(CPUState *cpu)
84{
85 return cpu->stopped || !runstate_is_running();
86}
87
Andreas Färbera98ae1d2013-05-26 23:21:08 +020088static bool cpu_thread_is_idle(CPUState *cpu)
Peter Maydellac873f12012-07-19 16:52:27 +010089{
Andreas Färberc64ca812012-05-03 02:11:45 +020090 if (cpu->stop || cpu->queued_work_first) {
Peter Maydellac873f12012-07-19 16:52:27 +010091 return false;
92 }
Tiejun Chen321bc0b2013-08-02 09:43:09 +080093 if (cpu_is_stopped(cpu)) {
Peter Maydellac873f12012-07-19 16:52:27 +010094 return true;
95 }
Andreas Färber8c2e1b02013-08-25 18:53:55 +020096 if (!cpu->halted || cpu_has_work(cpu) ||
Alexander Graf215e79c2013-04-24 22:24:12 +020097 kvm_halt_in_kernel()) {
Peter Maydellac873f12012-07-19 16:52:27 +010098 return false;
99 }
100 return true;
101}
102
103static bool all_cpu_threads_idle(void)
104{
Andreas Färber182735e2013-05-29 22:29:20 +0200105 CPUState *cpu;
Peter Maydellac873f12012-07-19 16:52:27 +0100106
Andreas Färberbdc44642013-06-24 23:50:24 +0200107 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200108 if (!cpu_thread_is_idle(cpu)) {
Peter Maydellac873f12012-07-19 16:52:27 +0100109 return false;
110 }
111 }
112 return true;
113}
114
Blue Swirl296af7c2010-03-29 19:23:50 +0000115/***********************************************************/
Paolo Bonzini946fb272011-09-12 13:57:37 +0200116/* guest cycle counter */
117
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200118/* Protected by TimersState seqlock */
119
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200120static bool icount_sleep = true;
Sebastian Tanase71468392014-07-23 11:47:50 +0200121static int64_t vm_clock_warp_start = -1;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200122/* Conversion factor from emulated instructions to virtual clock ticks. */
123static int icount_time_shift;
124/* Arbitrarily pick 1MIPS as the minimum allowable speed. */
125#define MAX_ICOUNT_SHIFT 10
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200126
Paolo Bonzini946fb272011-09-12 13:57:37 +0200127static QEMUTimer *icount_rt_timer;
128static QEMUTimer *icount_vm_timer;
129static QEMUTimer *icount_warp_timer;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200130
131typedef struct TimersState {
Liu Ping Fancb365642013-09-25 14:20:58 +0800132 /* Protected by BQL. */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200133 int64_t cpu_ticks_prev;
134 int64_t cpu_ticks_offset;
Liu Ping Fancb365642013-09-25 14:20:58 +0800135
136 /* cpu_clock_offset can be read out of BQL, so protect it with
137 * this lock.
138 */
139 QemuSeqLock vm_clock_seqlock;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200140 int64_t cpu_clock_offset;
141 int32_t cpu_ticks_enabled;
142 int64_t dummy;
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200143
144 /* Compensate for varying guest execution speed. */
145 int64_t qemu_icount_bias;
146 /* Only written by TCG thread */
147 int64_t qemu_icount;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200148} TimersState;
149
Liu Ping Fand9cd4002013-07-21 08:43:00 +0000150static TimersState timers_state;
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000151bool mttcg_enabled;
152
153/*
154 * We default to false if we know other options have been enabled
155 * which are currently incompatible with MTTCG. Otherwise when each
156 * guest (target) has been updated to support:
157 * - atomic instructions
158 * - memory ordering primitives (barriers)
159 * they can set the appropriate CONFIG flags in ${target}-softmmu.mak
160 *
161 * Once a guest architecture has been converted to the new primitives
162 * there are two remaining limitations to check.
163 *
164 * - The guest can't be oversized (e.g. 64 bit guest on 32 bit host)
165 * - The host must have a stronger memory order than the guest
166 *
167 * It may be possible in future to support strong guests on weak hosts
168 * but that will require tagging all load/stores in a guest with their
169 * implicit memory order requirements which would likely slow things
170 * down a lot.
171 */
172
173static bool check_tcg_memory_orders_compatible(void)
174{
175#if defined(TCG_GUEST_DEFAULT_MO) && defined(TCG_TARGET_DEFAULT_MO)
176 return (TCG_GUEST_DEFAULT_MO & ~TCG_TARGET_DEFAULT_MO) == 0;
177#else
178 return false;
179#endif
180}
181
182static bool default_mttcg_enabled(void)
183{
Alex Bennée83fd9622017-02-27 17:09:01 +0000184 if (use_icount || TCG_OVERSIZED_GUEST) {
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000185 return false;
186 } else {
187#ifdef TARGET_SUPPORTS_MTTCG
188 return check_tcg_memory_orders_compatible();
189#else
190 return false;
191#endif
192 }
193}
194
195void qemu_tcg_configure(QemuOpts *opts, Error **errp)
196{
197 const char *t = qemu_opt_get(opts, "thread");
198 if (t) {
199 if (strcmp(t, "multi") == 0) {
200 if (TCG_OVERSIZED_GUEST) {
201 error_setg(errp, "No MTTCG when guest word size > hosts");
Alex Bennée83fd9622017-02-27 17:09:01 +0000202 } else if (use_icount) {
203 error_setg(errp, "No MTTCG when icount is enabled");
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000204 } else {
Nikunj A Dadhania86953502017-04-10 11:36:55 +0530205#ifndef TARGET_SUPPORTS_MTTCG
Alex Bennéec34c7622017-02-28 14:40:17 +0000206 error_report("Guest not yet converted to MTTCG - "
207 "you may get unexpected results");
208#endif
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000209 if (!check_tcg_memory_orders_compatible()) {
210 error_report("Guest expects a stronger memory ordering "
211 "than the host provides");
Pranith Kumar8cfef892017-03-25 16:19:23 -0400212 error_printf("This may cause strange/hard to debug errors\n");
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000213 }
214 mttcg_enabled = true;
215 }
216 } else if (strcmp(t, "single") == 0) {
217 mttcg_enabled = false;
218 } else {
219 error_setg(errp, "Invalid 'thread' setting %s", t);
220 }
221 } else {
222 mttcg_enabled = default_mttcg_enabled();
223 }
224}
Paolo Bonzini946fb272011-09-12 13:57:37 +0200225
Alex Bennéee4cd9652017-03-31 16:09:42 +0100226/* The current number of executed instructions is based on what we
227 * originally budgeted minus the current state of the decrementing
228 * icount counters in extra/u16.low.
229 */
230static int64_t cpu_get_icount_executed(CPUState *cpu)
231{
232 return cpu->icount_budget - (cpu->icount_decr.u16.low + cpu->icount_extra);
233}
234
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300235int64_t cpu_get_icount_raw(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200236{
237 int64_t icount;
Andreas Färber4917cf42013-05-27 05:17:50 +0200238 CPUState *cpu = current_cpu;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200239
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200240 icount = timers_state.qemu_icount;
Alex Bennée243c5f72017-03-30 18:49:22 +0100241 if (cpu && cpu->running) {
Paolo Bonzini414b15c2015-06-24 14:16:26 +0200242 if (!cpu->can_do_io) {
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300243 fprintf(stderr, "Bad icount read\n");
244 exit(1);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200245 }
Alex Bennéee4cd9652017-03-31 16:09:42 +0100246 /* Take into account what has run */
247 icount += cpu_get_icount_executed(cpu);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200248 }
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300249 return icount;
250}
251
252/* Return the virtual CPU time, based on the instruction counter. */
253static int64_t cpu_get_icount_locked(void)
254{
255 int64_t icount = cpu_get_icount_raw();
KONRAD Frederic3f031312014-08-01 01:37:15 +0200256 return timers_state.qemu_icount_bias + cpu_icount_to_ns(icount);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200257}
258
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200259int64_t cpu_get_icount(void)
260{
261 int64_t icount;
262 unsigned start;
263
264 do {
265 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
266 icount = cpu_get_icount_locked();
267 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
268
269 return icount;
270}
271
KONRAD Frederic3f031312014-08-01 01:37:15 +0200272int64_t cpu_icount_to_ns(int64_t icount)
273{
274 return icount << icount_time_shift;
275}
276
Cao jind90f3cc2016-07-29 19:05:38 +0800277/* return the time elapsed in VM between vm_start and vm_stop. Unless
278 * icount is active, cpu_get_ticks() uses units of the host CPU cycle
279 * counter.
280 *
281 * Caller must hold the BQL
282 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200283int64_t cpu_get_ticks(void)
284{
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100285 int64_t ticks;
286
Paolo Bonzini946fb272011-09-12 13:57:37 +0200287 if (use_icount) {
288 return cpu_get_icount();
289 }
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100290
291 ticks = timers_state.cpu_ticks_offset;
292 if (timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400293 ticks += cpu_get_host_ticks();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200294 }
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100295
296 if (timers_state.cpu_ticks_prev > ticks) {
297 /* Note: non increasing ticks may happen if the host uses
298 software suspend */
299 timers_state.cpu_ticks_offset += timers_state.cpu_ticks_prev - ticks;
300 ticks = timers_state.cpu_ticks_prev;
301 }
302
303 timers_state.cpu_ticks_prev = ticks;
304 return ticks;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200305}
306
Liu Ping Fancb365642013-09-25 14:20:58 +0800307static int64_t cpu_get_clock_locked(void)
308{
Cao jin1d45cea2016-07-29 19:05:37 +0800309 int64_t time;
Liu Ping Fancb365642013-09-25 14:20:58 +0800310
Cao jin1d45cea2016-07-29 19:05:37 +0800311 time = timers_state.cpu_clock_offset;
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100312 if (timers_state.cpu_ticks_enabled) {
Cao jin1d45cea2016-07-29 19:05:37 +0800313 time += get_clock();
Liu Ping Fancb365642013-09-25 14:20:58 +0800314 }
315
Cao jin1d45cea2016-07-29 19:05:37 +0800316 return time;
Liu Ping Fancb365642013-09-25 14:20:58 +0800317}
318
Cao jind90f3cc2016-07-29 19:05:38 +0800319/* Return the monotonic time elapsed in VM, i.e.,
Peter Maydell8212ff82016-09-15 10:24:22 +0100320 * the time between vm_start and vm_stop
321 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200322int64_t cpu_get_clock(void)
323{
324 int64_t ti;
Liu Ping Fancb365642013-09-25 14:20:58 +0800325 unsigned start;
326
327 do {
328 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
329 ti = cpu_get_clock_locked();
330 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
331
332 return ti;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200333}
334
Liu Ping Fancb365642013-09-25 14:20:58 +0800335/* enable cpu_get_ticks()
Cao jin3224e872016-07-08 18:31:37 +0800336 * Caller must hold BQL which serves as mutex for vm_clock_seqlock.
Liu Ping Fancb365642013-09-25 14:20:58 +0800337 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200338void cpu_enable_ticks(void)
339{
Liu Ping Fancb365642013-09-25 14:20:58 +0800340 /* Here, the really thing protected by seqlock is cpu_clock_offset. */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400341 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200342 if (!timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400343 timers_state.cpu_ticks_offset -= cpu_get_host_ticks();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200344 timers_state.cpu_clock_offset -= get_clock();
345 timers_state.cpu_ticks_enabled = 1;
346 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400347 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200348}
349
350/* disable cpu_get_ticks() : the clock is stopped. You must not call
Liu Ping Fancb365642013-09-25 14:20:58 +0800351 * cpu_get_ticks() after that.
Cao jin3224e872016-07-08 18:31:37 +0800352 * Caller must hold BQL which serves as mutex for vm_clock_seqlock.
Liu Ping Fancb365642013-09-25 14:20:58 +0800353 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200354void cpu_disable_ticks(void)
355{
Liu Ping Fancb365642013-09-25 14:20:58 +0800356 /* Here, the really thing protected by seqlock is cpu_clock_offset. */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400357 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200358 if (timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400359 timers_state.cpu_ticks_offset += cpu_get_host_ticks();
Liu Ping Fancb365642013-09-25 14:20:58 +0800360 timers_state.cpu_clock_offset = cpu_get_clock_locked();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200361 timers_state.cpu_ticks_enabled = 0;
362 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400363 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200364}
365
366/* Correlation between real and virtual time is always going to be
367 fairly approximate, so ignore small variation.
368 When the guest is idle real and virtual time will be aligned in
369 the IO wait loop. */
Rutuja Shah73bcb242016-03-21 21:32:30 +0530370#define ICOUNT_WOBBLE (NANOSECONDS_PER_SECOND / 10)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200371
372static void icount_adjust(void)
373{
374 int64_t cur_time;
375 int64_t cur_icount;
376 int64_t delta;
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200377
378 /* Protected by TimersState mutex. */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200379 static int64_t last_delta;
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200380
Paolo Bonzini946fb272011-09-12 13:57:37 +0200381 /* If the VM is not running, then do nothing. */
382 if (!runstate_is_running()) {
383 return;
384 }
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200385
Emilio G. Cota03719e42016-06-08 14:55:21 -0400386 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200387 cur_time = cpu_get_clock_locked();
388 cur_icount = cpu_get_icount_locked();
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200389
Paolo Bonzini946fb272011-09-12 13:57:37 +0200390 delta = cur_icount - cur_time;
391 /* FIXME: This is a very crude algorithm, somewhat prone to oscillation. */
392 if (delta > 0
393 && last_delta + ICOUNT_WOBBLE < delta * 2
394 && icount_time_shift > 0) {
395 /* The guest is getting too far ahead. Slow time down. */
396 icount_time_shift--;
397 }
398 if (delta < 0
399 && last_delta - ICOUNT_WOBBLE > delta * 2
400 && icount_time_shift < MAX_ICOUNT_SHIFT) {
401 /* The guest is getting too far behind. Speed time up. */
402 icount_time_shift++;
403 }
404 last_delta = delta;
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200405 timers_state.qemu_icount_bias = cur_icount
406 - (timers_state.qemu_icount << icount_time_shift);
Emilio G. Cota03719e42016-06-08 14:55:21 -0400407 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200408}
409
410static void icount_adjust_rt(void *opaque)
411{
Alex Bligh40daca52013-08-21 16:03:02 +0100412 timer_mod(icount_rt_timer,
Pavel Dovgalyuk1979b902015-01-12 15:00:43 +0300413 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL_RT) + 1000);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200414 icount_adjust();
415}
416
417static void icount_adjust_vm(void *opaque)
418{
Alex Bligh40daca52013-08-21 16:03:02 +0100419 timer_mod(icount_vm_timer,
420 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
Rutuja Shah73bcb242016-03-21 21:32:30 +0530421 NANOSECONDS_PER_SECOND / 10);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200422 icount_adjust();
423}
424
425static int64_t qemu_icount_round(int64_t count)
426{
427 return (count + (1 << icount_time_shift) - 1) >> icount_time_shift;
428}
429
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300430static void icount_warp_rt(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200431{
Alex Bennéeccffff42016-04-04 15:35:48 +0100432 unsigned seq;
433 int64_t warp_start;
434
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200435 /* The icount_warp_timer is rescheduled soon after vm_clock_warp_start
436 * changes from -1 to another value, so the race here is okay.
437 */
Alex Bennéeccffff42016-04-04 15:35:48 +0100438 do {
439 seq = seqlock_read_begin(&timers_state.vm_clock_seqlock);
440 warp_start = vm_clock_warp_start;
441 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, seq));
442
443 if (warp_start == -1) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200444 return;
445 }
446
Emilio G. Cota03719e42016-06-08 14:55:21 -0400447 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200448 if (runstate_is_running()) {
Pavel Dovgalyuk8eda2062015-09-17 19:24:28 +0300449 int64_t clock = REPLAY_CLOCK(REPLAY_CLOCK_VIRTUAL_RT,
450 cpu_get_clock_locked());
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200451 int64_t warp_delta;
452
453 warp_delta = clock - vm_clock_warp_start;
454 if (use_icount == 2) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200455 /*
Alex Bligh40daca52013-08-21 16:03:02 +0100456 * In adaptive mode, do not let QEMU_CLOCK_VIRTUAL run too
Paolo Bonzini946fb272011-09-12 13:57:37 +0200457 * far ahead of real time.
458 */
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200459 int64_t cur_icount = cpu_get_icount_locked();
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300460 int64_t delta = clock - cur_icount;
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200461 warp_delta = MIN(warp_delta, delta);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200462 }
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200463 timers_state.qemu_icount_bias += warp_delta;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200464 }
465 vm_clock_warp_start = -1;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400466 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200467
468 if (qemu_clock_expired(QEMU_CLOCK_VIRTUAL)) {
469 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
470 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200471}
472
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300473static void icount_timer_cb(void *opaque)
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300474{
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300475 /* No need for a checkpoint because the timer already synchronizes
476 * with CHECKPOINT_CLOCK_VIRTUAL_RT.
477 */
478 icount_warp_rt();
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300479}
480
Paolo Bonzini8156be52012-03-28 15:42:04 +0200481void qtest_clock_warp(int64_t dest)
482{
Alex Bligh40daca52013-08-21 16:03:02 +0100483 int64_t clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
Fam Zhengefef88b2015-01-19 17:51:43 +0800484 AioContext *aio_context;
Paolo Bonzini8156be52012-03-28 15:42:04 +0200485 assert(qtest_enabled());
Fam Zhengefef88b2015-01-19 17:51:43 +0800486 aio_context = qemu_get_aio_context();
Paolo Bonzini8156be52012-03-28 15:42:04 +0200487 while (clock < dest) {
Alex Bligh40daca52013-08-21 16:03:02 +0100488 int64_t deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
Sergey Fedorovc9299e22014-06-10 13:10:28 +0400489 int64_t warp = qemu_soonest_timeout(dest - clock, deadline);
Fam Zhengefef88b2015-01-19 17:51:43 +0800490
Emilio G. Cota03719e42016-06-08 14:55:21 -0400491 seqlock_write_begin(&timers_state.vm_clock_seqlock);
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200492 timers_state.qemu_icount_bias += warp;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400493 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200494
Alex Bligh40daca52013-08-21 16:03:02 +0100495 qemu_clock_run_timers(QEMU_CLOCK_VIRTUAL);
Fam Zhengefef88b2015-01-19 17:51:43 +0800496 timerlist_run_timers(aio_context->tlg.tl[QEMU_CLOCK_VIRTUAL]);
Alex Bligh40daca52013-08-21 16:03:02 +0100497 clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini8156be52012-03-28 15:42:04 +0200498 }
Alex Bligh40daca52013-08-21 16:03:02 +0100499 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini8156be52012-03-28 15:42:04 +0200500}
501
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300502void qemu_start_warp_timer(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200503{
Paolo Bonzinice78d182013-10-07 17:30:02 +0200504 int64_t clock;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200505 int64_t deadline;
506
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300507 if (!use_icount) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200508 return;
509 }
510
Pavel Dovgalyuk8bd7f712015-09-17 19:24:44 +0300511 /* Nothing to do if the VM is stopped: QEMU_CLOCK_VIRTUAL timers
512 * do not fire, so computing the deadline does not make sense.
513 */
514 if (!runstate_is_running()) {
515 return;
516 }
517
518 /* warp clock deterministically in record/replay mode */
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300519 if (!replay_checkpoint(CHECKPOINT_CLOCK_WARP_START)) {
Pavel Dovgalyuk8bd7f712015-09-17 19:24:44 +0300520 return;
521 }
522
Paolo Bonzinice78d182013-10-07 17:30:02 +0200523 if (!all_cpu_threads_idle()) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200524 return;
525 }
526
Paolo Bonzini8156be52012-03-28 15:42:04 +0200527 if (qtest_enabled()) {
528 /* When testing, qtest commands advance icount. */
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300529 return;
Paolo Bonzini8156be52012-03-28 15:42:04 +0200530 }
531
Alex Blighac70aaf2013-08-21 16:02:57 +0100532 /* We want to use the earliest deadline from ALL vm_clocks */
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300533 clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT);
Alex Bligh40daca52013-08-21 16:03:02 +0100534 deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
Paolo Bonzinice78d182013-10-07 17:30:02 +0200535 if (deadline < 0) {
Victor CLEMENTd7a0f712015-05-29 17:14:06 +0200536 static bool notified;
537 if (!icount_sleep && !notified) {
538 error_report("WARNING: icount sleep disabled and no active timers");
539 notified = true;
540 }
Paolo Bonzinice78d182013-10-07 17:30:02 +0200541 return;
Alex Blighac70aaf2013-08-21 16:02:57 +0100542 }
543
Paolo Bonzini946fb272011-09-12 13:57:37 +0200544 if (deadline > 0) {
545 /*
Alex Bligh40daca52013-08-21 16:03:02 +0100546 * Ensure QEMU_CLOCK_VIRTUAL proceeds even when the virtual CPU goes to
Paolo Bonzini946fb272011-09-12 13:57:37 +0200547 * sleep. Otherwise, the CPU might be waiting for a future timer
548 * interrupt to wake it up, but the interrupt never comes because
549 * the vCPU isn't running any insns and thus doesn't advance the
Alex Bligh40daca52013-08-21 16:03:02 +0100550 * QEMU_CLOCK_VIRTUAL.
Paolo Bonzini946fb272011-09-12 13:57:37 +0200551 */
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200552 if (!icount_sleep) {
553 /*
554 * We never let VCPUs sleep in no sleep icount mode.
555 * If there is a pending QEMU_CLOCK_VIRTUAL timer we just advance
556 * to the next QEMU_CLOCK_VIRTUAL event and notify it.
557 * It is useful when we want a deterministic execution time,
558 * isolated from host latencies.
559 */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400560 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200561 timers_state.qemu_icount_bias += deadline;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400562 seqlock_write_end(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200563 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
564 } else {
565 /*
566 * We do stop VCPUs and only advance QEMU_CLOCK_VIRTUAL after some
567 * "real" time, (related to the time left until the next event) has
568 * passed. The QEMU_CLOCK_VIRTUAL_RT clock will do this.
569 * This avoids that the warps are visible externally; for example,
570 * you will not be sending network packets continuously instead of
571 * every 100ms.
572 */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400573 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200574 if (vm_clock_warp_start == -1 || vm_clock_warp_start > clock) {
575 vm_clock_warp_start = clock;
576 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400577 seqlock_write_end(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200578 timer_mod_anticipate(icount_warp_timer, clock + deadline);
Paolo Bonzinice78d182013-10-07 17:30:02 +0200579 }
Alex Blighac70aaf2013-08-21 16:02:57 +0100580 } else if (deadline == 0) {
Alex Bligh40daca52013-08-21 16:03:02 +0100581 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200582 }
583}
584
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300585static void qemu_account_warp_timer(void)
586{
587 if (!use_icount || !icount_sleep) {
588 return;
589 }
590
591 /* Nothing to do if the VM is stopped: QEMU_CLOCK_VIRTUAL timers
592 * do not fire, so computing the deadline does not make sense.
593 */
594 if (!runstate_is_running()) {
595 return;
596 }
597
598 /* warp clock deterministically in record/replay mode */
599 if (!replay_checkpoint(CHECKPOINT_CLOCK_WARP_ACCOUNT)) {
600 return;
601 }
602
603 timer_del(icount_warp_timer);
604 icount_warp_rt();
605}
606
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200607static bool icount_state_needed(void *opaque)
608{
609 return use_icount;
610}
611
612/*
613 * This is a subsection for icount migration.
614 */
615static const VMStateDescription icount_vmstate_timers = {
616 .name = "timer/icount",
617 .version_id = 1,
618 .minimum_version_id = 1,
Juan Quintela5cd8cad2014-09-23 14:09:54 +0200619 .needed = icount_state_needed,
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200620 .fields = (VMStateField[]) {
621 VMSTATE_INT64(qemu_icount_bias, TimersState),
622 VMSTATE_INT64(qemu_icount, TimersState),
623 VMSTATE_END_OF_LIST()
624 }
625};
626
Paolo Bonzini946fb272011-09-12 13:57:37 +0200627static const VMStateDescription vmstate_timers = {
628 .name = "timer",
629 .version_id = 2,
630 .minimum_version_id = 1,
Juan Quintela35d08452014-04-16 16:01:33 +0200631 .fields = (VMStateField[]) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200632 VMSTATE_INT64(cpu_ticks_offset, TimersState),
633 VMSTATE_INT64(dummy, TimersState),
634 VMSTATE_INT64_V(cpu_clock_offset, TimersState, 2),
635 VMSTATE_END_OF_LIST()
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200636 },
Juan Quintela5cd8cad2014-09-23 14:09:54 +0200637 .subsections = (const VMStateDescription*[]) {
638 &icount_vmstate_timers,
639 NULL
Paolo Bonzini946fb272011-09-12 13:57:37 +0200640 }
641};
642
Paolo Bonzini14e6fe12016-10-31 10:36:08 +0100643static void cpu_throttle_thread(CPUState *cpu, run_on_cpu_data opaque)
Jason J. Herne2adcc852015-09-08 13:12:33 -0400644{
Jason J. Herne2adcc852015-09-08 13:12:33 -0400645 double pct;
646 double throttle_ratio;
647 long sleeptime_ns;
648
649 if (!cpu_throttle_get_percentage()) {
650 return;
651 }
652
653 pct = (double)cpu_throttle_get_percentage()/100;
654 throttle_ratio = pct / (1 - pct);
655 sleeptime_ns = (long)(throttle_ratio * CPU_THROTTLE_TIMESLICE_NS);
656
657 qemu_mutex_unlock_iothread();
658 atomic_set(&cpu->throttle_thread_scheduled, 0);
659 g_usleep(sleeptime_ns / 1000); /* Convert ns to us for usleep call */
660 qemu_mutex_lock_iothread();
661}
662
663static void cpu_throttle_timer_tick(void *opaque)
664{
665 CPUState *cpu;
666 double pct;
667
668 /* Stop the timer if needed */
669 if (!cpu_throttle_get_percentage()) {
670 return;
671 }
672 CPU_FOREACH(cpu) {
673 if (!atomic_xchg(&cpu->throttle_thread_scheduled, 1)) {
Paolo Bonzini14e6fe12016-10-31 10:36:08 +0100674 async_run_on_cpu(cpu, cpu_throttle_thread,
675 RUN_ON_CPU_NULL);
Jason J. Herne2adcc852015-09-08 13:12:33 -0400676 }
677 }
678
679 pct = (double)cpu_throttle_get_percentage()/100;
680 timer_mod(throttle_timer, qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT) +
681 CPU_THROTTLE_TIMESLICE_NS / (1-pct));
682}
683
684void cpu_throttle_set(int new_throttle_pct)
685{
686 /* Ensure throttle percentage is within valid range */
687 new_throttle_pct = MIN(new_throttle_pct, CPU_THROTTLE_PCT_MAX);
688 new_throttle_pct = MAX(new_throttle_pct, CPU_THROTTLE_PCT_MIN);
689
690 atomic_set(&throttle_percentage, new_throttle_pct);
691
692 timer_mod(throttle_timer, qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT) +
693 CPU_THROTTLE_TIMESLICE_NS);
694}
695
696void cpu_throttle_stop(void)
697{
698 atomic_set(&throttle_percentage, 0);
699}
700
701bool cpu_throttle_active(void)
702{
703 return (cpu_throttle_get_percentage() != 0);
704}
705
706int cpu_throttle_get_percentage(void)
707{
708 return atomic_read(&throttle_percentage);
709}
710
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400711void cpu_ticks_init(void)
712{
Emilio G. Cotaccdb3c12016-06-08 14:55:20 -0400713 seqlock_init(&timers_state.vm_clock_seqlock);
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400714 vmstate_register(NULL, 0, &vmstate_timers, &timers_state);
Jason J. Herne2adcc852015-09-08 13:12:33 -0400715 throttle_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL_RT,
716 cpu_throttle_timer_tick, NULL);
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400717}
718
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200719void configure_icount(QemuOpts *opts, Error **errp)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200720{
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200721 const char *option;
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200722 char *rem_str = NULL;
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200723
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200724 option = qemu_opt_get(opts, "shift");
Paolo Bonzini946fb272011-09-12 13:57:37 +0200725 if (!option) {
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200726 if (qemu_opt_get(opts, "align") != NULL) {
727 error_setg(errp, "Please specify shift option when using align");
728 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200729 return;
730 }
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200731
732 icount_sleep = qemu_opt_get_bool(opts, "sleep", true);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200733 if (icount_sleep) {
734 icount_warp_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL_RT,
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300735 icount_timer_cb, NULL);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200736 }
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200737
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200738 icount_align_option = qemu_opt_get_bool(opts, "align", false);
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200739
740 if (icount_align_option && !icount_sleep) {
Pranith Kumar778d9f92016-02-26 10:16:51 -0500741 error_setg(errp, "align=on and sleep=off are incompatible");
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200742 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200743 if (strcmp(option, "auto") != 0) {
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200744 errno = 0;
745 icount_time_shift = strtol(option, &rem_str, 0);
746 if (errno != 0 || *rem_str != '\0' || !strlen(option)) {
747 error_setg(errp, "icount: Invalid shift value");
748 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200749 use_icount = 1;
750 return;
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200751 } else if (icount_align_option) {
752 error_setg(errp, "shift=auto and align=on are incompatible");
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200753 } else if (!icount_sleep) {
Pranith Kumar778d9f92016-02-26 10:16:51 -0500754 error_setg(errp, "shift=auto and sleep=off are incompatible");
Paolo Bonzini946fb272011-09-12 13:57:37 +0200755 }
756
757 use_icount = 2;
758
759 /* 125MIPS seems a reasonable initial guess at the guest speed.
760 It will be corrected fairly quickly anyway. */
761 icount_time_shift = 3;
762
763 /* Have both realtime and virtual time triggers for speed adjustment.
764 The realtime trigger catches emulated time passing too slowly,
765 the virtual time trigger catches emulated time passing too fast.
766 Realtime triggers occur even when idle, so use them less frequently
767 than VM triggers. */
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300768 icount_rt_timer = timer_new_ms(QEMU_CLOCK_VIRTUAL_RT,
769 icount_adjust_rt, NULL);
Alex Bligh40daca52013-08-21 16:03:02 +0100770 timer_mod(icount_rt_timer,
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300771 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL_RT) + 1000);
Alex Bligh40daca52013-08-21 16:03:02 +0100772 icount_vm_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
773 icount_adjust_vm, NULL);
774 timer_mod(icount_vm_timer,
775 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
Rutuja Shah73bcb242016-03-21 21:32:30 +0530776 NANOSECONDS_PER_SECOND / 10);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200777}
778
779/***********************************************************/
Alex Bennée65467062017-02-23 18:29:09 +0000780/* TCG vCPU kick timer
781 *
782 * The kick timer is responsible for moving single threaded vCPU
783 * emulation on to the next vCPU. If more than one vCPU is running a
784 * timer event with force a cpu->exit so the next vCPU can get
785 * scheduled.
786 *
787 * The timer is removed if all vCPUs are idle and restarted again once
788 * idleness is complete.
789 */
790
791static QEMUTimer *tcg_kick_vcpu_timer;
Alex Bennée791158d2017-02-23 18:29:10 +0000792static CPUState *tcg_current_rr_cpu;
Alex Bennée65467062017-02-23 18:29:09 +0000793
794#define TCG_KICK_PERIOD (NANOSECONDS_PER_SECOND / 10)
795
796static inline int64_t qemu_tcg_next_kick(void)
797{
798 return qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + TCG_KICK_PERIOD;
799}
800
Alex Bennée791158d2017-02-23 18:29:10 +0000801/* Kick the currently round-robin scheduled vCPU */
802static void qemu_cpu_kick_rr_cpu(void)
803{
804 CPUState *cpu;
Alex Bennée791158d2017-02-23 18:29:10 +0000805 do {
806 cpu = atomic_mb_read(&tcg_current_rr_cpu);
807 if (cpu) {
808 cpu_exit(cpu);
809 }
810 } while (cpu != atomic_mb_read(&tcg_current_rr_cpu));
811}
812
Paolo Bonzini6b8f0182017-03-02 19:56:40 +0100813static void do_nothing(CPUState *cpu, run_on_cpu_data unused)
814{
815}
816
Paolo Bonzini3f53bc62017-03-03 11:50:29 +0100817void qemu_timer_notify_cb(void *opaque, QEMUClockType type)
818{
Paolo Bonzini6b8f0182017-03-02 19:56:40 +0100819 if (!use_icount || type != QEMU_CLOCK_VIRTUAL) {
820 qemu_notify_event();
821 return;
822 }
823
824 if (!qemu_in_vcpu_thread() && first_cpu) {
825 /* qemu_cpu_kick is not enough to kick a halted CPU out of
826 * qemu_tcg_wait_io_event. async_run_on_cpu, instead,
827 * causes cpu_thread_is_idle to return false. This way,
828 * handle_icount_deadline can run.
829 */
830 async_run_on_cpu(first_cpu, do_nothing, RUN_ON_CPU_NULL);
831 }
Paolo Bonzini3f53bc62017-03-03 11:50:29 +0100832}
833
Alex Bennée65467062017-02-23 18:29:09 +0000834static void kick_tcg_thread(void *opaque)
835{
836 timer_mod(tcg_kick_vcpu_timer, qemu_tcg_next_kick());
Alex Bennée791158d2017-02-23 18:29:10 +0000837 qemu_cpu_kick_rr_cpu();
Alex Bennée65467062017-02-23 18:29:09 +0000838}
839
840static void start_tcg_kick_timer(void)
841{
Alex Bennée37257942017-02-23 18:29:14 +0000842 if (!mttcg_enabled && !tcg_kick_vcpu_timer && CPU_NEXT(first_cpu)) {
Alex Bennée65467062017-02-23 18:29:09 +0000843 tcg_kick_vcpu_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
844 kick_tcg_thread, NULL);
845 timer_mod(tcg_kick_vcpu_timer, qemu_tcg_next_kick());
846 }
847}
848
849static void stop_tcg_kick_timer(void)
850{
851 if (tcg_kick_vcpu_timer) {
852 timer_del(tcg_kick_vcpu_timer);
853 tcg_kick_vcpu_timer = NULL;
854 }
855}
856
Alex Bennée65467062017-02-23 18:29:09 +0000857/***********************************************************/
Blue Swirl296af7c2010-03-29 19:23:50 +0000858void hw_error(const char *fmt, ...)
859{
860 va_list ap;
Andreas Färber55e5c282012-12-17 06:18:02 +0100861 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000862
863 va_start(ap, fmt);
864 fprintf(stderr, "qemu: hardware error: ");
865 vfprintf(stderr, fmt, ap);
866 fprintf(stderr, "\n");
Andreas Färberbdc44642013-06-24 23:50:24 +0200867 CPU_FOREACH(cpu) {
Andreas Färber55e5c282012-12-17 06:18:02 +0100868 fprintf(stderr, "CPU #%d:\n", cpu->cpu_index);
Andreas Färber878096e2013-05-27 01:33:50 +0200869 cpu_dump_state(cpu, stderr, fprintf, CPU_DUMP_FPU);
Blue Swirl296af7c2010-03-29 19:23:50 +0000870 }
871 va_end(ap);
872 abort();
873}
874
875void cpu_synchronize_all_states(void)
876{
Andreas Färber182735e2013-05-29 22:29:20 +0200877 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000878
Andreas Färberbdc44642013-06-24 23:50:24 +0200879 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200880 cpu_synchronize_state(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000881 }
882}
883
884void cpu_synchronize_all_post_reset(void)
885{
Andreas Färber182735e2013-05-29 22:29:20 +0200886 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000887
Andreas Färberbdc44642013-06-24 23:50:24 +0200888 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200889 cpu_synchronize_post_reset(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000890 }
891}
892
893void cpu_synchronize_all_post_init(void)
894{
Andreas Färber182735e2013-05-29 22:29:20 +0200895 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000896
Andreas Färberbdc44642013-06-24 23:50:24 +0200897 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200898 cpu_synchronize_post_init(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000899 }
900}
901
Kevin Wolf56983462013-07-05 13:49:54 +0200902static int do_vm_stop(RunState state)
Blue Swirl296af7c2010-03-29 19:23:50 +0000903{
Kevin Wolf56983462013-07-05 13:49:54 +0200904 int ret = 0;
905
Luiz Capitulino13548692011-07-29 15:36:43 -0300906 if (runstate_is_running()) {
Blue Swirl296af7c2010-03-29 19:23:50 +0000907 cpu_disable_ticks();
Blue Swirl296af7c2010-03-29 19:23:50 +0000908 pause_all_vcpus();
Luiz Capitulinof5bbfba2011-07-29 15:04:45 -0300909 runstate_set(state);
Luiz Capitulino1dfb4dd2011-07-29 14:26:33 -0300910 vm_state_notify(0, state);
Wenchao Xiaa4e15de2014-06-18 08:43:36 +0200911 qapi_event_send_stop(&error_abort);
Blue Swirl296af7c2010-03-29 19:23:50 +0000912 }
Kevin Wolf56983462013-07-05 13:49:54 +0200913
Kevin Wolf594a45c2013-07-18 14:52:19 +0200914 bdrv_drain_all();
Pavel Dovgalyuk6d0ceb82016-09-26 11:08:16 +0300915 replay_disable_events();
John Snow22af08e2016-09-22 21:45:51 -0400916 ret = bdrv_flush_all();
Kevin Wolf594a45c2013-07-18 14:52:19 +0200917
Kevin Wolf56983462013-07-05 13:49:54 +0200918 return ret;
Blue Swirl296af7c2010-03-29 19:23:50 +0000919}
920
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200921static bool cpu_can_run(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +0000922{
Andreas Färber4fdeee72012-05-02 23:10:09 +0200923 if (cpu->stop) {
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200924 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +0100925 }
Tiejun Chen321bc0b2013-08-02 09:43:09 +0800926 if (cpu_is_stopped(cpu)) {
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200927 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +0100928 }
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200929 return true;
Blue Swirl296af7c2010-03-29 19:23:50 +0000930}
931
Andreas Färber91325042013-05-27 02:07:49 +0200932static void cpu_handle_guest_debug(CPUState *cpu)
Jan Kiszka3c638d02010-06-25 16:56:56 +0200933{
Andreas Färber64f6b342013-05-27 02:06:09 +0200934 gdb_set_stop_cpu(cpu);
Jan Kiszka8cf71712011-02-07 12:19:16 +0100935 qemu_system_debug_request();
Andreas Färberf324e762012-05-02 23:26:21 +0200936 cpu->stopped = true;
Jan Kiszka3c638d02010-06-25 16:56:56 +0200937}
938
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100939#ifdef CONFIG_LINUX
940static void sigbus_reraise(void)
941{
942 sigset_t set;
943 struct sigaction action;
944
945 memset(&action, 0, sizeof(action));
946 action.sa_handler = SIG_DFL;
947 if (!sigaction(SIGBUS, &action, NULL)) {
948 raise(SIGBUS);
949 sigemptyset(&set);
950 sigaddset(&set, SIGBUS);
Peter Maydella2d17612016-05-16 18:33:59 +0100951 pthread_sigmask(SIG_UNBLOCK, &set, NULL);
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100952 }
953 perror("Failed to re-raise SIGBUS!\n");
954 abort();
955}
956
Paolo Bonzinid98d4072017-02-08 13:22:12 +0100957static void sigbus_handler(int n, siginfo_t *siginfo, void *ctx)
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100958{
Paolo Bonzinia16fc072017-02-09 09:50:02 +0100959 if (siginfo->si_code != BUS_MCEERR_AO && siginfo->si_code != BUS_MCEERR_AR) {
960 sigbus_reraise();
961 }
962
Paolo Bonzini2ae41db2017-02-08 12:48:54 +0100963 if (current_cpu) {
964 /* Called asynchronously in VCPU thread. */
965 if (kvm_on_sigbus_vcpu(current_cpu, siginfo->si_code, siginfo->si_addr)) {
966 sigbus_reraise();
967 }
968 } else {
969 /* Called synchronously (via signalfd) in main thread. */
970 if (kvm_on_sigbus(siginfo->si_code, siginfo->si_addr)) {
971 sigbus_reraise();
972 }
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100973 }
974}
975
976static void qemu_init_sigbus(void)
977{
978 struct sigaction action;
979
980 memset(&action, 0, sizeof(action));
981 action.sa_flags = SA_SIGINFO;
Paolo Bonzinid98d4072017-02-08 13:22:12 +0100982 action.sa_sigaction = sigbus_handler;
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100983 sigaction(SIGBUS, &action, NULL);
984
985 prctl(PR_MCE_KILL, PR_MCE_KILL_SET, PR_MCE_KILL_EARLY, 0, 0);
986}
Paolo Bonzinia16fc072017-02-09 09:50:02 +0100987#else /* !CONFIG_LINUX */
988static void qemu_init_sigbus(void)
989{
990}
Paolo Bonzinia16fc072017-02-09 09:50:02 +0100991#endif /* !CONFIG_LINUX */
Blue Swirl296af7c2010-03-29 19:23:50 +0000992
Stefan Weilb2532d82012-09-27 07:41:42 +0200993static QemuMutex qemu_global_mutex;
Blue Swirl296af7c2010-03-29 19:23:50 +0000994
995static QemuThread io_thread;
996
Blue Swirl296af7c2010-03-29 19:23:50 +0000997/* cpu creation */
998static QemuCond qemu_cpu_cond;
999/* system init */
Blue Swirl296af7c2010-03-29 19:23:50 +00001000static QemuCond qemu_pause_cond;
1001
Paolo Bonzinid3b12f52011-09-13 10:30:52 +02001002void qemu_init_cpu_loop(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001003{
Jan Kiszka6d9cb732011-02-01 22:15:58 +01001004 qemu_init_sigbus();
Anthony Liguoried945922011-02-08 18:18:18 +01001005 qemu_cond_init(&qemu_cpu_cond);
Anthony Liguoried945922011-02-08 18:18:18 +01001006 qemu_cond_init(&qemu_pause_cond);
Blue Swirl296af7c2010-03-29 19:23:50 +00001007 qemu_mutex_init(&qemu_global_mutex);
Blue Swirl296af7c2010-03-29 19:23:50 +00001008
Jan Kiszkab7680cb2011-03-12 17:43:51 +01001009 qemu_thread_get_self(&io_thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001010}
1011
Paolo Bonzini14e6fe12016-10-31 10:36:08 +01001012void run_on_cpu(CPUState *cpu, run_on_cpu_func func, run_on_cpu_data data)
Marcelo Tosattie82bcec2010-05-04 09:45:22 -03001013{
Sergey Fedorovd148d902016-08-29 09:51:00 +02001014 do_run_on_cpu(cpu, func, data, &qemu_global_mutex);
Chegu Vinod3c022702013-06-24 03:49:41 -06001015}
1016
Gu Zheng4c055ab2016-05-12 09:18:13 +05301017static void qemu_kvm_destroy_vcpu(CPUState *cpu)
1018{
1019 if (kvm_destroy_vcpu(cpu) < 0) {
1020 error_report("kvm_destroy_vcpu failed");
1021 exit(EXIT_FAILURE);
1022 }
1023}
1024
1025static void qemu_tcg_destroy_vcpu(CPUState *cpu)
1026{
1027}
1028
Andreas Färber509a0d72012-05-03 02:18:09 +02001029static void qemu_wait_io_event_common(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001030{
Alex Bennée37257942017-02-23 18:29:14 +00001031 atomic_mb_set(&cpu->thread_kicked, false);
Andreas Färber4fdeee72012-05-02 23:10:09 +02001032 if (cpu->stop) {
1033 cpu->stop = false;
Andreas Färberf324e762012-05-02 23:26:21 +02001034 cpu->stopped = true;
Dr. David Alan Gilbert96bce682016-01-25 10:08:18 +00001035 qemu_cond_broadcast(&qemu_pause_cond);
Blue Swirl296af7c2010-03-29 19:23:50 +00001036 }
Sergey Fedorova5403c62016-08-02 18:27:36 +01001037 process_queued_cpu_work(cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001038}
1039
1040static bool qemu_tcg_should_sleep(CPUState *cpu)
1041{
1042 if (mttcg_enabled) {
1043 return cpu_thread_is_idle(cpu);
1044 } else {
1045 return all_cpu_threads_idle();
1046 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001047}
1048
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001049static void qemu_tcg_wait_io_event(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001050{
Alex Bennée37257942017-02-23 18:29:14 +00001051 while (qemu_tcg_should_sleep(cpu)) {
Alex Bennée65467062017-02-23 18:29:09 +00001052 stop_tcg_kick_timer();
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001053 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka16400322011-02-09 16:29:37 +01001054 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001055
Alex Bennée65467062017-02-23 18:29:09 +00001056 start_tcg_kick_timer();
1057
Alex Bennée37257942017-02-23 18:29:14 +00001058 qemu_wait_io_event_common(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001059}
1060
Andreas Färberfd529e82013-05-26 23:24:55 +02001061static void qemu_kvm_wait_io_event(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001062{
Andreas Färbera98ae1d2013-05-26 23:21:08 +02001063 while (cpu_thread_is_idle(cpu)) {
Andreas Färberf5c121b2012-05-03 01:22:49 +02001064 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka16400322011-02-09 16:29:37 +01001065 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001066
Andreas Färber509a0d72012-05-03 02:18:09 +02001067 qemu_wait_io_event_common(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001068}
1069
Jan Kiszka7e97cd82011-02-07 12:19:12 +01001070static void *qemu_kvm_cpu_thread_fn(void *arg)
Blue Swirl296af7c2010-03-29 19:23:50 +00001071{
Andreas Färber48a106b2013-05-27 02:20:39 +02001072 CPUState *cpu = arg;
Jan Kiszka84b49152011-02-01 22:15:50 +01001073 int r;
Blue Swirl296af7c2010-03-29 19:23:50 +00001074
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001075 rcu_register_thread();
1076
Paolo Bonzini2e7f7a32015-06-18 18:47:18 +02001077 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001078 qemu_thread_get_self(cpu->thread);
Andreas Färber9f09e182012-05-03 06:59:07 +02001079 cpu->thread_id = qemu_get_thread_id();
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001080 cpu->can_do_io = 1;
Andreas Färber4917cf42013-05-27 05:17:50 +02001081 current_cpu = cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001082
Andreas Färber504134d2012-12-17 06:38:45 +01001083 r = kvm_init_vcpu(cpu);
Jan Kiszka84b49152011-02-01 22:15:50 +01001084 if (r < 0) {
1085 fprintf(stderr, "kvm_init_vcpu failed: %s\n", strerror(-r));
1086 exit(1);
1087 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001088
Paolo Bonzini18268b62017-02-09 09:41:14 +01001089 kvm_init_cpu_signals(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001090
1091 /* signal CPU creation */
Andreas Färber61a46212012-05-02 22:49:36 +02001092 cpu->created = true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001093 qemu_cond_signal(&qemu_cpu_cond);
1094
Gu Zheng4c055ab2016-05-12 09:18:13 +05301095 do {
Andreas Färbera1fcaa72012-05-02 23:42:26 +02001096 if (cpu_can_run(cpu)) {
Andreas Färber1458c362013-05-26 23:46:55 +02001097 r = kvm_cpu_exec(cpu);
Jan Kiszka83f338f2011-02-07 12:19:17 +01001098 if (r == EXCP_DEBUG) {
Andreas Färber91325042013-05-27 02:07:49 +02001099 cpu_handle_guest_debug(cpu);
Jan Kiszka83f338f2011-02-07 12:19:17 +01001100 }
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001101 }
Andreas Färberfd529e82013-05-26 23:24:55 +02001102 qemu_kvm_wait_io_event(cpu);
Gu Zheng4c055ab2016-05-12 09:18:13 +05301103 } while (!cpu->unplug || cpu_can_run(cpu));
Blue Swirl296af7c2010-03-29 19:23:50 +00001104
Gu Zheng4c055ab2016-05-12 09:18:13 +05301105 qemu_kvm_destroy_vcpu(cpu);
Bharata B Rao2c579042016-05-12 09:18:14 +05301106 cpu->created = false;
1107 qemu_cond_signal(&qemu_cpu_cond);
Gu Zheng4c055ab2016-05-12 09:18:13 +05301108 qemu_mutex_unlock_iothread();
Blue Swirl296af7c2010-03-29 19:23:50 +00001109 return NULL;
1110}
1111
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001112static void *qemu_dummy_cpu_thread_fn(void *arg)
1113{
1114#ifdef _WIN32
1115 fprintf(stderr, "qtest is not supported under Windows\n");
1116 exit(1);
1117#else
Andreas Färber10a90212013-05-27 02:24:35 +02001118 CPUState *cpu = arg;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001119 sigset_t waitset;
1120 int r;
1121
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001122 rcu_register_thread();
1123
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001124 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001125 qemu_thread_get_self(cpu->thread);
Andreas Färber9f09e182012-05-03 06:59:07 +02001126 cpu->thread_id = qemu_get_thread_id();
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001127 cpu->can_do_io = 1;
Alex Bennée37257942017-02-23 18:29:14 +00001128 current_cpu = cpu;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001129
1130 sigemptyset(&waitset);
1131 sigaddset(&waitset, SIG_IPI);
1132
1133 /* signal CPU creation */
Andreas Färber61a46212012-05-02 22:49:36 +02001134 cpu->created = true;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001135 qemu_cond_signal(&qemu_cpu_cond);
1136
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001137 while (1) {
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001138 qemu_mutex_unlock_iothread();
1139 do {
1140 int sig;
1141 r = sigwait(&waitset, &sig);
1142 } while (r == -1 && (errno == EAGAIN || errno == EINTR));
1143 if (r == -1) {
1144 perror("sigwait");
1145 exit(1);
1146 }
1147 qemu_mutex_lock_iothread();
Andreas Färber509a0d72012-05-03 02:18:09 +02001148 qemu_wait_io_event_common(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001149 }
1150
1151 return NULL;
1152#endif
1153}
1154
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001155static int64_t tcg_get_icount_limit(void)
1156{
1157 int64_t deadline;
1158
1159 if (replay_mode != REPLAY_MODE_PLAY) {
1160 deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
1161
1162 /* Maintain prior (possibly buggy) behaviour where if no deadline
1163 * was set (as there is no QEMU_CLOCK_VIRTUAL timer) or it is more than
1164 * INT32_MAX nanoseconds ahead, we still use INT32_MAX
1165 * nanoseconds.
1166 */
1167 if ((deadline < 0) || (deadline > INT32_MAX)) {
1168 deadline = INT32_MAX;
1169 }
1170
1171 return qemu_icount_round(deadline);
1172 } else {
1173 return replay_get_instructions();
1174 }
1175}
1176
Alex Bennée12e97002016-10-27 16:10:14 +01001177static void handle_icount_deadline(void)
1178{
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001179 assert(qemu_in_vcpu_thread());
Alex Bennée12e97002016-10-27 16:10:14 +01001180 if (use_icount) {
1181 int64_t deadline =
1182 qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
1183
1184 if (deadline == 0) {
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001185 /* Wake up other AioContexts. */
Alex Bennée12e97002016-10-27 16:10:14 +01001186 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001187 qemu_clock_run_timers(QEMU_CLOCK_VIRTUAL);
Alex Bennée12e97002016-10-27 16:10:14 +01001188 }
1189 }
1190}
1191
Alex Bennée05248382017-03-29 16:46:59 +01001192static void prepare_icount_for_run(CPUState *cpu)
1193{
1194 if (use_icount) {
1195 int64_t count;
1196 int decr;
1197
1198 /* These should always be cleared by process_icount_data after
1199 * each vCPU execution. However u16.high can be raised
1200 * asynchronously by cpu_exit/cpu_interrupt/tcg_handle_interrupt
1201 */
1202 g_assert(cpu->icount_decr.u16.low == 0);
1203 g_assert(cpu->icount_extra == 0);
1204
1205
1206 count = tcg_get_icount_limit();
1207
Alex Bennéee4cd9652017-03-31 16:09:42 +01001208 /* To calculate what we have executed so far we need to know
1209 * what we originally budgeted to run this cycle */
1210 cpu->icount_budget = count;
1211
Alex Bennée05248382017-03-29 16:46:59 +01001212 decr = (count > 0xffff) ? 0xffff : count;
1213 count -= decr;
1214 cpu->icount_decr.u16.low = decr;
1215 cpu->icount_extra = count;
1216 }
1217}
1218
1219static void process_icount_data(CPUState *cpu)
1220{
1221 if (use_icount) {
Alex Bennéee4cd9652017-03-31 16:09:42 +01001222 /* Account for executed instructions */
1223 timers_state.qemu_icount += cpu_get_icount_executed(cpu);
Alex Bennée05248382017-03-29 16:46:59 +01001224
1225 /* Reset the counters */
1226 cpu->icount_decr.u16.low = 0;
1227 cpu->icount_extra = 0;
Alex Bennéee4cd9652017-03-31 16:09:42 +01001228 cpu->icount_budget = 0;
1229
Alex Bennée05248382017-03-29 16:46:59 +01001230 replay_account_executed_instructions();
1231 }
1232}
1233
1234
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001235static int tcg_cpu_exec(CPUState *cpu)
1236{
1237 int ret;
1238#ifdef CONFIG_PROFILER
1239 int64_t ti;
1240#endif
1241
1242#ifdef CONFIG_PROFILER
1243 ti = profile_getclock();
1244#endif
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001245 qemu_mutex_unlock_iothread();
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001246 cpu_exec_start(cpu);
1247 ret = cpu_exec(cpu);
1248 cpu_exec_end(cpu);
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001249 qemu_mutex_lock_iothread();
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001250#ifdef CONFIG_PROFILER
1251 tcg_time += profile_getclock() - ti;
1252#endif
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001253 return ret;
1254}
1255
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001256/* Destroy any remaining vCPUs which have been unplugged and have
1257 * finished running
1258 */
1259static void deal_with_unplugged_cpus(void)
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001260{
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001261 CPUState *cpu;
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001262
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001263 CPU_FOREACH(cpu) {
1264 if (cpu->unplug && !cpu_can_run(cpu)) {
1265 qemu_tcg_destroy_vcpu(cpu);
1266 cpu->created = false;
1267 qemu_cond_signal(&qemu_cpu_cond);
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001268 break;
1269 }
1270 }
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001271}
Jan Kiszkabdb7ca62011-09-26 09:40:39 +02001272
Alex Bennée65467062017-02-23 18:29:09 +00001273/* Single-threaded TCG
1274 *
1275 * In the single-threaded case each vCPU is simulated in turn. If
1276 * there is more than a single vCPU we create a simple timer to kick
1277 * the vCPU and ensure we don't get stuck in a tight loop in one vCPU.
1278 * This is done explicitly rather than relying on side-effects
1279 * elsewhere.
1280 */
1281
Alex Bennée37257942017-02-23 18:29:14 +00001282static void *qemu_tcg_rr_cpu_thread_fn(void *arg)
Blue Swirl296af7c2010-03-29 19:23:50 +00001283{
Andreas Färberc3586ba2012-05-03 01:41:24 +02001284 CPUState *cpu = arg;
Blue Swirl296af7c2010-03-29 19:23:50 +00001285
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001286 rcu_register_thread();
1287
Paolo Bonzini2e7f7a32015-06-18 18:47:18 +02001288 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001289 qemu_thread_get_self(cpu->thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001290
Andreas Färber38fcbd32013-07-07 19:50:23 +02001291 CPU_FOREACH(cpu) {
1292 cpu->thread_id = qemu_get_thread_id();
1293 cpu->created = true;
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001294 cpu->can_do_io = 1;
Andreas Färber38fcbd32013-07-07 19:50:23 +02001295 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001296 qemu_cond_signal(&qemu_cpu_cond);
1297
Jan Kiszkafa7d1862011-08-22 18:35:25 +02001298 /* wait for initial kick-off after machine start */
Emilio G. Cotac28e3992015-04-27 12:45:28 -04001299 while (first_cpu->stopped) {
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001300 qemu_cond_wait(first_cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka8e564b42012-02-17 18:31:15 +01001301
1302 /* process any pending work */
Andreas Färberbdc44642013-06-24 23:50:24 +02001303 CPU_FOREACH(cpu) {
Alex Bennée37257942017-02-23 18:29:14 +00001304 current_cpu = cpu;
Andreas Färber182735e2013-05-29 22:29:20 +02001305 qemu_wait_io_event_common(cpu);
Jan Kiszka8e564b42012-02-17 18:31:15 +01001306 }
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001307 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001308
Alex Bennée65467062017-02-23 18:29:09 +00001309 start_tcg_kick_timer();
1310
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001311 cpu = first_cpu;
1312
Alex Bennéee5143e32017-02-23 18:29:12 +00001313 /* process any pending work */
1314 cpu->exit_request = 1;
1315
Blue Swirl296af7c2010-03-29 19:23:50 +00001316 while (1) {
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001317 /* Account partial waits to QEMU_CLOCK_VIRTUAL. */
1318 qemu_account_warp_timer();
1319
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001320 /* Run the timers here. This is much more efficient than
1321 * waking up the I/O thread and waiting for completion.
1322 */
1323 handle_icount_deadline();
1324
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001325 if (!cpu) {
1326 cpu = first_cpu;
1327 }
1328
Alex Bennéee5143e32017-02-23 18:29:12 +00001329 while (cpu && !cpu->queued_work_first && !cpu->exit_request) {
1330
Alex Bennée791158d2017-02-23 18:29:10 +00001331 atomic_mb_set(&tcg_current_rr_cpu, cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001332 current_cpu = cpu;
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001333
1334 qemu_clock_enable(QEMU_CLOCK_VIRTUAL,
1335 (cpu->singlestep_enabled & SSTEP_NOTIMER) == 0);
1336
1337 if (cpu_can_run(cpu)) {
1338 int r;
Alex Bennée05248382017-03-29 16:46:59 +01001339
1340 prepare_icount_for_run(cpu);
1341
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001342 r = tcg_cpu_exec(cpu);
Alex Bennée05248382017-03-29 16:46:59 +01001343
1344 process_icount_data(cpu);
1345
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001346 if (r == EXCP_DEBUG) {
1347 cpu_handle_guest_debug(cpu);
1348 break;
Pranith Kumar08e73c42017-02-23 18:29:15 +00001349 } else if (r == EXCP_ATOMIC) {
1350 qemu_mutex_unlock_iothread();
1351 cpu_exec_step_atomic(cpu);
1352 qemu_mutex_lock_iothread();
1353 break;
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001354 }
Alex Bennée37257942017-02-23 18:29:14 +00001355 } else if (cpu->stop) {
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001356 if (cpu->unplug) {
1357 cpu = CPU_NEXT(cpu);
1358 }
1359 break;
1360 }
1361
Alex Bennéee5143e32017-02-23 18:29:12 +00001362 cpu = CPU_NEXT(cpu);
1363 } /* while (cpu && !cpu->exit_request).. */
1364
Alex Bennée791158d2017-02-23 18:29:10 +00001365 /* Does not need atomic_mb_set because a spurious wakeup is okay. */
1366 atomic_set(&tcg_current_rr_cpu, NULL);
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001367
Alex Bennéee5143e32017-02-23 18:29:12 +00001368 if (cpu && cpu->exit_request) {
1369 atomic_mb_set(&cpu->exit_request, 0);
1370 }
Alex Blighac70aaf2013-08-21 16:02:57 +01001371
Alex Bennée37257942017-02-23 18:29:14 +00001372 qemu_tcg_wait_io_event(cpu ? cpu : QTAILQ_FIRST(&cpus));
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001373 deal_with_unplugged_cpus();
Blue Swirl296af7c2010-03-29 19:23:50 +00001374 }
1375
1376 return NULL;
1377}
1378
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001379static void *qemu_hax_cpu_thread_fn(void *arg)
1380{
1381 CPUState *cpu = arg;
1382 int r;
Vincent Palatinb3d3a422017-03-20 11:15:49 +01001383
1384 qemu_mutex_lock_iothread();
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001385 qemu_thread_get_self(cpu->thread);
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001386
1387 cpu->thread_id = qemu_get_thread_id();
1388 cpu->created = true;
1389 cpu->halted = 0;
1390 current_cpu = cpu;
1391
1392 hax_init_vcpu(cpu);
1393 qemu_cond_signal(&qemu_cpu_cond);
1394
1395 while (1) {
1396 if (cpu_can_run(cpu)) {
1397 r = hax_smp_cpu_exec(cpu);
1398 if (r == EXCP_DEBUG) {
1399 cpu_handle_guest_debug(cpu);
1400 }
1401 }
1402
1403 while (cpu_thread_is_idle(cpu)) {
1404 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
1405 }
1406#ifdef _WIN32
1407 SleepEx(0, TRUE);
1408#endif
1409 qemu_wait_io_event_common(cpu);
1410 }
1411 return NULL;
1412}
1413
1414#ifdef _WIN32
1415static void CALLBACK dummy_apc_func(ULONG_PTR unused)
1416{
1417}
1418#endif
1419
Alex Bennée37257942017-02-23 18:29:14 +00001420/* Multi-threaded TCG
1421 *
1422 * In the multi-threaded case each vCPU has its own thread. The TLS
1423 * variable current_cpu can be used deep in the code to find the
1424 * current CPUState for a given thread.
1425 */
1426
1427static void *qemu_tcg_cpu_thread_fn(void *arg)
1428{
1429 CPUState *cpu = arg;
1430
Alex Bennéebf51c722017-03-30 18:32:29 +01001431 g_assert(!use_icount);
1432
Alex Bennée37257942017-02-23 18:29:14 +00001433 rcu_register_thread();
1434
1435 qemu_mutex_lock_iothread();
1436 qemu_thread_get_self(cpu->thread);
1437
1438 cpu->thread_id = qemu_get_thread_id();
1439 cpu->created = true;
1440 cpu->can_do_io = 1;
1441 current_cpu = cpu;
1442 qemu_cond_signal(&qemu_cpu_cond);
1443
1444 /* process any pending work */
1445 cpu->exit_request = 1;
1446
1447 while (1) {
1448 if (cpu_can_run(cpu)) {
1449 int r;
1450 r = tcg_cpu_exec(cpu);
1451 switch (r) {
1452 case EXCP_DEBUG:
1453 cpu_handle_guest_debug(cpu);
1454 break;
1455 case EXCP_HALTED:
1456 /* during start-up the vCPU is reset and the thread is
1457 * kicked several times. If we don't ensure we go back
1458 * to sleep in the halted state we won't cleanly
1459 * start-up when the vCPU is enabled.
1460 *
1461 * cpu->halted should ensure we sleep in wait_io_event
1462 */
1463 g_assert(cpu->halted);
1464 break;
Pranith Kumar08e73c42017-02-23 18:29:15 +00001465 case EXCP_ATOMIC:
1466 qemu_mutex_unlock_iothread();
1467 cpu_exec_step_atomic(cpu);
1468 qemu_mutex_lock_iothread();
Alex Bennée37257942017-02-23 18:29:14 +00001469 default:
1470 /* Ignore everything else? */
1471 break;
1472 }
1473 }
1474
Alex Bennée37257942017-02-23 18:29:14 +00001475 atomic_mb_set(&cpu->exit_request, 0);
1476 qemu_tcg_wait_io_event(cpu);
1477 }
1478
1479 return NULL;
1480}
1481
Andreas Färber2ff09a42012-05-03 00:23:30 +02001482static void qemu_cpu_kick_thread(CPUState *cpu)
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001483{
1484#ifndef _WIN32
1485 int err;
1486
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001487 if (cpu->thread_kicked) {
1488 return;
Paolo Bonzini9102ded2015-08-18 06:52:09 -07001489 }
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001490 cpu->thread_kicked = true;
Andreas Färber814e6122012-05-02 17:00:37 +02001491 err = pthread_kill(cpu->thread->thread, SIG_IPI);
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001492 if (err) {
1493 fprintf(stderr, "qemu:%s: %s", __func__, strerror(err));
1494 exit(1);
1495 }
1496#else /* _WIN32 */
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001497 if (!qemu_cpu_is_self(cpu)) {
1498 if (!QueueUserAPC(dummy_apc_func, cpu->hThread, 0)) {
1499 fprintf(stderr, "%s: QueueUserAPC failed with error %lu\n",
1500 __func__, GetLastError());
1501 exit(1);
1502 }
1503 }
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001504#endif
1505}
1506
Andreas Färberc08d7422012-05-03 04:34:15 +02001507void qemu_cpu_kick(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001508{
Andreas Färberf5c121b2012-05-03 01:22:49 +02001509 qemu_cond_broadcast(cpu->halt_cond);
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001510 if (tcg_enabled()) {
Alex Bennée791158d2017-02-23 18:29:10 +00001511 cpu_exit(cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001512 /* NOP unless doing single-thread RR */
Alex Bennée791158d2017-02-23 18:29:10 +00001513 qemu_cpu_kick_rr_cpu();
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001514 } else {
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001515 if (hax_enabled()) {
1516 /*
1517 * FIXME: race condition with the exit_request check in
1518 * hax_vcpu_hax_exec
1519 */
1520 cpu->exit_request = 1;
1521 }
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001522 qemu_cpu_kick_thread(cpu);
1523 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001524}
1525
Jan Kiszka46d62fa2011-02-01 22:15:59 +01001526void qemu_cpu_kick_self(void)
1527{
Andreas Färber4917cf42013-05-27 05:17:50 +02001528 assert(current_cpu);
Paolo Bonzini9102ded2015-08-18 06:52:09 -07001529 qemu_cpu_kick_thread(current_cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001530}
1531
Andreas Färber60e82572012-05-02 22:23:49 +02001532bool qemu_cpu_is_self(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001533{
Andreas Färber814e6122012-05-02 17:00:37 +02001534 return qemu_thread_is_self(cpu->thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001535}
1536
Paolo Bonzini79e2b9a2015-01-21 12:09:14 +01001537bool qemu_in_vcpu_thread(void)
Juan Quintelaaa723c22012-09-18 16:30:11 +02001538{
Andreas Färber4917cf42013-05-27 05:17:50 +02001539 return current_cpu && qemu_cpu_is_self(current_cpu);
Juan Quintelaaa723c22012-09-18 16:30:11 +02001540}
1541
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001542static __thread bool iothread_locked = false;
1543
1544bool qemu_mutex_iothread_locked(void)
1545{
1546 return iothread_locked;
1547}
1548
Blue Swirl296af7c2010-03-29 19:23:50 +00001549void qemu_mutex_lock_iothread(void)
1550{
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001551 g_assert(!qemu_mutex_iothread_locked());
1552 qemu_mutex_lock(&qemu_global_mutex);
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001553 iothread_locked = true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001554}
1555
1556void qemu_mutex_unlock_iothread(void)
1557{
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001558 g_assert(qemu_mutex_iothread_locked());
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001559 iothread_locked = false;
Blue Swirl296af7c2010-03-29 19:23:50 +00001560 qemu_mutex_unlock(&qemu_global_mutex);
1561}
1562
Alex Bennéee8faee02016-10-27 16:09:58 +01001563static bool all_vcpus_paused(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001564{
Andreas Färberbdc44642013-06-24 23:50:24 +02001565 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001566
Andreas Färberbdc44642013-06-24 23:50:24 +02001567 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001568 if (!cpu->stopped) {
Alex Bennéee8faee02016-10-27 16:09:58 +01001569 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001570 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001571 }
1572
Alex Bennéee8faee02016-10-27 16:09:58 +01001573 return true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001574}
1575
1576void pause_all_vcpus(void)
1577{
Andreas Färberbdc44642013-06-24 23:50:24 +02001578 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001579
Alex Bligh40daca52013-08-21 16:03:02 +01001580 qemu_clock_enable(QEMU_CLOCK_VIRTUAL, false);
Andreas Färberbdc44642013-06-24 23:50:24 +02001581 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001582 cpu->stop = true;
1583 qemu_cpu_kick(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001584 }
1585
Juan Quintelaaa723c22012-09-18 16:30:11 +02001586 if (qemu_in_vcpu_thread()) {
Jan Kiszkad798e972012-02-17 18:31:16 +01001587 cpu_stop_current();
Jan Kiszkad798e972012-02-17 18:31:16 +01001588 }
1589
Blue Swirl296af7c2010-03-29 19:23:50 +00001590 while (!all_vcpus_paused()) {
Paolo Bonzinibe7d6c52011-03-12 17:44:02 +01001591 qemu_cond_wait(&qemu_pause_cond, &qemu_global_mutex);
Andreas Färberbdc44642013-06-24 23:50:24 +02001592 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001593 qemu_cpu_kick(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001594 }
1595 }
1596}
1597
Igor Mammedov29936832013-04-23 10:29:37 +02001598void cpu_resume(CPUState *cpu)
1599{
1600 cpu->stop = false;
1601 cpu->stopped = false;
1602 qemu_cpu_kick(cpu);
1603}
1604
Blue Swirl296af7c2010-03-29 19:23:50 +00001605void resume_all_vcpus(void)
1606{
Andreas Färberbdc44642013-06-24 23:50:24 +02001607 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001608
Alex Bligh40daca52013-08-21 16:03:02 +01001609 qemu_clock_enable(QEMU_CLOCK_VIRTUAL, true);
Andreas Färberbdc44642013-06-24 23:50:24 +02001610 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001611 cpu_resume(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001612 }
1613}
1614
Gu Zheng4c055ab2016-05-12 09:18:13 +05301615void cpu_remove(CPUState *cpu)
1616{
1617 cpu->stop = true;
1618 cpu->unplug = true;
1619 qemu_cpu_kick(cpu);
1620}
1621
Bharata B Rao2c579042016-05-12 09:18:14 +05301622void cpu_remove_sync(CPUState *cpu)
1623{
1624 cpu_remove(cpu);
1625 while (cpu->created) {
1626 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1627 }
1628}
1629
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001630/* For temporary buffers for forming a name */
1631#define VCPU_THREAD_NAME_SIZE 16
1632
Andreas Färbere5ab30a2012-05-03 01:50:44 +02001633static void qemu_tcg_init_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001634{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001635 char thread_name[VCPU_THREAD_NAME_SIZE];
Alex Bennée37257942017-02-23 18:29:14 +00001636 static QemuCond *single_tcg_halt_cond;
1637 static QemuThread *single_tcg_cpu_thread;
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001638
Alex Bennée37257942017-02-23 18:29:14 +00001639 if (qemu_tcg_mttcg_enabled() || !single_tcg_cpu_thread) {
Andreas Färber814e6122012-05-02 17:00:37 +02001640 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001641 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1642 qemu_cond_init(cpu->halt_cond);
Alex Bennée37257942017-02-23 18:29:14 +00001643
1644 if (qemu_tcg_mttcg_enabled()) {
1645 /* create a thread per vCPU with TCG (MTTCG) */
1646 parallel_cpus = true;
1647 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/TCG",
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001648 cpu->cpu_index);
Alex Bennée37257942017-02-23 18:29:14 +00001649
1650 qemu_thread_create(cpu->thread, thread_name, qemu_tcg_cpu_thread_fn,
1651 cpu, QEMU_THREAD_JOINABLE);
1652
1653 } else {
1654 /* share a single thread for all cpus with TCG */
1655 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "ALL CPUs/TCG");
1656 qemu_thread_create(cpu->thread, thread_name,
1657 qemu_tcg_rr_cpu_thread_fn,
1658 cpu, QEMU_THREAD_JOINABLE);
1659
1660 single_tcg_halt_cond = cpu->halt_cond;
1661 single_tcg_cpu_thread = cpu->thread;
1662 }
Paolo Bonzini1ecf47b2011-12-13 13:43:52 +01001663#ifdef _WIN32
Andreas Färber814e6122012-05-02 17:00:37 +02001664 cpu->hThread = qemu_thread_get_handle(cpu->thread);
Paolo Bonzini1ecf47b2011-12-13 13:43:52 +01001665#endif
Andreas Färber61a46212012-05-02 22:49:36 +02001666 while (!cpu->created) {
Paolo Bonzini18a85722011-03-12 17:44:03 +01001667 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001668 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001669 } else {
Alex Bennée37257942017-02-23 18:29:14 +00001670 /* For non-MTTCG cases we share the thread */
1671 cpu->thread = single_tcg_cpu_thread;
1672 cpu->halt_cond = single_tcg_halt_cond;
Blue Swirl296af7c2010-03-29 19:23:50 +00001673 }
1674}
1675
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001676static void qemu_hax_start_vcpu(CPUState *cpu)
1677{
1678 char thread_name[VCPU_THREAD_NAME_SIZE];
1679
1680 cpu->thread = g_malloc0(sizeof(QemuThread));
1681 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1682 qemu_cond_init(cpu->halt_cond);
1683
1684 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/HAX",
1685 cpu->cpu_index);
1686 qemu_thread_create(cpu->thread, thread_name, qemu_hax_cpu_thread_fn,
1687 cpu, QEMU_THREAD_JOINABLE);
1688#ifdef _WIN32
1689 cpu->hThread = qemu_thread_get_handle(cpu->thread);
1690#endif
1691 while (!cpu->created) {
1692 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1693 }
1694}
1695
Andreas Färber48a106b2013-05-27 02:20:39 +02001696static void qemu_kvm_start_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001697{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001698 char thread_name[VCPU_THREAD_NAME_SIZE];
1699
Andreas Färber814e6122012-05-02 17:00:37 +02001700 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001701 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1702 qemu_cond_init(cpu->halt_cond);
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001703 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/KVM",
1704 cpu->cpu_index);
1705 qemu_thread_create(cpu->thread, thread_name, qemu_kvm_cpu_thread_fn,
1706 cpu, QEMU_THREAD_JOINABLE);
Andreas Färber61a46212012-05-02 22:49:36 +02001707 while (!cpu->created) {
Paolo Bonzini18a85722011-03-12 17:44:03 +01001708 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001709 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001710}
1711
Andreas Färber10a90212013-05-27 02:24:35 +02001712static void qemu_dummy_start_vcpu(CPUState *cpu)
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001713{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001714 char thread_name[VCPU_THREAD_NAME_SIZE];
1715
Andreas Färber814e6122012-05-02 17:00:37 +02001716 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001717 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1718 qemu_cond_init(cpu->halt_cond);
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001719 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/DUMMY",
1720 cpu->cpu_index);
1721 qemu_thread_create(cpu->thread, thread_name, qemu_dummy_cpu_thread_fn, cpu,
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001722 QEMU_THREAD_JOINABLE);
Andreas Färber61a46212012-05-02 22:49:36 +02001723 while (!cpu->created) {
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001724 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1725 }
1726}
1727
Andreas Färberc643bed2013-05-27 03:23:24 +02001728void qemu_init_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001729{
Andreas Färberce3960e2012-12-17 03:27:07 +01001730 cpu->nr_cores = smp_cores;
1731 cpu->nr_threads = smp_threads;
Andreas Färberf324e762012-05-02 23:26:21 +02001732 cpu->stopped = true;
Peter Maydell56943e82016-01-21 14:15:04 +00001733
1734 if (!cpu->as) {
1735 /* If the target cpu hasn't set up any address spaces itself,
1736 * give it the default one.
1737 */
Peter Crosthwaite6731d862016-01-21 14:15:06 +00001738 AddressSpace *as = address_space_init_shareable(cpu->memory,
1739 "cpu-memory");
Peter Maydell12ebc9a2016-01-21 14:15:04 +00001740 cpu->num_ases = 1;
Peter Crosthwaite6731d862016-01-21 14:15:06 +00001741 cpu_address_space_init(cpu, as, 0);
Peter Maydell56943e82016-01-21 14:15:04 +00001742 }
1743
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001744 if (kvm_enabled()) {
Andreas Färber48a106b2013-05-27 02:20:39 +02001745 qemu_kvm_start_vcpu(cpu);
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001746 } else if (hax_enabled()) {
1747 qemu_hax_start_vcpu(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001748 } else if (tcg_enabled()) {
Andreas Färbere5ab30a2012-05-03 01:50:44 +02001749 qemu_tcg_init_vcpu(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001750 } else {
Andreas Färber10a90212013-05-27 02:24:35 +02001751 qemu_dummy_start_vcpu(cpu);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001752 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001753}
1754
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001755void cpu_stop_current(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001756{
Andreas Färber4917cf42013-05-27 05:17:50 +02001757 if (current_cpu) {
1758 current_cpu->stop = false;
1759 current_cpu->stopped = true;
1760 cpu_exit(current_cpu);
Dr. David Alan Gilbert96bce682016-01-25 10:08:18 +00001761 qemu_cond_broadcast(&qemu_pause_cond);
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001762 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001763}
1764
Kevin Wolf56983462013-07-05 13:49:54 +02001765int vm_stop(RunState state)
Blue Swirl296af7c2010-03-29 19:23:50 +00001766{
Juan Quintelaaa723c22012-09-18 16:30:11 +02001767 if (qemu_in_vcpu_thread()) {
Paolo Bonzini74892d22014-06-05 14:53:58 +02001768 qemu_system_vmstop_request_prepare();
Luiz Capitulino1dfb4dd2011-07-29 14:26:33 -03001769 qemu_system_vmstop_request(state);
Blue Swirl296af7c2010-03-29 19:23:50 +00001770 /*
1771 * FIXME: should not return to device code in case
1772 * vm_stop() has been requested.
1773 */
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001774 cpu_stop_current();
Kevin Wolf56983462013-07-05 13:49:54 +02001775 return 0;
Blue Swirl296af7c2010-03-29 19:23:50 +00001776 }
Kevin Wolf56983462013-07-05 13:49:54 +02001777
1778 return do_vm_stop(state);
Blue Swirl296af7c2010-03-29 19:23:50 +00001779}
1780
Claudio Imbrenda2d76e822017-02-14 18:07:47 +01001781/**
1782 * Prepare for (re)starting the VM.
1783 * Returns -1 if the vCPUs are not to be restarted (e.g. if they are already
1784 * running or in case of an error condition), 0 otherwise.
1785 */
1786int vm_prepare_start(void)
1787{
1788 RunState requested;
1789 int res = 0;
1790
1791 qemu_vmstop_requested(&requested);
1792 if (runstate_is_running() && requested == RUN_STATE__MAX) {
1793 return -1;
1794 }
1795
1796 /* Ensure that a STOP/RESUME pair of events is emitted if a
1797 * vmstop request was pending. The BLOCK_IO_ERROR event, for
1798 * example, according to documentation is always followed by
1799 * the STOP event.
1800 */
1801 if (runstate_is_running()) {
1802 qapi_event_send_stop(&error_abort);
1803 res = -1;
1804 } else {
1805 replay_enable_events();
1806 cpu_enable_ticks();
1807 runstate_set(RUN_STATE_RUNNING);
1808 vm_state_notify(1, RUN_STATE_RUNNING);
1809 }
1810
1811 /* We are sending this now, but the CPUs will be resumed shortly later */
1812 qapi_event_send_resume(&error_abort);
1813 return res;
1814}
1815
1816void vm_start(void)
1817{
1818 if (!vm_prepare_start()) {
1819 resume_all_vcpus();
1820 }
1821}
1822
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001823/* does a state transition even if the VM is already stopped,
1824 current state is forgotten forever */
Kevin Wolf56983462013-07-05 13:49:54 +02001825int vm_stop_force_state(RunState state)
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001826{
1827 if (runstate_is_running()) {
Kevin Wolf56983462013-07-05 13:49:54 +02001828 return vm_stop(state);
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001829 } else {
1830 runstate_set(state);
Wen Congyangb2780d32015-11-20 17:34:38 +08001831
1832 bdrv_drain_all();
Kevin Wolf594a45c2013-07-18 14:52:19 +02001833 /* Make sure to return an error if the flush in a previous vm_stop()
1834 * failed. */
John Snow22af08e2016-09-22 21:45:51 -04001835 return bdrv_flush_all();
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001836 }
1837}
1838
Stefan Weil9a78eea2010-10-22 23:03:33 +02001839void list_cpus(FILE *f, fprintf_function cpu_fprintf, const char *optarg)
Blue Swirl262353c2010-05-04 19:55:35 +00001840{
1841 /* XXX: implement xxx_cpu_list for targets that still miss it */
Peter Maydelle916cbf2012-09-05 17:41:08 -03001842#if defined(cpu_list)
1843 cpu_list(f, cpu_fprintf);
Blue Swirl262353c2010-05-04 19:55:35 +00001844#endif
1845}
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001846
1847CpuInfoList *qmp_query_cpus(Error **errp)
1848{
1849 CpuInfoList *head = NULL, *cur_item = NULL;
Andreas Färber182735e2013-05-29 22:29:20 +02001850 CPUState *cpu;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001851
Andreas Färberbdc44642013-06-24 23:50:24 +02001852 CPU_FOREACH(cpu) {
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001853 CpuInfoList *info;
Andreas Färber182735e2013-05-29 22:29:20 +02001854#if defined(TARGET_I386)
1855 X86CPU *x86_cpu = X86_CPU(cpu);
1856 CPUX86State *env = &x86_cpu->env;
1857#elif defined(TARGET_PPC)
1858 PowerPCCPU *ppc_cpu = POWERPC_CPU(cpu);
1859 CPUPPCState *env = &ppc_cpu->env;
1860#elif defined(TARGET_SPARC)
1861 SPARCCPU *sparc_cpu = SPARC_CPU(cpu);
1862 CPUSPARCState *env = &sparc_cpu->env;
1863#elif defined(TARGET_MIPS)
1864 MIPSCPU *mips_cpu = MIPS_CPU(cpu);
1865 CPUMIPSState *env = &mips_cpu->env;
Bastian Koppelmann48e06fe2014-09-01 12:59:46 +01001866#elif defined(TARGET_TRICORE)
1867 TriCoreCPU *tricore_cpu = TRICORE_CPU(cpu);
1868 CPUTriCoreState *env = &tricore_cpu->env;
Andreas Färber182735e2013-05-29 22:29:20 +02001869#endif
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001870
Andreas Färbercb446ec2013-05-01 14:24:52 +02001871 cpu_synchronize_state(cpu);
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001872
1873 info = g_malloc0(sizeof(*info));
1874 info->value = g_malloc0(sizeof(*info->value));
Andreas Färber55e5c282012-12-17 06:18:02 +01001875 info->value->CPU = cpu->cpu_index;
Andreas Färber182735e2013-05-29 22:29:20 +02001876 info->value->current = (cpu == first_cpu);
Andreas Färber259186a2013-01-17 18:51:17 +01001877 info->value->halted = cpu->halted;
Eduardo Habkost58f88d42015-05-08 16:04:22 -03001878 info->value->qom_path = object_get_canonical_path(OBJECT(cpu));
Andreas Färber9f09e182012-05-03 06:59:07 +02001879 info->value->thread_id = cpu->thread_id;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001880#if defined(TARGET_I386)
Eric Blake86f4b682015-11-18 01:52:59 -07001881 info->value->arch = CPU_INFO_ARCH_X86;
Eric Blake544a3732016-02-17 23:48:27 -07001882 info->value->u.x86.pc = env->eip + env->segs[R_CS].base;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001883#elif defined(TARGET_PPC)
Eric Blake86f4b682015-11-18 01:52:59 -07001884 info->value->arch = CPU_INFO_ARCH_PPC;
Eric Blake544a3732016-02-17 23:48:27 -07001885 info->value->u.ppc.nip = env->nip;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001886#elif defined(TARGET_SPARC)
Eric Blake86f4b682015-11-18 01:52:59 -07001887 info->value->arch = CPU_INFO_ARCH_SPARC;
Eric Blake544a3732016-02-17 23:48:27 -07001888 info->value->u.q_sparc.pc = env->pc;
1889 info->value->u.q_sparc.npc = env->npc;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001890#elif defined(TARGET_MIPS)
Eric Blake86f4b682015-11-18 01:52:59 -07001891 info->value->arch = CPU_INFO_ARCH_MIPS;
Eric Blake544a3732016-02-17 23:48:27 -07001892 info->value->u.q_mips.PC = env->active_tc.PC;
Bastian Koppelmann48e06fe2014-09-01 12:59:46 +01001893#elif defined(TARGET_TRICORE)
Eric Blake86f4b682015-11-18 01:52:59 -07001894 info->value->arch = CPU_INFO_ARCH_TRICORE;
Eric Blake544a3732016-02-17 23:48:27 -07001895 info->value->u.tricore.PC = env->PC;
Eric Blake86f4b682015-11-18 01:52:59 -07001896#else
1897 info->value->arch = CPU_INFO_ARCH_OTHER;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001898#endif
1899
1900 /* XXX: waiting for the qapi to support GSList */
1901 if (!cur_item) {
1902 head = cur_item = info;
1903 } else {
1904 cur_item->next = info;
1905 cur_item = info;
1906 }
1907 }
1908
1909 return head;
1910}
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001911
1912void qmp_memsave(int64_t addr, int64_t size, const char *filename,
1913 bool has_cpu, int64_t cpu_index, Error **errp)
1914{
1915 FILE *f;
1916 uint32_t l;
Andreas Färber55e5c282012-12-17 06:18:02 +01001917 CPUState *cpu;
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001918 uint8_t buf[1024];
Borislav Petkov0dc9daf2015-02-08 13:14:38 +01001919 int64_t orig_addr = addr, orig_size = size;
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001920
1921 if (!has_cpu) {
1922 cpu_index = 0;
1923 }
1924
Andreas Färber151d1322013-02-15 15:41:49 +01001925 cpu = qemu_get_cpu(cpu_index);
1926 if (cpu == NULL) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01001927 error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "cpu-index",
1928 "a CPU number");
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001929 return;
1930 }
1931
1932 f = fopen(filename, "wb");
1933 if (!f) {
Luiz Capitulino618da852013-06-07 14:35:06 -04001934 error_setg_file_open(errp, errno, filename);
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001935 return;
1936 }
1937
1938 while (size != 0) {
1939 l = sizeof(buf);
1940 if (l > size)
1941 l = size;
Aneesh Kumar K.V2f4d0f52013-10-01 21:49:30 +05301942 if (cpu_memory_rw_debug(cpu, addr, buf, l, 0) != 0) {
Borislav Petkov0dc9daf2015-02-08 13:14:38 +01001943 error_setg(errp, "Invalid addr 0x%016" PRIx64 "/size %" PRId64
1944 " specified", orig_addr, orig_size);
Aneesh Kumar K.V2f4d0f52013-10-01 21:49:30 +05301945 goto exit;
1946 }
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001947 if (fwrite(buf, 1, l, f) != l) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01001948 error_setg(errp, QERR_IO_ERROR);
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001949 goto exit;
1950 }
1951 addr += l;
1952 size -= l;
1953 }
1954
1955exit:
1956 fclose(f);
1957}
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001958
1959void qmp_pmemsave(int64_t addr, int64_t size, const char *filename,
1960 Error **errp)
1961{
1962 FILE *f;
1963 uint32_t l;
1964 uint8_t buf[1024];
1965
1966 f = fopen(filename, "wb");
1967 if (!f) {
Luiz Capitulino618da852013-06-07 14:35:06 -04001968 error_setg_file_open(errp, errno, filename);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001969 return;
1970 }
1971
1972 while (size != 0) {
1973 l = sizeof(buf);
1974 if (l > size)
1975 l = size;
Stefan Weileb6282f2014-04-07 20:28:23 +02001976 cpu_physical_memory_read(addr, buf, l);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001977 if (fwrite(buf, 1, l, f) != l) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01001978 error_setg(errp, QERR_IO_ERROR);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001979 goto exit;
1980 }
1981 addr += l;
1982 size -= l;
1983 }
1984
1985exit:
1986 fclose(f);
1987}
Luiz Capitulinoab49ab52011-11-23 12:55:53 -02001988
1989void qmp_inject_nmi(Error **errp)
1990{
Alexey Kardashevskiy9cb805f2014-08-20 22:16:33 +10001991 nmi_monitor_handle(monitor_get_cpu_index(), errp);
Luiz Capitulinoab49ab52011-11-23 12:55:53 -02001992}
Sebastian Tanase27498be2014-07-25 11:56:33 +02001993
1994void dump_drift_info(FILE *f, fprintf_function cpu_fprintf)
1995{
1996 if (!use_icount) {
1997 return;
1998 }
1999
2000 cpu_fprintf(f, "Host - Guest clock %"PRIi64" ms\n",
2001 (cpu_get_clock() - cpu_get_icount())/SCALE_MS);
2002 if (icount_align_option) {
2003 cpu_fprintf(f, "Max guest delay %"PRIi64" ms\n", -max_delay/SCALE_MS);
2004 cpu_fprintf(f, "Max guest advance %"PRIi64" ms\n", max_advance/SCALE_MS);
2005 } else {
2006 cpu_fprintf(f, "Max guest delay NA\n");
2007 cpu_fprintf(f, "Max guest advance NA\n");
2008 }
2009}