blob: a628cde23260a82cba51c9146336fe8bdf7e854d [file] [log] [blame]
Blue Swirl296af7c2010-03-29 19:23:50 +00001/*
2 * QEMU System Emulator
3 *
4 * Copyright (c) 2003-2008 Fabrice Bellard
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
24
25/* Needed early for CONFIG_BSD etc. */
Peter Maydell7b31bbc2016-01-26 18:16:56 +000026#include "qemu/osdep.h"
Paolo Bonzini33c11872016-03-15 16:58:45 +010027#include "qemu-common.h"
KONRAD Frederic8d4e9142017-02-23 18:29:08 +000028#include "qemu/config-file.h"
Paolo Bonzini33c11872016-03-15 16:58:45 +010029#include "cpu.h"
Paolo Bonzini83c90892012-12-17 18:19:49 +010030#include "monitor/monitor.h"
Wenchao Xiaa4e15de2014-06-18 08:43:36 +020031#include "qapi/qmp/qerror.h"
Markus Armbrusterd49b6832015-03-17 18:29:20 +010032#include "qemu/error-report.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010033#include "sysemu/sysemu.h"
Max Reitzda31d592016-03-16 19:54:32 +010034#include "sysemu/block-backend.h"
Paolo Bonzini022c62c2012-12-17 18:19:49 +010035#include "exec/gdbstub.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010036#include "sysemu/dma.h"
Vincent Palatinb3946622017-01-10 11:59:55 +010037#include "sysemu/hw_accel.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010038#include "sysemu/kvm.h"
Vincent Palatinb0cb0a62017-01-10 11:59:57 +010039#include "sysemu/hax.h"
Luiz Capitulinode0b36b2011-09-21 16:38:35 -030040#include "qmp-commands.h"
Paolo Bonzini63c91552016-03-15 13:18:37 +010041#include "exec/exec-all.h"
Blue Swirl296af7c2010-03-29 19:23:50 +000042
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010043#include "qemu/thread.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010044#include "sysemu/cpus.h"
45#include "sysemu/qtest.h"
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010046#include "qemu/main-loop.h"
47#include "qemu/bitmap.h"
Liu Ping Fancb365642013-09-25 14:20:58 +080048#include "qemu/seqlock.h"
KONRAD Frederic8d4e9142017-02-23 18:29:08 +000049#include "tcg.h"
Wenchao Xiaa4e15de2014-06-18 08:43:36 +020050#include "qapi-event.h"
Alexey Kardashevskiy9cb805f2014-08-20 22:16:33 +100051#include "hw/nmi.h"
Pavel Dovgalyuk8b427042015-09-17 19:24:05 +030052#include "sysemu/replay.h"
Jan Kiszka0ff0fc12011-06-23 10:15:55 +020053
Jan Kiszka6d9cb732011-02-01 22:15:58 +010054#ifdef CONFIG_LINUX
55
56#include <sys/prctl.h>
57
Marcelo Tosattic0532a72010-10-11 15:31:21 -030058#ifndef PR_MCE_KILL
59#define PR_MCE_KILL 33
60#endif
61
Jan Kiszka6d9cb732011-02-01 22:15:58 +010062#ifndef PR_MCE_KILL_SET
63#define PR_MCE_KILL_SET 1
64#endif
65
66#ifndef PR_MCE_KILL_EARLY
67#define PR_MCE_KILL_EARLY 1
68#endif
69
70#endif /* CONFIG_LINUX */
71
Sebastian Tanase27498be2014-07-25 11:56:33 +020072int64_t max_delay;
73int64_t max_advance;
Blue Swirl296af7c2010-03-29 19:23:50 +000074
Jason J. Herne2adcc852015-09-08 13:12:33 -040075/* vcpu throttling controls */
76static QEMUTimer *throttle_timer;
77static unsigned int throttle_percentage;
78
79#define CPU_THROTTLE_PCT_MIN 1
80#define CPU_THROTTLE_PCT_MAX 99
81#define CPU_THROTTLE_TIMESLICE_NS 10000000
82
Tiejun Chen321bc0b2013-08-02 09:43:09 +080083bool cpu_is_stopped(CPUState *cpu)
84{
85 return cpu->stopped || !runstate_is_running();
86}
87
Andreas Färbera98ae1d2013-05-26 23:21:08 +020088static bool cpu_thread_is_idle(CPUState *cpu)
Peter Maydellac873f12012-07-19 16:52:27 +010089{
Andreas Färberc64ca812012-05-03 02:11:45 +020090 if (cpu->stop || cpu->queued_work_first) {
Peter Maydellac873f12012-07-19 16:52:27 +010091 return false;
92 }
Tiejun Chen321bc0b2013-08-02 09:43:09 +080093 if (cpu_is_stopped(cpu)) {
Peter Maydellac873f12012-07-19 16:52:27 +010094 return true;
95 }
Andreas Färber8c2e1b02013-08-25 18:53:55 +020096 if (!cpu->halted || cpu_has_work(cpu) ||
Alexander Graf215e79c2013-04-24 22:24:12 +020097 kvm_halt_in_kernel()) {
Peter Maydellac873f12012-07-19 16:52:27 +010098 return false;
99 }
100 return true;
101}
102
103static bool all_cpu_threads_idle(void)
104{
Andreas Färber182735e2013-05-29 22:29:20 +0200105 CPUState *cpu;
Peter Maydellac873f12012-07-19 16:52:27 +0100106
Andreas Färberbdc44642013-06-24 23:50:24 +0200107 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200108 if (!cpu_thread_is_idle(cpu)) {
Peter Maydellac873f12012-07-19 16:52:27 +0100109 return false;
110 }
111 }
112 return true;
113}
114
Blue Swirl296af7c2010-03-29 19:23:50 +0000115/***********************************************************/
Paolo Bonzini946fb272011-09-12 13:57:37 +0200116/* guest cycle counter */
117
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200118/* Protected by TimersState seqlock */
119
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200120static bool icount_sleep = true;
Sebastian Tanase71468392014-07-23 11:47:50 +0200121static int64_t vm_clock_warp_start = -1;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200122/* Conversion factor from emulated instructions to virtual clock ticks. */
123static int icount_time_shift;
124/* Arbitrarily pick 1MIPS as the minimum allowable speed. */
125#define MAX_ICOUNT_SHIFT 10
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200126
Paolo Bonzini946fb272011-09-12 13:57:37 +0200127static QEMUTimer *icount_rt_timer;
128static QEMUTimer *icount_vm_timer;
129static QEMUTimer *icount_warp_timer;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200130
131typedef struct TimersState {
Liu Ping Fancb365642013-09-25 14:20:58 +0800132 /* Protected by BQL. */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200133 int64_t cpu_ticks_prev;
134 int64_t cpu_ticks_offset;
Liu Ping Fancb365642013-09-25 14:20:58 +0800135
136 /* cpu_clock_offset can be read out of BQL, so protect it with
137 * this lock.
138 */
139 QemuSeqLock vm_clock_seqlock;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200140 int64_t cpu_clock_offset;
141 int32_t cpu_ticks_enabled;
142 int64_t dummy;
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200143
144 /* Compensate for varying guest execution speed. */
145 int64_t qemu_icount_bias;
146 /* Only written by TCG thread */
147 int64_t qemu_icount;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200148} TimersState;
149
Liu Ping Fand9cd4002013-07-21 08:43:00 +0000150static TimersState timers_state;
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000151bool mttcg_enabled;
152
153/*
154 * We default to false if we know other options have been enabled
155 * which are currently incompatible with MTTCG. Otherwise when each
156 * guest (target) has been updated to support:
157 * - atomic instructions
158 * - memory ordering primitives (barriers)
159 * they can set the appropriate CONFIG flags in ${target}-softmmu.mak
160 *
161 * Once a guest architecture has been converted to the new primitives
162 * there are two remaining limitations to check.
163 *
164 * - The guest can't be oversized (e.g. 64 bit guest on 32 bit host)
165 * - The host must have a stronger memory order than the guest
166 *
167 * It may be possible in future to support strong guests on weak hosts
168 * but that will require tagging all load/stores in a guest with their
169 * implicit memory order requirements which would likely slow things
170 * down a lot.
171 */
172
173static bool check_tcg_memory_orders_compatible(void)
174{
175#if defined(TCG_GUEST_DEFAULT_MO) && defined(TCG_TARGET_DEFAULT_MO)
176 return (TCG_GUEST_DEFAULT_MO & ~TCG_TARGET_DEFAULT_MO) == 0;
177#else
178 return false;
179#endif
180}
181
182static bool default_mttcg_enabled(void)
183{
184 QemuOpts *icount_opts = qemu_find_opts_singleton("icount");
185 const char *rr = qemu_opt_get(icount_opts, "rr");
186
187 if (rr || TCG_OVERSIZED_GUEST) {
188 return false;
189 } else {
190#ifdef TARGET_SUPPORTS_MTTCG
191 return check_tcg_memory_orders_compatible();
192#else
193 return false;
194#endif
195 }
196}
197
198void qemu_tcg_configure(QemuOpts *opts, Error **errp)
199{
200 const char *t = qemu_opt_get(opts, "thread");
201 if (t) {
202 if (strcmp(t, "multi") == 0) {
203 if (TCG_OVERSIZED_GUEST) {
204 error_setg(errp, "No MTTCG when guest word size > hosts");
205 } else {
206 if (!check_tcg_memory_orders_compatible()) {
207 error_report("Guest expects a stronger memory ordering "
208 "than the host provides");
209 error_printf("This may cause strange/hard to debug errors");
210 }
211 mttcg_enabled = true;
212 }
213 } else if (strcmp(t, "single") == 0) {
214 mttcg_enabled = false;
215 } else {
216 error_setg(errp, "Invalid 'thread' setting %s", t);
217 }
218 } else {
219 mttcg_enabled = default_mttcg_enabled();
220 }
221}
Paolo Bonzini946fb272011-09-12 13:57:37 +0200222
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300223int64_t cpu_get_icount_raw(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200224{
225 int64_t icount;
Andreas Färber4917cf42013-05-27 05:17:50 +0200226 CPUState *cpu = current_cpu;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200227
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200228 icount = timers_state.qemu_icount;
Andreas Färber4917cf42013-05-27 05:17:50 +0200229 if (cpu) {
Paolo Bonzini414b15c2015-06-24 14:16:26 +0200230 if (!cpu->can_do_io) {
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300231 fprintf(stderr, "Bad icount read\n");
232 exit(1);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200233 }
Andreas Färber28ecfd72013-08-26 05:51:49 +0200234 icount -= (cpu->icount_decr.u16.low + cpu->icount_extra);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200235 }
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300236 return icount;
237}
238
239/* Return the virtual CPU time, based on the instruction counter. */
240static int64_t cpu_get_icount_locked(void)
241{
242 int64_t icount = cpu_get_icount_raw();
KONRAD Frederic3f031312014-08-01 01:37:15 +0200243 return timers_state.qemu_icount_bias + cpu_icount_to_ns(icount);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200244}
245
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200246int64_t cpu_get_icount(void)
247{
248 int64_t icount;
249 unsigned start;
250
251 do {
252 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
253 icount = cpu_get_icount_locked();
254 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
255
256 return icount;
257}
258
KONRAD Frederic3f031312014-08-01 01:37:15 +0200259int64_t cpu_icount_to_ns(int64_t icount)
260{
261 return icount << icount_time_shift;
262}
263
Cao jind90f3cc2016-07-29 19:05:38 +0800264/* return the time elapsed in VM between vm_start and vm_stop. Unless
265 * icount is active, cpu_get_ticks() uses units of the host CPU cycle
266 * counter.
267 *
268 * Caller must hold the BQL
269 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200270int64_t cpu_get_ticks(void)
271{
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100272 int64_t ticks;
273
Paolo Bonzini946fb272011-09-12 13:57:37 +0200274 if (use_icount) {
275 return cpu_get_icount();
276 }
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100277
278 ticks = timers_state.cpu_ticks_offset;
279 if (timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400280 ticks += cpu_get_host_ticks();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200281 }
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100282
283 if (timers_state.cpu_ticks_prev > ticks) {
284 /* Note: non increasing ticks may happen if the host uses
285 software suspend */
286 timers_state.cpu_ticks_offset += timers_state.cpu_ticks_prev - ticks;
287 ticks = timers_state.cpu_ticks_prev;
288 }
289
290 timers_state.cpu_ticks_prev = ticks;
291 return ticks;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200292}
293
Liu Ping Fancb365642013-09-25 14:20:58 +0800294static int64_t cpu_get_clock_locked(void)
295{
Cao jin1d45cea2016-07-29 19:05:37 +0800296 int64_t time;
Liu Ping Fancb365642013-09-25 14:20:58 +0800297
Cao jin1d45cea2016-07-29 19:05:37 +0800298 time = timers_state.cpu_clock_offset;
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100299 if (timers_state.cpu_ticks_enabled) {
Cao jin1d45cea2016-07-29 19:05:37 +0800300 time += get_clock();
Liu Ping Fancb365642013-09-25 14:20:58 +0800301 }
302
Cao jin1d45cea2016-07-29 19:05:37 +0800303 return time;
Liu Ping Fancb365642013-09-25 14:20:58 +0800304}
305
Cao jind90f3cc2016-07-29 19:05:38 +0800306/* Return the monotonic time elapsed in VM, i.e.,
Peter Maydell8212ff82016-09-15 10:24:22 +0100307 * the time between vm_start and vm_stop
308 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200309int64_t cpu_get_clock(void)
310{
311 int64_t ti;
Liu Ping Fancb365642013-09-25 14:20:58 +0800312 unsigned start;
313
314 do {
315 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
316 ti = cpu_get_clock_locked();
317 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
318
319 return ti;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200320}
321
Liu Ping Fancb365642013-09-25 14:20:58 +0800322/* enable cpu_get_ticks()
Cao jin3224e872016-07-08 18:31:37 +0800323 * Caller must hold BQL which serves as mutex for vm_clock_seqlock.
Liu Ping Fancb365642013-09-25 14:20:58 +0800324 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200325void cpu_enable_ticks(void)
326{
Liu Ping Fancb365642013-09-25 14:20:58 +0800327 /* Here, the really thing protected by seqlock is cpu_clock_offset. */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400328 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200329 if (!timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400330 timers_state.cpu_ticks_offset -= cpu_get_host_ticks();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200331 timers_state.cpu_clock_offset -= get_clock();
332 timers_state.cpu_ticks_enabled = 1;
333 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400334 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200335}
336
337/* disable cpu_get_ticks() : the clock is stopped. You must not call
Liu Ping Fancb365642013-09-25 14:20:58 +0800338 * cpu_get_ticks() after that.
Cao jin3224e872016-07-08 18:31:37 +0800339 * Caller must hold BQL which serves as mutex for vm_clock_seqlock.
Liu Ping Fancb365642013-09-25 14:20:58 +0800340 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200341void cpu_disable_ticks(void)
342{
Liu Ping Fancb365642013-09-25 14:20:58 +0800343 /* Here, the really thing protected by seqlock is cpu_clock_offset. */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400344 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200345 if (timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400346 timers_state.cpu_ticks_offset += cpu_get_host_ticks();
Liu Ping Fancb365642013-09-25 14:20:58 +0800347 timers_state.cpu_clock_offset = cpu_get_clock_locked();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200348 timers_state.cpu_ticks_enabled = 0;
349 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400350 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200351}
352
353/* Correlation between real and virtual time is always going to be
354 fairly approximate, so ignore small variation.
355 When the guest is idle real and virtual time will be aligned in
356 the IO wait loop. */
Rutuja Shah73bcb242016-03-21 21:32:30 +0530357#define ICOUNT_WOBBLE (NANOSECONDS_PER_SECOND / 10)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200358
359static void icount_adjust(void)
360{
361 int64_t cur_time;
362 int64_t cur_icount;
363 int64_t delta;
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200364
365 /* Protected by TimersState mutex. */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200366 static int64_t last_delta;
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200367
Paolo Bonzini946fb272011-09-12 13:57:37 +0200368 /* If the VM is not running, then do nothing. */
369 if (!runstate_is_running()) {
370 return;
371 }
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200372
Emilio G. Cota03719e42016-06-08 14:55:21 -0400373 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200374 cur_time = cpu_get_clock_locked();
375 cur_icount = cpu_get_icount_locked();
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200376
Paolo Bonzini946fb272011-09-12 13:57:37 +0200377 delta = cur_icount - cur_time;
378 /* FIXME: This is a very crude algorithm, somewhat prone to oscillation. */
379 if (delta > 0
380 && last_delta + ICOUNT_WOBBLE < delta * 2
381 && icount_time_shift > 0) {
382 /* The guest is getting too far ahead. Slow time down. */
383 icount_time_shift--;
384 }
385 if (delta < 0
386 && last_delta - ICOUNT_WOBBLE > delta * 2
387 && icount_time_shift < MAX_ICOUNT_SHIFT) {
388 /* The guest is getting too far behind. Speed time up. */
389 icount_time_shift++;
390 }
391 last_delta = delta;
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200392 timers_state.qemu_icount_bias = cur_icount
393 - (timers_state.qemu_icount << icount_time_shift);
Emilio G. Cota03719e42016-06-08 14:55:21 -0400394 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200395}
396
397static void icount_adjust_rt(void *opaque)
398{
Alex Bligh40daca52013-08-21 16:03:02 +0100399 timer_mod(icount_rt_timer,
Pavel Dovgalyuk1979b902015-01-12 15:00:43 +0300400 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL_RT) + 1000);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200401 icount_adjust();
402}
403
404static void icount_adjust_vm(void *opaque)
405{
Alex Bligh40daca52013-08-21 16:03:02 +0100406 timer_mod(icount_vm_timer,
407 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
Rutuja Shah73bcb242016-03-21 21:32:30 +0530408 NANOSECONDS_PER_SECOND / 10);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200409 icount_adjust();
410}
411
412static int64_t qemu_icount_round(int64_t count)
413{
414 return (count + (1 << icount_time_shift) - 1) >> icount_time_shift;
415}
416
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300417static void icount_warp_rt(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200418{
Alex Bennéeccffff42016-04-04 15:35:48 +0100419 unsigned seq;
420 int64_t warp_start;
421
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200422 /* The icount_warp_timer is rescheduled soon after vm_clock_warp_start
423 * changes from -1 to another value, so the race here is okay.
424 */
Alex Bennéeccffff42016-04-04 15:35:48 +0100425 do {
426 seq = seqlock_read_begin(&timers_state.vm_clock_seqlock);
427 warp_start = vm_clock_warp_start;
428 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, seq));
429
430 if (warp_start == -1) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200431 return;
432 }
433
Emilio G. Cota03719e42016-06-08 14:55:21 -0400434 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200435 if (runstate_is_running()) {
Pavel Dovgalyuk8eda2062015-09-17 19:24:28 +0300436 int64_t clock = REPLAY_CLOCK(REPLAY_CLOCK_VIRTUAL_RT,
437 cpu_get_clock_locked());
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200438 int64_t warp_delta;
439
440 warp_delta = clock - vm_clock_warp_start;
441 if (use_icount == 2) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200442 /*
Alex Bligh40daca52013-08-21 16:03:02 +0100443 * In adaptive mode, do not let QEMU_CLOCK_VIRTUAL run too
Paolo Bonzini946fb272011-09-12 13:57:37 +0200444 * far ahead of real time.
445 */
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200446 int64_t cur_icount = cpu_get_icount_locked();
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300447 int64_t delta = clock - cur_icount;
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200448 warp_delta = MIN(warp_delta, delta);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200449 }
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200450 timers_state.qemu_icount_bias += warp_delta;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200451 }
452 vm_clock_warp_start = -1;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400453 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200454
455 if (qemu_clock_expired(QEMU_CLOCK_VIRTUAL)) {
456 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
457 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200458}
459
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300460static void icount_timer_cb(void *opaque)
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300461{
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300462 /* No need for a checkpoint because the timer already synchronizes
463 * with CHECKPOINT_CLOCK_VIRTUAL_RT.
464 */
465 icount_warp_rt();
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300466}
467
Paolo Bonzini8156be52012-03-28 15:42:04 +0200468void qtest_clock_warp(int64_t dest)
469{
Alex Bligh40daca52013-08-21 16:03:02 +0100470 int64_t clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
Fam Zhengefef88b2015-01-19 17:51:43 +0800471 AioContext *aio_context;
Paolo Bonzini8156be52012-03-28 15:42:04 +0200472 assert(qtest_enabled());
Fam Zhengefef88b2015-01-19 17:51:43 +0800473 aio_context = qemu_get_aio_context();
Paolo Bonzini8156be52012-03-28 15:42:04 +0200474 while (clock < dest) {
Alex Bligh40daca52013-08-21 16:03:02 +0100475 int64_t deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
Sergey Fedorovc9299e22014-06-10 13:10:28 +0400476 int64_t warp = qemu_soonest_timeout(dest - clock, deadline);
Fam Zhengefef88b2015-01-19 17:51:43 +0800477
Emilio G. Cota03719e42016-06-08 14:55:21 -0400478 seqlock_write_begin(&timers_state.vm_clock_seqlock);
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200479 timers_state.qemu_icount_bias += warp;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400480 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200481
Alex Bligh40daca52013-08-21 16:03:02 +0100482 qemu_clock_run_timers(QEMU_CLOCK_VIRTUAL);
Fam Zhengefef88b2015-01-19 17:51:43 +0800483 timerlist_run_timers(aio_context->tlg.tl[QEMU_CLOCK_VIRTUAL]);
Alex Bligh40daca52013-08-21 16:03:02 +0100484 clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini8156be52012-03-28 15:42:04 +0200485 }
Alex Bligh40daca52013-08-21 16:03:02 +0100486 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini8156be52012-03-28 15:42:04 +0200487}
488
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300489void qemu_start_warp_timer(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200490{
Paolo Bonzinice78d182013-10-07 17:30:02 +0200491 int64_t clock;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200492 int64_t deadline;
493
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300494 if (!use_icount) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200495 return;
496 }
497
Pavel Dovgalyuk8bd7f712015-09-17 19:24:44 +0300498 /* Nothing to do if the VM is stopped: QEMU_CLOCK_VIRTUAL timers
499 * do not fire, so computing the deadline does not make sense.
500 */
501 if (!runstate_is_running()) {
502 return;
503 }
504
505 /* warp clock deterministically in record/replay mode */
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300506 if (!replay_checkpoint(CHECKPOINT_CLOCK_WARP_START)) {
Pavel Dovgalyuk8bd7f712015-09-17 19:24:44 +0300507 return;
508 }
509
Paolo Bonzinice78d182013-10-07 17:30:02 +0200510 if (!all_cpu_threads_idle()) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200511 return;
512 }
513
Paolo Bonzini8156be52012-03-28 15:42:04 +0200514 if (qtest_enabled()) {
515 /* When testing, qtest commands advance icount. */
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300516 return;
Paolo Bonzini8156be52012-03-28 15:42:04 +0200517 }
518
Alex Blighac70aaf2013-08-21 16:02:57 +0100519 /* We want to use the earliest deadline from ALL vm_clocks */
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300520 clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT);
Alex Bligh40daca52013-08-21 16:03:02 +0100521 deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
Paolo Bonzinice78d182013-10-07 17:30:02 +0200522 if (deadline < 0) {
Victor CLEMENTd7a0f712015-05-29 17:14:06 +0200523 static bool notified;
524 if (!icount_sleep && !notified) {
525 error_report("WARNING: icount sleep disabled and no active timers");
526 notified = true;
527 }
Paolo Bonzinice78d182013-10-07 17:30:02 +0200528 return;
Alex Blighac70aaf2013-08-21 16:02:57 +0100529 }
530
Paolo Bonzini946fb272011-09-12 13:57:37 +0200531 if (deadline > 0) {
532 /*
Alex Bligh40daca52013-08-21 16:03:02 +0100533 * Ensure QEMU_CLOCK_VIRTUAL proceeds even when the virtual CPU goes to
Paolo Bonzini946fb272011-09-12 13:57:37 +0200534 * sleep. Otherwise, the CPU might be waiting for a future timer
535 * interrupt to wake it up, but the interrupt never comes because
536 * the vCPU isn't running any insns and thus doesn't advance the
Alex Bligh40daca52013-08-21 16:03:02 +0100537 * QEMU_CLOCK_VIRTUAL.
Paolo Bonzini946fb272011-09-12 13:57:37 +0200538 */
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200539 if (!icount_sleep) {
540 /*
541 * We never let VCPUs sleep in no sleep icount mode.
542 * If there is a pending QEMU_CLOCK_VIRTUAL timer we just advance
543 * to the next QEMU_CLOCK_VIRTUAL event and notify it.
544 * It is useful when we want a deterministic execution time,
545 * isolated from host latencies.
546 */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400547 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200548 timers_state.qemu_icount_bias += deadline;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400549 seqlock_write_end(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200550 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
551 } else {
552 /*
553 * We do stop VCPUs and only advance QEMU_CLOCK_VIRTUAL after some
554 * "real" time, (related to the time left until the next event) has
555 * passed. The QEMU_CLOCK_VIRTUAL_RT clock will do this.
556 * This avoids that the warps are visible externally; for example,
557 * you will not be sending network packets continuously instead of
558 * every 100ms.
559 */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400560 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200561 if (vm_clock_warp_start == -1 || vm_clock_warp_start > clock) {
562 vm_clock_warp_start = clock;
563 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400564 seqlock_write_end(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200565 timer_mod_anticipate(icount_warp_timer, clock + deadline);
Paolo Bonzinice78d182013-10-07 17:30:02 +0200566 }
Alex Blighac70aaf2013-08-21 16:02:57 +0100567 } else if (deadline == 0) {
Alex Bligh40daca52013-08-21 16:03:02 +0100568 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200569 }
570}
571
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300572static void qemu_account_warp_timer(void)
573{
574 if (!use_icount || !icount_sleep) {
575 return;
576 }
577
578 /* Nothing to do if the VM is stopped: QEMU_CLOCK_VIRTUAL timers
579 * do not fire, so computing the deadline does not make sense.
580 */
581 if (!runstate_is_running()) {
582 return;
583 }
584
585 /* warp clock deterministically in record/replay mode */
586 if (!replay_checkpoint(CHECKPOINT_CLOCK_WARP_ACCOUNT)) {
587 return;
588 }
589
590 timer_del(icount_warp_timer);
591 icount_warp_rt();
592}
593
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200594static bool icount_state_needed(void *opaque)
595{
596 return use_icount;
597}
598
599/*
600 * This is a subsection for icount migration.
601 */
602static const VMStateDescription icount_vmstate_timers = {
603 .name = "timer/icount",
604 .version_id = 1,
605 .minimum_version_id = 1,
Juan Quintela5cd8cad2014-09-23 14:09:54 +0200606 .needed = icount_state_needed,
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200607 .fields = (VMStateField[]) {
608 VMSTATE_INT64(qemu_icount_bias, TimersState),
609 VMSTATE_INT64(qemu_icount, TimersState),
610 VMSTATE_END_OF_LIST()
611 }
612};
613
Paolo Bonzini946fb272011-09-12 13:57:37 +0200614static const VMStateDescription vmstate_timers = {
615 .name = "timer",
616 .version_id = 2,
617 .minimum_version_id = 1,
Juan Quintela35d08452014-04-16 16:01:33 +0200618 .fields = (VMStateField[]) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200619 VMSTATE_INT64(cpu_ticks_offset, TimersState),
620 VMSTATE_INT64(dummy, TimersState),
621 VMSTATE_INT64_V(cpu_clock_offset, TimersState, 2),
622 VMSTATE_END_OF_LIST()
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200623 },
Juan Quintela5cd8cad2014-09-23 14:09:54 +0200624 .subsections = (const VMStateDescription*[]) {
625 &icount_vmstate_timers,
626 NULL
Paolo Bonzini946fb272011-09-12 13:57:37 +0200627 }
628};
629
Paolo Bonzini14e6fe12016-10-31 10:36:08 +0100630static void cpu_throttle_thread(CPUState *cpu, run_on_cpu_data opaque)
Jason J. Herne2adcc852015-09-08 13:12:33 -0400631{
Jason J. Herne2adcc852015-09-08 13:12:33 -0400632 double pct;
633 double throttle_ratio;
634 long sleeptime_ns;
635
636 if (!cpu_throttle_get_percentage()) {
637 return;
638 }
639
640 pct = (double)cpu_throttle_get_percentage()/100;
641 throttle_ratio = pct / (1 - pct);
642 sleeptime_ns = (long)(throttle_ratio * CPU_THROTTLE_TIMESLICE_NS);
643
644 qemu_mutex_unlock_iothread();
645 atomic_set(&cpu->throttle_thread_scheduled, 0);
646 g_usleep(sleeptime_ns / 1000); /* Convert ns to us for usleep call */
647 qemu_mutex_lock_iothread();
648}
649
650static void cpu_throttle_timer_tick(void *opaque)
651{
652 CPUState *cpu;
653 double pct;
654
655 /* Stop the timer if needed */
656 if (!cpu_throttle_get_percentage()) {
657 return;
658 }
659 CPU_FOREACH(cpu) {
660 if (!atomic_xchg(&cpu->throttle_thread_scheduled, 1)) {
Paolo Bonzini14e6fe12016-10-31 10:36:08 +0100661 async_run_on_cpu(cpu, cpu_throttle_thread,
662 RUN_ON_CPU_NULL);
Jason J. Herne2adcc852015-09-08 13:12:33 -0400663 }
664 }
665
666 pct = (double)cpu_throttle_get_percentage()/100;
667 timer_mod(throttle_timer, qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT) +
668 CPU_THROTTLE_TIMESLICE_NS / (1-pct));
669}
670
671void cpu_throttle_set(int new_throttle_pct)
672{
673 /* Ensure throttle percentage is within valid range */
674 new_throttle_pct = MIN(new_throttle_pct, CPU_THROTTLE_PCT_MAX);
675 new_throttle_pct = MAX(new_throttle_pct, CPU_THROTTLE_PCT_MIN);
676
677 atomic_set(&throttle_percentage, new_throttle_pct);
678
679 timer_mod(throttle_timer, qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT) +
680 CPU_THROTTLE_TIMESLICE_NS);
681}
682
683void cpu_throttle_stop(void)
684{
685 atomic_set(&throttle_percentage, 0);
686}
687
688bool cpu_throttle_active(void)
689{
690 return (cpu_throttle_get_percentage() != 0);
691}
692
693int cpu_throttle_get_percentage(void)
694{
695 return atomic_read(&throttle_percentage);
696}
697
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400698void cpu_ticks_init(void)
699{
Emilio G. Cotaccdb3c12016-06-08 14:55:20 -0400700 seqlock_init(&timers_state.vm_clock_seqlock);
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400701 vmstate_register(NULL, 0, &vmstate_timers, &timers_state);
Jason J. Herne2adcc852015-09-08 13:12:33 -0400702 throttle_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL_RT,
703 cpu_throttle_timer_tick, NULL);
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400704}
705
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200706void configure_icount(QemuOpts *opts, Error **errp)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200707{
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200708 const char *option;
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200709 char *rem_str = NULL;
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200710
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200711 option = qemu_opt_get(opts, "shift");
Paolo Bonzini946fb272011-09-12 13:57:37 +0200712 if (!option) {
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200713 if (qemu_opt_get(opts, "align") != NULL) {
714 error_setg(errp, "Please specify shift option when using align");
715 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200716 return;
717 }
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200718
719 icount_sleep = qemu_opt_get_bool(opts, "sleep", true);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200720 if (icount_sleep) {
721 icount_warp_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL_RT,
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300722 icount_timer_cb, NULL);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200723 }
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200724
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200725 icount_align_option = qemu_opt_get_bool(opts, "align", false);
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200726
727 if (icount_align_option && !icount_sleep) {
Pranith Kumar778d9f92016-02-26 10:16:51 -0500728 error_setg(errp, "align=on and sleep=off are incompatible");
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200729 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200730 if (strcmp(option, "auto") != 0) {
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200731 errno = 0;
732 icount_time_shift = strtol(option, &rem_str, 0);
733 if (errno != 0 || *rem_str != '\0' || !strlen(option)) {
734 error_setg(errp, "icount: Invalid shift value");
735 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200736 use_icount = 1;
737 return;
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200738 } else if (icount_align_option) {
739 error_setg(errp, "shift=auto and align=on are incompatible");
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200740 } else if (!icount_sleep) {
Pranith Kumar778d9f92016-02-26 10:16:51 -0500741 error_setg(errp, "shift=auto and sleep=off are incompatible");
Paolo Bonzini946fb272011-09-12 13:57:37 +0200742 }
743
744 use_icount = 2;
745
746 /* 125MIPS seems a reasonable initial guess at the guest speed.
747 It will be corrected fairly quickly anyway. */
748 icount_time_shift = 3;
749
750 /* Have both realtime and virtual time triggers for speed adjustment.
751 The realtime trigger catches emulated time passing too slowly,
752 the virtual time trigger catches emulated time passing too fast.
753 Realtime triggers occur even when idle, so use them less frequently
754 than VM triggers. */
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300755 icount_rt_timer = timer_new_ms(QEMU_CLOCK_VIRTUAL_RT,
756 icount_adjust_rt, NULL);
Alex Bligh40daca52013-08-21 16:03:02 +0100757 timer_mod(icount_rt_timer,
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300758 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL_RT) + 1000);
Alex Bligh40daca52013-08-21 16:03:02 +0100759 icount_vm_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
760 icount_adjust_vm, NULL);
761 timer_mod(icount_vm_timer,
762 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
Rutuja Shah73bcb242016-03-21 21:32:30 +0530763 NANOSECONDS_PER_SECOND / 10);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200764}
765
766/***********************************************************/
Alex Bennée65467062017-02-23 18:29:09 +0000767/* TCG vCPU kick timer
768 *
769 * The kick timer is responsible for moving single threaded vCPU
770 * emulation on to the next vCPU. If more than one vCPU is running a
771 * timer event with force a cpu->exit so the next vCPU can get
772 * scheduled.
773 *
774 * The timer is removed if all vCPUs are idle and restarted again once
775 * idleness is complete.
776 */
777
778static QEMUTimer *tcg_kick_vcpu_timer;
Alex Bennée791158d2017-02-23 18:29:10 +0000779static CPUState *tcg_current_rr_cpu;
Alex Bennée65467062017-02-23 18:29:09 +0000780
781#define TCG_KICK_PERIOD (NANOSECONDS_PER_SECOND / 10)
782
783static inline int64_t qemu_tcg_next_kick(void)
784{
785 return qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + TCG_KICK_PERIOD;
786}
787
Alex Bennée791158d2017-02-23 18:29:10 +0000788/* Kick the currently round-robin scheduled vCPU */
789static void qemu_cpu_kick_rr_cpu(void)
790{
791 CPUState *cpu;
Alex Bennée791158d2017-02-23 18:29:10 +0000792 do {
793 cpu = atomic_mb_read(&tcg_current_rr_cpu);
794 if (cpu) {
795 cpu_exit(cpu);
796 }
797 } while (cpu != atomic_mb_read(&tcg_current_rr_cpu));
798}
799
Alex Bennée65467062017-02-23 18:29:09 +0000800static void kick_tcg_thread(void *opaque)
801{
802 timer_mod(tcg_kick_vcpu_timer, qemu_tcg_next_kick());
Alex Bennée791158d2017-02-23 18:29:10 +0000803 qemu_cpu_kick_rr_cpu();
Alex Bennée65467062017-02-23 18:29:09 +0000804}
805
806static void start_tcg_kick_timer(void)
807{
Alex Bennée37257942017-02-23 18:29:14 +0000808 if (!mttcg_enabled && !tcg_kick_vcpu_timer && CPU_NEXT(first_cpu)) {
Alex Bennée65467062017-02-23 18:29:09 +0000809 tcg_kick_vcpu_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
810 kick_tcg_thread, NULL);
811 timer_mod(tcg_kick_vcpu_timer, qemu_tcg_next_kick());
812 }
813}
814
815static void stop_tcg_kick_timer(void)
816{
817 if (tcg_kick_vcpu_timer) {
818 timer_del(tcg_kick_vcpu_timer);
819 tcg_kick_vcpu_timer = NULL;
820 }
821}
822
Alex Bennée65467062017-02-23 18:29:09 +0000823/***********************************************************/
Blue Swirl296af7c2010-03-29 19:23:50 +0000824void hw_error(const char *fmt, ...)
825{
826 va_list ap;
Andreas Färber55e5c282012-12-17 06:18:02 +0100827 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000828
829 va_start(ap, fmt);
830 fprintf(stderr, "qemu: hardware error: ");
831 vfprintf(stderr, fmt, ap);
832 fprintf(stderr, "\n");
Andreas Färberbdc44642013-06-24 23:50:24 +0200833 CPU_FOREACH(cpu) {
Andreas Färber55e5c282012-12-17 06:18:02 +0100834 fprintf(stderr, "CPU #%d:\n", cpu->cpu_index);
Andreas Färber878096e2013-05-27 01:33:50 +0200835 cpu_dump_state(cpu, stderr, fprintf, CPU_DUMP_FPU);
Blue Swirl296af7c2010-03-29 19:23:50 +0000836 }
837 va_end(ap);
838 abort();
839}
840
841void cpu_synchronize_all_states(void)
842{
Andreas Färber182735e2013-05-29 22:29:20 +0200843 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000844
Andreas Färberbdc44642013-06-24 23:50:24 +0200845 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200846 cpu_synchronize_state(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000847 }
848}
849
850void cpu_synchronize_all_post_reset(void)
851{
Andreas Färber182735e2013-05-29 22:29:20 +0200852 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000853
Andreas Färberbdc44642013-06-24 23:50:24 +0200854 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200855 cpu_synchronize_post_reset(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000856 }
857}
858
859void cpu_synchronize_all_post_init(void)
860{
Andreas Färber182735e2013-05-29 22:29:20 +0200861 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000862
Andreas Färberbdc44642013-06-24 23:50:24 +0200863 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200864 cpu_synchronize_post_init(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000865 }
866}
867
Kevin Wolf56983462013-07-05 13:49:54 +0200868static int do_vm_stop(RunState state)
Blue Swirl296af7c2010-03-29 19:23:50 +0000869{
Kevin Wolf56983462013-07-05 13:49:54 +0200870 int ret = 0;
871
Luiz Capitulino13548692011-07-29 15:36:43 -0300872 if (runstate_is_running()) {
Blue Swirl296af7c2010-03-29 19:23:50 +0000873 cpu_disable_ticks();
Blue Swirl296af7c2010-03-29 19:23:50 +0000874 pause_all_vcpus();
Luiz Capitulinof5bbfba2011-07-29 15:04:45 -0300875 runstate_set(state);
Luiz Capitulino1dfb4dd2011-07-29 14:26:33 -0300876 vm_state_notify(0, state);
Wenchao Xiaa4e15de2014-06-18 08:43:36 +0200877 qapi_event_send_stop(&error_abort);
Blue Swirl296af7c2010-03-29 19:23:50 +0000878 }
Kevin Wolf56983462013-07-05 13:49:54 +0200879
Kevin Wolf594a45c2013-07-18 14:52:19 +0200880 bdrv_drain_all();
Pavel Dovgalyuk6d0ceb82016-09-26 11:08:16 +0300881 replay_disable_events();
John Snow22af08e2016-09-22 21:45:51 -0400882 ret = bdrv_flush_all();
Kevin Wolf594a45c2013-07-18 14:52:19 +0200883
Kevin Wolf56983462013-07-05 13:49:54 +0200884 return ret;
Blue Swirl296af7c2010-03-29 19:23:50 +0000885}
886
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200887static bool cpu_can_run(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +0000888{
Andreas Färber4fdeee72012-05-02 23:10:09 +0200889 if (cpu->stop) {
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200890 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +0100891 }
Tiejun Chen321bc0b2013-08-02 09:43:09 +0800892 if (cpu_is_stopped(cpu)) {
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200893 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +0100894 }
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200895 return true;
Blue Swirl296af7c2010-03-29 19:23:50 +0000896}
897
Andreas Färber91325042013-05-27 02:07:49 +0200898static void cpu_handle_guest_debug(CPUState *cpu)
Jan Kiszka3c638d02010-06-25 16:56:56 +0200899{
Andreas Färber64f6b342013-05-27 02:06:09 +0200900 gdb_set_stop_cpu(cpu);
Jan Kiszka8cf71712011-02-07 12:19:16 +0100901 qemu_system_debug_request();
Andreas Färberf324e762012-05-02 23:26:21 +0200902 cpu->stopped = true;
Jan Kiszka3c638d02010-06-25 16:56:56 +0200903}
904
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100905#ifdef CONFIG_LINUX
906static void sigbus_reraise(void)
907{
908 sigset_t set;
909 struct sigaction action;
910
911 memset(&action, 0, sizeof(action));
912 action.sa_handler = SIG_DFL;
913 if (!sigaction(SIGBUS, &action, NULL)) {
914 raise(SIGBUS);
915 sigemptyset(&set);
916 sigaddset(&set, SIGBUS);
Peter Maydella2d17612016-05-16 18:33:59 +0100917 pthread_sigmask(SIG_UNBLOCK, &set, NULL);
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100918 }
919 perror("Failed to re-raise SIGBUS!\n");
920 abort();
921}
922
Paolo Bonzinid98d4072017-02-08 13:22:12 +0100923static void sigbus_handler(int n, siginfo_t *siginfo, void *ctx)
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100924{
Paolo Bonzinid98d4072017-02-08 13:22:12 +0100925 if (kvm_on_sigbus(siginfo->si_code, siginfo->si_addr)) {
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100926 sigbus_reraise();
927 }
928}
929
930static void qemu_init_sigbus(void)
931{
932 struct sigaction action;
933
934 memset(&action, 0, sizeof(action));
935 action.sa_flags = SA_SIGINFO;
Paolo Bonzinid98d4072017-02-08 13:22:12 +0100936 action.sa_sigaction = sigbus_handler;
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100937 sigaction(SIGBUS, &action, NULL);
938
939 prctl(PR_MCE_KILL, PR_MCE_KILL_SET, PR_MCE_KILL_EARLY, 0, 0);
940}
941
Andreas Färber290adf32013-01-17 09:30:27 +0100942static void qemu_kvm_eat_signals(CPUState *cpu)
Jan Kiszka1ab3c6c2011-03-15 12:26:12 +0100943{
944 struct timespec ts = { 0, 0 };
945 siginfo_t siginfo;
946 sigset_t waitset;
947 sigset_t chkset;
948 int r;
949
950 sigemptyset(&waitset);
951 sigaddset(&waitset, SIG_IPI);
952 sigaddset(&waitset, SIGBUS);
953
954 do {
955 r = sigtimedwait(&waitset, &siginfo, &ts);
956 if (r == -1 && !(errno == EAGAIN || errno == EINTR)) {
957 perror("sigtimedwait");
958 exit(1);
959 }
960
961 switch (r) {
962 case SIGBUS:
Andreas Färber290adf32013-01-17 09:30:27 +0100963 if (kvm_on_sigbus_vcpu(cpu, siginfo.si_code, siginfo.si_addr)) {
Jan Kiszka1ab3c6c2011-03-15 12:26:12 +0100964 sigbus_reraise();
965 }
966 break;
967 default:
968 break;
969 }
970
971 r = sigpending(&chkset);
972 if (r == -1) {
973 perror("sigpending");
974 exit(1);
975 }
976 } while (sigismember(&chkset, SIG_IPI) || sigismember(&chkset, SIGBUS));
Jan Kiszka1ab3c6c2011-03-15 12:26:12 +0100977}
978
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100979#else /* !CONFIG_LINUX */
980
981static void qemu_init_sigbus(void)
982{
983}
Jan Kiszka1ab3c6c2011-03-15 12:26:12 +0100984
Andreas Färber290adf32013-01-17 09:30:27 +0100985static void qemu_kvm_eat_signals(CPUState *cpu)
Jan Kiszka1ab3c6c2011-03-15 12:26:12 +0100986{
987}
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100988#endif /* !CONFIG_LINUX */
989
Blue Swirl296af7c2010-03-29 19:23:50 +0000990#ifndef _WIN32
Jan Kiszka55f8d6a2011-02-01 22:15:52 +0100991static void dummy_signal(int sig)
Blue Swirl296af7c2010-03-29 19:23:50 +0000992{
993}
994
Andreas Färber13618e02013-05-26 23:41:00 +0200995static void qemu_kvm_init_cpu_signals(CPUState *cpu)
Paolo Bonzini714bd042011-03-12 17:44:06 +0100996{
997 int r;
998 sigset_t set;
999 struct sigaction sigact;
1000
1001 memset(&sigact, 0, sizeof(sigact));
1002 sigact.sa_handler = dummy_signal;
1003 sigaction(SIG_IPI, &sigact, NULL);
1004
Paolo Bonzini714bd042011-03-12 17:44:06 +01001005 pthread_sigmask(SIG_BLOCK, NULL, &set);
1006 sigdelset(&set, SIG_IPI);
1007 sigdelset(&set, SIGBUS);
Andreas Färber491d6e82013-05-26 23:38:10 +02001008 r = kvm_set_signal_mask(cpu, &set);
Paolo Bonzini714bd042011-03-12 17:44:06 +01001009 if (r) {
1010 fprintf(stderr, "kvm_set_signal_mask: %s\n", strerror(-r));
1011 exit(1);
1012 }
Paolo Bonzini714bd042011-03-12 17:44:06 +01001013}
1014
Jan Kiszka55f8d6a2011-02-01 22:15:52 +01001015#else /* _WIN32 */
Andreas Färber13618e02013-05-26 23:41:00 +02001016static void qemu_kvm_init_cpu_signals(CPUState *cpu)
Paolo Bonzini714bd042011-03-12 17:44:06 +01001017{
1018 abort();
1019}
Jan Kiszka55f8d6a2011-02-01 22:15:52 +01001020#endif /* _WIN32 */
Blue Swirl296af7c2010-03-29 19:23:50 +00001021
Stefan Weilb2532d82012-09-27 07:41:42 +02001022static QemuMutex qemu_global_mutex;
Blue Swirl296af7c2010-03-29 19:23:50 +00001023
1024static QemuThread io_thread;
1025
Blue Swirl296af7c2010-03-29 19:23:50 +00001026/* cpu creation */
1027static QemuCond qemu_cpu_cond;
1028/* system init */
Blue Swirl296af7c2010-03-29 19:23:50 +00001029static QemuCond qemu_pause_cond;
1030
Paolo Bonzinid3b12f52011-09-13 10:30:52 +02001031void qemu_init_cpu_loop(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001032{
Jan Kiszka6d9cb732011-02-01 22:15:58 +01001033 qemu_init_sigbus();
Anthony Liguoried945922011-02-08 18:18:18 +01001034 qemu_cond_init(&qemu_cpu_cond);
Anthony Liguoried945922011-02-08 18:18:18 +01001035 qemu_cond_init(&qemu_pause_cond);
Blue Swirl296af7c2010-03-29 19:23:50 +00001036 qemu_mutex_init(&qemu_global_mutex);
Blue Swirl296af7c2010-03-29 19:23:50 +00001037
Jan Kiszkab7680cb2011-03-12 17:43:51 +01001038 qemu_thread_get_self(&io_thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001039}
1040
Paolo Bonzini14e6fe12016-10-31 10:36:08 +01001041void run_on_cpu(CPUState *cpu, run_on_cpu_func func, run_on_cpu_data data)
Marcelo Tosattie82bcec2010-05-04 09:45:22 -03001042{
Sergey Fedorovd148d902016-08-29 09:51:00 +02001043 do_run_on_cpu(cpu, func, data, &qemu_global_mutex);
Chegu Vinod3c022702013-06-24 03:49:41 -06001044}
1045
Gu Zheng4c055ab2016-05-12 09:18:13 +05301046static void qemu_kvm_destroy_vcpu(CPUState *cpu)
1047{
1048 if (kvm_destroy_vcpu(cpu) < 0) {
1049 error_report("kvm_destroy_vcpu failed");
1050 exit(EXIT_FAILURE);
1051 }
1052}
1053
1054static void qemu_tcg_destroy_vcpu(CPUState *cpu)
1055{
1056}
1057
Andreas Färber509a0d72012-05-03 02:18:09 +02001058static void qemu_wait_io_event_common(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001059{
Alex Bennée37257942017-02-23 18:29:14 +00001060 atomic_mb_set(&cpu->thread_kicked, false);
Andreas Färber4fdeee72012-05-02 23:10:09 +02001061 if (cpu->stop) {
1062 cpu->stop = false;
Andreas Färberf324e762012-05-02 23:26:21 +02001063 cpu->stopped = true;
Dr. David Alan Gilbert96bce682016-01-25 10:08:18 +00001064 qemu_cond_broadcast(&qemu_pause_cond);
Blue Swirl296af7c2010-03-29 19:23:50 +00001065 }
Sergey Fedorova5403c62016-08-02 18:27:36 +01001066 process_queued_cpu_work(cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001067}
1068
1069static bool qemu_tcg_should_sleep(CPUState *cpu)
1070{
1071 if (mttcg_enabled) {
1072 return cpu_thread_is_idle(cpu);
1073 } else {
1074 return all_cpu_threads_idle();
1075 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001076}
1077
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001078static void qemu_tcg_wait_io_event(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001079{
Alex Bennée37257942017-02-23 18:29:14 +00001080 while (qemu_tcg_should_sleep(cpu)) {
Alex Bennée65467062017-02-23 18:29:09 +00001081 stop_tcg_kick_timer();
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001082 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka16400322011-02-09 16:29:37 +01001083 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001084
Alex Bennée65467062017-02-23 18:29:09 +00001085 start_tcg_kick_timer();
1086
Alex Bennée37257942017-02-23 18:29:14 +00001087 qemu_wait_io_event_common(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001088}
1089
Andreas Färberfd529e82013-05-26 23:24:55 +02001090static void qemu_kvm_wait_io_event(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001091{
Andreas Färbera98ae1d2013-05-26 23:21:08 +02001092 while (cpu_thread_is_idle(cpu)) {
Andreas Färberf5c121b2012-05-03 01:22:49 +02001093 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka16400322011-02-09 16:29:37 +01001094 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001095
Andreas Färber290adf32013-01-17 09:30:27 +01001096 qemu_kvm_eat_signals(cpu);
Andreas Färber509a0d72012-05-03 02:18:09 +02001097 qemu_wait_io_event_common(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001098}
1099
Jan Kiszka7e97cd82011-02-07 12:19:12 +01001100static void *qemu_kvm_cpu_thread_fn(void *arg)
Blue Swirl296af7c2010-03-29 19:23:50 +00001101{
Andreas Färber48a106b2013-05-27 02:20:39 +02001102 CPUState *cpu = arg;
Jan Kiszka84b49152011-02-01 22:15:50 +01001103 int r;
Blue Swirl296af7c2010-03-29 19:23:50 +00001104
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001105 rcu_register_thread();
1106
Paolo Bonzini2e7f7a32015-06-18 18:47:18 +02001107 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001108 qemu_thread_get_self(cpu->thread);
Andreas Färber9f09e182012-05-03 06:59:07 +02001109 cpu->thread_id = qemu_get_thread_id();
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001110 cpu->can_do_io = 1;
Andreas Färber4917cf42013-05-27 05:17:50 +02001111 current_cpu = cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001112
Andreas Färber504134d2012-12-17 06:38:45 +01001113 r = kvm_init_vcpu(cpu);
Jan Kiszka84b49152011-02-01 22:15:50 +01001114 if (r < 0) {
1115 fprintf(stderr, "kvm_init_vcpu failed: %s\n", strerror(-r));
1116 exit(1);
1117 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001118
Andreas Färber13618e02013-05-26 23:41:00 +02001119 qemu_kvm_init_cpu_signals(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001120
1121 /* signal CPU creation */
Andreas Färber61a46212012-05-02 22:49:36 +02001122 cpu->created = true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001123 qemu_cond_signal(&qemu_cpu_cond);
1124
Gu Zheng4c055ab2016-05-12 09:18:13 +05301125 do {
Andreas Färbera1fcaa72012-05-02 23:42:26 +02001126 if (cpu_can_run(cpu)) {
Andreas Färber1458c362013-05-26 23:46:55 +02001127 r = kvm_cpu_exec(cpu);
Jan Kiszka83f338f2011-02-07 12:19:17 +01001128 if (r == EXCP_DEBUG) {
Andreas Färber91325042013-05-27 02:07:49 +02001129 cpu_handle_guest_debug(cpu);
Jan Kiszka83f338f2011-02-07 12:19:17 +01001130 }
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001131 }
Andreas Färberfd529e82013-05-26 23:24:55 +02001132 qemu_kvm_wait_io_event(cpu);
Gu Zheng4c055ab2016-05-12 09:18:13 +05301133 } while (!cpu->unplug || cpu_can_run(cpu));
Blue Swirl296af7c2010-03-29 19:23:50 +00001134
Gu Zheng4c055ab2016-05-12 09:18:13 +05301135 qemu_kvm_destroy_vcpu(cpu);
Bharata B Rao2c579042016-05-12 09:18:14 +05301136 cpu->created = false;
1137 qemu_cond_signal(&qemu_cpu_cond);
Gu Zheng4c055ab2016-05-12 09:18:13 +05301138 qemu_mutex_unlock_iothread();
Blue Swirl296af7c2010-03-29 19:23:50 +00001139 return NULL;
1140}
1141
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001142static void *qemu_dummy_cpu_thread_fn(void *arg)
1143{
1144#ifdef _WIN32
1145 fprintf(stderr, "qtest is not supported under Windows\n");
1146 exit(1);
1147#else
Andreas Färber10a90212013-05-27 02:24:35 +02001148 CPUState *cpu = arg;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001149 sigset_t waitset;
1150 int r;
1151
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001152 rcu_register_thread();
1153
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001154 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001155 qemu_thread_get_self(cpu->thread);
Andreas Färber9f09e182012-05-03 06:59:07 +02001156 cpu->thread_id = qemu_get_thread_id();
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001157 cpu->can_do_io = 1;
Alex Bennée37257942017-02-23 18:29:14 +00001158 current_cpu = cpu;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001159
1160 sigemptyset(&waitset);
1161 sigaddset(&waitset, SIG_IPI);
1162
1163 /* signal CPU creation */
Andreas Färber61a46212012-05-02 22:49:36 +02001164 cpu->created = true;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001165 qemu_cond_signal(&qemu_cpu_cond);
1166
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001167 while (1) {
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001168 qemu_mutex_unlock_iothread();
1169 do {
1170 int sig;
1171 r = sigwait(&waitset, &sig);
1172 } while (r == -1 && (errno == EAGAIN || errno == EINTR));
1173 if (r == -1) {
1174 perror("sigwait");
1175 exit(1);
1176 }
1177 qemu_mutex_lock_iothread();
Andreas Färber509a0d72012-05-03 02:18:09 +02001178 qemu_wait_io_event_common(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001179 }
1180
1181 return NULL;
1182#endif
1183}
1184
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001185static int64_t tcg_get_icount_limit(void)
1186{
1187 int64_t deadline;
1188
1189 if (replay_mode != REPLAY_MODE_PLAY) {
1190 deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
1191
1192 /* Maintain prior (possibly buggy) behaviour where if no deadline
1193 * was set (as there is no QEMU_CLOCK_VIRTUAL timer) or it is more than
1194 * INT32_MAX nanoseconds ahead, we still use INT32_MAX
1195 * nanoseconds.
1196 */
1197 if ((deadline < 0) || (deadline > INT32_MAX)) {
1198 deadline = INT32_MAX;
1199 }
1200
1201 return qemu_icount_round(deadline);
1202 } else {
1203 return replay_get_instructions();
1204 }
1205}
1206
Alex Bennée12e97002016-10-27 16:10:14 +01001207static void handle_icount_deadline(void)
1208{
1209 if (use_icount) {
1210 int64_t deadline =
1211 qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
1212
1213 if (deadline == 0) {
1214 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
1215 }
1216 }
1217}
1218
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001219static int tcg_cpu_exec(CPUState *cpu)
1220{
1221 int ret;
1222#ifdef CONFIG_PROFILER
1223 int64_t ti;
1224#endif
1225
1226#ifdef CONFIG_PROFILER
1227 ti = profile_getclock();
1228#endif
1229 if (use_icount) {
1230 int64_t count;
1231 int decr;
1232 timers_state.qemu_icount -= (cpu->icount_decr.u16.low
1233 + cpu->icount_extra);
1234 cpu->icount_decr.u16.low = 0;
1235 cpu->icount_extra = 0;
1236 count = tcg_get_icount_limit();
1237 timers_state.qemu_icount += count;
1238 decr = (count > 0xffff) ? 0xffff : count;
1239 count -= decr;
1240 cpu->icount_decr.u16.low = decr;
1241 cpu->icount_extra = count;
1242 }
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001243 qemu_mutex_unlock_iothread();
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001244 cpu_exec_start(cpu);
1245 ret = cpu_exec(cpu);
1246 cpu_exec_end(cpu);
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001247 qemu_mutex_lock_iothread();
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001248#ifdef CONFIG_PROFILER
1249 tcg_time += profile_getclock() - ti;
1250#endif
1251 if (use_icount) {
1252 /* Fold pending instructions back into the
1253 instruction counter, and clear the interrupt flag. */
1254 timers_state.qemu_icount -= (cpu->icount_decr.u16.low
1255 + cpu->icount_extra);
1256 cpu->icount_decr.u32 = 0;
1257 cpu->icount_extra = 0;
1258 replay_account_executed_instructions();
1259 }
1260 return ret;
1261}
1262
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001263/* Destroy any remaining vCPUs which have been unplugged and have
1264 * finished running
1265 */
1266static void deal_with_unplugged_cpus(void)
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001267{
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001268 CPUState *cpu;
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001269
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001270 CPU_FOREACH(cpu) {
1271 if (cpu->unplug && !cpu_can_run(cpu)) {
1272 qemu_tcg_destroy_vcpu(cpu);
1273 cpu->created = false;
1274 qemu_cond_signal(&qemu_cpu_cond);
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001275 break;
1276 }
1277 }
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001278}
Jan Kiszkabdb7ca62011-09-26 09:40:39 +02001279
Alex Bennée65467062017-02-23 18:29:09 +00001280/* Single-threaded TCG
1281 *
1282 * In the single-threaded case each vCPU is simulated in turn. If
1283 * there is more than a single vCPU we create a simple timer to kick
1284 * the vCPU and ensure we don't get stuck in a tight loop in one vCPU.
1285 * This is done explicitly rather than relying on side-effects
1286 * elsewhere.
1287 */
1288
Alex Bennée37257942017-02-23 18:29:14 +00001289static void *qemu_tcg_rr_cpu_thread_fn(void *arg)
Blue Swirl296af7c2010-03-29 19:23:50 +00001290{
Andreas Färberc3586ba2012-05-03 01:41:24 +02001291 CPUState *cpu = arg;
Blue Swirl296af7c2010-03-29 19:23:50 +00001292
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001293 rcu_register_thread();
1294
Paolo Bonzini2e7f7a32015-06-18 18:47:18 +02001295 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001296 qemu_thread_get_self(cpu->thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001297
Andreas Färber38fcbd32013-07-07 19:50:23 +02001298 CPU_FOREACH(cpu) {
1299 cpu->thread_id = qemu_get_thread_id();
1300 cpu->created = true;
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001301 cpu->can_do_io = 1;
Andreas Färber38fcbd32013-07-07 19:50:23 +02001302 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001303 qemu_cond_signal(&qemu_cpu_cond);
1304
Jan Kiszkafa7d1862011-08-22 18:35:25 +02001305 /* wait for initial kick-off after machine start */
Emilio G. Cotac28e3992015-04-27 12:45:28 -04001306 while (first_cpu->stopped) {
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001307 qemu_cond_wait(first_cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka8e564b42012-02-17 18:31:15 +01001308
1309 /* process any pending work */
Andreas Färberbdc44642013-06-24 23:50:24 +02001310 CPU_FOREACH(cpu) {
Alex Bennée37257942017-02-23 18:29:14 +00001311 current_cpu = cpu;
Andreas Färber182735e2013-05-29 22:29:20 +02001312 qemu_wait_io_event_common(cpu);
Jan Kiszka8e564b42012-02-17 18:31:15 +01001313 }
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001314 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001315
Alex Bennée65467062017-02-23 18:29:09 +00001316 start_tcg_kick_timer();
1317
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001318 cpu = first_cpu;
1319
Alex Bennéee5143e32017-02-23 18:29:12 +00001320 /* process any pending work */
1321 cpu->exit_request = 1;
1322
Blue Swirl296af7c2010-03-29 19:23:50 +00001323 while (1) {
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001324 /* Account partial waits to QEMU_CLOCK_VIRTUAL. */
1325 qemu_account_warp_timer();
1326
1327 if (!cpu) {
1328 cpu = first_cpu;
1329 }
1330
Alex Bennéee5143e32017-02-23 18:29:12 +00001331 while (cpu && !cpu->queued_work_first && !cpu->exit_request) {
1332
Alex Bennée791158d2017-02-23 18:29:10 +00001333 atomic_mb_set(&tcg_current_rr_cpu, cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001334 current_cpu = cpu;
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001335
1336 qemu_clock_enable(QEMU_CLOCK_VIRTUAL,
1337 (cpu->singlestep_enabled & SSTEP_NOTIMER) == 0);
1338
1339 if (cpu_can_run(cpu)) {
1340 int r;
1341 r = tcg_cpu_exec(cpu);
1342 if (r == EXCP_DEBUG) {
1343 cpu_handle_guest_debug(cpu);
1344 break;
Pranith Kumar08e73c42017-02-23 18:29:15 +00001345 } else if (r == EXCP_ATOMIC) {
1346 qemu_mutex_unlock_iothread();
1347 cpu_exec_step_atomic(cpu);
1348 qemu_mutex_lock_iothread();
1349 break;
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001350 }
Alex Bennée37257942017-02-23 18:29:14 +00001351 } else if (cpu->stop) {
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001352 if (cpu->unplug) {
1353 cpu = CPU_NEXT(cpu);
1354 }
1355 break;
1356 }
1357
Alex Bennéee5143e32017-02-23 18:29:12 +00001358 cpu = CPU_NEXT(cpu);
1359 } /* while (cpu && !cpu->exit_request).. */
1360
Alex Bennée791158d2017-02-23 18:29:10 +00001361 /* Does not need atomic_mb_set because a spurious wakeup is okay. */
1362 atomic_set(&tcg_current_rr_cpu, NULL);
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001363
Alex Bennéee5143e32017-02-23 18:29:12 +00001364 if (cpu && cpu->exit_request) {
1365 atomic_mb_set(&cpu->exit_request, 0);
1366 }
Alex Blighac70aaf2013-08-21 16:02:57 +01001367
Alex Bennée12e97002016-10-27 16:10:14 +01001368 handle_icount_deadline();
Alex Blighac70aaf2013-08-21 16:02:57 +01001369
Alex Bennée37257942017-02-23 18:29:14 +00001370 qemu_tcg_wait_io_event(cpu ? cpu : QTAILQ_FIRST(&cpus));
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001371 deal_with_unplugged_cpus();
Blue Swirl296af7c2010-03-29 19:23:50 +00001372 }
1373
1374 return NULL;
1375}
1376
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001377static void *qemu_hax_cpu_thread_fn(void *arg)
1378{
1379 CPUState *cpu = arg;
1380 int r;
1381 qemu_thread_get_self(cpu->thread);
1382 qemu_mutex_lock(&qemu_global_mutex);
1383
1384 cpu->thread_id = qemu_get_thread_id();
1385 cpu->created = true;
1386 cpu->halted = 0;
1387 current_cpu = cpu;
1388
1389 hax_init_vcpu(cpu);
1390 qemu_cond_signal(&qemu_cpu_cond);
1391
1392 while (1) {
1393 if (cpu_can_run(cpu)) {
1394 r = hax_smp_cpu_exec(cpu);
1395 if (r == EXCP_DEBUG) {
1396 cpu_handle_guest_debug(cpu);
1397 }
1398 }
1399
1400 while (cpu_thread_is_idle(cpu)) {
1401 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
1402 }
1403#ifdef _WIN32
1404 SleepEx(0, TRUE);
1405#endif
1406 qemu_wait_io_event_common(cpu);
1407 }
1408 return NULL;
1409}
1410
1411#ifdef _WIN32
1412static void CALLBACK dummy_apc_func(ULONG_PTR unused)
1413{
1414}
1415#endif
1416
Alex Bennée37257942017-02-23 18:29:14 +00001417/* Multi-threaded TCG
1418 *
1419 * In the multi-threaded case each vCPU has its own thread. The TLS
1420 * variable current_cpu can be used deep in the code to find the
1421 * current CPUState for a given thread.
1422 */
1423
1424static void *qemu_tcg_cpu_thread_fn(void *arg)
1425{
1426 CPUState *cpu = arg;
1427
1428 rcu_register_thread();
1429
1430 qemu_mutex_lock_iothread();
1431 qemu_thread_get_self(cpu->thread);
1432
1433 cpu->thread_id = qemu_get_thread_id();
1434 cpu->created = true;
1435 cpu->can_do_io = 1;
1436 current_cpu = cpu;
1437 qemu_cond_signal(&qemu_cpu_cond);
1438
1439 /* process any pending work */
1440 cpu->exit_request = 1;
1441
1442 while (1) {
1443 if (cpu_can_run(cpu)) {
1444 int r;
1445 r = tcg_cpu_exec(cpu);
1446 switch (r) {
1447 case EXCP_DEBUG:
1448 cpu_handle_guest_debug(cpu);
1449 break;
1450 case EXCP_HALTED:
1451 /* during start-up the vCPU is reset and the thread is
1452 * kicked several times. If we don't ensure we go back
1453 * to sleep in the halted state we won't cleanly
1454 * start-up when the vCPU is enabled.
1455 *
1456 * cpu->halted should ensure we sleep in wait_io_event
1457 */
1458 g_assert(cpu->halted);
1459 break;
Pranith Kumar08e73c42017-02-23 18:29:15 +00001460 case EXCP_ATOMIC:
1461 qemu_mutex_unlock_iothread();
1462 cpu_exec_step_atomic(cpu);
1463 qemu_mutex_lock_iothread();
Alex Bennée37257942017-02-23 18:29:14 +00001464 default:
1465 /* Ignore everything else? */
1466 break;
1467 }
1468 }
1469
1470 handle_icount_deadline();
1471
1472 atomic_mb_set(&cpu->exit_request, 0);
1473 qemu_tcg_wait_io_event(cpu);
1474 }
1475
1476 return NULL;
1477}
1478
Andreas Färber2ff09a42012-05-03 00:23:30 +02001479static void qemu_cpu_kick_thread(CPUState *cpu)
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001480{
1481#ifndef _WIN32
1482 int err;
1483
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001484 if (cpu->thread_kicked) {
1485 return;
Paolo Bonzini9102ded2015-08-18 06:52:09 -07001486 }
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001487 cpu->thread_kicked = true;
Andreas Färber814e6122012-05-02 17:00:37 +02001488 err = pthread_kill(cpu->thread->thread, SIG_IPI);
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001489 if (err) {
1490 fprintf(stderr, "qemu:%s: %s", __func__, strerror(err));
1491 exit(1);
1492 }
1493#else /* _WIN32 */
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001494 if (!qemu_cpu_is_self(cpu)) {
1495 if (!QueueUserAPC(dummy_apc_func, cpu->hThread, 0)) {
1496 fprintf(stderr, "%s: QueueUserAPC failed with error %lu\n",
1497 __func__, GetLastError());
1498 exit(1);
1499 }
1500 }
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001501#endif
1502}
1503
Andreas Färberc08d7422012-05-03 04:34:15 +02001504void qemu_cpu_kick(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001505{
Andreas Färberf5c121b2012-05-03 01:22:49 +02001506 qemu_cond_broadcast(cpu->halt_cond);
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001507 if (tcg_enabled()) {
Alex Bennée791158d2017-02-23 18:29:10 +00001508 cpu_exit(cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001509 /* NOP unless doing single-thread RR */
Alex Bennée791158d2017-02-23 18:29:10 +00001510 qemu_cpu_kick_rr_cpu();
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001511 } else {
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001512 if (hax_enabled()) {
1513 /*
1514 * FIXME: race condition with the exit_request check in
1515 * hax_vcpu_hax_exec
1516 */
1517 cpu->exit_request = 1;
1518 }
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001519 qemu_cpu_kick_thread(cpu);
1520 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001521}
1522
Jan Kiszka46d62fa2011-02-01 22:15:59 +01001523void qemu_cpu_kick_self(void)
1524{
Andreas Färber4917cf42013-05-27 05:17:50 +02001525 assert(current_cpu);
Paolo Bonzini9102ded2015-08-18 06:52:09 -07001526 qemu_cpu_kick_thread(current_cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001527}
1528
Andreas Färber60e82572012-05-02 22:23:49 +02001529bool qemu_cpu_is_self(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001530{
Andreas Färber814e6122012-05-02 17:00:37 +02001531 return qemu_thread_is_self(cpu->thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001532}
1533
Paolo Bonzini79e2b9a2015-01-21 12:09:14 +01001534bool qemu_in_vcpu_thread(void)
Juan Quintelaaa723c22012-09-18 16:30:11 +02001535{
Andreas Färber4917cf42013-05-27 05:17:50 +02001536 return current_cpu && qemu_cpu_is_self(current_cpu);
Juan Quintelaaa723c22012-09-18 16:30:11 +02001537}
1538
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001539static __thread bool iothread_locked = false;
1540
1541bool qemu_mutex_iothread_locked(void)
1542{
1543 return iothread_locked;
1544}
1545
Blue Swirl296af7c2010-03-29 19:23:50 +00001546void qemu_mutex_lock_iothread(void)
1547{
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001548 g_assert(!qemu_mutex_iothread_locked());
1549 qemu_mutex_lock(&qemu_global_mutex);
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001550 iothread_locked = true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001551}
1552
1553void qemu_mutex_unlock_iothread(void)
1554{
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001555 g_assert(qemu_mutex_iothread_locked());
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001556 iothread_locked = false;
Blue Swirl296af7c2010-03-29 19:23:50 +00001557 qemu_mutex_unlock(&qemu_global_mutex);
1558}
1559
Alex Bennéee8faee02016-10-27 16:09:58 +01001560static bool all_vcpus_paused(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001561{
Andreas Färberbdc44642013-06-24 23:50:24 +02001562 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001563
Andreas Färberbdc44642013-06-24 23:50:24 +02001564 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001565 if (!cpu->stopped) {
Alex Bennéee8faee02016-10-27 16:09:58 +01001566 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001567 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001568 }
1569
Alex Bennéee8faee02016-10-27 16:09:58 +01001570 return true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001571}
1572
1573void pause_all_vcpus(void)
1574{
Andreas Färberbdc44642013-06-24 23:50:24 +02001575 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001576
Alex Bligh40daca52013-08-21 16:03:02 +01001577 qemu_clock_enable(QEMU_CLOCK_VIRTUAL, false);
Andreas Färberbdc44642013-06-24 23:50:24 +02001578 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001579 cpu->stop = true;
1580 qemu_cpu_kick(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001581 }
1582
Juan Quintelaaa723c22012-09-18 16:30:11 +02001583 if (qemu_in_vcpu_thread()) {
Jan Kiszkad798e972012-02-17 18:31:16 +01001584 cpu_stop_current();
Jan Kiszkad798e972012-02-17 18:31:16 +01001585 }
1586
Blue Swirl296af7c2010-03-29 19:23:50 +00001587 while (!all_vcpus_paused()) {
Paolo Bonzinibe7d6c52011-03-12 17:44:02 +01001588 qemu_cond_wait(&qemu_pause_cond, &qemu_global_mutex);
Andreas Färberbdc44642013-06-24 23:50:24 +02001589 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001590 qemu_cpu_kick(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001591 }
1592 }
1593}
1594
Igor Mammedov29936832013-04-23 10:29:37 +02001595void cpu_resume(CPUState *cpu)
1596{
1597 cpu->stop = false;
1598 cpu->stopped = false;
1599 qemu_cpu_kick(cpu);
1600}
1601
Blue Swirl296af7c2010-03-29 19:23:50 +00001602void resume_all_vcpus(void)
1603{
Andreas Färberbdc44642013-06-24 23:50:24 +02001604 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001605
Alex Bligh40daca52013-08-21 16:03:02 +01001606 qemu_clock_enable(QEMU_CLOCK_VIRTUAL, true);
Andreas Färberbdc44642013-06-24 23:50:24 +02001607 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001608 cpu_resume(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001609 }
1610}
1611
Gu Zheng4c055ab2016-05-12 09:18:13 +05301612void cpu_remove(CPUState *cpu)
1613{
1614 cpu->stop = true;
1615 cpu->unplug = true;
1616 qemu_cpu_kick(cpu);
1617}
1618
Bharata B Rao2c579042016-05-12 09:18:14 +05301619void cpu_remove_sync(CPUState *cpu)
1620{
1621 cpu_remove(cpu);
1622 while (cpu->created) {
1623 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1624 }
1625}
1626
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001627/* For temporary buffers for forming a name */
1628#define VCPU_THREAD_NAME_SIZE 16
1629
Andreas Färbere5ab30a2012-05-03 01:50:44 +02001630static void qemu_tcg_init_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001631{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001632 char thread_name[VCPU_THREAD_NAME_SIZE];
Alex Bennée37257942017-02-23 18:29:14 +00001633 static QemuCond *single_tcg_halt_cond;
1634 static QemuThread *single_tcg_cpu_thread;
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001635
Alex Bennée37257942017-02-23 18:29:14 +00001636 if (qemu_tcg_mttcg_enabled() || !single_tcg_cpu_thread) {
Andreas Färber814e6122012-05-02 17:00:37 +02001637 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001638 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1639 qemu_cond_init(cpu->halt_cond);
Alex Bennée37257942017-02-23 18:29:14 +00001640
1641 if (qemu_tcg_mttcg_enabled()) {
1642 /* create a thread per vCPU with TCG (MTTCG) */
1643 parallel_cpus = true;
1644 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/TCG",
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001645 cpu->cpu_index);
Alex Bennée37257942017-02-23 18:29:14 +00001646
1647 qemu_thread_create(cpu->thread, thread_name, qemu_tcg_cpu_thread_fn,
1648 cpu, QEMU_THREAD_JOINABLE);
1649
1650 } else {
1651 /* share a single thread for all cpus with TCG */
1652 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "ALL CPUs/TCG");
1653 qemu_thread_create(cpu->thread, thread_name,
1654 qemu_tcg_rr_cpu_thread_fn,
1655 cpu, QEMU_THREAD_JOINABLE);
1656
1657 single_tcg_halt_cond = cpu->halt_cond;
1658 single_tcg_cpu_thread = cpu->thread;
1659 }
Paolo Bonzini1ecf47b2011-12-13 13:43:52 +01001660#ifdef _WIN32
Andreas Färber814e6122012-05-02 17:00:37 +02001661 cpu->hThread = qemu_thread_get_handle(cpu->thread);
Paolo Bonzini1ecf47b2011-12-13 13:43:52 +01001662#endif
Andreas Färber61a46212012-05-02 22:49:36 +02001663 while (!cpu->created) {
Paolo Bonzini18a85722011-03-12 17:44:03 +01001664 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001665 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001666 } else {
Alex Bennée37257942017-02-23 18:29:14 +00001667 /* For non-MTTCG cases we share the thread */
1668 cpu->thread = single_tcg_cpu_thread;
1669 cpu->halt_cond = single_tcg_halt_cond;
Blue Swirl296af7c2010-03-29 19:23:50 +00001670 }
1671}
1672
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001673static void qemu_hax_start_vcpu(CPUState *cpu)
1674{
1675 char thread_name[VCPU_THREAD_NAME_SIZE];
1676
1677 cpu->thread = g_malloc0(sizeof(QemuThread));
1678 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1679 qemu_cond_init(cpu->halt_cond);
1680
1681 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/HAX",
1682 cpu->cpu_index);
1683 qemu_thread_create(cpu->thread, thread_name, qemu_hax_cpu_thread_fn,
1684 cpu, QEMU_THREAD_JOINABLE);
1685#ifdef _WIN32
1686 cpu->hThread = qemu_thread_get_handle(cpu->thread);
1687#endif
1688 while (!cpu->created) {
1689 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1690 }
1691}
1692
Andreas Färber48a106b2013-05-27 02:20:39 +02001693static void qemu_kvm_start_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001694{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001695 char thread_name[VCPU_THREAD_NAME_SIZE];
1696
Andreas Färber814e6122012-05-02 17:00:37 +02001697 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001698 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1699 qemu_cond_init(cpu->halt_cond);
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001700 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/KVM",
1701 cpu->cpu_index);
1702 qemu_thread_create(cpu->thread, thread_name, qemu_kvm_cpu_thread_fn,
1703 cpu, QEMU_THREAD_JOINABLE);
Andreas Färber61a46212012-05-02 22:49:36 +02001704 while (!cpu->created) {
Paolo Bonzini18a85722011-03-12 17:44:03 +01001705 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001706 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001707}
1708
Andreas Färber10a90212013-05-27 02:24:35 +02001709static void qemu_dummy_start_vcpu(CPUState *cpu)
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001710{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001711 char thread_name[VCPU_THREAD_NAME_SIZE];
1712
Andreas Färber814e6122012-05-02 17:00:37 +02001713 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001714 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1715 qemu_cond_init(cpu->halt_cond);
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001716 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/DUMMY",
1717 cpu->cpu_index);
1718 qemu_thread_create(cpu->thread, thread_name, qemu_dummy_cpu_thread_fn, cpu,
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001719 QEMU_THREAD_JOINABLE);
Andreas Färber61a46212012-05-02 22:49:36 +02001720 while (!cpu->created) {
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001721 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1722 }
1723}
1724
Andreas Färberc643bed2013-05-27 03:23:24 +02001725void qemu_init_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001726{
Andreas Färberce3960e2012-12-17 03:27:07 +01001727 cpu->nr_cores = smp_cores;
1728 cpu->nr_threads = smp_threads;
Andreas Färberf324e762012-05-02 23:26:21 +02001729 cpu->stopped = true;
Peter Maydell56943e82016-01-21 14:15:04 +00001730
1731 if (!cpu->as) {
1732 /* If the target cpu hasn't set up any address spaces itself,
1733 * give it the default one.
1734 */
Peter Crosthwaite6731d862016-01-21 14:15:06 +00001735 AddressSpace *as = address_space_init_shareable(cpu->memory,
1736 "cpu-memory");
Peter Maydell12ebc9a2016-01-21 14:15:04 +00001737 cpu->num_ases = 1;
Peter Crosthwaite6731d862016-01-21 14:15:06 +00001738 cpu_address_space_init(cpu, as, 0);
Peter Maydell56943e82016-01-21 14:15:04 +00001739 }
1740
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001741 if (kvm_enabled()) {
Andreas Färber48a106b2013-05-27 02:20:39 +02001742 qemu_kvm_start_vcpu(cpu);
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001743 } else if (hax_enabled()) {
1744 qemu_hax_start_vcpu(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001745 } else if (tcg_enabled()) {
Andreas Färbere5ab30a2012-05-03 01:50:44 +02001746 qemu_tcg_init_vcpu(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001747 } else {
Andreas Färber10a90212013-05-27 02:24:35 +02001748 qemu_dummy_start_vcpu(cpu);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001749 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001750}
1751
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001752void cpu_stop_current(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001753{
Andreas Färber4917cf42013-05-27 05:17:50 +02001754 if (current_cpu) {
1755 current_cpu->stop = false;
1756 current_cpu->stopped = true;
1757 cpu_exit(current_cpu);
Dr. David Alan Gilbert96bce682016-01-25 10:08:18 +00001758 qemu_cond_broadcast(&qemu_pause_cond);
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001759 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001760}
1761
Kevin Wolf56983462013-07-05 13:49:54 +02001762int vm_stop(RunState state)
Blue Swirl296af7c2010-03-29 19:23:50 +00001763{
Juan Quintelaaa723c22012-09-18 16:30:11 +02001764 if (qemu_in_vcpu_thread()) {
Paolo Bonzini74892d22014-06-05 14:53:58 +02001765 qemu_system_vmstop_request_prepare();
Luiz Capitulino1dfb4dd2011-07-29 14:26:33 -03001766 qemu_system_vmstop_request(state);
Blue Swirl296af7c2010-03-29 19:23:50 +00001767 /*
1768 * FIXME: should not return to device code in case
1769 * vm_stop() has been requested.
1770 */
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001771 cpu_stop_current();
Kevin Wolf56983462013-07-05 13:49:54 +02001772 return 0;
Blue Swirl296af7c2010-03-29 19:23:50 +00001773 }
Kevin Wolf56983462013-07-05 13:49:54 +02001774
1775 return do_vm_stop(state);
Blue Swirl296af7c2010-03-29 19:23:50 +00001776}
1777
Claudio Imbrenda2d76e822017-02-14 18:07:47 +01001778/**
1779 * Prepare for (re)starting the VM.
1780 * Returns -1 if the vCPUs are not to be restarted (e.g. if they are already
1781 * running or in case of an error condition), 0 otherwise.
1782 */
1783int vm_prepare_start(void)
1784{
1785 RunState requested;
1786 int res = 0;
1787
1788 qemu_vmstop_requested(&requested);
1789 if (runstate_is_running() && requested == RUN_STATE__MAX) {
1790 return -1;
1791 }
1792
1793 /* Ensure that a STOP/RESUME pair of events is emitted if a
1794 * vmstop request was pending. The BLOCK_IO_ERROR event, for
1795 * example, according to documentation is always followed by
1796 * the STOP event.
1797 */
1798 if (runstate_is_running()) {
1799 qapi_event_send_stop(&error_abort);
1800 res = -1;
1801 } else {
1802 replay_enable_events();
1803 cpu_enable_ticks();
1804 runstate_set(RUN_STATE_RUNNING);
1805 vm_state_notify(1, RUN_STATE_RUNNING);
1806 }
1807
1808 /* We are sending this now, but the CPUs will be resumed shortly later */
1809 qapi_event_send_resume(&error_abort);
1810 return res;
1811}
1812
1813void vm_start(void)
1814{
1815 if (!vm_prepare_start()) {
1816 resume_all_vcpus();
1817 }
1818}
1819
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001820/* does a state transition even if the VM is already stopped,
1821 current state is forgotten forever */
Kevin Wolf56983462013-07-05 13:49:54 +02001822int vm_stop_force_state(RunState state)
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001823{
1824 if (runstate_is_running()) {
Kevin Wolf56983462013-07-05 13:49:54 +02001825 return vm_stop(state);
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001826 } else {
1827 runstate_set(state);
Wen Congyangb2780d32015-11-20 17:34:38 +08001828
1829 bdrv_drain_all();
Kevin Wolf594a45c2013-07-18 14:52:19 +02001830 /* Make sure to return an error if the flush in a previous vm_stop()
1831 * failed. */
John Snow22af08e2016-09-22 21:45:51 -04001832 return bdrv_flush_all();
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001833 }
1834}
1835
Stefan Weil9a78eea2010-10-22 23:03:33 +02001836void list_cpus(FILE *f, fprintf_function cpu_fprintf, const char *optarg)
Blue Swirl262353c2010-05-04 19:55:35 +00001837{
1838 /* XXX: implement xxx_cpu_list for targets that still miss it */
Peter Maydelle916cbf2012-09-05 17:41:08 -03001839#if defined(cpu_list)
1840 cpu_list(f, cpu_fprintf);
Blue Swirl262353c2010-05-04 19:55:35 +00001841#endif
1842}
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001843
1844CpuInfoList *qmp_query_cpus(Error **errp)
1845{
1846 CpuInfoList *head = NULL, *cur_item = NULL;
Andreas Färber182735e2013-05-29 22:29:20 +02001847 CPUState *cpu;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001848
Andreas Färberbdc44642013-06-24 23:50:24 +02001849 CPU_FOREACH(cpu) {
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001850 CpuInfoList *info;
Andreas Färber182735e2013-05-29 22:29:20 +02001851#if defined(TARGET_I386)
1852 X86CPU *x86_cpu = X86_CPU(cpu);
1853 CPUX86State *env = &x86_cpu->env;
1854#elif defined(TARGET_PPC)
1855 PowerPCCPU *ppc_cpu = POWERPC_CPU(cpu);
1856 CPUPPCState *env = &ppc_cpu->env;
1857#elif defined(TARGET_SPARC)
1858 SPARCCPU *sparc_cpu = SPARC_CPU(cpu);
1859 CPUSPARCState *env = &sparc_cpu->env;
1860#elif defined(TARGET_MIPS)
1861 MIPSCPU *mips_cpu = MIPS_CPU(cpu);
1862 CPUMIPSState *env = &mips_cpu->env;
Bastian Koppelmann48e06fe2014-09-01 12:59:46 +01001863#elif defined(TARGET_TRICORE)
1864 TriCoreCPU *tricore_cpu = TRICORE_CPU(cpu);
1865 CPUTriCoreState *env = &tricore_cpu->env;
Andreas Färber182735e2013-05-29 22:29:20 +02001866#endif
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001867
Andreas Färbercb446ec2013-05-01 14:24:52 +02001868 cpu_synchronize_state(cpu);
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001869
1870 info = g_malloc0(sizeof(*info));
1871 info->value = g_malloc0(sizeof(*info->value));
Andreas Färber55e5c282012-12-17 06:18:02 +01001872 info->value->CPU = cpu->cpu_index;
Andreas Färber182735e2013-05-29 22:29:20 +02001873 info->value->current = (cpu == first_cpu);
Andreas Färber259186a2013-01-17 18:51:17 +01001874 info->value->halted = cpu->halted;
Eduardo Habkost58f88d42015-05-08 16:04:22 -03001875 info->value->qom_path = object_get_canonical_path(OBJECT(cpu));
Andreas Färber9f09e182012-05-03 06:59:07 +02001876 info->value->thread_id = cpu->thread_id;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001877#if defined(TARGET_I386)
Eric Blake86f4b682015-11-18 01:52:59 -07001878 info->value->arch = CPU_INFO_ARCH_X86;
Eric Blake544a3732016-02-17 23:48:27 -07001879 info->value->u.x86.pc = env->eip + env->segs[R_CS].base;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001880#elif defined(TARGET_PPC)
Eric Blake86f4b682015-11-18 01:52:59 -07001881 info->value->arch = CPU_INFO_ARCH_PPC;
Eric Blake544a3732016-02-17 23:48:27 -07001882 info->value->u.ppc.nip = env->nip;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001883#elif defined(TARGET_SPARC)
Eric Blake86f4b682015-11-18 01:52:59 -07001884 info->value->arch = CPU_INFO_ARCH_SPARC;
Eric Blake544a3732016-02-17 23:48:27 -07001885 info->value->u.q_sparc.pc = env->pc;
1886 info->value->u.q_sparc.npc = env->npc;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001887#elif defined(TARGET_MIPS)
Eric Blake86f4b682015-11-18 01:52:59 -07001888 info->value->arch = CPU_INFO_ARCH_MIPS;
Eric Blake544a3732016-02-17 23:48:27 -07001889 info->value->u.q_mips.PC = env->active_tc.PC;
Bastian Koppelmann48e06fe2014-09-01 12:59:46 +01001890#elif defined(TARGET_TRICORE)
Eric Blake86f4b682015-11-18 01:52:59 -07001891 info->value->arch = CPU_INFO_ARCH_TRICORE;
Eric Blake544a3732016-02-17 23:48:27 -07001892 info->value->u.tricore.PC = env->PC;
Eric Blake86f4b682015-11-18 01:52:59 -07001893#else
1894 info->value->arch = CPU_INFO_ARCH_OTHER;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001895#endif
1896
1897 /* XXX: waiting for the qapi to support GSList */
1898 if (!cur_item) {
1899 head = cur_item = info;
1900 } else {
1901 cur_item->next = info;
1902 cur_item = info;
1903 }
1904 }
1905
1906 return head;
1907}
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001908
1909void qmp_memsave(int64_t addr, int64_t size, const char *filename,
1910 bool has_cpu, int64_t cpu_index, Error **errp)
1911{
1912 FILE *f;
1913 uint32_t l;
Andreas Färber55e5c282012-12-17 06:18:02 +01001914 CPUState *cpu;
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001915 uint8_t buf[1024];
Borislav Petkov0dc9daf2015-02-08 13:14:38 +01001916 int64_t orig_addr = addr, orig_size = size;
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001917
1918 if (!has_cpu) {
1919 cpu_index = 0;
1920 }
1921
Andreas Färber151d1322013-02-15 15:41:49 +01001922 cpu = qemu_get_cpu(cpu_index);
1923 if (cpu == NULL) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01001924 error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "cpu-index",
1925 "a CPU number");
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001926 return;
1927 }
1928
1929 f = fopen(filename, "wb");
1930 if (!f) {
Luiz Capitulino618da852013-06-07 14:35:06 -04001931 error_setg_file_open(errp, errno, filename);
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001932 return;
1933 }
1934
1935 while (size != 0) {
1936 l = sizeof(buf);
1937 if (l > size)
1938 l = size;
Aneesh Kumar K.V2f4d0f52013-10-01 21:49:30 +05301939 if (cpu_memory_rw_debug(cpu, addr, buf, l, 0) != 0) {
Borislav Petkov0dc9daf2015-02-08 13:14:38 +01001940 error_setg(errp, "Invalid addr 0x%016" PRIx64 "/size %" PRId64
1941 " specified", orig_addr, orig_size);
Aneesh Kumar K.V2f4d0f52013-10-01 21:49:30 +05301942 goto exit;
1943 }
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001944 if (fwrite(buf, 1, l, f) != l) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01001945 error_setg(errp, QERR_IO_ERROR);
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001946 goto exit;
1947 }
1948 addr += l;
1949 size -= l;
1950 }
1951
1952exit:
1953 fclose(f);
1954}
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001955
1956void qmp_pmemsave(int64_t addr, int64_t size, const char *filename,
1957 Error **errp)
1958{
1959 FILE *f;
1960 uint32_t l;
1961 uint8_t buf[1024];
1962
1963 f = fopen(filename, "wb");
1964 if (!f) {
Luiz Capitulino618da852013-06-07 14:35:06 -04001965 error_setg_file_open(errp, errno, filename);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001966 return;
1967 }
1968
1969 while (size != 0) {
1970 l = sizeof(buf);
1971 if (l > size)
1972 l = size;
Stefan Weileb6282f2014-04-07 20:28:23 +02001973 cpu_physical_memory_read(addr, buf, l);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001974 if (fwrite(buf, 1, l, f) != l) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01001975 error_setg(errp, QERR_IO_ERROR);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001976 goto exit;
1977 }
1978 addr += l;
1979 size -= l;
1980 }
1981
1982exit:
1983 fclose(f);
1984}
Luiz Capitulinoab49ab52011-11-23 12:55:53 -02001985
1986void qmp_inject_nmi(Error **errp)
1987{
Alexey Kardashevskiy9cb805f2014-08-20 22:16:33 +10001988 nmi_monitor_handle(monitor_get_cpu_index(), errp);
Luiz Capitulinoab49ab52011-11-23 12:55:53 -02001989}
Sebastian Tanase27498be2014-07-25 11:56:33 +02001990
1991void dump_drift_info(FILE *f, fprintf_function cpu_fprintf)
1992{
1993 if (!use_icount) {
1994 return;
1995 }
1996
1997 cpu_fprintf(f, "Host - Guest clock %"PRIi64" ms\n",
1998 (cpu_get_clock() - cpu_get_icount())/SCALE_MS);
1999 if (icount_align_option) {
2000 cpu_fprintf(f, "Max guest delay %"PRIi64" ms\n", -max_delay/SCALE_MS);
2001 cpu_fprintf(f, "Max guest advance %"PRIi64" ms\n", max_advance/SCALE_MS);
2002 } else {
2003 cpu_fprintf(f, "Max guest delay NA\n");
2004 cpu_fprintf(f, "Max guest advance NA\n");
2005 }
2006}