blob: fc0ddc87934ca2f76e5daeb0e9a9569db9f593ff [file] [log] [blame]
Blue Swirl296af7c2010-03-29 19:23:50 +00001/*
2 * QEMU System Emulator
3 *
4 * Copyright (c) 2003-2008 Fabrice Bellard
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
24
25/* Needed early for CONFIG_BSD etc. */
Peter Maydell7b31bbc2016-01-26 18:16:56 +000026#include "qemu/osdep.h"
Paolo Bonzini33c11872016-03-15 16:58:45 +010027#include "qemu-common.h"
KONRAD Frederic8d4e9142017-02-23 18:29:08 +000028#include "qemu/config-file.h"
Paolo Bonzini33c11872016-03-15 16:58:45 +010029#include "cpu.h"
Paolo Bonzini83c90892012-12-17 18:19:49 +010030#include "monitor/monitor.h"
Wenchao Xiaa4e15de2014-06-18 08:43:36 +020031#include "qapi/qmp/qerror.h"
Markus Armbrusterd49b6832015-03-17 18:29:20 +010032#include "qemu/error-report.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010033#include "sysemu/sysemu.h"
Max Reitzda31d592016-03-16 19:54:32 +010034#include "sysemu/block-backend.h"
Paolo Bonzini022c62c2012-12-17 18:19:49 +010035#include "exec/gdbstub.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010036#include "sysemu/dma.h"
Vincent Palatinb3946622017-01-10 11:59:55 +010037#include "sysemu/hw_accel.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010038#include "sysemu/kvm.h"
Vincent Palatinb0cb0a62017-01-10 11:59:57 +010039#include "sysemu/hax.h"
Luiz Capitulinode0b36b2011-09-21 16:38:35 -030040#include "qmp-commands.h"
Paolo Bonzini63c91552016-03-15 13:18:37 +010041#include "exec/exec-all.h"
Blue Swirl296af7c2010-03-29 19:23:50 +000042
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010043#include "qemu/thread.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010044#include "sysemu/cpus.h"
45#include "sysemu/qtest.h"
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010046#include "qemu/main-loop.h"
47#include "qemu/bitmap.h"
Liu Ping Fancb365642013-09-25 14:20:58 +080048#include "qemu/seqlock.h"
KONRAD Frederic8d4e9142017-02-23 18:29:08 +000049#include "tcg.h"
Wenchao Xiaa4e15de2014-06-18 08:43:36 +020050#include "qapi-event.h"
Alexey Kardashevskiy9cb805f2014-08-20 22:16:33 +100051#include "hw/nmi.h"
Pavel Dovgalyuk8b427042015-09-17 19:24:05 +030052#include "sysemu/replay.h"
Jan Kiszka0ff0fc12011-06-23 10:15:55 +020053
Jan Kiszka6d9cb732011-02-01 22:15:58 +010054#ifdef CONFIG_LINUX
55
56#include <sys/prctl.h>
57
Marcelo Tosattic0532a72010-10-11 15:31:21 -030058#ifndef PR_MCE_KILL
59#define PR_MCE_KILL 33
60#endif
61
Jan Kiszka6d9cb732011-02-01 22:15:58 +010062#ifndef PR_MCE_KILL_SET
63#define PR_MCE_KILL_SET 1
64#endif
65
66#ifndef PR_MCE_KILL_EARLY
67#define PR_MCE_KILL_EARLY 1
68#endif
69
70#endif /* CONFIG_LINUX */
71
Sebastian Tanase27498be2014-07-25 11:56:33 +020072int64_t max_delay;
73int64_t max_advance;
Blue Swirl296af7c2010-03-29 19:23:50 +000074
Jason J. Herne2adcc852015-09-08 13:12:33 -040075/* vcpu throttling controls */
76static QEMUTimer *throttle_timer;
77static unsigned int throttle_percentage;
78
79#define CPU_THROTTLE_PCT_MIN 1
80#define CPU_THROTTLE_PCT_MAX 99
81#define CPU_THROTTLE_TIMESLICE_NS 10000000
82
Tiejun Chen321bc0b2013-08-02 09:43:09 +080083bool cpu_is_stopped(CPUState *cpu)
84{
85 return cpu->stopped || !runstate_is_running();
86}
87
Andreas Färbera98ae1d2013-05-26 23:21:08 +020088static bool cpu_thread_is_idle(CPUState *cpu)
Peter Maydellac873f12012-07-19 16:52:27 +010089{
Andreas Färberc64ca812012-05-03 02:11:45 +020090 if (cpu->stop || cpu->queued_work_first) {
Peter Maydellac873f12012-07-19 16:52:27 +010091 return false;
92 }
Tiejun Chen321bc0b2013-08-02 09:43:09 +080093 if (cpu_is_stopped(cpu)) {
Peter Maydellac873f12012-07-19 16:52:27 +010094 return true;
95 }
Andreas Färber8c2e1b02013-08-25 18:53:55 +020096 if (!cpu->halted || cpu_has_work(cpu) ||
Alexander Graf215e79c2013-04-24 22:24:12 +020097 kvm_halt_in_kernel()) {
Peter Maydellac873f12012-07-19 16:52:27 +010098 return false;
99 }
100 return true;
101}
102
103static bool all_cpu_threads_idle(void)
104{
Andreas Färber182735e2013-05-29 22:29:20 +0200105 CPUState *cpu;
Peter Maydellac873f12012-07-19 16:52:27 +0100106
Andreas Färberbdc44642013-06-24 23:50:24 +0200107 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200108 if (!cpu_thread_is_idle(cpu)) {
Peter Maydellac873f12012-07-19 16:52:27 +0100109 return false;
110 }
111 }
112 return true;
113}
114
Blue Swirl296af7c2010-03-29 19:23:50 +0000115/***********************************************************/
Paolo Bonzini946fb272011-09-12 13:57:37 +0200116/* guest cycle counter */
117
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200118/* Protected by TimersState seqlock */
119
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200120static bool icount_sleep = true;
Sebastian Tanase71468392014-07-23 11:47:50 +0200121static int64_t vm_clock_warp_start = -1;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200122/* Conversion factor from emulated instructions to virtual clock ticks. */
123static int icount_time_shift;
124/* Arbitrarily pick 1MIPS as the minimum allowable speed. */
125#define MAX_ICOUNT_SHIFT 10
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200126
Paolo Bonzini946fb272011-09-12 13:57:37 +0200127static QEMUTimer *icount_rt_timer;
128static QEMUTimer *icount_vm_timer;
129static QEMUTimer *icount_warp_timer;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200130
131typedef struct TimersState {
Liu Ping Fancb365642013-09-25 14:20:58 +0800132 /* Protected by BQL. */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200133 int64_t cpu_ticks_prev;
134 int64_t cpu_ticks_offset;
Liu Ping Fancb365642013-09-25 14:20:58 +0800135
136 /* cpu_clock_offset can be read out of BQL, so protect it with
137 * this lock.
138 */
139 QemuSeqLock vm_clock_seqlock;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200140 int64_t cpu_clock_offset;
141 int32_t cpu_ticks_enabled;
142 int64_t dummy;
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200143
144 /* Compensate for varying guest execution speed. */
145 int64_t qemu_icount_bias;
146 /* Only written by TCG thread */
147 int64_t qemu_icount;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200148} TimersState;
149
Liu Ping Fand9cd4002013-07-21 08:43:00 +0000150static TimersState timers_state;
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000151bool mttcg_enabled;
152
153/*
154 * We default to false if we know other options have been enabled
155 * which are currently incompatible with MTTCG. Otherwise when each
156 * guest (target) has been updated to support:
157 * - atomic instructions
158 * - memory ordering primitives (barriers)
159 * they can set the appropriate CONFIG flags in ${target}-softmmu.mak
160 *
161 * Once a guest architecture has been converted to the new primitives
162 * there are two remaining limitations to check.
163 *
164 * - The guest can't be oversized (e.g. 64 bit guest on 32 bit host)
165 * - The host must have a stronger memory order than the guest
166 *
167 * It may be possible in future to support strong guests on weak hosts
168 * but that will require tagging all load/stores in a guest with their
169 * implicit memory order requirements which would likely slow things
170 * down a lot.
171 */
172
173static bool check_tcg_memory_orders_compatible(void)
174{
175#if defined(TCG_GUEST_DEFAULT_MO) && defined(TCG_TARGET_DEFAULT_MO)
176 return (TCG_GUEST_DEFAULT_MO & ~TCG_TARGET_DEFAULT_MO) == 0;
177#else
178 return false;
179#endif
180}
181
182static bool default_mttcg_enabled(void)
183{
Alex Bennée83fd9622017-02-27 17:09:01 +0000184 if (use_icount || TCG_OVERSIZED_GUEST) {
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000185 return false;
186 } else {
187#ifdef TARGET_SUPPORTS_MTTCG
188 return check_tcg_memory_orders_compatible();
189#else
190 return false;
191#endif
192 }
193}
194
195void qemu_tcg_configure(QemuOpts *opts, Error **errp)
196{
197 const char *t = qemu_opt_get(opts, "thread");
198 if (t) {
199 if (strcmp(t, "multi") == 0) {
200 if (TCG_OVERSIZED_GUEST) {
201 error_setg(errp, "No MTTCG when guest word size > hosts");
Alex Bennée83fd9622017-02-27 17:09:01 +0000202 } else if (use_icount) {
203 error_setg(errp, "No MTTCG when icount is enabled");
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000204 } else {
Nikunj A Dadhania86953502017-04-10 11:36:55 +0530205#ifndef TARGET_SUPPORTS_MTTCG
Alex Bennéec34c7622017-02-28 14:40:17 +0000206 error_report("Guest not yet converted to MTTCG - "
207 "you may get unexpected results");
208#endif
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000209 if (!check_tcg_memory_orders_compatible()) {
210 error_report("Guest expects a stronger memory ordering "
211 "than the host provides");
Pranith Kumar8cfef892017-03-25 16:19:23 -0400212 error_printf("This may cause strange/hard to debug errors\n");
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000213 }
214 mttcg_enabled = true;
215 }
216 } else if (strcmp(t, "single") == 0) {
217 mttcg_enabled = false;
218 } else {
219 error_setg(errp, "Invalid 'thread' setting %s", t);
220 }
221 } else {
222 mttcg_enabled = default_mttcg_enabled();
223 }
224}
Paolo Bonzini946fb272011-09-12 13:57:37 +0200225
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300226int64_t cpu_get_icount_raw(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200227{
228 int64_t icount;
Andreas Färber4917cf42013-05-27 05:17:50 +0200229 CPUState *cpu = current_cpu;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200230
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200231 icount = timers_state.qemu_icount;
Andreas Färber4917cf42013-05-27 05:17:50 +0200232 if (cpu) {
Paolo Bonzini414b15c2015-06-24 14:16:26 +0200233 if (!cpu->can_do_io) {
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300234 fprintf(stderr, "Bad icount read\n");
235 exit(1);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200236 }
Andreas Färber28ecfd72013-08-26 05:51:49 +0200237 icount -= (cpu->icount_decr.u16.low + cpu->icount_extra);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200238 }
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300239 return icount;
240}
241
242/* Return the virtual CPU time, based on the instruction counter. */
243static int64_t cpu_get_icount_locked(void)
244{
245 int64_t icount = cpu_get_icount_raw();
KONRAD Frederic3f031312014-08-01 01:37:15 +0200246 return timers_state.qemu_icount_bias + cpu_icount_to_ns(icount);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200247}
248
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200249int64_t cpu_get_icount(void)
250{
251 int64_t icount;
252 unsigned start;
253
254 do {
255 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
256 icount = cpu_get_icount_locked();
257 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
258
259 return icount;
260}
261
KONRAD Frederic3f031312014-08-01 01:37:15 +0200262int64_t cpu_icount_to_ns(int64_t icount)
263{
264 return icount << icount_time_shift;
265}
266
Cao jind90f3cc2016-07-29 19:05:38 +0800267/* return the time elapsed in VM between vm_start and vm_stop. Unless
268 * icount is active, cpu_get_ticks() uses units of the host CPU cycle
269 * counter.
270 *
271 * Caller must hold the BQL
272 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200273int64_t cpu_get_ticks(void)
274{
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100275 int64_t ticks;
276
Paolo Bonzini946fb272011-09-12 13:57:37 +0200277 if (use_icount) {
278 return cpu_get_icount();
279 }
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100280
281 ticks = timers_state.cpu_ticks_offset;
282 if (timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400283 ticks += cpu_get_host_ticks();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200284 }
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100285
286 if (timers_state.cpu_ticks_prev > ticks) {
287 /* Note: non increasing ticks may happen if the host uses
288 software suspend */
289 timers_state.cpu_ticks_offset += timers_state.cpu_ticks_prev - ticks;
290 ticks = timers_state.cpu_ticks_prev;
291 }
292
293 timers_state.cpu_ticks_prev = ticks;
294 return ticks;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200295}
296
Liu Ping Fancb365642013-09-25 14:20:58 +0800297static int64_t cpu_get_clock_locked(void)
298{
Cao jin1d45cea2016-07-29 19:05:37 +0800299 int64_t time;
Liu Ping Fancb365642013-09-25 14:20:58 +0800300
Cao jin1d45cea2016-07-29 19:05:37 +0800301 time = timers_state.cpu_clock_offset;
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100302 if (timers_state.cpu_ticks_enabled) {
Cao jin1d45cea2016-07-29 19:05:37 +0800303 time += get_clock();
Liu Ping Fancb365642013-09-25 14:20:58 +0800304 }
305
Cao jin1d45cea2016-07-29 19:05:37 +0800306 return time;
Liu Ping Fancb365642013-09-25 14:20:58 +0800307}
308
Cao jind90f3cc2016-07-29 19:05:38 +0800309/* Return the monotonic time elapsed in VM, i.e.,
Peter Maydell8212ff82016-09-15 10:24:22 +0100310 * the time between vm_start and vm_stop
311 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200312int64_t cpu_get_clock(void)
313{
314 int64_t ti;
Liu Ping Fancb365642013-09-25 14:20:58 +0800315 unsigned start;
316
317 do {
318 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
319 ti = cpu_get_clock_locked();
320 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
321
322 return ti;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200323}
324
Liu Ping Fancb365642013-09-25 14:20:58 +0800325/* enable cpu_get_ticks()
Cao jin3224e872016-07-08 18:31:37 +0800326 * Caller must hold BQL which serves as mutex for vm_clock_seqlock.
Liu Ping Fancb365642013-09-25 14:20:58 +0800327 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200328void cpu_enable_ticks(void)
329{
Liu Ping Fancb365642013-09-25 14:20:58 +0800330 /* Here, the really thing protected by seqlock is cpu_clock_offset. */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400331 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200332 if (!timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400333 timers_state.cpu_ticks_offset -= cpu_get_host_ticks();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200334 timers_state.cpu_clock_offset -= get_clock();
335 timers_state.cpu_ticks_enabled = 1;
336 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400337 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200338}
339
340/* disable cpu_get_ticks() : the clock is stopped. You must not call
Liu Ping Fancb365642013-09-25 14:20:58 +0800341 * cpu_get_ticks() after that.
Cao jin3224e872016-07-08 18:31:37 +0800342 * Caller must hold BQL which serves as mutex for vm_clock_seqlock.
Liu Ping Fancb365642013-09-25 14:20:58 +0800343 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200344void cpu_disable_ticks(void)
345{
Liu Ping Fancb365642013-09-25 14:20:58 +0800346 /* Here, the really thing protected by seqlock is cpu_clock_offset. */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400347 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200348 if (timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400349 timers_state.cpu_ticks_offset += cpu_get_host_ticks();
Liu Ping Fancb365642013-09-25 14:20:58 +0800350 timers_state.cpu_clock_offset = cpu_get_clock_locked();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200351 timers_state.cpu_ticks_enabled = 0;
352 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400353 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200354}
355
356/* Correlation between real and virtual time is always going to be
357 fairly approximate, so ignore small variation.
358 When the guest is idle real and virtual time will be aligned in
359 the IO wait loop. */
Rutuja Shah73bcb242016-03-21 21:32:30 +0530360#define ICOUNT_WOBBLE (NANOSECONDS_PER_SECOND / 10)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200361
362static void icount_adjust(void)
363{
364 int64_t cur_time;
365 int64_t cur_icount;
366 int64_t delta;
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200367
368 /* Protected by TimersState mutex. */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200369 static int64_t last_delta;
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200370
Paolo Bonzini946fb272011-09-12 13:57:37 +0200371 /* If the VM is not running, then do nothing. */
372 if (!runstate_is_running()) {
373 return;
374 }
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200375
Emilio G. Cota03719e42016-06-08 14:55:21 -0400376 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200377 cur_time = cpu_get_clock_locked();
378 cur_icount = cpu_get_icount_locked();
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200379
Paolo Bonzini946fb272011-09-12 13:57:37 +0200380 delta = cur_icount - cur_time;
381 /* FIXME: This is a very crude algorithm, somewhat prone to oscillation. */
382 if (delta > 0
383 && last_delta + ICOUNT_WOBBLE < delta * 2
384 && icount_time_shift > 0) {
385 /* The guest is getting too far ahead. Slow time down. */
386 icount_time_shift--;
387 }
388 if (delta < 0
389 && last_delta - ICOUNT_WOBBLE > delta * 2
390 && icount_time_shift < MAX_ICOUNT_SHIFT) {
391 /* The guest is getting too far behind. Speed time up. */
392 icount_time_shift++;
393 }
394 last_delta = delta;
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200395 timers_state.qemu_icount_bias = cur_icount
396 - (timers_state.qemu_icount << icount_time_shift);
Emilio G. Cota03719e42016-06-08 14:55:21 -0400397 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200398}
399
400static void icount_adjust_rt(void *opaque)
401{
Alex Bligh40daca52013-08-21 16:03:02 +0100402 timer_mod(icount_rt_timer,
Pavel Dovgalyuk1979b902015-01-12 15:00:43 +0300403 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL_RT) + 1000);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200404 icount_adjust();
405}
406
407static void icount_adjust_vm(void *opaque)
408{
Alex Bligh40daca52013-08-21 16:03:02 +0100409 timer_mod(icount_vm_timer,
410 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
Rutuja Shah73bcb242016-03-21 21:32:30 +0530411 NANOSECONDS_PER_SECOND / 10);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200412 icount_adjust();
413}
414
415static int64_t qemu_icount_round(int64_t count)
416{
417 return (count + (1 << icount_time_shift) - 1) >> icount_time_shift;
418}
419
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300420static void icount_warp_rt(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200421{
Alex Bennéeccffff42016-04-04 15:35:48 +0100422 unsigned seq;
423 int64_t warp_start;
424
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200425 /* The icount_warp_timer is rescheduled soon after vm_clock_warp_start
426 * changes from -1 to another value, so the race here is okay.
427 */
Alex Bennéeccffff42016-04-04 15:35:48 +0100428 do {
429 seq = seqlock_read_begin(&timers_state.vm_clock_seqlock);
430 warp_start = vm_clock_warp_start;
431 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, seq));
432
433 if (warp_start == -1) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200434 return;
435 }
436
Emilio G. Cota03719e42016-06-08 14:55:21 -0400437 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200438 if (runstate_is_running()) {
Pavel Dovgalyuk8eda2062015-09-17 19:24:28 +0300439 int64_t clock = REPLAY_CLOCK(REPLAY_CLOCK_VIRTUAL_RT,
440 cpu_get_clock_locked());
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200441 int64_t warp_delta;
442
443 warp_delta = clock - vm_clock_warp_start;
444 if (use_icount == 2) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200445 /*
Alex Bligh40daca52013-08-21 16:03:02 +0100446 * In adaptive mode, do not let QEMU_CLOCK_VIRTUAL run too
Paolo Bonzini946fb272011-09-12 13:57:37 +0200447 * far ahead of real time.
448 */
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200449 int64_t cur_icount = cpu_get_icount_locked();
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300450 int64_t delta = clock - cur_icount;
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200451 warp_delta = MIN(warp_delta, delta);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200452 }
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200453 timers_state.qemu_icount_bias += warp_delta;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200454 }
455 vm_clock_warp_start = -1;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400456 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200457
458 if (qemu_clock_expired(QEMU_CLOCK_VIRTUAL)) {
459 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
460 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200461}
462
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300463static void icount_timer_cb(void *opaque)
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300464{
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300465 /* No need for a checkpoint because the timer already synchronizes
466 * with CHECKPOINT_CLOCK_VIRTUAL_RT.
467 */
468 icount_warp_rt();
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300469}
470
Paolo Bonzini8156be52012-03-28 15:42:04 +0200471void qtest_clock_warp(int64_t dest)
472{
Alex Bligh40daca52013-08-21 16:03:02 +0100473 int64_t clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
Fam Zhengefef88b2015-01-19 17:51:43 +0800474 AioContext *aio_context;
Paolo Bonzini8156be52012-03-28 15:42:04 +0200475 assert(qtest_enabled());
Fam Zhengefef88b2015-01-19 17:51:43 +0800476 aio_context = qemu_get_aio_context();
Paolo Bonzini8156be52012-03-28 15:42:04 +0200477 while (clock < dest) {
Alex Bligh40daca52013-08-21 16:03:02 +0100478 int64_t deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
Sergey Fedorovc9299e22014-06-10 13:10:28 +0400479 int64_t warp = qemu_soonest_timeout(dest - clock, deadline);
Fam Zhengefef88b2015-01-19 17:51:43 +0800480
Emilio G. Cota03719e42016-06-08 14:55:21 -0400481 seqlock_write_begin(&timers_state.vm_clock_seqlock);
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200482 timers_state.qemu_icount_bias += warp;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400483 seqlock_write_end(&timers_state.vm_clock_seqlock);
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200484
Alex Bligh40daca52013-08-21 16:03:02 +0100485 qemu_clock_run_timers(QEMU_CLOCK_VIRTUAL);
Fam Zhengefef88b2015-01-19 17:51:43 +0800486 timerlist_run_timers(aio_context->tlg.tl[QEMU_CLOCK_VIRTUAL]);
Alex Bligh40daca52013-08-21 16:03:02 +0100487 clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini8156be52012-03-28 15:42:04 +0200488 }
Alex Bligh40daca52013-08-21 16:03:02 +0100489 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini8156be52012-03-28 15:42:04 +0200490}
491
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300492void qemu_start_warp_timer(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200493{
Paolo Bonzinice78d182013-10-07 17:30:02 +0200494 int64_t clock;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200495 int64_t deadline;
496
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300497 if (!use_icount) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200498 return;
499 }
500
Pavel Dovgalyuk8bd7f712015-09-17 19:24:44 +0300501 /* Nothing to do if the VM is stopped: QEMU_CLOCK_VIRTUAL timers
502 * do not fire, so computing the deadline does not make sense.
503 */
504 if (!runstate_is_running()) {
505 return;
506 }
507
508 /* warp clock deterministically in record/replay mode */
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300509 if (!replay_checkpoint(CHECKPOINT_CLOCK_WARP_START)) {
Pavel Dovgalyuk8bd7f712015-09-17 19:24:44 +0300510 return;
511 }
512
Paolo Bonzinice78d182013-10-07 17:30:02 +0200513 if (!all_cpu_threads_idle()) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200514 return;
515 }
516
Paolo Bonzini8156be52012-03-28 15:42:04 +0200517 if (qtest_enabled()) {
518 /* When testing, qtest commands advance icount. */
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300519 return;
Paolo Bonzini8156be52012-03-28 15:42:04 +0200520 }
521
Alex Blighac70aaf2013-08-21 16:02:57 +0100522 /* We want to use the earliest deadline from ALL vm_clocks */
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300523 clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT);
Alex Bligh40daca52013-08-21 16:03:02 +0100524 deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
Paolo Bonzinice78d182013-10-07 17:30:02 +0200525 if (deadline < 0) {
Victor CLEMENTd7a0f712015-05-29 17:14:06 +0200526 static bool notified;
527 if (!icount_sleep && !notified) {
528 error_report("WARNING: icount sleep disabled and no active timers");
529 notified = true;
530 }
Paolo Bonzinice78d182013-10-07 17:30:02 +0200531 return;
Alex Blighac70aaf2013-08-21 16:02:57 +0100532 }
533
Paolo Bonzini946fb272011-09-12 13:57:37 +0200534 if (deadline > 0) {
535 /*
Alex Bligh40daca52013-08-21 16:03:02 +0100536 * Ensure QEMU_CLOCK_VIRTUAL proceeds even when the virtual CPU goes to
Paolo Bonzini946fb272011-09-12 13:57:37 +0200537 * sleep. Otherwise, the CPU might be waiting for a future timer
538 * interrupt to wake it up, but the interrupt never comes because
539 * the vCPU isn't running any insns and thus doesn't advance the
Alex Bligh40daca52013-08-21 16:03:02 +0100540 * QEMU_CLOCK_VIRTUAL.
Paolo Bonzini946fb272011-09-12 13:57:37 +0200541 */
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200542 if (!icount_sleep) {
543 /*
544 * We never let VCPUs sleep in no sleep icount mode.
545 * If there is a pending QEMU_CLOCK_VIRTUAL timer we just advance
546 * to the next QEMU_CLOCK_VIRTUAL event and notify it.
547 * It is useful when we want a deterministic execution time,
548 * isolated from host latencies.
549 */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400550 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200551 timers_state.qemu_icount_bias += deadline;
Emilio G. Cota03719e42016-06-08 14:55:21 -0400552 seqlock_write_end(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200553 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
554 } else {
555 /*
556 * We do stop VCPUs and only advance QEMU_CLOCK_VIRTUAL after some
557 * "real" time, (related to the time left until the next event) has
558 * passed. The QEMU_CLOCK_VIRTUAL_RT clock will do this.
559 * This avoids that the warps are visible externally; for example,
560 * you will not be sending network packets continuously instead of
561 * every 100ms.
562 */
Emilio G. Cota03719e42016-06-08 14:55:21 -0400563 seqlock_write_begin(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200564 if (vm_clock_warp_start == -1 || vm_clock_warp_start > clock) {
565 vm_clock_warp_start = clock;
566 }
Emilio G. Cota03719e42016-06-08 14:55:21 -0400567 seqlock_write_end(&timers_state.vm_clock_seqlock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200568 timer_mod_anticipate(icount_warp_timer, clock + deadline);
Paolo Bonzinice78d182013-10-07 17:30:02 +0200569 }
Alex Blighac70aaf2013-08-21 16:02:57 +0100570 } else if (deadline == 0) {
Alex Bligh40daca52013-08-21 16:03:02 +0100571 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200572 }
573}
574
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300575static void qemu_account_warp_timer(void)
576{
577 if (!use_icount || !icount_sleep) {
578 return;
579 }
580
581 /* Nothing to do if the VM is stopped: QEMU_CLOCK_VIRTUAL timers
582 * do not fire, so computing the deadline does not make sense.
583 */
584 if (!runstate_is_running()) {
585 return;
586 }
587
588 /* warp clock deterministically in record/replay mode */
589 if (!replay_checkpoint(CHECKPOINT_CLOCK_WARP_ACCOUNT)) {
590 return;
591 }
592
593 timer_del(icount_warp_timer);
594 icount_warp_rt();
595}
596
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200597static bool icount_state_needed(void *opaque)
598{
599 return use_icount;
600}
601
602/*
603 * This is a subsection for icount migration.
604 */
605static const VMStateDescription icount_vmstate_timers = {
606 .name = "timer/icount",
607 .version_id = 1,
608 .minimum_version_id = 1,
Juan Quintela5cd8cad2014-09-23 14:09:54 +0200609 .needed = icount_state_needed,
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200610 .fields = (VMStateField[]) {
611 VMSTATE_INT64(qemu_icount_bias, TimersState),
612 VMSTATE_INT64(qemu_icount, TimersState),
613 VMSTATE_END_OF_LIST()
614 }
615};
616
Paolo Bonzini946fb272011-09-12 13:57:37 +0200617static const VMStateDescription vmstate_timers = {
618 .name = "timer",
619 .version_id = 2,
620 .minimum_version_id = 1,
Juan Quintela35d08452014-04-16 16:01:33 +0200621 .fields = (VMStateField[]) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200622 VMSTATE_INT64(cpu_ticks_offset, TimersState),
623 VMSTATE_INT64(dummy, TimersState),
624 VMSTATE_INT64_V(cpu_clock_offset, TimersState, 2),
625 VMSTATE_END_OF_LIST()
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200626 },
Juan Quintela5cd8cad2014-09-23 14:09:54 +0200627 .subsections = (const VMStateDescription*[]) {
628 &icount_vmstate_timers,
629 NULL
Paolo Bonzini946fb272011-09-12 13:57:37 +0200630 }
631};
632
Paolo Bonzini14e6fe12016-10-31 10:36:08 +0100633static void cpu_throttle_thread(CPUState *cpu, run_on_cpu_data opaque)
Jason J. Herne2adcc852015-09-08 13:12:33 -0400634{
Jason J. Herne2adcc852015-09-08 13:12:33 -0400635 double pct;
636 double throttle_ratio;
637 long sleeptime_ns;
638
639 if (!cpu_throttle_get_percentage()) {
640 return;
641 }
642
643 pct = (double)cpu_throttle_get_percentage()/100;
644 throttle_ratio = pct / (1 - pct);
645 sleeptime_ns = (long)(throttle_ratio * CPU_THROTTLE_TIMESLICE_NS);
646
647 qemu_mutex_unlock_iothread();
648 atomic_set(&cpu->throttle_thread_scheduled, 0);
649 g_usleep(sleeptime_ns / 1000); /* Convert ns to us for usleep call */
650 qemu_mutex_lock_iothread();
651}
652
653static void cpu_throttle_timer_tick(void *opaque)
654{
655 CPUState *cpu;
656 double pct;
657
658 /* Stop the timer if needed */
659 if (!cpu_throttle_get_percentage()) {
660 return;
661 }
662 CPU_FOREACH(cpu) {
663 if (!atomic_xchg(&cpu->throttle_thread_scheduled, 1)) {
Paolo Bonzini14e6fe12016-10-31 10:36:08 +0100664 async_run_on_cpu(cpu, cpu_throttle_thread,
665 RUN_ON_CPU_NULL);
Jason J. Herne2adcc852015-09-08 13:12:33 -0400666 }
667 }
668
669 pct = (double)cpu_throttle_get_percentage()/100;
670 timer_mod(throttle_timer, qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT) +
671 CPU_THROTTLE_TIMESLICE_NS / (1-pct));
672}
673
674void cpu_throttle_set(int new_throttle_pct)
675{
676 /* Ensure throttle percentage is within valid range */
677 new_throttle_pct = MIN(new_throttle_pct, CPU_THROTTLE_PCT_MAX);
678 new_throttle_pct = MAX(new_throttle_pct, CPU_THROTTLE_PCT_MIN);
679
680 atomic_set(&throttle_percentage, new_throttle_pct);
681
682 timer_mod(throttle_timer, qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT) +
683 CPU_THROTTLE_TIMESLICE_NS);
684}
685
686void cpu_throttle_stop(void)
687{
688 atomic_set(&throttle_percentage, 0);
689}
690
691bool cpu_throttle_active(void)
692{
693 return (cpu_throttle_get_percentage() != 0);
694}
695
696int cpu_throttle_get_percentage(void)
697{
698 return atomic_read(&throttle_percentage);
699}
700
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400701void cpu_ticks_init(void)
702{
Emilio G. Cotaccdb3c12016-06-08 14:55:20 -0400703 seqlock_init(&timers_state.vm_clock_seqlock);
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400704 vmstate_register(NULL, 0, &vmstate_timers, &timers_state);
Jason J. Herne2adcc852015-09-08 13:12:33 -0400705 throttle_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL_RT,
706 cpu_throttle_timer_tick, NULL);
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400707}
708
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200709void configure_icount(QemuOpts *opts, Error **errp)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200710{
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200711 const char *option;
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200712 char *rem_str = NULL;
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200713
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200714 option = qemu_opt_get(opts, "shift");
Paolo Bonzini946fb272011-09-12 13:57:37 +0200715 if (!option) {
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200716 if (qemu_opt_get(opts, "align") != NULL) {
717 error_setg(errp, "Please specify shift option when using align");
718 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200719 return;
720 }
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200721
722 icount_sleep = qemu_opt_get_bool(opts, "sleep", true);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200723 if (icount_sleep) {
724 icount_warp_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL_RT,
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300725 icount_timer_cb, NULL);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200726 }
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200727
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200728 icount_align_option = qemu_opt_get_bool(opts, "align", false);
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200729
730 if (icount_align_option && !icount_sleep) {
Pranith Kumar778d9f92016-02-26 10:16:51 -0500731 error_setg(errp, "align=on and sleep=off are incompatible");
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200732 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200733 if (strcmp(option, "auto") != 0) {
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200734 errno = 0;
735 icount_time_shift = strtol(option, &rem_str, 0);
736 if (errno != 0 || *rem_str != '\0' || !strlen(option)) {
737 error_setg(errp, "icount: Invalid shift value");
738 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200739 use_icount = 1;
740 return;
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200741 } else if (icount_align_option) {
742 error_setg(errp, "shift=auto and align=on are incompatible");
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200743 } else if (!icount_sleep) {
Pranith Kumar778d9f92016-02-26 10:16:51 -0500744 error_setg(errp, "shift=auto and sleep=off are incompatible");
Paolo Bonzini946fb272011-09-12 13:57:37 +0200745 }
746
747 use_icount = 2;
748
749 /* 125MIPS seems a reasonable initial guess at the guest speed.
750 It will be corrected fairly quickly anyway. */
751 icount_time_shift = 3;
752
753 /* Have both realtime and virtual time triggers for speed adjustment.
754 The realtime trigger catches emulated time passing too slowly,
755 the virtual time trigger catches emulated time passing too fast.
756 Realtime triggers occur even when idle, so use them less frequently
757 than VM triggers. */
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300758 icount_rt_timer = timer_new_ms(QEMU_CLOCK_VIRTUAL_RT,
759 icount_adjust_rt, NULL);
Alex Bligh40daca52013-08-21 16:03:02 +0100760 timer_mod(icount_rt_timer,
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300761 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL_RT) + 1000);
Alex Bligh40daca52013-08-21 16:03:02 +0100762 icount_vm_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
763 icount_adjust_vm, NULL);
764 timer_mod(icount_vm_timer,
765 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
Rutuja Shah73bcb242016-03-21 21:32:30 +0530766 NANOSECONDS_PER_SECOND / 10);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200767}
768
769/***********************************************************/
Alex Bennée65467062017-02-23 18:29:09 +0000770/* TCG vCPU kick timer
771 *
772 * The kick timer is responsible for moving single threaded vCPU
773 * emulation on to the next vCPU. If more than one vCPU is running a
774 * timer event with force a cpu->exit so the next vCPU can get
775 * scheduled.
776 *
777 * The timer is removed if all vCPUs are idle and restarted again once
778 * idleness is complete.
779 */
780
781static QEMUTimer *tcg_kick_vcpu_timer;
Alex Bennée791158d2017-02-23 18:29:10 +0000782static CPUState *tcg_current_rr_cpu;
Alex Bennée65467062017-02-23 18:29:09 +0000783
784#define TCG_KICK_PERIOD (NANOSECONDS_PER_SECOND / 10)
785
786static inline int64_t qemu_tcg_next_kick(void)
787{
788 return qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + TCG_KICK_PERIOD;
789}
790
Alex Bennée791158d2017-02-23 18:29:10 +0000791/* Kick the currently round-robin scheduled vCPU */
792static void qemu_cpu_kick_rr_cpu(void)
793{
794 CPUState *cpu;
Alex Bennée791158d2017-02-23 18:29:10 +0000795 do {
796 cpu = atomic_mb_read(&tcg_current_rr_cpu);
797 if (cpu) {
798 cpu_exit(cpu);
799 }
800 } while (cpu != atomic_mb_read(&tcg_current_rr_cpu));
801}
802
Paolo Bonzini6b8f0182017-03-02 19:56:40 +0100803static void do_nothing(CPUState *cpu, run_on_cpu_data unused)
804{
805}
806
Paolo Bonzini3f53bc62017-03-03 11:50:29 +0100807void qemu_timer_notify_cb(void *opaque, QEMUClockType type)
808{
Paolo Bonzini6b8f0182017-03-02 19:56:40 +0100809 if (!use_icount || type != QEMU_CLOCK_VIRTUAL) {
810 qemu_notify_event();
811 return;
812 }
813
814 if (!qemu_in_vcpu_thread() && first_cpu) {
815 /* qemu_cpu_kick is not enough to kick a halted CPU out of
816 * qemu_tcg_wait_io_event. async_run_on_cpu, instead,
817 * causes cpu_thread_is_idle to return false. This way,
818 * handle_icount_deadline can run.
819 */
820 async_run_on_cpu(first_cpu, do_nothing, RUN_ON_CPU_NULL);
821 }
Paolo Bonzini3f53bc62017-03-03 11:50:29 +0100822}
823
Alex Bennée65467062017-02-23 18:29:09 +0000824static void kick_tcg_thread(void *opaque)
825{
826 timer_mod(tcg_kick_vcpu_timer, qemu_tcg_next_kick());
Alex Bennée791158d2017-02-23 18:29:10 +0000827 qemu_cpu_kick_rr_cpu();
Alex Bennée65467062017-02-23 18:29:09 +0000828}
829
830static void start_tcg_kick_timer(void)
831{
Alex Bennée37257942017-02-23 18:29:14 +0000832 if (!mttcg_enabled && !tcg_kick_vcpu_timer && CPU_NEXT(first_cpu)) {
Alex Bennée65467062017-02-23 18:29:09 +0000833 tcg_kick_vcpu_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
834 kick_tcg_thread, NULL);
835 timer_mod(tcg_kick_vcpu_timer, qemu_tcg_next_kick());
836 }
837}
838
839static void stop_tcg_kick_timer(void)
840{
841 if (tcg_kick_vcpu_timer) {
842 timer_del(tcg_kick_vcpu_timer);
843 tcg_kick_vcpu_timer = NULL;
844 }
845}
846
Alex Bennée65467062017-02-23 18:29:09 +0000847/***********************************************************/
Blue Swirl296af7c2010-03-29 19:23:50 +0000848void hw_error(const char *fmt, ...)
849{
850 va_list ap;
Andreas Färber55e5c282012-12-17 06:18:02 +0100851 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000852
853 va_start(ap, fmt);
854 fprintf(stderr, "qemu: hardware error: ");
855 vfprintf(stderr, fmt, ap);
856 fprintf(stderr, "\n");
Andreas Färberbdc44642013-06-24 23:50:24 +0200857 CPU_FOREACH(cpu) {
Andreas Färber55e5c282012-12-17 06:18:02 +0100858 fprintf(stderr, "CPU #%d:\n", cpu->cpu_index);
Andreas Färber878096e2013-05-27 01:33:50 +0200859 cpu_dump_state(cpu, stderr, fprintf, CPU_DUMP_FPU);
Blue Swirl296af7c2010-03-29 19:23:50 +0000860 }
861 va_end(ap);
862 abort();
863}
864
865void cpu_synchronize_all_states(void)
866{
Andreas Färber182735e2013-05-29 22:29:20 +0200867 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000868
Andreas Färberbdc44642013-06-24 23:50:24 +0200869 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200870 cpu_synchronize_state(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000871 }
872}
873
874void cpu_synchronize_all_post_reset(void)
875{
Andreas Färber182735e2013-05-29 22:29:20 +0200876 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000877
Andreas Färberbdc44642013-06-24 23:50:24 +0200878 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200879 cpu_synchronize_post_reset(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000880 }
881}
882
883void cpu_synchronize_all_post_init(void)
884{
Andreas Färber182735e2013-05-29 22:29:20 +0200885 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000886
Andreas Färberbdc44642013-06-24 23:50:24 +0200887 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200888 cpu_synchronize_post_init(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000889 }
890}
891
Kevin Wolf56983462013-07-05 13:49:54 +0200892static int do_vm_stop(RunState state)
Blue Swirl296af7c2010-03-29 19:23:50 +0000893{
Kevin Wolf56983462013-07-05 13:49:54 +0200894 int ret = 0;
895
Luiz Capitulino13548692011-07-29 15:36:43 -0300896 if (runstate_is_running()) {
Blue Swirl296af7c2010-03-29 19:23:50 +0000897 cpu_disable_ticks();
Blue Swirl296af7c2010-03-29 19:23:50 +0000898 pause_all_vcpus();
Luiz Capitulinof5bbfba2011-07-29 15:04:45 -0300899 runstate_set(state);
Luiz Capitulino1dfb4dd2011-07-29 14:26:33 -0300900 vm_state_notify(0, state);
Wenchao Xiaa4e15de2014-06-18 08:43:36 +0200901 qapi_event_send_stop(&error_abort);
Blue Swirl296af7c2010-03-29 19:23:50 +0000902 }
Kevin Wolf56983462013-07-05 13:49:54 +0200903
Kevin Wolf594a45c2013-07-18 14:52:19 +0200904 bdrv_drain_all();
Pavel Dovgalyuk6d0ceb82016-09-26 11:08:16 +0300905 replay_disable_events();
John Snow22af08e2016-09-22 21:45:51 -0400906 ret = bdrv_flush_all();
Kevin Wolf594a45c2013-07-18 14:52:19 +0200907
Kevin Wolf56983462013-07-05 13:49:54 +0200908 return ret;
Blue Swirl296af7c2010-03-29 19:23:50 +0000909}
910
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200911static bool cpu_can_run(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +0000912{
Andreas Färber4fdeee72012-05-02 23:10:09 +0200913 if (cpu->stop) {
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200914 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +0100915 }
Tiejun Chen321bc0b2013-08-02 09:43:09 +0800916 if (cpu_is_stopped(cpu)) {
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200917 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +0100918 }
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200919 return true;
Blue Swirl296af7c2010-03-29 19:23:50 +0000920}
921
Andreas Färber91325042013-05-27 02:07:49 +0200922static void cpu_handle_guest_debug(CPUState *cpu)
Jan Kiszka3c638d02010-06-25 16:56:56 +0200923{
Andreas Färber64f6b342013-05-27 02:06:09 +0200924 gdb_set_stop_cpu(cpu);
Jan Kiszka8cf71712011-02-07 12:19:16 +0100925 qemu_system_debug_request();
Andreas Färberf324e762012-05-02 23:26:21 +0200926 cpu->stopped = true;
Jan Kiszka3c638d02010-06-25 16:56:56 +0200927}
928
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100929#ifdef CONFIG_LINUX
930static void sigbus_reraise(void)
931{
932 sigset_t set;
933 struct sigaction action;
934
935 memset(&action, 0, sizeof(action));
936 action.sa_handler = SIG_DFL;
937 if (!sigaction(SIGBUS, &action, NULL)) {
938 raise(SIGBUS);
939 sigemptyset(&set);
940 sigaddset(&set, SIGBUS);
Peter Maydella2d17612016-05-16 18:33:59 +0100941 pthread_sigmask(SIG_UNBLOCK, &set, NULL);
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100942 }
943 perror("Failed to re-raise SIGBUS!\n");
944 abort();
945}
946
Paolo Bonzinid98d4072017-02-08 13:22:12 +0100947static void sigbus_handler(int n, siginfo_t *siginfo, void *ctx)
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100948{
Paolo Bonzinia16fc072017-02-09 09:50:02 +0100949 if (siginfo->si_code != BUS_MCEERR_AO && siginfo->si_code != BUS_MCEERR_AR) {
950 sigbus_reraise();
951 }
952
Paolo Bonzini2ae41db2017-02-08 12:48:54 +0100953 if (current_cpu) {
954 /* Called asynchronously in VCPU thread. */
955 if (kvm_on_sigbus_vcpu(current_cpu, siginfo->si_code, siginfo->si_addr)) {
956 sigbus_reraise();
957 }
958 } else {
959 /* Called synchronously (via signalfd) in main thread. */
960 if (kvm_on_sigbus(siginfo->si_code, siginfo->si_addr)) {
961 sigbus_reraise();
962 }
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100963 }
964}
965
966static void qemu_init_sigbus(void)
967{
968 struct sigaction action;
969
970 memset(&action, 0, sizeof(action));
971 action.sa_flags = SA_SIGINFO;
Paolo Bonzinid98d4072017-02-08 13:22:12 +0100972 action.sa_sigaction = sigbus_handler;
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100973 sigaction(SIGBUS, &action, NULL);
974
975 prctl(PR_MCE_KILL, PR_MCE_KILL_SET, PR_MCE_KILL_EARLY, 0, 0);
976}
Paolo Bonzinia16fc072017-02-09 09:50:02 +0100977#else /* !CONFIG_LINUX */
978static void qemu_init_sigbus(void)
979{
980}
Paolo Bonzinia16fc072017-02-09 09:50:02 +0100981#endif /* !CONFIG_LINUX */
Blue Swirl296af7c2010-03-29 19:23:50 +0000982
Stefan Weilb2532d82012-09-27 07:41:42 +0200983static QemuMutex qemu_global_mutex;
Blue Swirl296af7c2010-03-29 19:23:50 +0000984
985static QemuThread io_thread;
986
Blue Swirl296af7c2010-03-29 19:23:50 +0000987/* cpu creation */
988static QemuCond qemu_cpu_cond;
989/* system init */
Blue Swirl296af7c2010-03-29 19:23:50 +0000990static QemuCond qemu_pause_cond;
991
Paolo Bonzinid3b12f52011-09-13 10:30:52 +0200992void qemu_init_cpu_loop(void)
Blue Swirl296af7c2010-03-29 19:23:50 +0000993{
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100994 qemu_init_sigbus();
Anthony Liguoried945922011-02-08 18:18:18 +0100995 qemu_cond_init(&qemu_cpu_cond);
Anthony Liguoried945922011-02-08 18:18:18 +0100996 qemu_cond_init(&qemu_pause_cond);
Blue Swirl296af7c2010-03-29 19:23:50 +0000997 qemu_mutex_init(&qemu_global_mutex);
Blue Swirl296af7c2010-03-29 19:23:50 +0000998
Jan Kiszkab7680cb2011-03-12 17:43:51 +0100999 qemu_thread_get_self(&io_thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001000}
1001
Paolo Bonzini14e6fe12016-10-31 10:36:08 +01001002void run_on_cpu(CPUState *cpu, run_on_cpu_func func, run_on_cpu_data data)
Marcelo Tosattie82bcec2010-05-04 09:45:22 -03001003{
Sergey Fedorovd148d902016-08-29 09:51:00 +02001004 do_run_on_cpu(cpu, func, data, &qemu_global_mutex);
Chegu Vinod3c022702013-06-24 03:49:41 -06001005}
1006
Gu Zheng4c055ab2016-05-12 09:18:13 +05301007static void qemu_kvm_destroy_vcpu(CPUState *cpu)
1008{
1009 if (kvm_destroy_vcpu(cpu) < 0) {
1010 error_report("kvm_destroy_vcpu failed");
1011 exit(EXIT_FAILURE);
1012 }
1013}
1014
1015static void qemu_tcg_destroy_vcpu(CPUState *cpu)
1016{
1017}
1018
Andreas Färber509a0d72012-05-03 02:18:09 +02001019static void qemu_wait_io_event_common(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001020{
Alex Bennée37257942017-02-23 18:29:14 +00001021 atomic_mb_set(&cpu->thread_kicked, false);
Andreas Färber4fdeee72012-05-02 23:10:09 +02001022 if (cpu->stop) {
1023 cpu->stop = false;
Andreas Färberf324e762012-05-02 23:26:21 +02001024 cpu->stopped = true;
Dr. David Alan Gilbert96bce682016-01-25 10:08:18 +00001025 qemu_cond_broadcast(&qemu_pause_cond);
Blue Swirl296af7c2010-03-29 19:23:50 +00001026 }
Sergey Fedorova5403c62016-08-02 18:27:36 +01001027 process_queued_cpu_work(cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001028}
1029
1030static bool qemu_tcg_should_sleep(CPUState *cpu)
1031{
1032 if (mttcg_enabled) {
1033 return cpu_thread_is_idle(cpu);
1034 } else {
1035 return all_cpu_threads_idle();
1036 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001037}
1038
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001039static void qemu_tcg_wait_io_event(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001040{
Alex Bennée37257942017-02-23 18:29:14 +00001041 while (qemu_tcg_should_sleep(cpu)) {
Alex Bennée65467062017-02-23 18:29:09 +00001042 stop_tcg_kick_timer();
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001043 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka16400322011-02-09 16:29:37 +01001044 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001045
Alex Bennée65467062017-02-23 18:29:09 +00001046 start_tcg_kick_timer();
1047
Alex Bennée37257942017-02-23 18:29:14 +00001048 qemu_wait_io_event_common(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001049}
1050
Andreas Färberfd529e82013-05-26 23:24:55 +02001051static void qemu_kvm_wait_io_event(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001052{
Andreas Färbera98ae1d2013-05-26 23:21:08 +02001053 while (cpu_thread_is_idle(cpu)) {
Andreas Färberf5c121b2012-05-03 01:22:49 +02001054 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka16400322011-02-09 16:29:37 +01001055 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001056
Andreas Färber509a0d72012-05-03 02:18:09 +02001057 qemu_wait_io_event_common(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001058}
1059
Jan Kiszka7e97cd82011-02-07 12:19:12 +01001060static void *qemu_kvm_cpu_thread_fn(void *arg)
Blue Swirl296af7c2010-03-29 19:23:50 +00001061{
Andreas Färber48a106b2013-05-27 02:20:39 +02001062 CPUState *cpu = arg;
Jan Kiszka84b49152011-02-01 22:15:50 +01001063 int r;
Blue Swirl296af7c2010-03-29 19:23:50 +00001064
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001065 rcu_register_thread();
1066
Paolo Bonzini2e7f7a32015-06-18 18:47:18 +02001067 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001068 qemu_thread_get_self(cpu->thread);
Andreas Färber9f09e182012-05-03 06:59:07 +02001069 cpu->thread_id = qemu_get_thread_id();
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001070 cpu->can_do_io = 1;
Andreas Färber4917cf42013-05-27 05:17:50 +02001071 current_cpu = cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001072
Andreas Färber504134d2012-12-17 06:38:45 +01001073 r = kvm_init_vcpu(cpu);
Jan Kiszka84b49152011-02-01 22:15:50 +01001074 if (r < 0) {
1075 fprintf(stderr, "kvm_init_vcpu failed: %s\n", strerror(-r));
1076 exit(1);
1077 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001078
Paolo Bonzini18268b62017-02-09 09:41:14 +01001079 kvm_init_cpu_signals(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001080
1081 /* signal CPU creation */
Andreas Färber61a46212012-05-02 22:49:36 +02001082 cpu->created = true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001083 qemu_cond_signal(&qemu_cpu_cond);
1084
Gu Zheng4c055ab2016-05-12 09:18:13 +05301085 do {
Andreas Färbera1fcaa72012-05-02 23:42:26 +02001086 if (cpu_can_run(cpu)) {
Andreas Färber1458c362013-05-26 23:46:55 +02001087 r = kvm_cpu_exec(cpu);
Jan Kiszka83f338f2011-02-07 12:19:17 +01001088 if (r == EXCP_DEBUG) {
Andreas Färber91325042013-05-27 02:07:49 +02001089 cpu_handle_guest_debug(cpu);
Jan Kiszka83f338f2011-02-07 12:19:17 +01001090 }
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001091 }
Andreas Färberfd529e82013-05-26 23:24:55 +02001092 qemu_kvm_wait_io_event(cpu);
Gu Zheng4c055ab2016-05-12 09:18:13 +05301093 } while (!cpu->unplug || cpu_can_run(cpu));
Blue Swirl296af7c2010-03-29 19:23:50 +00001094
Gu Zheng4c055ab2016-05-12 09:18:13 +05301095 qemu_kvm_destroy_vcpu(cpu);
Bharata B Rao2c579042016-05-12 09:18:14 +05301096 cpu->created = false;
1097 qemu_cond_signal(&qemu_cpu_cond);
Gu Zheng4c055ab2016-05-12 09:18:13 +05301098 qemu_mutex_unlock_iothread();
Blue Swirl296af7c2010-03-29 19:23:50 +00001099 return NULL;
1100}
1101
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001102static void *qemu_dummy_cpu_thread_fn(void *arg)
1103{
1104#ifdef _WIN32
1105 fprintf(stderr, "qtest is not supported under Windows\n");
1106 exit(1);
1107#else
Andreas Färber10a90212013-05-27 02:24:35 +02001108 CPUState *cpu = arg;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001109 sigset_t waitset;
1110 int r;
1111
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001112 rcu_register_thread();
1113
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001114 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001115 qemu_thread_get_self(cpu->thread);
Andreas Färber9f09e182012-05-03 06:59:07 +02001116 cpu->thread_id = qemu_get_thread_id();
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001117 cpu->can_do_io = 1;
Alex Bennée37257942017-02-23 18:29:14 +00001118 current_cpu = cpu;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001119
1120 sigemptyset(&waitset);
1121 sigaddset(&waitset, SIG_IPI);
1122
1123 /* signal CPU creation */
Andreas Färber61a46212012-05-02 22:49:36 +02001124 cpu->created = true;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001125 qemu_cond_signal(&qemu_cpu_cond);
1126
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001127 while (1) {
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001128 qemu_mutex_unlock_iothread();
1129 do {
1130 int sig;
1131 r = sigwait(&waitset, &sig);
1132 } while (r == -1 && (errno == EAGAIN || errno == EINTR));
1133 if (r == -1) {
1134 perror("sigwait");
1135 exit(1);
1136 }
1137 qemu_mutex_lock_iothread();
Andreas Färber509a0d72012-05-03 02:18:09 +02001138 qemu_wait_io_event_common(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001139 }
1140
1141 return NULL;
1142#endif
1143}
1144
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001145static int64_t tcg_get_icount_limit(void)
1146{
1147 int64_t deadline;
1148
1149 if (replay_mode != REPLAY_MODE_PLAY) {
1150 deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
1151
1152 /* Maintain prior (possibly buggy) behaviour where if no deadline
1153 * was set (as there is no QEMU_CLOCK_VIRTUAL timer) or it is more than
1154 * INT32_MAX nanoseconds ahead, we still use INT32_MAX
1155 * nanoseconds.
1156 */
1157 if ((deadline < 0) || (deadline > INT32_MAX)) {
1158 deadline = INT32_MAX;
1159 }
1160
1161 return qemu_icount_round(deadline);
1162 } else {
1163 return replay_get_instructions();
1164 }
1165}
1166
Alex Bennée12e97002016-10-27 16:10:14 +01001167static void handle_icount_deadline(void)
1168{
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001169 assert(qemu_in_vcpu_thread());
Alex Bennée12e97002016-10-27 16:10:14 +01001170 if (use_icount) {
1171 int64_t deadline =
1172 qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
1173
1174 if (deadline == 0) {
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001175 /* Wake up other AioContexts. */
Alex Bennée12e97002016-10-27 16:10:14 +01001176 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001177 qemu_clock_run_timers(QEMU_CLOCK_VIRTUAL);
Alex Bennée12e97002016-10-27 16:10:14 +01001178 }
1179 }
1180}
1181
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001182static int tcg_cpu_exec(CPUState *cpu)
1183{
1184 int ret;
1185#ifdef CONFIG_PROFILER
1186 int64_t ti;
1187#endif
1188
1189#ifdef CONFIG_PROFILER
1190 ti = profile_getclock();
1191#endif
1192 if (use_icount) {
1193 int64_t count;
1194 int decr;
1195 timers_state.qemu_icount -= (cpu->icount_decr.u16.low
1196 + cpu->icount_extra);
1197 cpu->icount_decr.u16.low = 0;
1198 cpu->icount_extra = 0;
1199 count = tcg_get_icount_limit();
1200 timers_state.qemu_icount += count;
1201 decr = (count > 0xffff) ? 0xffff : count;
1202 count -= decr;
1203 cpu->icount_decr.u16.low = decr;
1204 cpu->icount_extra = count;
1205 }
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001206 qemu_mutex_unlock_iothread();
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001207 cpu_exec_start(cpu);
1208 ret = cpu_exec(cpu);
1209 cpu_exec_end(cpu);
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001210 qemu_mutex_lock_iothread();
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001211#ifdef CONFIG_PROFILER
1212 tcg_time += profile_getclock() - ti;
1213#endif
1214 if (use_icount) {
1215 /* Fold pending instructions back into the
1216 instruction counter, and clear the interrupt flag. */
1217 timers_state.qemu_icount -= (cpu->icount_decr.u16.low
1218 + cpu->icount_extra);
1219 cpu->icount_decr.u32 = 0;
1220 cpu->icount_extra = 0;
1221 replay_account_executed_instructions();
1222 }
1223 return ret;
1224}
1225
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001226/* Destroy any remaining vCPUs which have been unplugged and have
1227 * finished running
1228 */
1229static void deal_with_unplugged_cpus(void)
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001230{
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001231 CPUState *cpu;
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001232
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001233 CPU_FOREACH(cpu) {
1234 if (cpu->unplug && !cpu_can_run(cpu)) {
1235 qemu_tcg_destroy_vcpu(cpu);
1236 cpu->created = false;
1237 qemu_cond_signal(&qemu_cpu_cond);
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001238 break;
1239 }
1240 }
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001241}
Jan Kiszkabdb7ca62011-09-26 09:40:39 +02001242
Alex Bennée65467062017-02-23 18:29:09 +00001243/* Single-threaded TCG
1244 *
1245 * In the single-threaded case each vCPU is simulated in turn. If
1246 * there is more than a single vCPU we create a simple timer to kick
1247 * the vCPU and ensure we don't get stuck in a tight loop in one vCPU.
1248 * This is done explicitly rather than relying on side-effects
1249 * elsewhere.
1250 */
1251
Alex Bennée37257942017-02-23 18:29:14 +00001252static void *qemu_tcg_rr_cpu_thread_fn(void *arg)
Blue Swirl296af7c2010-03-29 19:23:50 +00001253{
Andreas Färberc3586ba2012-05-03 01:41:24 +02001254 CPUState *cpu = arg;
Blue Swirl296af7c2010-03-29 19:23:50 +00001255
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001256 rcu_register_thread();
1257
Paolo Bonzini2e7f7a32015-06-18 18:47:18 +02001258 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001259 qemu_thread_get_self(cpu->thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001260
Andreas Färber38fcbd32013-07-07 19:50:23 +02001261 CPU_FOREACH(cpu) {
1262 cpu->thread_id = qemu_get_thread_id();
1263 cpu->created = true;
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001264 cpu->can_do_io = 1;
Andreas Färber38fcbd32013-07-07 19:50:23 +02001265 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001266 qemu_cond_signal(&qemu_cpu_cond);
1267
Jan Kiszkafa7d1862011-08-22 18:35:25 +02001268 /* wait for initial kick-off after machine start */
Emilio G. Cotac28e3992015-04-27 12:45:28 -04001269 while (first_cpu->stopped) {
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001270 qemu_cond_wait(first_cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka8e564b42012-02-17 18:31:15 +01001271
1272 /* process any pending work */
Andreas Färberbdc44642013-06-24 23:50:24 +02001273 CPU_FOREACH(cpu) {
Alex Bennée37257942017-02-23 18:29:14 +00001274 current_cpu = cpu;
Andreas Färber182735e2013-05-29 22:29:20 +02001275 qemu_wait_io_event_common(cpu);
Jan Kiszka8e564b42012-02-17 18:31:15 +01001276 }
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001277 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001278
Alex Bennée65467062017-02-23 18:29:09 +00001279 start_tcg_kick_timer();
1280
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001281 cpu = first_cpu;
1282
Alex Bennéee5143e32017-02-23 18:29:12 +00001283 /* process any pending work */
1284 cpu->exit_request = 1;
1285
Blue Swirl296af7c2010-03-29 19:23:50 +00001286 while (1) {
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001287 /* Account partial waits to QEMU_CLOCK_VIRTUAL. */
1288 qemu_account_warp_timer();
1289
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001290 /* Run the timers here. This is much more efficient than
1291 * waking up the I/O thread and waiting for completion.
1292 */
1293 handle_icount_deadline();
1294
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001295 if (!cpu) {
1296 cpu = first_cpu;
1297 }
1298
Alex Bennéee5143e32017-02-23 18:29:12 +00001299 while (cpu && !cpu->queued_work_first && !cpu->exit_request) {
1300
Alex Bennée791158d2017-02-23 18:29:10 +00001301 atomic_mb_set(&tcg_current_rr_cpu, cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001302 current_cpu = cpu;
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001303
1304 qemu_clock_enable(QEMU_CLOCK_VIRTUAL,
1305 (cpu->singlestep_enabled & SSTEP_NOTIMER) == 0);
1306
1307 if (cpu_can_run(cpu)) {
1308 int r;
1309 r = tcg_cpu_exec(cpu);
1310 if (r == EXCP_DEBUG) {
1311 cpu_handle_guest_debug(cpu);
1312 break;
Pranith Kumar08e73c42017-02-23 18:29:15 +00001313 } else if (r == EXCP_ATOMIC) {
1314 qemu_mutex_unlock_iothread();
1315 cpu_exec_step_atomic(cpu);
1316 qemu_mutex_lock_iothread();
1317 break;
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001318 }
Alex Bennée37257942017-02-23 18:29:14 +00001319 } else if (cpu->stop) {
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001320 if (cpu->unplug) {
1321 cpu = CPU_NEXT(cpu);
1322 }
1323 break;
1324 }
1325
Alex Bennéee5143e32017-02-23 18:29:12 +00001326 cpu = CPU_NEXT(cpu);
1327 } /* while (cpu && !cpu->exit_request).. */
1328
Alex Bennée791158d2017-02-23 18:29:10 +00001329 /* Does not need atomic_mb_set because a spurious wakeup is okay. */
1330 atomic_set(&tcg_current_rr_cpu, NULL);
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001331
Alex Bennéee5143e32017-02-23 18:29:12 +00001332 if (cpu && cpu->exit_request) {
1333 atomic_mb_set(&cpu->exit_request, 0);
1334 }
Alex Blighac70aaf2013-08-21 16:02:57 +01001335
Alex Bennée37257942017-02-23 18:29:14 +00001336 qemu_tcg_wait_io_event(cpu ? cpu : QTAILQ_FIRST(&cpus));
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001337 deal_with_unplugged_cpus();
Blue Swirl296af7c2010-03-29 19:23:50 +00001338 }
1339
1340 return NULL;
1341}
1342
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001343static void *qemu_hax_cpu_thread_fn(void *arg)
1344{
1345 CPUState *cpu = arg;
1346 int r;
Vincent Palatinb3d3a422017-03-20 11:15:49 +01001347
1348 qemu_mutex_lock_iothread();
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001349 qemu_thread_get_self(cpu->thread);
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001350
1351 cpu->thread_id = qemu_get_thread_id();
1352 cpu->created = true;
1353 cpu->halted = 0;
1354 current_cpu = cpu;
1355
1356 hax_init_vcpu(cpu);
1357 qemu_cond_signal(&qemu_cpu_cond);
1358
1359 while (1) {
1360 if (cpu_can_run(cpu)) {
1361 r = hax_smp_cpu_exec(cpu);
1362 if (r == EXCP_DEBUG) {
1363 cpu_handle_guest_debug(cpu);
1364 }
1365 }
1366
1367 while (cpu_thread_is_idle(cpu)) {
1368 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
1369 }
1370#ifdef _WIN32
1371 SleepEx(0, TRUE);
1372#endif
1373 qemu_wait_io_event_common(cpu);
1374 }
1375 return NULL;
1376}
1377
1378#ifdef _WIN32
1379static void CALLBACK dummy_apc_func(ULONG_PTR unused)
1380{
1381}
1382#endif
1383
Alex Bennée37257942017-02-23 18:29:14 +00001384/* Multi-threaded TCG
1385 *
1386 * In the multi-threaded case each vCPU has its own thread. The TLS
1387 * variable current_cpu can be used deep in the code to find the
1388 * current CPUState for a given thread.
1389 */
1390
1391static void *qemu_tcg_cpu_thread_fn(void *arg)
1392{
1393 CPUState *cpu = arg;
1394
Alex Bennéebf51c722017-03-30 18:32:29 +01001395 g_assert(!use_icount);
1396
Alex Bennée37257942017-02-23 18:29:14 +00001397 rcu_register_thread();
1398
1399 qemu_mutex_lock_iothread();
1400 qemu_thread_get_self(cpu->thread);
1401
1402 cpu->thread_id = qemu_get_thread_id();
1403 cpu->created = true;
1404 cpu->can_do_io = 1;
1405 current_cpu = cpu;
1406 qemu_cond_signal(&qemu_cpu_cond);
1407
1408 /* process any pending work */
1409 cpu->exit_request = 1;
1410
1411 while (1) {
1412 if (cpu_can_run(cpu)) {
1413 int r;
1414 r = tcg_cpu_exec(cpu);
1415 switch (r) {
1416 case EXCP_DEBUG:
1417 cpu_handle_guest_debug(cpu);
1418 break;
1419 case EXCP_HALTED:
1420 /* during start-up the vCPU is reset and the thread is
1421 * kicked several times. If we don't ensure we go back
1422 * to sleep in the halted state we won't cleanly
1423 * start-up when the vCPU is enabled.
1424 *
1425 * cpu->halted should ensure we sleep in wait_io_event
1426 */
1427 g_assert(cpu->halted);
1428 break;
Pranith Kumar08e73c42017-02-23 18:29:15 +00001429 case EXCP_ATOMIC:
1430 qemu_mutex_unlock_iothread();
1431 cpu_exec_step_atomic(cpu);
1432 qemu_mutex_lock_iothread();
Alex Bennée37257942017-02-23 18:29:14 +00001433 default:
1434 /* Ignore everything else? */
1435 break;
1436 }
1437 }
1438
Alex Bennée37257942017-02-23 18:29:14 +00001439 atomic_mb_set(&cpu->exit_request, 0);
1440 qemu_tcg_wait_io_event(cpu);
1441 }
1442
1443 return NULL;
1444}
1445
Andreas Färber2ff09a42012-05-03 00:23:30 +02001446static void qemu_cpu_kick_thread(CPUState *cpu)
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001447{
1448#ifndef _WIN32
1449 int err;
1450
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001451 if (cpu->thread_kicked) {
1452 return;
Paolo Bonzini9102ded2015-08-18 06:52:09 -07001453 }
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001454 cpu->thread_kicked = true;
Andreas Färber814e6122012-05-02 17:00:37 +02001455 err = pthread_kill(cpu->thread->thread, SIG_IPI);
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001456 if (err) {
1457 fprintf(stderr, "qemu:%s: %s", __func__, strerror(err));
1458 exit(1);
1459 }
1460#else /* _WIN32 */
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001461 if (!qemu_cpu_is_self(cpu)) {
1462 if (!QueueUserAPC(dummy_apc_func, cpu->hThread, 0)) {
1463 fprintf(stderr, "%s: QueueUserAPC failed with error %lu\n",
1464 __func__, GetLastError());
1465 exit(1);
1466 }
1467 }
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001468#endif
1469}
1470
Andreas Färberc08d7422012-05-03 04:34:15 +02001471void qemu_cpu_kick(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001472{
Andreas Färberf5c121b2012-05-03 01:22:49 +02001473 qemu_cond_broadcast(cpu->halt_cond);
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001474 if (tcg_enabled()) {
Alex Bennée791158d2017-02-23 18:29:10 +00001475 cpu_exit(cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001476 /* NOP unless doing single-thread RR */
Alex Bennée791158d2017-02-23 18:29:10 +00001477 qemu_cpu_kick_rr_cpu();
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001478 } else {
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001479 if (hax_enabled()) {
1480 /*
1481 * FIXME: race condition with the exit_request check in
1482 * hax_vcpu_hax_exec
1483 */
1484 cpu->exit_request = 1;
1485 }
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001486 qemu_cpu_kick_thread(cpu);
1487 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001488}
1489
Jan Kiszka46d62fa2011-02-01 22:15:59 +01001490void qemu_cpu_kick_self(void)
1491{
Andreas Färber4917cf42013-05-27 05:17:50 +02001492 assert(current_cpu);
Paolo Bonzini9102ded2015-08-18 06:52:09 -07001493 qemu_cpu_kick_thread(current_cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001494}
1495
Andreas Färber60e82572012-05-02 22:23:49 +02001496bool qemu_cpu_is_self(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001497{
Andreas Färber814e6122012-05-02 17:00:37 +02001498 return qemu_thread_is_self(cpu->thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001499}
1500
Paolo Bonzini79e2b9a2015-01-21 12:09:14 +01001501bool qemu_in_vcpu_thread(void)
Juan Quintelaaa723c22012-09-18 16:30:11 +02001502{
Andreas Färber4917cf42013-05-27 05:17:50 +02001503 return current_cpu && qemu_cpu_is_self(current_cpu);
Juan Quintelaaa723c22012-09-18 16:30:11 +02001504}
1505
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001506static __thread bool iothread_locked = false;
1507
1508bool qemu_mutex_iothread_locked(void)
1509{
1510 return iothread_locked;
1511}
1512
Blue Swirl296af7c2010-03-29 19:23:50 +00001513void qemu_mutex_lock_iothread(void)
1514{
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001515 g_assert(!qemu_mutex_iothread_locked());
1516 qemu_mutex_lock(&qemu_global_mutex);
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001517 iothread_locked = true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001518}
1519
1520void qemu_mutex_unlock_iothread(void)
1521{
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001522 g_assert(qemu_mutex_iothread_locked());
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001523 iothread_locked = false;
Blue Swirl296af7c2010-03-29 19:23:50 +00001524 qemu_mutex_unlock(&qemu_global_mutex);
1525}
1526
Alex Bennéee8faee02016-10-27 16:09:58 +01001527static bool all_vcpus_paused(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001528{
Andreas Färberbdc44642013-06-24 23:50:24 +02001529 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001530
Andreas Färberbdc44642013-06-24 23:50:24 +02001531 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001532 if (!cpu->stopped) {
Alex Bennéee8faee02016-10-27 16:09:58 +01001533 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001534 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001535 }
1536
Alex Bennéee8faee02016-10-27 16:09:58 +01001537 return true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001538}
1539
1540void pause_all_vcpus(void)
1541{
Andreas Färberbdc44642013-06-24 23:50:24 +02001542 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001543
Alex Bligh40daca52013-08-21 16:03:02 +01001544 qemu_clock_enable(QEMU_CLOCK_VIRTUAL, false);
Andreas Färberbdc44642013-06-24 23:50:24 +02001545 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001546 cpu->stop = true;
1547 qemu_cpu_kick(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001548 }
1549
Juan Quintelaaa723c22012-09-18 16:30:11 +02001550 if (qemu_in_vcpu_thread()) {
Jan Kiszkad798e972012-02-17 18:31:16 +01001551 cpu_stop_current();
Jan Kiszkad798e972012-02-17 18:31:16 +01001552 }
1553
Blue Swirl296af7c2010-03-29 19:23:50 +00001554 while (!all_vcpus_paused()) {
Paolo Bonzinibe7d6c52011-03-12 17:44:02 +01001555 qemu_cond_wait(&qemu_pause_cond, &qemu_global_mutex);
Andreas Färberbdc44642013-06-24 23:50:24 +02001556 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001557 qemu_cpu_kick(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001558 }
1559 }
1560}
1561
Igor Mammedov29936832013-04-23 10:29:37 +02001562void cpu_resume(CPUState *cpu)
1563{
1564 cpu->stop = false;
1565 cpu->stopped = false;
1566 qemu_cpu_kick(cpu);
1567}
1568
Blue Swirl296af7c2010-03-29 19:23:50 +00001569void resume_all_vcpus(void)
1570{
Andreas Färberbdc44642013-06-24 23:50:24 +02001571 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001572
Alex Bligh40daca52013-08-21 16:03:02 +01001573 qemu_clock_enable(QEMU_CLOCK_VIRTUAL, true);
Andreas Färberbdc44642013-06-24 23:50:24 +02001574 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001575 cpu_resume(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001576 }
1577}
1578
Gu Zheng4c055ab2016-05-12 09:18:13 +05301579void cpu_remove(CPUState *cpu)
1580{
1581 cpu->stop = true;
1582 cpu->unplug = true;
1583 qemu_cpu_kick(cpu);
1584}
1585
Bharata B Rao2c579042016-05-12 09:18:14 +05301586void cpu_remove_sync(CPUState *cpu)
1587{
1588 cpu_remove(cpu);
1589 while (cpu->created) {
1590 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1591 }
1592}
1593
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001594/* For temporary buffers for forming a name */
1595#define VCPU_THREAD_NAME_SIZE 16
1596
Andreas Färbere5ab30a2012-05-03 01:50:44 +02001597static void qemu_tcg_init_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001598{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001599 char thread_name[VCPU_THREAD_NAME_SIZE];
Alex Bennée37257942017-02-23 18:29:14 +00001600 static QemuCond *single_tcg_halt_cond;
1601 static QemuThread *single_tcg_cpu_thread;
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001602
Alex Bennée37257942017-02-23 18:29:14 +00001603 if (qemu_tcg_mttcg_enabled() || !single_tcg_cpu_thread) {
Andreas Färber814e6122012-05-02 17:00:37 +02001604 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001605 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1606 qemu_cond_init(cpu->halt_cond);
Alex Bennée37257942017-02-23 18:29:14 +00001607
1608 if (qemu_tcg_mttcg_enabled()) {
1609 /* create a thread per vCPU with TCG (MTTCG) */
1610 parallel_cpus = true;
1611 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/TCG",
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001612 cpu->cpu_index);
Alex Bennée37257942017-02-23 18:29:14 +00001613
1614 qemu_thread_create(cpu->thread, thread_name, qemu_tcg_cpu_thread_fn,
1615 cpu, QEMU_THREAD_JOINABLE);
1616
1617 } else {
1618 /* share a single thread for all cpus with TCG */
1619 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "ALL CPUs/TCG");
1620 qemu_thread_create(cpu->thread, thread_name,
1621 qemu_tcg_rr_cpu_thread_fn,
1622 cpu, QEMU_THREAD_JOINABLE);
1623
1624 single_tcg_halt_cond = cpu->halt_cond;
1625 single_tcg_cpu_thread = cpu->thread;
1626 }
Paolo Bonzini1ecf47b2011-12-13 13:43:52 +01001627#ifdef _WIN32
Andreas Färber814e6122012-05-02 17:00:37 +02001628 cpu->hThread = qemu_thread_get_handle(cpu->thread);
Paolo Bonzini1ecf47b2011-12-13 13:43:52 +01001629#endif
Andreas Färber61a46212012-05-02 22:49:36 +02001630 while (!cpu->created) {
Paolo Bonzini18a85722011-03-12 17:44:03 +01001631 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001632 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001633 } else {
Alex Bennée37257942017-02-23 18:29:14 +00001634 /* For non-MTTCG cases we share the thread */
1635 cpu->thread = single_tcg_cpu_thread;
1636 cpu->halt_cond = single_tcg_halt_cond;
Blue Swirl296af7c2010-03-29 19:23:50 +00001637 }
1638}
1639
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001640static void qemu_hax_start_vcpu(CPUState *cpu)
1641{
1642 char thread_name[VCPU_THREAD_NAME_SIZE];
1643
1644 cpu->thread = g_malloc0(sizeof(QemuThread));
1645 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1646 qemu_cond_init(cpu->halt_cond);
1647
1648 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/HAX",
1649 cpu->cpu_index);
1650 qemu_thread_create(cpu->thread, thread_name, qemu_hax_cpu_thread_fn,
1651 cpu, QEMU_THREAD_JOINABLE);
1652#ifdef _WIN32
1653 cpu->hThread = qemu_thread_get_handle(cpu->thread);
1654#endif
1655 while (!cpu->created) {
1656 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1657 }
1658}
1659
Andreas Färber48a106b2013-05-27 02:20:39 +02001660static void qemu_kvm_start_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001661{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001662 char thread_name[VCPU_THREAD_NAME_SIZE];
1663
Andreas Färber814e6122012-05-02 17:00:37 +02001664 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001665 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1666 qemu_cond_init(cpu->halt_cond);
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001667 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/KVM",
1668 cpu->cpu_index);
1669 qemu_thread_create(cpu->thread, thread_name, qemu_kvm_cpu_thread_fn,
1670 cpu, QEMU_THREAD_JOINABLE);
Andreas Färber61a46212012-05-02 22:49:36 +02001671 while (!cpu->created) {
Paolo Bonzini18a85722011-03-12 17:44:03 +01001672 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001673 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001674}
1675
Andreas Färber10a90212013-05-27 02:24:35 +02001676static void qemu_dummy_start_vcpu(CPUState *cpu)
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001677{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001678 char thread_name[VCPU_THREAD_NAME_SIZE];
1679
Andreas Färber814e6122012-05-02 17:00:37 +02001680 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001681 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1682 qemu_cond_init(cpu->halt_cond);
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001683 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/DUMMY",
1684 cpu->cpu_index);
1685 qemu_thread_create(cpu->thread, thread_name, qemu_dummy_cpu_thread_fn, cpu,
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001686 QEMU_THREAD_JOINABLE);
Andreas Färber61a46212012-05-02 22:49:36 +02001687 while (!cpu->created) {
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001688 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1689 }
1690}
1691
Andreas Färberc643bed2013-05-27 03:23:24 +02001692void qemu_init_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001693{
Andreas Färberce3960e2012-12-17 03:27:07 +01001694 cpu->nr_cores = smp_cores;
1695 cpu->nr_threads = smp_threads;
Andreas Färberf324e762012-05-02 23:26:21 +02001696 cpu->stopped = true;
Peter Maydell56943e82016-01-21 14:15:04 +00001697
1698 if (!cpu->as) {
1699 /* If the target cpu hasn't set up any address spaces itself,
1700 * give it the default one.
1701 */
Peter Crosthwaite6731d862016-01-21 14:15:06 +00001702 AddressSpace *as = address_space_init_shareable(cpu->memory,
1703 "cpu-memory");
Peter Maydell12ebc9a2016-01-21 14:15:04 +00001704 cpu->num_ases = 1;
Peter Crosthwaite6731d862016-01-21 14:15:06 +00001705 cpu_address_space_init(cpu, as, 0);
Peter Maydell56943e82016-01-21 14:15:04 +00001706 }
1707
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001708 if (kvm_enabled()) {
Andreas Färber48a106b2013-05-27 02:20:39 +02001709 qemu_kvm_start_vcpu(cpu);
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001710 } else if (hax_enabled()) {
1711 qemu_hax_start_vcpu(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001712 } else if (tcg_enabled()) {
Andreas Färbere5ab30a2012-05-03 01:50:44 +02001713 qemu_tcg_init_vcpu(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001714 } else {
Andreas Färber10a90212013-05-27 02:24:35 +02001715 qemu_dummy_start_vcpu(cpu);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001716 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001717}
1718
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001719void cpu_stop_current(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001720{
Andreas Färber4917cf42013-05-27 05:17:50 +02001721 if (current_cpu) {
1722 current_cpu->stop = false;
1723 current_cpu->stopped = true;
1724 cpu_exit(current_cpu);
Dr. David Alan Gilbert96bce682016-01-25 10:08:18 +00001725 qemu_cond_broadcast(&qemu_pause_cond);
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001726 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001727}
1728
Kevin Wolf56983462013-07-05 13:49:54 +02001729int vm_stop(RunState state)
Blue Swirl296af7c2010-03-29 19:23:50 +00001730{
Juan Quintelaaa723c22012-09-18 16:30:11 +02001731 if (qemu_in_vcpu_thread()) {
Paolo Bonzini74892d22014-06-05 14:53:58 +02001732 qemu_system_vmstop_request_prepare();
Luiz Capitulino1dfb4dd2011-07-29 14:26:33 -03001733 qemu_system_vmstop_request(state);
Blue Swirl296af7c2010-03-29 19:23:50 +00001734 /*
1735 * FIXME: should not return to device code in case
1736 * vm_stop() has been requested.
1737 */
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001738 cpu_stop_current();
Kevin Wolf56983462013-07-05 13:49:54 +02001739 return 0;
Blue Swirl296af7c2010-03-29 19:23:50 +00001740 }
Kevin Wolf56983462013-07-05 13:49:54 +02001741
1742 return do_vm_stop(state);
Blue Swirl296af7c2010-03-29 19:23:50 +00001743}
1744
Claudio Imbrenda2d76e822017-02-14 18:07:47 +01001745/**
1746 * Prepare for (re)starting the VM.
1747 * Returns -1 if the vCPUs are not to be restarted (e.g. if they are already
1748 * running or in case of an error condition), 0 otherwise.
1749 */
1750int vm_prepare_start(void)
1751{
1752 RunState requested;
1753 int res = 0;
1754
1755 qemu_vmstop_requested(&requested);
1756 if (runstate_is_running() && requested == RUN_STATE__MAX) {
1757 return -1;
1758 }
1759
1760 /* Ensure that a STOP/RESUME pair of events is emitted if a
1761 * vmstop request was pending. The BLOCK_IO_ERROR event, for
1762 * example, according to documentation is always followed by
1763 * the STOP event.
1764 */
1765 if (runstate_is_running()) {
1766 qapi_event_send_stop(&error_abort);
1767 res = -1;
1768 } else {
1769 replay_enable_events();
1770 cpu_enable_ticks();
1771 runstate_set(RUN_STATE_RUNNING);
1772 vm_state_notify(1, RUN_STATE_RUNNING);
1773 }
1774
1775 /* We are sending this now, but the CPUs will be resumed shortly later */
1776 qapi_event_send_resume(&error_abort);
1777 return res;
1778}
1779
1780void vm_start(void)
1781{
1782 if (!vm_prepare_start()) {
1783 resume_all_vcpus();
1784 }
1785}
1786
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001787/* does a state transition even if the VM is already stopped,
1788 current state is forgotten forever */
Kevin Wolf56983462013-07-05 13:49:54 +02001789int vm_stop_force_state(RunState state)
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001790{
1791 if (runstate_is_running()) {
Kevin Wolf56983462013-07-05 13:49:54 +02001792 return vm_stop(state);
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001793 } else {
1794 runstate_set(state);
Wen Congyangb2780d32015-11-20 17:34:38 +08001795
1796 bdrv_drain_all();
Kevin Wolf594a45c2013-07-18 14:52:19 +02001797 /* Make sure to return an error if the flush in a previous vm_stop()
1798 * failed. */
John Snow22af08e2016-09-22 21:45:51 -04001799 return bdrv_flush_all();
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001800 }
1801}
1802
Stefan Weil9a78eea2010-10-22 23:03:33 +02001803void list_cpus(FILE *f, fprintf_function cpu_fprintf, const char *optarg)
Blue Swirl262353c2010-05-04 19:55:35 +00001804{
1805 /* XXX: implement xxx_cpu_list for targets that still miss it */
Peter Maydelle916cbf2012-09-05 17:41:08 -03001806#if defined(cpu_list)
1807 cpu_list(f, cpu_fprintf);
Blue Swirl262353c2010-05-04 19:55:35 +00001808#endif
1809}
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001810
1811CpuInfoList *qmp_query_cpus(Error **errp)
1812{
1813 CpuInfoList *head = NULL, *cur_item = NULL;
Andreas Färber182735e2013-05-29 22:29:20 +02001814 CPUState *cpu;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001815
Andreas Färberbdc44642013-06-24 23:50:24 +02001816 CPU_FOREACH(cpu) {
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001817 CpuInfoList *info;
Andreas Färber182735e2013-05-29 22:29:20 +02001818#if defined(TARGET_I386)
1819 X86CPU *x86_cpu = X86_CPU(cpu);
1820 CPUX86State *env = &x86_cpu->env;
1821#elif defined(TARGET_PPC)
1822 PowerPCCPU *ppc_cpu = POWERPC_CPU(cpu);
1823 CPUPPCState *env = &ppc_cpu->env;
1824#elif defined(TARGET_SPARC)
1825 SPARCCPU *sparc_cpu = SPARC_CPU(cpu);
1826 CPUSPARCState *env = &sparc_cpu->env;
1827#elif defined(TARGET_MIPS)
1828 MIPSCPU *mips_cpu = MIPS_CPU(cpu);
1829 CPUMIPSState *env = &mips_cpu->env;
Bastian Koppelmann48e06fe2014-09-01 12:59:46 +01001830#elif defined(TARGET_TRICORE)
1831 TriCoreCPU *tricore_cpu = TRICORE_CPU(cpu);
1832 CPUTriCoreState *env = &tricore_cpu->env;
Andreas Färber182735e2013-05-29 22:29:20 +02001833#endif
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001834
Andreas Färbercb446ec2013-05-01 14:24:52 +02001835 cpu_synchronize_state(cpu);
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001836
1837 info = g_malloc0(sizeof(*info));
1838 info->value = g_malloc0(sizeof(*info->value));
Andreas Färber55e5c282012-12-17 06:18:02 +01001839 info->value->CPU = cpu->cpu_index;
Andreas Färber182735e2013-05-29 22:29:20 +02001840 info->value->current = (cpu == first_cpu);
Andreas Färber259186a2013-01-17 18:51:17 +01001841 info->value->halted = cpu->halted;
Eduardo Habkost58f88d42015-05-08 16:04:22 -03001842 info->value->qom_path = object_get_canonical_path(OBJECT(cpu));
Andreas Färber9f09e182012-05-03 06:59:07 +02001843 info->value->thread_id = cpu->thread_id;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001844#if defined(TARGET_I386)
Eric Blake86f4b682015-11-18 01:52:59 -07001845 info->value->arch = CPU_INFO_ARCH_X86;
Eric Blake544a3732016-02-17 23:48:27 -07001846 info->value->u.x86.pc = env->eip + env->segs[R_CS].base;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001847#elif defined(TARGET_PPC)
Eric Blake86f4b682015-11-18 01:52:59 -07001848 info->value->arch = CPU_INFO_ARCH_PPC;
Eric Blake544a3732016-02-17 23:48:27 -07001849 info->value->u.ppc.nip = env->nip;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001850#elif defined(TARGET_SPARC)
Eric Blake86f4b682015-11-18 01:52:59 -07001851 info->value->arch = CPU_INFO_ARCH_SPARC;
Eric Blake544a3732016-02-17 23:48:27 -07001852 info->value->u.q_sparc.pc = env->pc;
1853 info->value->u.q_sparc.npc = env->npc;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001854#elif defined(TARGET_MIPS)
Eric Blake86f4b682015-11-18 01:52:59 -07001855 info->value->arch = CPU_INFO_ARCH_MIPS;
Eric Blake544a3732016-02-17 23:48:27 -07001856 info->value->u.q_mips.PC = env->active_tc.PC;
Bastian Koppelmann48e06fe2014-09-01 12:59:46 +01001857#elif defined(TARGET_TRICORE)
Eric Blake86f4b682015-11-18 01:52:59 -07001858 info->value->arch = CPU_INFO_ARCH_TRICORE;
Eric Blake544a3732016-02-17 23:48:27 -07001859 info->value->u.tricore.PC = env->PC;
Eric Blake86f4b682015-11-18 01:52:59 -07001860#else
1861 info->value->arch = CPU_INFO_ARCH_OTHER;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001862#endif
1863
1864 /* XXX: waiting for the qapi to support GSList */
1865 if (!cur_item) {
1866 head = cur_item = info;
1867 } else {
1868 cur_item->next = info;
1869 cur_item = info;
1870 }
1871 }
1872
1873 return head;
1874}
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001875
1876void qmp_memsave(int64_t addr, int64_t size, const char *filename,
1877 bool has_cpu, int64_t cpu_index, Error **errp)
1878{
1879 FILE *f;
1880 uint32_t l;
Andreas Färber55e5c282012-12-17 06:18:02 +01001881 CPUState *cpu;
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001882 uint8_t buf[1024];
Borislav Petkov0dc9daf2015-02-08 13:14:38 +01001883 int64_t orig_addr = addr, orig_size = size;
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001884
1885 if (!has_cpu) {
1886 cpu_index = 0;
1887 }
1888
Andreas Färber151d1322013-02-15 15:41:49 +01001889 cpu = qemu_get_cpu(cpu_index);
1890 if (cpu == NULL) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01001891 error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "cpu-index",
1892 "a CPU number");
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001893 return;
1894 }
1895
1896 f = fopen(filename, "wb");
1897 if (!f) {
Luiz Capitulino618da852013-06-07 14:35:06 -04001898 error_setg_file_open(errp, errno, filename);
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001899 return;
1900 }
1901
1902 while (size != 0) {
1903 l = sizeof(buf);
1904 if (l > size)
1905 l = size;
Aneesh Kumar K.V2f4d0f52013-10-01 21:49:30 +05301906 if (cpu_memory_rw_debug(cpu, addr, buf, l, 0) != 0) {
Borislav Petkov0dc9daf2015-02-08 13:14:38 +01001907 error_setg(errp, "Invalid addr 0x%016" PRIx64 "/size %" PRId64
1908 " specified", orig_addr, orig_size);
Aneesh Kumar K.V2f4d0f52013-10-01 21:49:30 +05301909 goto exit;
1910 }
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001911 if (fwrite(buf, 1, l, f) != l) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01001912 error_setg(errp, QERR_IO_ERROR);
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001913 goto exit;
1914 }
1915 addr += l;
1916 size -= l;
1917 }
1918
1919exit:
1920 fclose(f);
1921}
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001922
1923void qmp_pmemsave(int64_t addr, int64_t size, const char *filename,
1924 Error **errp)
1925{
1926 FILE *f;
1927 uint32_t l;
1928 uint8_t buf[1024];
1929
1930 f = fopen(filename, "wb");
1931 if (!f) {
Luiz Capitulino618da852013-06-07 14:35:06 -04001932 error_setg_file_open(errp, errno, filename);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001933 return;
1934 }
1935
1936 while (size != 0) {
1937 l = sizeof(buf);
1938 if (l > size)
1939 l = size;
Stefan Weileb6282f2014-04-07 20:28:23 +02001940 cpu_physical_memory_read(addr, buf, l);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001941 if (fwrite(buf, 1, l, f) != l) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01001942 error_setg(errp, QERR_IO_ERROR);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001943 goto exit;
1944 }
1945 addr += l;
1946 size -= l;
1947 }
1948
1949exit:
1950 fclose(f);
1951}
Luiz Capitulinoab49ab52011-11-23 12:55:53 -02001952
1953void qmp_inject_nmi(Error **errp)
1954{
Alexey Kardashevskiy9cb805f2014-08-20 22:16:33 +10001955 nmi_monitor_handle(monitor_get_cpu_index(), errp);
Luiz Capitulinoab49ab52011-11-23 12:55:53 -02001956}
Sebastian Tanase27498be2014-07-25 11:56:33 +02001957
1958void dump_drift_info(FILE *f, fprintf_function cpu_fprintf)
1959{
1960 if (!use_icount) {
1961 return;
1962 }
1963
1964 cpu_fprintf(f, "Host - Guest clock %"PRIi64" ms\n",
1965 (cpu_get_clock() - cpu_get_icount())/SCALE_MS);
1966 if (icount_align_option) {
1967 cpu_fprintf(f, "Max guest delay %"PRIi64" ms\n", -max_delay/SCALE_MS);
1968 cpu_fprintf(f, "Max guest advance %"PRIi64" ms\n", max_advance/SCALE_MS);
1969 } else {
1970 cpu_fprintf(f, "Max guest delay NA\n");
1971 cpu_fprintf(f, "Max guest advance NA\n");
1972 }
1973}