blob: 0ddeeefc14f18da10a0a76919bccb31f807fb374 [file] [log] [blame]
Blue Swirl296af7c2010-03-29 19:23:50 +00001/*
2 * QEMU System Emulator
3 *
4 * Copyright (c) 2003-2008 Fabrice Bellard
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
24
Peter Maydell7b31bbc2016-01-26 18:16:56 +000025#include "qemu/osdep.h"
KONRAD Frederic8d4e9142017-02-23 18:29:08 +000026#include "qemu/config-file.h"
Paolo Bonzini33c11872016-03-15 16:58:45 +010027#include "cpu.h"
Paolo Bonzini83c90892012-12-17 18:19:49 +010028#include "monitor/monitor.h"
Markus Armbrustere688df62018-02-01 12:18:31 +010029#include "qapi/error.h"
Markus Armbruster112ed242018-02-26 17:13:27 -060030#include "qapi/qapi-commands-misc.h"
Markus Armbruster9af23982018-02-11 10:36:01 +010031#include "qapi/qapi-events-run-state.h"
Wenchao Xiaa4e15de2014-06-18 08:43:36 +020032#include "qapi/qmp/qerror.h"
Markus Armbrusterd49b6832015-03-17 18:29:20 +010033#include "qemu/error-report.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010034#include "sysemu/sysemu.h"
Max Reitzda31d592016-03-16 19:54:32 +010035#include "sysemu/block-backend.h"
Paolo Bonzini022c62c2012-12-17 18:19:49 +010036#include "exec/gdbstub.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010037#include "sysemu/dma.h"
Vincent Palatinb3946622017-01-10 11:59:55 +010038#include "sysemu/hw_accel.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010039#include "sysemu/kvm.h"
Vincent Palatinb0cb0a62017-01-10 11:59:57 +010040#include "sysemu/hax.h"
Sergio Andres Gomez Del Realc97d6d22017-09-13 04:05:09 -050041#include "sysemu/hvf.h"
Justin Terry (VM)19306802018-01-22 13:07:49 -080042#include "sysemu/whpx.h"
Paolo Bonzini63c91552016-03-15 13:18:37 +010043#include "exec/exec-all.h"
Blue Swirl296af7c2010-03-29 19:23:50 +000044
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010045#include "qemu/thread.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010046#include "sysemu/cpus.h"
47#include "sysemu/qtest.h"
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010048#include "qemu/main-loop.h"
Markus Armbruster922a01a2018-02-01 12:18:46 +010049#include "qemu/option.h"
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010050#include "qemu/bitmap.h"
Liu Ping Fancb365642013-09-25 14:20:58 +080051#include "qemu/seqlock.h"
KONRAD Frederic8d4e9142017-02-23 18:29:08 +000052#include "tcg.h"
Alexey Kardashevskiy9cb805f2014-08-20 22:16:33 +100053#include "hw/nmi.h"
Pavel Dovgalyuk8b427042015-09-17 19:24:05 +030054#include "sysemu/replay.h"
Igor Mammedovafed5a52017-05-10 13:29:55 +020055#include "hw/boards.h"
Jan Kiszka0ff0fc12011-06-23 10:15:55 +020056
Jan Kiszka6d9cb732011-02-01 22:15:58 +010057#ifdef CONFIG_LINUX
58
59#include <sys/prctl.h>
60
Marcelo Tosattic0532a72010-10-11 15:31:21 -030061#ifndef PR_MCE_KILL
62#define PR_MCE_KILL 33
63#endif
64
Jan Kiszka6d9cb732011-02-01 22:15:58 +010065#ifndef PR_MCE_KILL_SET
66#define PR_MCE_KILL_SET 1
67#endif
68
69#ifndef PR_MCE_KILL_EARLY
70#define PR_MCE_KILL_EARLY 1
71#endif
72
73#endif /* CONFIG_LINUX */
74
Sebastian Tanase27498be2014-07-25 11:56:33 +020075int64_t max_delay;
76int64_t max_advance;
Blue Swirl296af7c2010-03-29 19:23:50 +000077
Jason J. Herne2adcc852015-09-08 13:12:33 -040078/* vcpu throttling controls */
79static QEMUTimer *throttle_timer;
80static unsigned int throttle_percentage;
81
82#define CPU_THROTTLE_PCT_MIN 1
83#define CPU_THROTTLE_PCT_MAX 99
84#define CPU_THROTTLE_TIMESLICE_NS 10000000
85
Tiejun Chen321bc0b2013-08-02 09:43:09 +080086bool cpu_is_stopped(CPUState *cpu)
87{
88 return cpu->stopped || !runstate_is_running();
89}
90
Andreas Färbera98ae1d2013-05-26 23:21:08 +020091static bool cpu_thread_is_idle(CPUState *cpu)
Peter Maydellac873f12012-07-19 16:52:27 +010092{
Andreas Färberc64ca812012-05-03 02:11:45 +020093 if (cpu->stop || cpu->queued_work_first) {
Peter Maydellac873f12012-07-19 16:52:27 +010094 return false;
95 }
Tiejun Chen321bc0b2013-08-02 09:43:09 +080096 if (cpu_is_stopped(cpu)) {
Peter Maydellac873f12012-07-19 16:52:27 +010097 return true;
98 }
Andreas Färber8c2e1b02013-08-25 18:53:55 +020099 if (!cpu->halted || cpu_has_work(cpu) ||
Alexander Graf215e79c2013-04-24 22:24:12 +0200100 kvm_halt_in_kernel()) {
Peter Maydellac873f12012-07-19 16:52:27 +0100101 return false;
102 }
103 return true;
104}
105
106static bool all_cpu_threads_idle(void)
107{
Andreas Färber182735e2013-05-29 22:29:20 +0200108 CPUState *cpu;
Peter Maydellac873f12012-07-19 16:52:27 +0100109
Andreas Färberbdc44642013-06-24 23:50:24 +0200110 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200111 if (!cpu_thread_is_idle(cpu)) {
Peter Maydellac873f12012-07-19 16:52:27 +0100112 return false;
113 }
114 }
115 return true;
116}
117
Blue Swirl296af7c2010-03-29 19:23:50 +0000118/***********************************************************/
Paolo Bonzini946fb272011-09-12 13:57:37 +0200119/* guest cycle counter */
120
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200121/* Protected by TimersState seqlock */
122
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200123static bool icount_sleep = true;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200124/* Arbitrarily pick 1MIPS as the minimum allowable speed. */
125#define MAX_ICOUNT_SHIFT 10
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200126
Paolo Bonzini946fb272011-09-12 13:57:37 +0200127typedef struct TimersState {
Liu Ping Fancb365642013-09-25 14:20:58 +0800128 /* Protected by BQL. */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200129 int64_t cpu_ticks_prev;
130 int64_t cpu_ticks_offset;
Liu Ping Fancb365642013-09-25 14:20:58 +0800131
Paolo Bonzini94377112018-08-14 09:57:16 +0200132 /* Protect fields that can be respectively read outside the
133 * BQL, and written from multiple threads.
Liu Ping Fancb365642013-09-25 14:20:58 +0800134 */
135 QemuSeqLock vm_clock_seqlock;
Paolo Bonzini94377112018-08-14 09:57:16 +0200136 QemuSpin vm_clock_lock;
137
138 int16_t cpu_ticks_enabled;
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200139
Paolo Bonzinic1ff0732018-08-14 09:31:58 +0200140 /* Conversion factor from emulated instructions to virtual clock ticks. */
Paolo Bonzini94377112018-08-14 09:57:16 +0200141 int16_t icount_time_shift;
142
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200143 /* Compensate for varying guest execution speed. */
144 int64_t qemu_icount_bias;
Paolo Bonzini94377112018-08-14 09:57:16 +0200145
146 int64_t vm_clock_warp_start;
147 int64_t cpu_clock_offset;
148
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200149 /* Only written by TCG thread */
150 int64_t qemu_icount;
Paolo Bonzini94377112018-08-14 09:57:16 +0200151
Pavel Dovgalyukb39e3f32018-01-11 11:26:10 +0300152 /* for adjusting icount */
Pavel Dovgalyukb39e3f32018-01-11 11:26:10 +0300153 QEMUTimer *icount_rt_timer;
154 QEMUTimer *icount_vm_timer;
155 QEMUTimer *icount_warp_timer;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200156} TimersState;
157
Liu Ping Fand9cd4002013-07-21 08:43:00 +0000158static TimersState timers_state;
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000159bool mttcg_enabled;
160
161/*
162 * We default to false if we know other options have been enabled
163 * which are currently incompatible with MTTCG. Otherwise when each
164 * guest (target) has been updated to support:
165 * - atomic instructions
166 * - memory ordering primitives (barriers)
167 * they can set the appropriate CONFIG flags in ${target}-softmmu.mak
168 *
169 * Once a guest architecture has been converted to the new primitives
170 * there are two remaining limitations to check.
171 *
172 * - The guest can't be oversized (e.g. 64 bit guest on 32 bit host)
173 * - The host must have a stronger memory order than the guest
174 *
175 * It may be possible in future to support strong guests on weak hosts
176 * but that will require tagging all load/stores in a guest with their
177 * implicit memory order requirements which would likely slow things
178 * down a lot.
179 */
180
181static bool check_tcg_memory_orders_compatible(void)
182{
183#if defined(TCG_GUEST_DEFAULT_MO) && defined(TCG_TARGET_DEFAULT_MO)
184 return (TCG_GUEST_DEFAULT_MO & ~TCG_TARGET_DEFAULT_MO) == 0;
185#else
186 return false;
187#endif
188}
189
190static bool default_mttcg_enabled(void)
191{
Alex Bennée83fd9622017-02-27 17:09:01 +0000192 if (use_icount || TCG_OVERSIZED_GUEST) {
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000193 return false;
194 } else {
195#ifdef TARGET_SUPPORTS_MTTCG
196 return check_tcg_memory_orders_compatible();
197#else
198 return false;
199#endif
200 }
201}
202
203void qemu_tcg_configure(QemuOpts *opts, Error **errp)
204{
205 const char *t = qemu_opt_get(opts, "thread");
206 if (t) {
207 if (strcmp(t, "multi") == 0) {
208 if (TCG_OVERSIZED_GUEST) {
209 error_setg(errp, "No MTTCG when guest word size > hosts");
Alex Bennée83fd9622017-02-27 17:09:01 +0000210 } else if (use_icount) {
211 error_setg(errp, "No MTTCG when icount is enabled");
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000212 } else {
Nikunj A Dadhania86953502017-04-10 11:36:55 +0530213#ifndef TARGET_SUPPORTS_MTTCG
Markus Armbruster07656912018-10-17 10:26:28 +0200214 warn_report("Guest not yet converted to MTTCG - "
215 "you may get unexpected results");
Alex Bennéec34c7622017-02-28 14:40:17 +0000216#endif
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000217 if (!check_tcg_memory_orders_compatible()) {
Markus Armbruster07656912018-10-17 10:26:28 +0200218 warn_report("Guest expects a stronger memory ordering "
219 "than the host provides");
Pranith Kumar8cfef892017-03-25 16:19:23 -0400220 error_printf("This may cause strange/hard to debug errors\n");
KONRAD Frederic8d4e9142017-02-23 18:29:08 +0000221 }
222 mttcg_enabled = true;
223 }
224 } else if (strcmp(t, "single") == 0) {
225 mttcg_enabled = false;
226 } else {
227 error_setg(errp, "Invalid 'thread' setting %s", t);
228 }
229 } else {
230 mttcg_enabled = default_mttcg_enabled();
231 }
232}
Paolo Bonzini946fb272011-09-12 13:57:37 +0200233
Alex Bennéee4cd9652017-03-31 16:09:42 +0100234/* The current number of executed instructions is based on what we
235 * originally budgeted minus the current state of the decrementing
236 * icount counters in extra/u16.low.
237 */
238static int64_t cpu_get_icount_executed(CPUState *cpu)
239{
240 return cpu->icount_budget - (cpu->icount_decr.u16.low + cpu->icount_extra);
241}
242
Alex Bennée512d3c82017-04-05 12:32:37 +0100243/*
244 * Update the global shared timer_state.qemu_icount to take into
245 * account executed instructions. This is done by the TCG vCPU
246 * thread so the main-loop can see time has moved forward.
247 */
Paolo Bonzini9b4e6f42018-09-11 13:15:32 +0200248static void cpu_update_icount_locked(CPUState *cpu)
Alex Bennée512d3c82017-04-05 12:32:37 +0100249{
250 int64_t executed = cpu_get_icount_executed(cpu);
251 cpu->icount_budget -= executed;
252
Emilio G. Cota38adcb62018-09-10 19:27:49 -0400253 atomic_set_i64(&timers_state.qemu_icount,
254 timers_state.qemu_icount + executed);
Paolo Bonzini9b4e6f42018-09-11 13:15:32 +0200255}
256
257/*
258 * Update the global shared timer_state.qemu_icount to take into
259 * account executed instructions. This is done by the TCG vCPU
260 * thread so the main-loop can see time has moved forward.
261 */
262void cpu_update_icount(CPUState *cpu)
263{
264 seqlock_write_lock(&timers_state.vm_clock_seqlock,
265 &timers_state.vm_clock_lock);
266 cpu_update_icount_locked(cpu);
Paolo Bonzini94377112018-08-14 09:57:16 +0200267 seqlock_write_unlock(&timers_state.vm_clock_seqlock,
268 &timers_state.vm_clock_lock);
Alex Bennée512d3c82017-04-05 12:32:37 +0100269}
270
Paolo Bonzinic1ff0732018-08-14 09:31:58 +0200271static int64_t cpu_get_icount_raw_locked(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200272{
Andreas Färber4917cf42013-05-27 05:17:50 +0200273 CPUState *cpu = current_cpu;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200274
Alex Bennée243c5f72017-03-30 18:49:22 +0100275 if (cpu && cpu->running) {
Paolo Bonzini414b15c2015-06-24 14:16:26 +0200276 if (!cpu->can_do_io) {
Alistair Francis493d89b2018-02-03 09:43:14 +0100277 error_report("Bad icount read");
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300278 exit(1);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200279 }
Alex Bennéee4cd9652017-03-31 16:09:42 +0100280 /* Take into account what has run */
Paolo Bonzini9b4e6f42018-09-11 13:15:32 +0200281 cpu_update_icount_locked(cpu);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200282 }
Emilio G. Cota38adcb62018-09-10 19:27:49 -0400283 /* The read is protected by the seqlock, but needs atomic64 to avoid UB */
284 return atomic_read_i64(&timers_state.qemu_icount);
Paolo Bonzinic1ff0732018-08-14 09:31:58 +0200285}
286
287static int64_t cpu_get_icount_locked(void)
288{
289 int64_t icount = cpu_get_icount_raw_locked();
Emilio G. Cotac97595d2018-09-10 19:27:50 -0400290 return atomic_read_i64(&timers_state.qemu_icount_bias) +
291 cpu_icount_to_ns(icount);
Paolo Bonzinic1ff0732018-08-14 09:31:58 +0200292}
293
294int64_t cpu_get_icount_raw(void)
295{
296 int64_t icount;
297 unsigned start;
298
299 do {
300 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
301 icount = cpu_get_icount_raw_locked();
302 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
303
304 return icount;
Pavel Dovgalyuk2a629142014-12-08 10:53:45 +0300305}
306
307/* Return the virtual CPU time, based on the instruction counter. */
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200308int64_t cpu_get_icount(void)
309{
310 int64_t icount;
311 unsigned start;
312
313 do {
314 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
315 icount = cpu_get_icount_locked();
316 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
317
318 return icount;
319}
320
KONRAD Frederic3f031312014-08-01 01:37:15 +0200321int64_t cpu_icount_to_ns(int64_t icount)
322{
Paolo Bonzinic1ff0732018-08-14 09:31:58 +0200323 return icount << atomic_read(&timers_state.icount_time_shift);
KONRAD Frederic3f031312014-08-01 01:37:15 +0200324}
325
Paolo Bonzinif2a4ad62018-08-18 09:36:16 +0200326static int64_t cpu_get_ticks_locked(void)
327{
328 int64_t ticks = timers_state.cpu_ticks_offset;
329 if (timers_state.cpu_ticks_enabled) {
330 ticks += cpu_get_host_ticks();
331 }
332
333 if (timers_state.cpu_ticks_prev > ticks) {
334 /* Non increasing ticks may happen if the host uses software suspend. */
335 timers_state.cpu_ticks_offset += timers_state.cpu_ticks_prev - ticks;
336 ticks = timers_state.cpu_ticks_prev;
337 }
338
339 timers_state.cpu_ticks_prev = ticks;
340 return ticks;
341}
342
Cao jind90f3cc2016-07-29 19:05:38 +0800343/* return the time elapsed in VM between vm_start and vm_stop. Unless
344 * icount is active, cpu_get_ticks() uses units of the host CPU cycle
345 * counter.
Cao jind90f3cc2016-07-29 19:05:38 +0800346 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200347int64_t cpu_get_ticks(void)
348{
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100349 int64_t ticks;
350
Paolo Bonzini946fb272011-09-12 13:57:37 +0200351 if (use_icount) {
352 return cpu_get_icount();
353 }
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100354
Paolo Bonzinif2a4ad62018-08-18 09:36:16 +0200355 qemu_spin_lock(&timers_state.vm_clock_lock);
356 ticks = cpu_get_ticks_locked();
357 qemu_spin_unlock(&timers_state.vm_clock_lock);
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100358 return ticks;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200359}
360
Liu Ping Fancb365642013-09-25 14:20:58 +0800361static int64_t cpu_get_clock_locked(void)
362{
Cao jin1d45cea2016-07-29 19:05:37 +0800363 int64_t time;
Liu Ping Fancb365642013-09-25 14:20:58 +0800364
Cao jin1d45cea2016-07-29 19:05:37 +0800365 time = timers_state.cpu_clock_offset;
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100366 if (timers_state.cpu_ticks_enabled) {
Cao jin1d45cea2016-07-29 19:05:37 +0800367 time += get_clock();
Liu Ping Fancb365642013-09-25 14:20:58 +0800368 }
369
Cao jin1d45cea2016-07-29 19:05:37 +0800370 return time;
Liu Ping Fancb365642013-09-25 14:20:58 +0800371}
372
Cao jind90f3cc2016-07-29 19:05:38 +0800373/* Return the monotonic time elapsed in VM, i.e.,
Peter Maydell8212ff82016-09-15 10:24:22 +0100374 * the time between vm_start and vm_stop
375 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200376int64_t cpu_get_clock(void)
377{
378 int64_t ti;
Liu Ping Fancb365642013-09-25 14:20:58 +0800379 unsigned start;
380
381 do {
382 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
383 ti = cpu_get_clock_locked();
384 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
385
386 return ti;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200387}
388
Liu Ping Fancb365642013-09-25 14:20:58 +0800389/* enable cpu_get_ticks()
Cao jin3224e872016-07-08 18:31:37 +0800390 * Caller must hold BQL which serves as mutex for vm_clock_seqlock.
Liu Ping Fancb365642013-09-25 14:20:58 +0800391 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200392void cpu_enable_ticks(void)
393{
Paolo Bonzini94377112018-08-14 09:57:16 +0200394 seqlock_write_lock(&timers_state.vm_clock_seqlock,
395 &timers_state.vm_clock_lock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200396 if (!timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400397 timers_state.cpu_ticks_offset -= cpu_get_host_ticks();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200398 timers_state.cpu_clock_offset -= get_clock();
399 timers_state.cpu_ticks_enabled = 1;
400 }
Paolo Bonzini94377112018-08-14 09:57:16 +0200401 seqlock_write_unlock(&timers_state.vm_clock_seqlock,
402 &timers_state.vm_clock_lock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200403}
404
405/* disable cpu_get_ticks() : the clock is stopped. You must not call
Liu Ping Fancb365642013-09-25 14:20:58 +0800406 * cpu_get_ticks() after that.
Cao jin3224e872016-07-08 18:31:37 +0800407 * Caller must hold BQL which serves as mutex for vm_clock_seqlock.
Liu Ping Fancb365642013-09-25 14:20:58 +0800408 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200409void cpu_disable_ticks(void)
410{
Paolo Bonzini94377112018-08-14 09:57:16 +0200411 seqlock_write_lock(&timers_state.vm_clock_seqlock,
412 &timers_state.vm_clock_lock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200413 if (timers_state.cpu_ticks_enabled) {
Christopher Covington4a7428c2015-09-25 10:42:21 -0400414 timers_state.cpu_ticks_offset += cpu_get_host_ticks();
Liu Ping Fancb365642013-09-25 14:20:58 +0800415 timers_state.cpu_clock_offset = cpu_get_clock_locked();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200416 timers_state.cpu_ticks_enabled = 0;
417 }
Paolo Bonzini94377112018-08-14 09:57:16 +0200418 seqlock_write_unlock(&timers_state.vm_clock_seqlock,
419 &timers_state.vm_clock_lock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200420}
421
422/* Correlation between real and virtual time is always going to be
423 fairly approximate, so ignore small variation.
424 When the guest is idle real and virtual time will be aligned in
425 the IO wait loop. */
Rutuja Shah73bcb242016-03-21 21:32:30 +0530426#define ICOUNT_WOBBLE (NANOSECONDS_PER_SECOND / 10)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200427
428static void icount_adjust(void)
429{
430 int64_t cur_time;
431 int64_t cur_icount;
432 int64_t delta;
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200433
434 /* Protected by TimersState mutex. */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200435 static int64_t last_delta;
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200436
Paolo Bonzini946fb272011-09-12 13:57:37 +0200437 /* If the VM is not running, then do nothing. */
438 if (!runstate_is_running()) {
439 return;
440 }
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200441
Paolo Bonzini94377112018-08-14 09:57:16 +0200442 seqlock_write_lock(&timers_state.vm_clock_seqlock,
443 &timers_state.vm_clock_lock);
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200444 cur_time = cpu_get_clock_locked();
445 cur_icount = cpu_get_icount_locked();
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200446
Paolo Bonzini946fb272011-09-12 13:57:37 +0200447 delta = cur_icount - cur_time;
448 /* FIXME: This is a very crude algorithm, somewhat prone to oscillation. */
449 if (delta > 0
450 && last_delta + ICOUNT_WOBBLE < delta * 2
Paolo Bonzinic1ff0732018-08-14 09:31:58 +0200451 && timers_state.icount_time_shift > 0) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200452 /* The guest is getting too far ahead. Slow time down. */
Paolo Bonzinic1ff0732018-08-14 09:31:58 +0200453 atomic_set(&timers_state.icount_time_shift,
454 timers_state.icount_time_shift - 1);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200455 }
456 if (delta < 0
457 && last_delta - ICOUNT_WOBBLE > delta * 2
Paolo Bonzinic1ff0732018-08-14 09:31:58 +0200458 && timers_state.icount_time_shift < MAX_ICOUNT_SHIFT) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200459 /* The guest is getting too far behind. Speed time up. */
Paolo Bonzinic1ff0732018-08-14 09:31:58 +0200460 atomic_set(&timers_state.icount_time_shift,
461 timers_state.icount_time_shift + 1);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200462 }
463 last_delta = delta;
Emilio G. Cotac97595d2018-09-10 19:27:50 -0400464 atomic_set_i64(&timers_state.qemu_icount_bias,
465 cur_icount - (timers_state.qemu_icount
466 << timers_state.icount_time_shift));
Paolo Bonzini94377112018-08-14 09:57:16 +0200467 seqlock_write_unlock(&timers_state.vm_clock_seqlock,
468 &timers_state.vm_clock_lock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200469}
470
471static void icount_adjust_rt(void *opaque)
472{
Pavel Dovgalyukb39e3f32018-01-11 11:26:10 +0300473 timer_mod(timers_state.icount_rt_timer,
Pavel Dovgalyuk1979b902015-01-12 15:00:43 +0300474 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL_RT) + 1000);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200475 icount_adjust();
476}
477
478static void icount_adjust_vm(void *opaque)
479{
Pavel Dovgalyukb39e3f32018-01-11 11:26:10 +0300480 timer_mod(timers_state.icount_vm_timer,
Alex Bligh40daca52013-08-21 16:03:02 +0100481 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
Rutuja Shah73bcb242016-03-21 21:32:30 +0530482 NANOSECONDS_PER_SECOND / 10);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200483 icount_adjust();
484}
485
486static int64_t qemu_icount_round(int64_t count)
487{
Paolo Bonzinic1ff0732018-08-14 09:31:58 +0200488 int shift = atomic_read(&timers_state.icount_time_shift);
489 return (count + (1 << shift) - 1) >> shift;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200490}
491
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300492static void icount_warp_rt(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200493{
Alex Bennéeccffff42016-04-04 15:35:48 +0100494 unsigned seq;
495 int64_t warp_start;
496
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200497 /* The icount_warp_timer is rescheduled soon after vm_clock_warp_start
498 * changes from -1 to another value, so the race here is okay.
499 */
Alex Bennéeccffff42016-04-04 15:35:48 +0100500 do {
501 seq = seqlock_read_begin(&timers_state.vm_clock_seqlock);
Pavel Dovgalyukb39e3f32018-01-11 11:26:10 +0300502 warp_start = timers_state.vm_clock_warp_start;
Alex Bennéeccffff42016-04-04 15:35:48 +0100503 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, seq));
504
505 if (warp_start == -1) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200506 return;
507 }
508
Paolo Bonzini94377112018-08-14 09:57:16 +0200509 seqlock_write_lock(&timers_state.vm_clock_seqlock,
510 &timers_state.vm_clock_lock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200511 if (runstate_is_running()) {
Paolo Bonzini74c0b812018-10-08 13:24:14 +0200512 int64_t clock = REPLAY_CLOCK_LOCKED(REPLAY_CLOCK_VIRTUAL_RT,
513 cpu_get_clock_locked());
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200514 int64_t warp_delta;
515
Pavel Dovgalyukb39e3f32018-01-11 11:26:10 +0300516 warp_delta = clock - timers_state.vm_clock_warp_start;
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200517 if (use_icount == 2) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200518 /*
Alex Bligh40daca52013-08-21 16:03:02 +0100519 * In adaptive mode, do not let QEMU_CLOCK_VIRTUAL run too
Paolo Bonzini946fb272011-09-12 13:57:37 +0200520 * far ahead of real time.
521 */
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200522 int64_t cur_icount = cpu_get_icount_locked();
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300523 int64_t delta = clock - cur_icount;
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200524 warp_delta = MIN(warp_delta, delta);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200525 }
Emilio G. Cotac97595d2018-09-10 19:27:50 -0400526 atomic_set_i64(&timers_state.qemu_icount_bias,
527 timers_state.qemu_icount_bias + warp_delta);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200528 }
Pavel Dovgalyukb39e3f32018-01-11 11:26:10 +0300529 timers_state.vm_clock_warp_start = -1;
Paolo Bonzini94377112018-08-14 09:57:16 +0200530 seqlock_write_unlock(&timers_state.vm_clock_seqlock,
531 &timers_state.vm_clock_lock);
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200532
533 if (qemu_clock_expired(QEMU_CLOCK_VIRTUAL)) {
534 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
535 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200536}
537
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300538static void icount_timer_cb(void *opaque)
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300539{
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300540 /* No need for a checkpoint because the timer already synchronizes
541 * with CHECKPOINT_CLOCK_VIRTUAL_RT.
542 */
543 icount_warp_rt();
Pavel Dovgalyukefab87c2015-09-17 19:24:39 +0300544}
545
Paolo Bonzini8156be52012-03-28 15:42:04 +0200546void qtest_clock_warp(int64_t dest)
547{
Alex Bligh40daca52013-08-21 16:03:02 +0100548 int64_t clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
Fam Zhengefef88b2015-01-19 17:51:43 +0800549 AioContext *aio_context;
Paolo Bonzini8156be52012-03-28 15:42:04 +0200550 assert(qtest_enabled());
Fam Zhengefef88b2015-01-19 17:51:43 +0800551 aio_context = qemu_get_aio_context();
Paolo Bonzini8156be52012-03-28 15:42:04 +0200552 while (clock < dest) {
Alex Bligh40daca52013-08-21 16:03:02 +0100553 int64_t deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
Sergey Fedorovc9299e22014-06-10 13:10:28 +0400554 int64_t warp = qemu_soonest_timeout(dest - clock, deadline);
Fam Zhengefef88b2015-01-19 17:51:43 +0800555
Paolo Bonzini94377112018-08-14 09:57:16 +0200556 seqlock_write_lock(&timers_state.vm_clock_seqlock,
557 &timers_state.vm_clock_lock);
Emilio G. Cotac97595d2018-09-10 19:27:50 -0400558 atomic_set_i64(&timers_state.qemu_icount_bias,
559 timers_state.qemu_icount_bias + warp);
Paolo Bonzini94377112018-08-14 09:57:16 +0200560 seqlock_write_unlock(&timers_state.vm_clock_seqlock,
561 &timers_state.vm_clock_lock);
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200562
Alex Bligh40daca52013-08-21 16:03:02 +0100563 qemu_clock_run_timers(QEMU_CLOCK_VIRTUAL);
Fam Zhengefef88b2015-01-19 17:51:43 +0800564 timerlist_run_timers(aio_context->tlg.tl[QEMU_CLOCK_VIRTUAL]);
Alex Bligh40daca52013-08-21 16:03:02 +0100565 clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini8156be52012-03-28 15:42:04 +0200566 }
Alex Bligh40daca52013-08-21 16:03:02 +0100567 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini8156be52012-03-28 15:42:04 +0200568}
569
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300570void qemu_start_warp_timer(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200571{
Paolo Bonzinice78d182013-10-07 17:30:02 +0200572 int64_t clock;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200573 int64_t deadline;
574
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300575 if (!use_icount) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200576 return;
577 }
578
Pavel Dovgalyuk8bd7f712015-09-17 19:24:44 +0300579 /* Nothing to do if the VM is stopped: QEMU_CLOCK_VIRTUAL timers
580 * do not fire, so computing the deadline does not make sense.
581 */
582 if (!runstate_is_running()) {
583 return;
584 }
585
Pavel Dovgalyuk0c081852018-09-12 11:19:45 +0300586 if (replay_mode != REPLAY_MODE_PLAY) {
587 if (!all_cpu_threads_idle()) {
588 return;
589 }
Pavel Dovgalyuk8bd7f712015-09-17 19:24:44 +0300590
Pavel Dovgalyuk0c081852018-09-12 11:19:45 +0300591 if (qtest_enabled()) {
592 /* When testing, qtest commands advance icount. */
593 return;
594 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200595
Pavel Dovgalyuk0c081852018-09-12 11:19:45 +0300596 replay_checkpoint(CHECKPOINT_CLOCK_WARP_START);
597 } else {
598 /* warp clock deterministically in record/replay mode */
599 if (!replay_checkpoint(CHECKPOINT_CLOCK_WARP_START)) {
600 /* vCPU is sleeping and warp can't be started.
601 It is probably a race condition: notification sent
602 to vCPU was processed in advance and vCPU went to sleep.
603 Therefore we have to wake it up for doing someting. */
604 if (replay_has_checkpoint()) {
605 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
606 }
607 return;
608 }
Paolo Bonzini8156be52012-03-28 15:42:04 +0200609 }
610
Alex Blighac70aaf2013-08-21 16:02:57 +0100611 /* We want to use the earliest deadline from ALL vm_clocks */
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300612 clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT);
Alex Bligh40daca52013-08-21 16:03:02 +0100613 deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
Paolo Bonzinice78d182013-10-07 17:30:02 +0200614 if (deadline < 0) {
Victor CLEMENTd7a0f712015-05-29 17:14:06 +0200615 static bool notified;
616 if (!icount_sleep && !notified) {
Alistair Francis3dc6f862017-07-12 06:57:41 -0700617 warn_report("icount sleep disabled and no active timers");
Victor CLEMENTd7a0f712015-05-29 17:14:06 +0200618 notified = true;
619 }
Paolo Bonzinice78d182013-10-07 17:30:02 +0200620 return;
Alex Blighac70aaf2013-08-21 16:02:57 +0100621 }
622
Paolo Bonzini946fb272011-09-12 13:57:37 +0200623 if (deadline > 0) {
624 /*
Alex Bligh40daca52013-08-21 16:03:02 +0100625 * Ensure QEMU_CLOCK_VIRTUAL proceeds even when the virtual CPU goes to
Paolo Bonzini946fb272011-09-12 13:57:37 +0200626 * sleep. Otherwise, the CPU might be waiting for a future timer
627 * interrupt to wake it up, but the interrupt never comes because
628 * the vCPU isn't running any insns and thus doesn't advance the
Alex Bligh40daca52013-08-21 16:03:02 +0100629 * QEMU_CLOCK_VIRTUAL.
Paolo Bonzini946fb272011-09-12 13:57:37 +0200630 */
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200631 if (!icount_sleep) {
632 /*
633 * We never let VCPUs sleep in no sleep icount mode.
634 * If there is a pending QEMU_CLOCK_VIRTUAL timer we just advance
635 * to the next QEMU_CLOCK_VIRTUAL event and notify it.
636 * It is useful when we want a deterministic execution time,
637 * isolated from host latencies.
638 */
Paolo Bonzini94377112018-08-14 09:57:16 +0200639 seqlock_write_lock(&timers_state.vm_clock_seqlock,
640 &timers_state.vm_clock_lock);
Emilio G. Cotac97595d2018-09-10 19:27:50 -0400641 atomic_set_i64(&timers_state.qemu_icount_bias,
642 timers_state.qemu_icount_bias + deadline);
Paolo Bonzini94377112018-08-14 09:57:16 +0200643 seqlock_write_unlock(&timers_state.vm_clock_seqlock,
644 &timers_state.vm_clock_lock);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200645 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
646 } else {
647 /*
648 * We do stop VCPUs and only advance QEMU_CLOCK_VIRTUAL after some
649 * "real" time, (related to the time left until the next event) has
650 * passed. The QEMU_CLOCK_VIRTUAL_RT clock will do this.
651 * This avoids that the warps are visible externally; for example,
652 * you will not be sending network packets continuously instead of
653 * every 100ms.
654 */
Paolo Bonzini94377112018-08-14 09:57:16 +0200655 seqlock_write_lock(&timers_state.vm_clock_seqlock,
656 &timers_state.vm_clock_lock);
Pavel Dovgalyukb39e3f32018-01-11 11:26:10 +0300657 if (timers_state.vm_clock_warp_start == -1
658 || timers_state.vm_clock_warp_start > clock) {
659 timers_state.vm_clock_warp_start = clock;
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200660 }
Paolo Bonzini94377112018-08-14 09:57:16 +0200661 seqlock_write_unlock(&timers_state.vm_clock_seqlock,
662 &timers_state.vm_clock_lock);
Pavel Dovgalyukb39e3f32018-01-11 11:26:10 +0300663 timer_mod_anticipate(timers_state.icount_warp_timer,
664 clock + deadline);
Paolo Bonzinice78d182013-10-07 17:30:02 +0200665 }
Alex Blighac70aaf2013-08-21 16:02:57 +0100666 } else if (deadline == 0) {
Alex Bligh40daca52013-08-21 16:03:02 +0100667 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200668 }
669}
670
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300671static void qemu_account_warp_timer(void)
672{
673 if (!use_icount || !icount_sleep) {
674 return;
675 }
676
677 /* Nothing to do if the VM is stopped: QEMU_CLOCK_VIRTUAL timers
678 * do not fire, so computing the deadline does not make sense.
679 */
680 if (!runstate_is_running()) {
681 return;
682 }
683
684 /* warp clock deterministically in record/replay mode */
685 if (!replay_checkpoint(CHECKPOINT_CLOCK_WARP_ACCOUNT)) {
686 return;
687 }
688
Pavel Dovgalyukb39e3f32018-01-11 11:26:10 +0300689 timer_del(timers_state.icount_warp_timer);
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300690 icount_warp_rt();
691}
692
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200693static bool icount_state_needed(void *opaque)
694{
695 return use_icount;
696}
697
Pavel Dovgalyukb39e3f32018-01-11 11:26:10 +0300698static bool warp_timer_state_needed(void *opaque)
699{
700 TimersState *s = opaque;
701 return s->icount_warp_timer != NULL;
702}
703
704static bool adjust_timers_state_needed(void *opaque)
705{
706 TimersState *s = opaque;
707 return s->icount_rt_timer != NULL;
708}
709
710/*
711 * Subsection for warp timer migration is optional, because may not be created
712 */
713static const VMStateDescription icount_vmstate_warp_timer = {
714 .name = "timer/icount/warp_timer",
715 .version_id = 1,
716 .minimum_version_id = 1,
717 .needed = warp_timer_state_needed,
718 .fields = (VMStateField[]) {
719 VMSTATE_INT64(vm_clock_warp_start, TimersState),
720 VMSTATE_TIMER_PTR(icount_warp_timer, TimersState),
721 VMSTATE_END_OF_LIST()
722 }
723};
724
725static const VMStateDescription icount_vmstate_adjust_timers = {
726 .name = "timer/icount/timers",
727 .version_id = 1,
728 .minimum_version_id = 1,
729 .needed = adjust_timers_state_needed,
730 .fields = (VMStateField[]) {
731 VMSTATE_TIMER_PTR(icount_rt_timer, TimersState),
732 VMSTATE_TIMER_PTR(icount_vm_timer, TimersState),
733 VMSTATE_END_OF_LIST()
734 }
735};
736
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200737/*
738 * This is a subsection for icount migration.
739 */
740static const VMStateDescription icount_vmstate_timers = {
741 .name = "timer/icount",
742 .version_id = 1,
743 .minimum_version_id = 1,
Juan Quintela5cd8cad2014-09-23 14:09:54 +0200744 .needed = icount_state_needed,
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200745 .fields = (VMStateField[]) {
746 VMSTATE_INT64(qemu_icount_bias, TimersState),
747 VMSTATE_INT64(qemu_icount, TimersState),
748 VMSTATE_END_OF_LIST()
Pavel Dovgalyukb39e3f32018-01-11 11:26:10 +0300749 },
750 .subsections = (const VMStateDescription*[]) {
751 &icount_vmstate_warp_timer,
752 &icount_vmstate_adjust_timers,
753 NULL
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200754 }
755};
756
Paolo Bonzini946fb272011-09-12 13:57:37 +0200757static const VMStateDescription vmstate_timers = {
758 .name = "timer",
759 .version_id = 2,
760 .minimum_version_id = 1,
Juan Quintela35d08452014-04-16 16:01:33 +0200761 .fields = (VMStateField[]) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200762 VMSTATE_INT64(cpu_ticks_offset, TimersState),
Paolo Bonzinic1ff0732018-08-14 09:31:58 +0200763 VMSTATE_UNUSED(8),
Paolo Bonzini946fb272011-09-12 13:57:37 +0200764 VMSTATE_INT64_V(cpu_clock_offset, TimersState, 2),
765 VMSTATE_END_OF_LIST()
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200766 },
Juan Quintela5cd8cad2014-09-23 14:09:54 +0200767 .subsections = (const VMStateDescription*[]) {
768 &icount_vmstate_timers,
769 NULL
Paolo Bonzini946fb272011-09-12 13:57:37 +0200770 }
771};
772
Paolo Bonzini14e6fe12016-10-31 10:36:08 +0100773static void cpu_throttle_thread(CPUState *cpu, run_on_cpu_data opaque)
Jason J. Herne2adcc852015-09-08 13:12:33 -0400774{
Jason J. Herne2adcc852015-09-08 13:12:33 -0400775 double pct;
776 double throttle_ratio;
777 long sleeptime_ns;
778
779 if (!cpu_throttle_get_percentage()) {
780 return;
781 }
782
783 pct = (double)cpu_throttle_get_percentage()/100;
784 throttle_ratio = pct / (1 - pct);
785 sleeptime_ns = (long)(throttle_ratio * CPU_THROTTLE_TIMESLICE_NS);
786
787 qemu_mutex_unlock_iothread();
Jason J. Herne2adcc852015-09-08 13:12:33 -0400788 g_usleep(sleeptime_ns / 1000); /* Convert ns to us for usleep call */
789 qemu_mutex_lock_iothread();
Felipe Franciosi90bb0c02017-05-19 22:29:50 +0100790 atomic_set(&cpu->throttle_thread_scheduled, 0);
Jason J. Herne2adcc852015-09-08 13:12:33 -0400791}
792
793static void cpu_throttle_timer_tick(void *opaque)
794{
795 CPUState *cpu;
796 double pct;
797
798 /* Stop the timer if needed */
799 if (!cpu_throttle_get_percentage()) {
800 return;
801 }
802 CPU_FOREACH(cpu) {
803 if (!atomic_xchg(&cpu->throttle_thread_scheduled, 1)) {
Paolo Bonzini14e6fe12016-10-31 10:36:08 +0100804 async_run_on_cpu(cpu, cpu_throttle_thread,
805 RUN_ON_CPU_NULL);
Jason J. Herne2adcc852015-09-08 13:12:33 -0400806 }
807 }
808
809 pct = (double)cpu_throttle_get_percentage()/100;
810 timer_mod(throttle_timer, qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT) +
811 CPU_THROTTLE_TIMESLICE_NS / (1-pct));
812}
813
814void cpu_throttle_set(int new_throttle_pct)
815{
816 /* Ensure throttle percentage is within valid range */
817 new_throttle_pct = MIN(new_throttle_pct, CPU_THROTTLE_PCT_MAX);
818 new_throttle_pct = MAX(new_throttle_pct, CPU_THROTTLE_PCT_MIN);
819
820 atomic_set(&throttle_percentage, new_throttle_pct);
821
822 timer_mod(throttle_timer, qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT) +
823 CPU_THROTTLE_TIMESLICE_NS);
824}
825
826void cpu_throttle_stop(void)
827{
828 atomic_set(&throttle_percentage, 0);
829}
830
831bool cpu_throttle_active(void)
832{
833 return (cpu_throttle_get_percentage() != 0);
834}
835
836int cpu_throttle_get_percentage(void)
837{
838 return atomic_read(&throttle_percentage);
839}
840
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400841void cpu_ticks_init(void)
842{
Emilio G. Cotaccdb3c12016-06-08 14:55:20 -0400843 seqlock_init(&timers_state.vm_clock_seqlock);
Emilio G. Cota87a09cd2018-09-03 13:18:29 -0400844 qemu_spin_init(&timers_state.vm_clock_lock);
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400845 vmstate_register(NULL, 0, &vmstate_timers, &timers_state);
Jason J. Herne2adcc852015-09-08 13:12:33 -0400846 throttle_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL_RT,
847 cpu_throttle_timer_tick, NULL);
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400848}
849
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200850void configure_icount(QemuOpts *opts, Error **errp)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200851{
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200852 const char *option;
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200853 char *rem_str = NULL;
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200854
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200855 option = qemu_opt_get(opts, "shift");
Paolo Bonzini946fb272011-09-12 13:57:37 +0200856 if (!option) {
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200857 if (qemu_opt_get(opts, "align") != NULL) {
858 error_setg(errp, "Please specify shift option when using align");
859 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200860 return;
861 }
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200862
863 icount_sleep = qemu_opt_get_bool(opts, "sleep", true);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200864 if (icount_sleep) {
Pavel Dovgalyukb39e3f32018-01-11 11:26:10 +0300865 timers_state.icount_warp_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL_RT,
Pavel Dovgalyuke76d1792016-03-10 14:56:09 +0300866 icount_timer_cb, NULL);
Victor CLEMENT5045e9d92015-05-29 17:14:04 +0200867 }
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200868
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200869 icount_align_option = qemu_opt_get_bool(opts, "align", false);
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200870
871 if (icount_align_option && !icount_sleep) {
Pranith Kumar778d9f92016-02-26 10:16:51 -0500872 error_setg(errp, "align=on and sleep=off are incompatible");
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200873 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200874 if (strcmp(option, "auto") != 0) {
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200875 errno = 0;
Paolo Bonzinic1ff0732018-08-14 09:31:58 +0200876 timers_state.icount_time_shift = strtol(option, &rem_str, 0);
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200877 if (errno != 0 || *rem_str != '\0' || !strlen(option)) {
878 error_setg(errp, "icount: Invalid shift value");
879 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200880 use_icount = 1;
881 return;
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200882 } else if (icount_align_option) {
883 error_setg(errp, "shift=auto and align=on are incompatible");
Victor CLEMENTf1f4b572015-05-29 17:14:05 +0200884 } else if (!icount_sleep) {
Pranith Kumar778d9f92016-02-26 10:16:51 -0500885 error_setg(errp, "shift=auto and sleep=off are incompatible");
Paolo Bonzini946fb272011-09-12 13:57:37 +0200886 }
887
888 use_icount = 2;
889
890 /* 125MIPS seems a reasonable initial guess at the guest speed.
891 It will be corrected fairly quickly anyway. */
Paolo Bonzinic1ff0732018-08-14 09:31:58 +0200892 timers_state.icount_time_shift = 3;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200893
894 /* Have both realtime and virtual time triggers for speed adjustment.
895 The realtime trigger catches emulated time passing too slowly,
896 the virtual time trigger catches emulated time passing too fast.
897 Realtime triggers occur even when idle, so use them less frequently
898 than VM triggers. */
Pavel Dovgalyukb39e3f32018-01-11 11:26:10 +0300899 timers_state.vm_clock_warp_start = -1;
900 timers_state.icount_rt_timer = timer_new_ms(QEMU_CLOCK_VIRTUAL_RT,
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300901 icount_adjust_rt, NULL);
Pavel Dovgalyukb39e3f32018-01-11 11:26:10 +0300902 timer_mod(timers_state.icount_rt_timer,
Pavel Dovgalyukbf2a7dd2014-11-26 13:40:55 +0300903 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL_RT) + 1000);
Pavel Dovgalyukb39e3f32018-01-11 11:26:10 +0300904 timers_state.icount_vm_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
Alex Bligh40daca52013-08-21 16:03:02 +0100905 icount_adjust_vm, NULL);
Pavel Dovgalyukb39e3f32018-01-11 11:26:10 +0300906 timer_mod(timers_state.icount_vm_timer,
Alex Bligh40daca52013-08-21 16:03:02 +0100907 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
Rutuja Shah73bcb242016-03-21 21:32:30 +0530908 NANOSECONDS_PER_SECOND / 10);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200909}
910
911/***********************************************************/
Alex Bennée65467062017-02-23 18:29:09 +0000912/* TCG vCPU kick timer
913 *
914 * The kick timer is responsible for moving single threaded vCPU
915 * emulation on to the next vCPU. If more than one vCPU is running a
916 * timer event with force a cpu->exit so the next vCPU can get
917 * scheduled.
918 *
919 * The timer is removed if all vCPUs are idle and restarted again once
920 * idleness is complete.
921 */
922
923static QEMUTimer *tcg_kick_vcpu_timer;
Alex Bennée791158d2017-02-23 18:29:10 +0000924static CPUState *tcg_current_rr_cpu;
Alex Bennée65467062017-02-23 18:29:09 +0000925
926#define TCG_KICK_PERIOD (NANOSECONDS_PER_SECOND / 10)
927
928static inline int64_t qemu_tcg_next_kick(void)
929{
930 return qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + TCG_KICK_PERIOD;
931}
932
Alex Bennée791158d2017-02-23 18:29:10 +0000933/* Kick the currently round-robin scheduled vCPU */
934static void qemu_cpu_kick_rr_cpu(void)
935{
936 CPUState *cpu;
Alex Bennée791158d2017-02-23 18:29:10 +0000937 do {
938 cpu = atomic_mb_read(&tcg_current_rr_cpu);
939 if (cpu) {
940 cpu_exit(cpu);
941 }
942 } while (cpu != atomic_mb_read(&tcg_current_rr_cpu));
943}
944
Paolo Bonzini6b8f0182017-03-02 19:56:40 +0100945static void do_nothing(CPUState *cpu, run_on_cpu_data unused)
946{
947}
948
Paolo Bonzini3f53bc62017-03-03 11:50:29 +0100949void qemu_timer_notify_cb(void *opaque, QEMUClockType type)
950{
Paolo Bonzini6b8f0182017-03-02 19:56:40 +0100951 if (!use_icount || type != QEMU_CLOCK_VIRTUAL) {
952 qemu_notify_event();
953 return;
954 }
955
Peter Maydellc52e7132018-04-10 13:02:25 +0100956 if (qemu_in_vcpu_thread()) {
957 /* A CPU is currently running; kick it back out to the
958 * tcg_cpu_exec() loop so it will recalculate its
959 * icount deadline immediately.
960 */
961 qemu_cpu_kick(current_cpu);
962 } else if (first_cpu) {
Paolo Bonzini6b8f0182017-03-02 19:56:40 +0100963 /* qemu_cpu_kick is not enough to kick a halted CPU out of
964 * qemu_tcg_wait_io_event. async_run_on_cpu, instead,
965 * causes cpu_thread_is_idle to return false. This way,
966 * handle_icount_deadline can run.
Peter Maydellc52e7132018-04-10 13:02:25 +0100967 * If we have no CPUs at all for some reason, we don't
968 * need to do anything.
Paolo Bonzini6b8f0182017-03-02 19:56:40 +0100969 */
970 async_run_on_cpu(first_cpu, do_nothing, RUN_ON_CPU_NULL);
971 }
Paolo Bonzini3f53bc62017-03-03 11:50:29 +0100972}
973
Alex Bennée65467062017-02-23 18:29:09 +0000974static void kick_tcg_thread(void *opaque)
975{
976 timer_mod(tcg_kick_vcpu_timer, qemu_tcg_next_kick());
Alex Bennée791158d2017-02-23 18:29:10 +0000977 qemu_cpu_kick_rr_cpu();
Alex Bennée65467062017-02-23 18:29:09 +0000978}
979
980static void start_tcg_kick_timer(void)
981{
Paolo Bonzinidb08b682018-01-11 13:53:12 +0100982 assert(!mttcg_enabled);
983 if (!tcg_kick_vcpu_timer && CPU_NEXT(first_cpu)) {
Alex Bennée65467062017-02-23 18:29:09 +0000984 tcg_kick_vcpu_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
985 kick_tcg_thread, NULL);
Alex Bennée1926ab22018-09-27 18:17:24 +0100986 }
987 if (tcg_kick_vcpu_timer && !timer_pending(tcg_kick_vcpu_timer)) {
Alex Bennée65467062017-02-23 18:29:09 +0000988 timer_mod(tcg_kick_vcpu_timer, qemu_tcg_next_kick());
989 }
990}
991
992static void stop_tcg_kick_timer(void)
993{
Paolo Bonzinidb08b682018-01-11 13:53:12 +0100994 assert(!mttcg_enabled);
Alex Bennée1926ab22018-09-27 18:17:24 +0100995 if (tcg_kick_vcpu_timer && timer_pending(tcg_kick_vcpu_timer)) {
Alex Bennée65467062017-02-23 18:29:09 +0000996 timer_del(tcg_kick_vcpu_timer);
Alex Bennée65467062017-02-23 18:29:09 +0000997 }
998}
999
Alex Bennée65467062017-02-23 18:29:09 +00001000/***********************************************************/
Blue Swirl296af7c2010-03-29 19:23:50 +00001001void hw_error(const char *fmt, ...)
1002{
1003 va_list ap;
Andreas Färber55e5c282012-12-17 06:18:02 +01001004 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001005
1006 va_start(ap, fmt);
1007 fprintf(stderr, "qemu: hardware error: ");
1008 vfprintf(stderr, fmt, ap);
1009 fprintf(stderr, "\n");
Andreas Färberbdc44642013-06-24 23:50:24 +02001010 CPU_FOREACH(cpu) {
Andreas Färber55e5c282012-12-17 06:18:02 +01001011 fprintf(stderr, "CPU #%d:\n", cpu->cpu_index);
Andreas Färber878096e2013-05-27 01:33:50 +02001012 cpu_dump_state(cpu, stderr, fprintf, CPU_DUMP_FPU);
Blue Swirl296af7c2010-03-29 19:23:50 +00001013 }
1014 va_end(ap);
1015 abort();
1016}
1017
1018void cpu_synchronize_all_states(void)
1019{
Andreas Färber182735e2013-05-29 22:29:20 +02001020 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001021
Andreas Färberbdc44642013-06-24 23:50:24 +02001022 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001023 cpu_synchronize_state(cpu);
Sergio Andres Gomez Del Realc97d6d22017-09-13 04:05:09 -05001024 /* TODO: move to cpu_synchronize_state() */
1025 if (hvf_enabled()) {
1026 hvf_cpu_synchronize_state(cpu);
1027 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001028 }
1029}
1030
1031void cpu_synchronize_all_post_reset(void)
1032{
Andreas Färber182735e2013-05-29 22:29:20 +02001033 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001034
Andreas Färberbdc44642013-06-24 23:50:24 +02001035 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001036 cpu_synchronize_post_reset(cpu);
Sergio Andres Gomez Del Realc97d6d22017-09-13 04:05:09 -05001037 /* TODO: move to cpu_synchronize_post_reset() */
1038 if (hvf_enabled()) {
1039 hvf_cpu_synchronize_post_reset(cpu);
1040 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001041 }
1042}
1043
1044void cpu_synchronize_all_post_init(void)
1045{
Andreas Färber182735e2013-05-29 22:29:20 +02001046 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001047
Andreas Färberbdc44642013-06-24 23:50:24 +02001048 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001049 cpu_synchronize_post_init(cpu);
Sergio Andres Gomez Del Realc97d6d22017-09-13 04:05:09 -05001050 /* TODO: move to cpu_synchronize_post_init() */
1051 if (hvf_enabled()) {
1052 hvf_cpu_synchronize_post_init(cpu);
1053 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001054 }
1055}
1056
David Gibson75e972d2017-05-26 14:46:28 +10001057void cpu_synchronize_all_pre_loadvm(void)
1058{
1059 CPUState *cpu;
1060
1061 CPU_FOREACH(cpu) {
1062 cpu_synchronize_pre_loadvm(cpu);
1063 }
1064}
1065
Stefan Hajnoczi4486e892018-03-07 14:42:05 +00001066static int do_vm_stop(RunState state, bool send_stop)
Blue Swirl296af7c2010-03-29 19:23:50 +00001067{
Kevin Wolf56983462013-07-05 13:49:54 +02001068 int ret = 0;
1069
Luiz Capitulino13548692011-07-29 15:36:43 -03001070 if (runstate_is_running()) {
Blue Swirl296af7c2010-03-29 19:23:50 +00001071 cpu_disable_ticks();
Blue Swirl296af7c2010-03-29 19:23:50 +00001072 pause_all_vcpus();
Luiz Capitulinof5bbfba2011-07-29 15:04:45 -03001073 runstate_set(state);
Luiz Capitulino1dfb4dd2011-07-29 14:26:33 -03001074 vm_state_notify(0, state);
Stefan Hajnoczi4486e892018-03-07 14:42:05 +00001075 if (send_stop) {
Peter Xu3ab72382018-08-15 21:37:37 +08001076 qapi_event_send_stop();
Stefan Hajnoczi4486e892018-03-07 14:42:05 +00001077 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001078 }
Kevin Wolf56983462013-07-05 13:49:54 +02001079
Kevin Wolf594a45c2013-07-18 14:52:19 +02001080 bdrv_drain_all();
Pavel Dovgalyuk6d0ceb82016-09-26 11:08:16 +03001081 replay_disable_events();
John Snow22af08e2016-09-22 21:45:51 -04001082 ret = bdrv_flush_all();
Kevin Wolf594a45c2013-07-18 14:52:19 +02001083
Kevin Wolf56983462013-07-05 13:49:54 +02001084 return ret;
Blue Swirl296af7c2010-03-29 19:23:50 +00001085}
1086
Stefan Hajnoczi4486e892018-03-07 14:42:05 +00001087/* Special vm_stop() variant for terminating the process. Historically clients
1088 * did not expect a QMP STOP event and so we need to retain compatibility.
1089 */
1090int vm_shutdown(void)
1091{
1092 return do_vm_stop(RUN_STATE_SHUTDOWN, false);
1093}
1094
Andreas Färbera1fcaa72012-05-02 23:42:26 +02001095static bool cpu_can_run(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001096{
Andreas Färber4fdeee72012-05-02 23:10:09 +02001097 if (cpu->stop) {
Andreas Färbera1fcaa72012-05-02 23:42:26 +02001098 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001099 }
Tiejun Chen321bc0b2013-08-02 09:43:09 +08001100 if (cpu_is_stopped(cpu)) {
Andreas Färbera1fcaa72012-05-02 23:42:26 +02001101 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001102 }
Andreas Färbera1fcaa72012-05-02 23:42:26 +02001103 return true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001104}
1105
Andreas Färber91325042013-05-27 02:07:49 +02001106static void cpu_handle_guest_debug(CPUState *cpu)
Jan Kiszka3c638d02010-06-25 16:56:56 +02001107{
Andreas Färber64f6b342013-05-27 02:06:09 +02001108 gdb_set_stop_cpu(cpu);
Jan Kiszka8cf71712011-02-07 12:19:16 +01001109 qemu_system_debug_request();
Andreas Färberf324e762012-05-02 23:26:21 +02001110 cpu->stopped = true;
Jan Kiszka3c638d02010-06-25 16:56:56 +02001111}
1112
Jan Kiszka6d9cb732011-02-01 22:15:58 +01001113#ifdef CONFIG_LINUX
1114static void sigbus_reraise(void)
1115{
1116 sigset_t set;
1117 struct sigaction action;
1118
1119 memset(&action, 0, sizeof(action));
1120 action.sa_handler = SIG_DFL;
1121 if (!sigaction(SIGBUS, &action, NULL)) {
1122 raise(SIGBUS);
1123 sigemptyset(&set);
1124 sigaddset(&set, SIGBUS);
Peter Maydella2d17612016-05-16 18:33:59 +01001125 pthread_sigmask(SIG_UNBLOCK, &set, NULL);
Jan Kiszka6d9cb732011-02-01 22:15:58 +01001126 }
1127 perror("Failed to re-raise SIGBUS!\n");
1128 abort();
1129}
1130
Paolo Bonzinid98d4072017-02-08 13:22:12 +01001131static void sigbus_handler(int n, siginfo_t *siginfo, void *ctx)
Jan Kiszka6d9cb732011-02-01 22:15:58 +01001132{
Paolo Bonzinia16fc072017-02-09 09:50:02 +01001133 if (siginfo->si_code != BUS_MCEERR_AO && siginfo->si_code != BUS_MCEERR_AR) {
1134 sigbus_reraise();
1135 }
1136
Paolo Bonzini2ae41db2017-02-08 12:48:54 +01001137 if (current_cpu) {
1138 /* Called asynchronously in VCPU thread. */
1139 if (kvm_on_sigbus_vcpu(current_cpu, siginfo->si_code, siginfo->si_addr)) {
1140 sigbus_reraise();
1141 }
1142 } else {
1143 /* Called synchronously (via signalfd) in main thread. */
1144 if (kvm_on_sigbus(siginfo->si_code, siginfo->si_addr)) {
1145 sigbus_reraise();
1146 }
Jan Kiszka6d9cb732011-02-01 22:15:58 +01001147 }
1148}
1149
1150static void qemu_init_sigbus(void)
1151{
1152 struct sigaction action;
1153
1154 memset(&action, 0, sizeof(action));
1155 action.sa_flags = SA_SIGINFO;
Paolo Bonzinid98d4072017-02-08 13:22:12 +01001156 action.sa_sigaction = sigbus_handler;
Jan Kiszka6d9cb732011-02-01 22:15:58 +01001157 sigaction(SIGBUS, &action, NULL);
1158
1159 prctl(PR_MCE_KILL, PR_MCE_KILL_SET, PR_MCE_KILL_EARLY, 0, 0);
1160}
Paolo Bonzinia16fc072017-02-09 09:50:02 +01001161#else /* !CONFIG_LINUX */
1162static void qemu_init_sigbus(void)
1163{
1164}
Paolo Bonzinia16fc072017-02-09 09:50:02 +01001165#endif /* !CONFIG_LINUX */
Blue Swirl296af7c2010-03-29 19:23:50 +00001166
Stefan Weilb2532d82012-09-27 07:41:42 +02001167static QemuMutex qemu_global_mutex;
Blue Swirl296af7c2010-03-29 19:23:50 +00001168
1169static QemuThread io_thread;
1170
Blue Swirl296af7c2010-03-29 19:23:50 +00001171/* cpu creation */
1172static QemuCond qemu_cpu_cond;
1173/* system init */
Blue Swirl296af7c2010-03-29 19:23:50 +00001174static QemuCond qemu_pause_cond;
1175
Paolo Bonzinid3b12f52011-09-13 10:30:52 +02001176void qemu_init_cpu_loop(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001177{
Jan Kiszka6d9cb732011-02-01 22:15:58 +01001178 qemu_init_sigbus();
Anthony Liguoried945922011-02-08 18:18:18 +01001179 qemu_cond_init(&qemu_cpu_cond);
Anthony Liguoried945922011-02-08 18:18:18 +01001180 qemu_cond_init(&qemu_pause_cond);
Blue Swirl296af7c2010-03-29 19:23:50 +00001181 qemu_mutex_init(&qemu_global_mutex);
Blue Swirl296af7c2010-03-29 19:23:50 +00001182
Jan Kiszkab7680cb2011-03-12 17:43:51 +01001183 qemu_thread_get_self(&io_thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001184}
1185
Paolo Bonzini14e6fe12016-10-31 10:36:08 +01001186void run_on_cpu(CPUState *cpu, run_on_cpu_func func, run_on_cpu_data data)
Marcelo Tosattie82bcec2010-05-04 09:45:22 -03001187{
Sergey Fedorovd148d902016-08-29 09:51:00 +02001188 do_run_on_cpu(cpu, func, data, &qemu_global_mutex);
Chegu Vinod3c022702013-06-24 03:49:41 -06001189}
1190
Gu Zheng4c055ab2016-05-12 09:18:13 +05301191static void qemu_kvm_destroy_vcpu(CPUState *cpu)
1192{
1193 if (kvm_destroy_vcpu(cpu) < 0) {
1194 error_report("kvm_destroy_vcpu failed");
1195 exit(EXIT_FAILURE);
1196 }
1197}
1198
1199static void qemu_tcg_destroy_vcpu(CPUState *cpu)
1200{
1201}
1202
David Hildenbrandebd05fe2017-11-29 20:12:15 +01001203static void qemu_cpu_stop(CPUState *cpu, bool exit)
1204{
1205 g_assert(qemu_cpu_is_self(cpu));
1206 cpu->stop = false;
1207 cpu->stopped = true;
1208 if (exit) {
1209 cpu_exit(cpu);
1210 }
1211 qemu_cond_broadcast(&qemu_pause_cond);
1212}
1213
Andreas Färber509a0d72012-05-03 02:18:09 +02001214static void qemu_wait_io_event_common(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001215{
Alex Bennée37257942017-02-23 18:29:14 +00001216 atomic_mb_set(&cpu->thread_kicked, false);
Andreas Färber4fdeee72012-05-02 23:10:09 +02001217 if (cpu->stop) {
David Hildenbrandebd05fe2017-11-29 20:12:15 +01001218 qemu_cpu_stop(cpu, false);
Blue Swirl296af7c2010-03-29 19:23:50 +00001219 }
Sergey Fedorova5403c62016-08-02 18:27:36 +01001220 process_queued_cpu_work(cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001221}
1222
Paolo Bonzinia8efa602018-11-14 12:36:57 +01001223static void qemu_tcg_rr_wait_io_event(void)
Alex Bennée37257942017-02-23 18:29:14 +00001224{
Paolo Bonzinia8efa602018-11-14 12:36:57 +01001225 CPUState *cpu;
1226
Paolo Bonzinidb08b682018-01-11 13:53:12 +01001227 while (all_cpu_threads_idle()) {
Alex Bennée65467062017-02-23 18:29:09 +00001228 stop_tcg_kick_timer();
Paolo Bonzinia8efa602018-11-14 12:36:57 +01001229 qemu_cond_wait(first_cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka16400322011-02-09 16:29:37 +01001230 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001231
Alex Bennée65467062017-02-23 18:29:09 +00001232 start_tcg_kick_timer();
1233
Paolo Bonzinia8efa602018-11-14 12:36:57 +01001234 CPU_FOREACH(cpu) {
1235 qemu_wait_io_event_common(cpu);
1236 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001237}
1238
Paolo Bonzinidb08b682018-01-11 13:53:12 +01001239static void qemu_wait_io_event(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001240{
Andreas Färbera98ae1d2013-05-26 23:21:08 +02001241 while (cpu_thread_is_idle(cpu)) {
Andreas Färberf5c121b2012-05-03 01:22:49 +02001242 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka16400322011-02-09 16:29:37 +01001243 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001244
Paolo Bonzinidb08b682018-01-11 13:53:12 +01001245#ifdef _WIN32
1246 /* Eat dummy APC queued by qemu_cpu_kick_thread. */
1247 if (!tcg_enabled()) {
1248 SleepEx(0, TRUE);
Sergio Andres Gomez Del Realc97d6d22017-09-13 04:05:09 -05001249 }
Paolo Bonzinidb08b682018-01-11 13:53:12 +01001250#endif
Sergio Andres Gomez Del Realc97d6d22017-09-13 04:05:09 -05001251 qemu_wait_io_event_common(cpu);
1252}
1253
Jan Kiszka7e97cd82011-02-07 12:19:12 +01001254static void *qemu_kvm_cpu_thread_fn(void *arg)
Blue Swirl296af7c2010-03-29 19:23:50 +00001255{
Andreas Färber48a106b2013-05-27 02:20:39 +02001256 CPUState *cpu = arg;
Jan Kiszka84b49152011-02-01 22:15:50 +01001257 int r;
Blue Swirl296af7c2010-03-29 19:23:50 +00001258
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001259 rcu_register_thread();
1260
Paolo Bonzini2e7f7a32015-06-18 18:47:18 +02001261 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001262 qemu_thread_get_self(cpu->thread);
Andreas Färber9f09e182012-05-03 06:59:07 +02001263 cpu->thread_id = qemu_get_thread_id();
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001264 cpu->can_do_io = 1;
Andreas Färber4917cf42013-05-27 05:17:50 +02001265 current_cpu = cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001266
Andreas Färber504134d2012-12-17 06:38:45 +01001267 r = kvm_init_vcpu(cpu);
Jan Kiszka84b49152011-02-01 22:15:50 +01001268 if (r < 0) {
Alistair Francis493d89b2018-02-03 09:43:14 +01001269 error_report("kvm_init_vcpu failed: %s", strerror(-r));
Jan Kiszka84b49152011-02-01 22:15:50 +01001270 exit(1);
1271 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001272
Paolo Bonzini18268b62017-02-09 09:41:14 +01001273 kvm_init_cpu_signals(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001274
1275 /* signal CPU creation */
Andreas Färber61a46212012-05-02 22:49:36 +02001276 cpu->created = true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001277 qemu_cond_signal(&qemu_cpu_cond);
1278
Gu Zheng4c055ab2016-05-12 09:18:13 +05301279 do {
Andreas Färbera1fcaa72012-05-02 23:42:26 +02001280 if (cpu_can_run(cpu)) {
Andreas Färber1458c362013-05-26 23:46:55 +02001281 r = kvm_cpu_exec(cpu);
Jan Kiszka83f338f2011-02-07 12:19:17 +01001282 if (r == EXCP_DEBUG) {
Andreas Färber91325042013-05-27 02:07:49 +02001283 cpu_handle_guest_debug(cpu);
Jan Kiszka83f338f2011-02-07 12:19:17 +01001284 }
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001285 }
Paolo Bonzinidb08b682018-01-11 13:53:12 +01001286 qemu_wait_io_event(cpu);
Gu Zheng4c055ab2016-05-12 09:18:13 +05301287 } while (!cpu->unplug || cpu_can_run(cpu));
Blue Swirl296af7c2010-03-29 19:23:50 +00001288
Gu Zheng4c055ab2016-05-12 09:18:13 +05301289 qemu_kvm_destroy_vcpu(cpu);
Bharata B Rao2c579042016-05-12 09:18:14 +05301290 cpu->created = false;
1291 qemu_cond_signal(&qemu_cpu_cond);
Gu Zheng4c055ab2016-05-12 09:18:13 +05301292 qemu_mutex_unlock_iothread();
Paolo Bonzini57615ed2018-01-30 11:04:36 -05001293 rcu_unregister_thread();
Blue Swirl296af7c2010-03-29 19:23:50 +00001294 return NULL;
1295}
1296
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001297static void *qemu_dummy_cpu_thread_fn(void *arg)
1298{
1299#ifdef _WIN32
Alistair Francis493d89b2018-02-03 09:43:14 +01001300 error_report("qtest is not supported under Windows");
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001301 exit(1);
1302#else
Andreas Färber10a90212013-05-27 02:24:35 +02001303 CPUState *cpu = arg;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001304 sigset_t waitset;
1305 int r;
1306
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001307 rcu_register_thread();
1308
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001309 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001310 qemu_thread_get_self(cpu->thread);
Andreas Färber9f09e182012-05-03 06:59:07 +02001311 cpu->thread_id = qemu_get_thread_id();
Pavel Dovgalyuk626cf8f2014-12-08 10:53:17 +03001312 cpu->can_do_io = 1;
Alex Bennée37257942017-02-23 18:29:14 +00001313 current_cpu = cpu;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001314
1315 sigemptyset(&waitset);
1316 sigaddset(&waitset, SIG_IPI);
1317
1318 /* signal CPU creation */
Andreas Färber61a46212012-05-02 22:49:36 +02001319 cpu->created = true;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001320 qemu_cond_signal(&qemu_cpu_cond);
1321
Paolo Bonzinid2831ab2018-01-30 11:04:53 -05001322 do {
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001323 qemu_mutex_unlock_iothread();
1324 do {
1325 int sig;
1326 r = sigwait(&waitset, &sig);
1327 } while (r == -1 && (errno == EAGAIN || errno == EINTR));
1328 if (r == -1) {
1329 perror("sigwait");
1330 exit(1);
1331 }
1332 qemu_mutex_lock_iothread();
Paolo Bonzinidb08b682018-01-11 13:53:12 +01001333 qemu_wait_io_event(cpu);
Paolo Bonzinid2831ab2018-01-30 11:04:53 -05001334 } while (!cpu->unplug);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001335
Paolo Bonzinid2831ab2018-01-30 11:04:53 -05001336 rcu_unregister_thread();
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001337 return NULL;
1338#endif
1339}
1340
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001341static int64_t tcg_get_icount_limit(void)
1342{
1343 int64_t deadline;
1344
1345 if (replay_mode != REPLAY_MODE_PLAY) {
1346 deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
1347
1348 /* Maintain prior (possibly buggy) behaviour where if no deadline
1349 * was set (as there is no QEMU_CLOCK_VIRTUAL timer) or it is more than
1350 * INT32_MAX nanoseconds ahead, we still use INT32_MAX
1351 * nanoseconds.
1352 */
1353 if ((deadline < 0) || (deadline > INT32_MAX)) {
1354 deadline = INT32_MAX;
1355 }
1356
1357 return qemu_icount_round(deadline);
1358 } else {
1359 return replay_get_instructions();
1360 }
1361}
1362
Alex Bennée12e97002016-10-27 16:10:14 +01001363static void handle_icount_deadline(void)
1364{
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001365 assert(qemu_in_vcpu_thread());
Alex Bennée12e97002016-10-27 16:10:14 +01001366 if (use_icount) {
1367 int64_t deadline =
1368 qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
1369
1370 if (deadline == 0) {
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001371 /* Wake up other AioContexts. */
Alex Bennée12e97002016-10-27 16:10:14 +01001372 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001373 qemu_clock_run_timers(QEMU_CLOCK_VIRTUAL);
Alex Bennée12e97002016-10-27 16:10:14 +01001374 }
1375 }
1376}
1377
Alex Bennée05248382017-03-29 16:46:59 +01001378static void prepare_icount_for_run(CPUState *cpu)
1379{
1380 if (use_icount) {
Alex Bennéeeda5f7c2017-04-05 12:35:48 +01001381 int insns_left;
Alex Bennée05248382017-03-29 16:46:59 +01001382
1383 /* These should always be cleared by process_icount_data after
1384 * each vCPU execution. However u16.high can be raised
1385 * asynchronously by cpu_exit/cpu_interrupt/tcg_handle_interrupt
1386 */
1387 g_assert(cpu->icount_decr.u16.low == 0);
1388 g_assert(cpu->icount_extra == 0);
1389
Alex Bennéeeda5f7c2017-04-05 12:35:48 +01001390 cpu->icount_budget = tcg_get_icount_limit();
1391 insns_left = MIN(0xffff, cpu->icount_budget);
1392 cpu->icount_decr.u16.low = insns_left;
1393 cpu->icount_extra = cpu->icount_budget - insns_left;
Alex Bennéed759c952018-02-27 12:52:48 +03001394
1395 replay_mutex_lock();
Alex Bennée05248382017-03-29 16:46:59 +01001396 }
1397}
1398
1399static void process_icount_data(CPUState *cpu)
1400{
1401 if (use_icount) {
Alex Bennéee4cd9652017-03-31 16:09:42 +01001402 /* Account for executed instructions */
Alex Bennée512d3c82017-04-05 12:32:37 +01001403 cpu_update_icount(cpu);
Alex Bennée05248382017-03-29 16:46:59 +01001404
1405 /* Reset the counters */
1406 cpu->icount_decr.u16.low = 0;
1407 cpu->icount_extra = 0;
Alex Bennéee4cd9652017-03-31 16:09:42 +01001408 cpu->icount_budget = 0;
1409
Alex Bennée05248382017-03-29 16:46:59 +01001410 replay_account_executed_instructions();
Alex Bennéed759c952018-02-27 12:52:48 +03001411
1412 replay_mutex_unlock();
Alex Bennée05248382017-03-29 16:46:59 +01001413 }
1414}
1415
1416
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001417static int tcg_cpu_exec(CPUState *cpu)
1418{
1419 int ret;
1420#ifdef CONFIG_PROFILER
1421 int64_t ti;
1422#endif
1423
Emilio G. Cotaf28d0df2018-06-22 13:45:31 -04001424 assert(tcg_enabled());
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001425#ifdef CONFIG_PROFILER
1426 ti = profile_getclock();
1427#endif
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001428 cpu_exec_start(cpu);
1429 ret = cpu_exec(cpu);
1430 cpu_exec_end(cpu);
1431#ifdef CONFIG_PROFILER
Emilio G. Cota72fd2ef2018-10-10 10:48:53 -04001432 atomic_set(&tcg_ctx->prof.cpu_exec_time,
1433 tcg_ctx->prof.cpu_exec_time + profile_getclock() - ti);
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001434#endif
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001435 return ret;
1436}
1437
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001438/* Destroy any remaining vCPUs which have been unplugged and have
1439 * finished running
1440 */
1441static void deal_with_unplugged_cpus(void)
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001442{
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001443 CPUState *cpu;
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001444
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001445 CPU_FOREACH(cpu) {
1446 if (cpu->unplug && !cpu_can_run(cpu)) {
1447 qemu_tcg_destroy_vcpu(cpu);
1448 cpu->created = false;
1449 qemu_cond_signal(&qemu_cpu_cond);
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001450 break;
1451 }
1452 }
Alex Bennée1be7fcb2016-10-27 16:10:08 +01001453}
Jan Kiszkabdb7ca62011-09-26 09:40:39 +02001454
Alex Bennée65467062017-02-23 18:29:09 +00001455/* Single-threaded TCG
1456 *
1457 * In the single-threaded case each vCPU is simulated in turn. If
1458 * there is more than a single vCPU we create a simple timer to kick
1459 * the vCPU and ensure we don't get stuck in a tight loop in one vCPU.
1460 * This is done explicitly rather than relying on side-effects
1461 * elsewhere.
1462 */
1463
Alex Bennée37257942017-02-23 18:29:14 +00001464static void *qemu_tcg_rr_cpu_thread_fn(void *arg)
Blue Swirl296af7c2010-03-29 19:23:50 +00001465{
Andreas Färberc3586ba2012-05-03 01:41:24 +02001466 CPUState *cpu = arg;
Blue Swirl296af7c2010-03-29 19:23:50 +00001467
Emilio G. Cotaf28d0df2018-06-22 13:45:31 -04001468 assert(tcg_enabled());
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001469 rcu_register_thread();
Emilio G. Cota3468b592017-07-19 18:57:58 -04001470 tcg_register_thread();
Paolo Bonziniab28bd22015-07-09 08:55:38 +02001471
Paolo Bonzini2e7f7a32015-06-18 18:47:18 +02001472 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +02001473 qemu_thread_get_self(cpu->thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001474
David Hildenbrand5a9c9732018-02-09 20:52:39 +01001475 cpu->thread_id = qemu_get_thread_id();
1476 cpu->created = true;
1477 cpu->can_do_io = 1;
Blue Swirl296af7c2010-03-29 19:23:50 +00001478 qemu_cond_signal(&qemu_cpu_cond);
1479
Jan Kiszkafa7d1862011-08-22 18:35:25 +02001480 /* wait for initial kick-off after machine start */
Emilio G. Cotac28e3992015-04-27 12:45:28 -04001481 while (first_cpu->stopped) {
KONRAD Fredericd5f8d612015-08-10 17:27:06 +02001482 qemu_cond_wait(first_cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka8e564b42012-02-17 18:31:15 +01001483
1484 /* process any pending work */
Andreas Färberbdc44642013-06-24 23:50:24 +02001485 CPU_FOREACH(cpu) {
Alex Bennée37257942017-02-23 18:29:14 +00001486 current_cpu = cpu;
Andreas Färber182735e2013-05-29 22:29:20 +02001487 qemu_wait_io_event_common(cpu);
Jan Kiszka8e564b42012-02-17 18:31:15 +01001488 }
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001489 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001490
Alex Bennée65467062017-02-23 18:29:09 +00001491 start_tcg_kick_timer();
1492
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001493 cpu = first_cpu;
1494
Alex Bennéee5143e32017-02-23 18:29:12 +00001495 /* process any pending work */
1496 cpu->exit_request = 1;
1497
Blue Swirl296af7c2010-03-29 19:23:50 +00001498 while (1) {
Alex Bennéed759c952018-02-27 12:52:48 +03001499 qemu_mutex_unlock_iothread();
1500 replay_mutex_lock();
1501 qemu_mutex_lock_iothread();
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001502 /* Account partial waits to QEMU_CLOCK_VIRTUAL. */
1503 qemu_account_warp_timer();
1504
Paolo Bonzini6b8f0182017-03-02 19:56:40 +01001505 /* Run the timers here. This is much more efficient than
1506 * waking up the I/O thread and waiting for completion.
1507 */
1508 handle_icount_deadline();
1509
Alex Bennéed759c952018-02-27 12:52:48 +03001510 replay_mutex_unlock();
1511
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001512 if (!cpu) {
1513 cpu = first_cpu;
1514 }
1515
Alex Bennéee5143e32017-02-23 18:29:12 +00001516 while (cpu && !cpu->queued_work_first && !cpu->exit_request) {
1517
Alex Bennée791158d2017-02-23 18:29:10 +00001518 atomic_mb_set(&tcg_current_rr_cpu, cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001519 current_cpu = cpu;
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001520
1521 qemu_clock_enable(QEMU_CLOCK_VIRTUAL,
1522 (cpu->singlestep_enabled & SSTEP_NOTIMER) == 0);
1523
1524 if (cpu_can_run(cpu)) {
1525 int r;
Alex Bennée05248382017-03-29 16:46:59 +01001526
Alex Bennéed759c952018-02-27 12:52:48 +03001527 qemu_mutex_unlock_iothread();
Alex Bennée05248382017-03-29 16:46:59 +01001528 prepare_icount_for_run(cpu);
1529
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001530 r = tcg_cpu_exec(cpu);
Alex Bennée05248382017-03-29 16:46:59 +01001531
1532 process_icount_data(cpu);
Alex Bennéed759c952018-02-27 12:52:48 +03001533 qemu_mutex_lock_iothread();
Alex Bennée05248382017-03-29 16:46:59 +01001534
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001535 if (r == EXCP_DEBUG) {
1536 cpu_handle_guest_debug(cpu);
1537 break;
Pranith Kumar08e73c42017-02-23 18:29:15 +00001538 } else if (r == EXCP_ATOMIC) {
1539 qemu_mutex_unlock_iothread();
1540 cpu_exec_step_atomic(cpu);
1541 qemu_mutex_lock_iothread();
1542 break;
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001543 }
Alex Bennée37257942017-02-23 18:29:14 +00001544 } else if (cpu->stop) {
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001545 if (cpu->unplug) {
1546 cpu = CPU_NEXT(cpu);
1547 }
1548 break;
1549 }
1550
Alex Bennéee5143e32017-02-23 18:29:12 +00001551 cpu = CPU_NEXT(cpu);
1552 } /* while (cpu && !cpu->exit_request).. */
1553
Alex Bennée791158d2017-02-23 18:29:10 +00001554 /* Does not need atomic_mb_set because a spurious wakeup is okay. */
1555 atomic_set(&tcg_current_rr_cpu, NULL);
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001556
Alex Bennéee5143e32017-02-23 18:29:12 +00001557 if (cpu && cpu->exit_request) {
1558 atomic_mb_set(&cpu->exit_request, 0);
1559 }
Alex Blighac70aaf2013-08-21 16:02:57 +01001560
Clement Deschamps013aabd2018-10-21 16:21:03 +02001561 if (use_icount && all_cpu_threads_idle()) {
1562 /*
1563 * When all cpus are sleeping (e.g in WFI), to avoid a deadlock
1564 * in the main_loop, wake it up in order to start the warp timer.
1565 */
1566 qemu_notify_event();
1567 }
1568
Paolo Bonzinia8efa602018-11-14 12:36:57 +01001569 qemu_tcg_rr_wait_io_event();
Alex Bennéec93bbbe2016-10-27 16:10:09 +01001570 deal_with_unplugged_cpus();
Blue Swirl296af7c2010-03-29 19:23:50 +00001571 }
1572
Paolo Bonzini9b0605f2018-01-30 11:05:06 -05001573 rcu_unregister_thread();
Blue Swirl296af7c2010-03-29 19:23:50 +00001574 return NULL;
1575}
1576
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001577static void *qemu_hax_cpu_thread_fn(void *arg)
1578{
1579 CPUState *cpu = arg;
1580 int r;
Vincent Palatinb3d3a422017-03-20 11:15:49 +01001581
Paolo Bonzini9857c2d2018-01-30 16:28:49 +01001582 rcu_register_thread();
Vincent Palatinb3d3a422017-03-20 11:15:49 +01001583 qemu_mutex_lock_iothread();
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001584 qemu_thread_get_self(cpu->thread);
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001585
1586 cpu->thread_id = qemu_get_thread_id();
1587 cpu->created = true;
1588 cpu->halted = 0;
1589 current_cpu = cpu;
1590
1591 hax_init_vcpu(cpu);
1592 qemu_cond_signal(&qemu_cpu_cond);
1593
Paolo Bonzini9857c2d2018-01-30 16:28:49 +01001594 do {
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001595 if (cpu_can_run(cpu)) {
1596 r = hax_smp_cpu_exec(cpu);
1597 if (r == EXCP_DEBUG) {
1598 cpu_handle_guest_debug(cpu);
1599 }
1600 }
1601
Paolo Bonzinidb08b682018-01-11 13:53:12 +01001602 qemu_wait_io_event(cpu);
Paolo Bonzini9857c2d2018-01-30 16:28:49 +01001603 } while (!cpu->unplug || cpu_can_run(cpu));
1604 rcu_unregister_thread();
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001605 return NULL;
1606}
1607
Sergio Andres Gomez Del Realc97d6d22017-09-13 04:05:09 -05001608/* The HVF-specific vCPU thread function. This one should only run when the host
1609 * CPU supports the VMX "unrestricted guest" feature. */
1610static void *qemu_hvf_cpu_thread_fn(void *arg)
1611{
1612 CPUState *cpu = arg;
1613
1614 int r;
1615
1616 assert(hvf_enabled());
1617
1618 rcu_register_thread();
1619
1620 qemu_mutex_lock_iothread();
1621 qemu_thread_get_self(cpu->thread);
1622
1623 cpu->thread_id = qemu_get_thread_id();
1624 cpu->can_do_io = 1;
1625 current_cpu = cpu;
1626
1627 hvf_init_vcpu(cpu);
1628
1629 /* signal CPU creation */
1630 cpu->created = true;
1631 qemu_cond_signal(&qemu_cpu_cond);
1632
1633 do {
1634 if (cpu_can_run(cpu)) {
1635 r = hvf_vcpu_exec(cpu);
1636 if (r == EXCP_DEBUG) {
1637 cpu_handle_guest_debug(cpu);
1638 }
1639 }
Paolo Bonzinidb08b682018-01-11 13:53:12 +01001640 qemu_wait_io_event(cpu);
Sergio Andres Gomez Del Realc97d6d22017-09-13 04:05:09 -05001641 } while (!cpu->unplug || cpu_can_run(cpu));
1642
1643 hvf_vcpu_destroy(cpu);
1644 cpu->created = false;
1645 qemu_cond_signal(&qemu_cpu_cond);
1646 qemu_mutex_unlock_iothread();
Paolo Bonzini8178e632018-01-30 11:05:21 -05001647 rcu_unregister_thread();
Sergio Andres Gomez Del Realc97d6d22017-09-13 04:05:09 -05001648 return NULL;
1649}
1650
Justin Terry (VM)19306802018-01-22 13:07:49 -08001651static void *qemu_whpx_cpu_thread_fn(void *arg)
1652{
1653 CPUState *cpu = arg;
1654 int r;
1655
1656 rcu_register_thread();
1657
1658 qemu_mutex_lock_iothread();
1659 qemu_thread_get_self(cpu->thread);
1660 cpu->thread_id = qemu_get_thread_id();
1661 current_cpu = cpu;
1662
1663 r = whpx_init_vcpu(cpu);
1664 if (r < 0) {
1665 fprintf(stderr, "whpx_init_vcpu failed: %s\n", strerror(-r));
1666 exit(1);
1667 }
1668
1669 /* signal CPU creation */
1670 cpu->created = true;
1671 qemu_cond_signal(&qemu_cpu_cond);
1672
1673 do {
1674 if (cpu_can_run(cpu)) {
1675 r = whpx_vcpu_exec(cpu);
1676 if (r == EXCP_DEBUG) {
1677 cpu_handle_guest_debug(cpu);
1678 }
1679 }
1680 while (cpu_thread_is_idle(cpu)) {
1681 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
1682 }
1683 qemu_wait_io_event_common(cpu);
1684 } while (!cpu->unplug || cpu_can_run(cpu));
1685
1686 whpx_destroy_vcpu(cpu);
1687 cpu->created = false;
1688 qemu_cond_signal(&qemu_cpu_cond);
1689 qemu_mutex_unlock_iothread();
1690 rcu_unregister_thread();
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001691 return NULL;
1692}
1693
1694#ifdef _WIN32
1695static void CALLBACK dummy_apc_func(ULONG_PTR unused)
1696{
1697}
1698#endif
1699
Alex Bennée37257942017-02-23 18:29:14 +00001700/* Multi-threaded TCG
1701 *
1702 * In the multi-threaded case each vCPU has its own thread. The TLS
1703 * variable current_cpu can be used deep in the code to find the
1704 * current CPUState for a given thread.
1705 */
1706
1707static void *qemu_tcg_cpu_thread_fn(void *arg)
1708{
1709 CPUState *cpu = arg;
1710
Emilio G. Cotaf28d0df2018-06-22 13:45:31 -04001711 assert(tcg_enabled());
Alex Bennéebf51c722017-03-30 18:32:29 +01001712 g_assert(!use_icount);
1713
Alex Bennée37257942017-02-23 18:29:14 +00001714 rcu_register_thread();
Emilio G. Cota3468b592017-07-19 18:57:58 -04001715 tcg_register_thread();
Alex Bennée37257942017-02-23 18:29:14 +00001716
1717 qemu_mutex_lock_iothread();
1718 qemu_thread_get_self(cpu->thread);
1719
1720 cpu->thread_id = qemu_get_thread_id();
1721 cpu->created = true;
1722 cpu->can_do_io = 1;
1723 current_cpu = cpu;
1724 qemu_cond_signal(&qemu_cpu_cond);
1725
1726 /* process any pending work */
1727 cpu->exit_request = 1;
1728
Cédric Le Goater54961aa2018-04-25 15:18:28 +02001729 do {
Alex Bennée37257942017-02-23 18:29:14 +00001730 if (cpu_can_run(cpu)) {
1731 int r;
Alex Bennéed759c952018-02-27 12:52:48 +03001732 qemu_mutex_unlock_iothread();
Alex Bennée37257942017-02-23 18:29:14 +00001733 r = tcg_cpu_exec(cpu);
Alex Bennéed759c952018-02-27 12:52:48 +03001734 qemu_mutex_lock_iothread();
Alex Bennée37257942017-02-23 18:29:14 +00001735 switch (r) {
1736 case EXCP_DEBUG:
1737 cpu_handle_guest_debug(cpu);
1738 break;
1739 case EXCP_HALTED:
1740 /* during start-up the vCPU is reset and the thread is
1741 * kicked several times. If we don't ensure we go back
1742 * to sleep in the halted state we won't cleanly
1743 * start-up when the vCPU is enabled.
1744 *
1745 * cpu->halted should ensure we sleep in wait_io_event
1746 */
1747 g_assert(cpu->halted);
1748 break;
Pranith Kumar08e73c42017-02-23 18:29:15 +00001749 case EXCP_ATOMIC:
1750 qemu_mutex_unlock_iothread();
1751 cpu_exec_step_atomic(cpu);
1752 qemu_mutex_lock_iothread();
Alex Bennée37257942017-02-23 18:29:14 +00001753 default:
1754 /* Ignore everything else? */
1755 break;
1756 }
1757 }
1758
Alex Bennée37257942017-02-23 18:29:14 +00001759 atomic_mb_set(&cpu->exit_request, 0);
Paolo Bonzinidb08b682018-01-11 13:53:12 +01001760 qemu_wait_io_event(cpu);
Paolo Bonzini9b0605f2018-01-30 11:05:06 -05001761 } while (!cpu->unplug || cpu_can_run(cpu));
Alex Bennée37257942017-02-23 18:29:14 +00001762
Paolo Bonzini9b0605f2018-01-30 11:05:06 -05001763 qemu_tcg_destroy_vcpu(cpu);
1764 cpu->created = false;
1765 qemu_cond_signal(&qemu_cpu_cond);
1766 qemu_mutex_unlock_iothread();
1767 rcu_unregister_thread();
Alex Bennée37257942017-02-23 18:29:14 +00001768 return NULL;
1769}
1770
Andreas Färber2ff09a42012-05-03 00:23:30 +02001771static void qemu_cpu_kick_thread(CPUState *cpu)
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001772{
1773#ifndef _WIN32
1774 int err;
1775
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001776 if (cpu->thread_kicked) {
1777 return;
Paolo Bonzini9102ded2015-08-18 06:52:09 -07001778 }
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001779 cpu->thread_kicked = true;
Andreas Färber814e6122012-05-02 17:00:37 +02001780 err = pthread_kill(cpu->thread->thread, SIG_IPI);
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001781 if (err) {
1782 fprintf(stderr, "qemu:%s: %s", __func__, strerror(err));
1783 exit(1);
1784 }
1785#else /* _WIN32 */
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001786 if (!qemu_cpu_is_self(cpu)) {
Justin Terry (VM)19306802018-01-22 13:07:49 -08001787 if (whpx_enabled()) {
1788 whpx_vcpu_kick(cpu);
1789 } else if (!QueueUserAPC(dummy_apc_func, cpu->hThread, 0)) {
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001790 fprintf(stderr, "%s: QueueUserAPC failed with error %lu\n",
1791 __func__, GetLastError());
1792 exit(1);
1793 }
1794 }
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001795#endif
1796}
1797
Andreas Färberc08d7422012-05-03 04:34:15 +02001798void qemu_cpu_kick(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001799{
Andreas Färberf5c121b2012-05-03 01:22:49 +02001800 qemu_cond_broadcast(cpu->halt_cond);
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001801 if (tcg_enabled()) {
Alex Bennée791158d2017-02-23 18:29:10 +00001802 cpu_exit(cpu);
Alex Bennée37257942017-02-23 18:29:14 +00001803 /* NOP unless doing single-thread RR */
Alex Bennée791158d2017-02-23 18:29:10 +00001804 qemu_cpu_kick_rr_cpu();
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001805 } else {
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001806 if (hax_enabled()) {
1807 /*
1808 * FIXME: race condition with the exit_request check in
1809 * hax_vcpu_hax_exec
1810 */
1811 cpu->exit_request = 1;
1812 }
Paolo Bonzinie0c38212015-08-26 00:19:19 +02001813 qemu_cpu_kick_thread(cpu);
1814 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001815}
1816
Jan Kiszka46d62fa2011-02-01 22:15:59 +01001817void qemu_cpu_kick_self(void)
1818{
Andreas Färber4917cf42013-05-27 05:17:50 +02001819 assert(current_cpu);
Paolo Bonzini9102ded2015-08-18 06:52:09 -07001820 qemu_cpu_kick_thread(current_cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001821}
1822
Andreas Färber60e82572012-05-02 22:23:49 +02001823bool qemu_cpu_is_self(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001824{
Andreas Färber814e6122012-05-02 17:00:37 +02001825 return qemu_thread_is_self(cpu->thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001826}
1827
Paolo Bonzini79e2b9a2015-01-21 12:09:14 +01001828bool qemu_in_vcpu_thread(void)
Juan Quintelaaa723c22012-09-18 16:30:11 +02001829{
Andreas Färber4917cf42013-05-27 05:17:50 +02001830 return current_cpu && qemu_cpu_is_self(current_cpu);
Juan Quintelaaa723c22012-09-18 16:30:11 +02001831}
1832
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001833static __thread bool iothread_locked = false;
1834
1835bool qemu_mutex_iothread_locked(void)
1836{
1837 return iothread_locked;
1838}
1839
Emilio G. Cotacb764d02017-10-28 02:16:41 -04001840/*
1841 * The BQL is taken from so many places that it is worth profiling the
1842 * callers directly, instead of funneling them all through a single function.
1843 */
1844void qemu_mutex_lock_iothread_impl(const char *file, int line)
Blue Swirl296af7c2010-03-29 19:23:50 +00001845{
Emilio G. Cotacb764d02017-10-28 02:16:41 -04001846 QemuMutexLockFunc bql_lock = atomic_read(&qemu_bql_mutex_lock_func);
1847
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001848 g_assert(!qemu_mutex_iothread_locked());
Emilio G. Cotacb764d02017-10-28 02:16:41 -04001849 bql_lock(&qemu_global_mutex, file, line);
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001850 iothread_locked = true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001851}
1852
1853void qemu_mutex_unlock_iothread(void)
1854{
Jan Kiszka8d04fb52017-02-23 18:29:11 +00001855 g_assert(qemu_mutex_iothread_locked());
Paolo Bonziniafbe7052015-06-18 18:47:19 +02001856 iothread_locked = false;
Blue Swirl296af7c2010-03-29 19:23:50 +00001857 qemu_mutex_unlock(&qemu_global_mutex);
1858}
1859
Alex Bennéee8faee02016-10-27 16:09:58 +01001860static bool all_vcpus_paused(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001861{
Andreas Färberbdc44642013-06-24 23:50:24 +02001862 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001863
Andreas Färberbdc44642013-06-24 23:50:24 +02001864 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001865 if (!cpu->stopped) {
Alex Bennéee8faee02016-10-27 16:09:58 +01001866 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001867 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001868 }
1869
Alex Bennéee8faee02016-10-27 16:09:58 +01001870 return true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001871}
1872
1873void pause_all_vcpus(void)
1874{
Andreas Färberbdc44642013-06-24 23:50:24 +02001875 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001876
Alex Bligh40daca52013-08-21 16:03:02 +01001877 qemu_clock_enable(QEMU_CLOCK_VIRTUAL, false);
Andreas Färberbdc44642013-06-24 23:50:24 +02001878 CPU_FOREACH(cpu) {
David Hildenbrandebd05fe2017-11-29 20:12:15 +01001879 if (qemu_cpu_is_self(cpu)) {
1880 qemu_cpu_stop(cpu, true);
1881 } else {
1882 cpu->stop = true;
1883 qemu_cpu_kick(cpu);
1884 }
Jan Kiszkad798e972012-02-17 18:31:16 +01001885 }
1886
Alex Bennéed759c952018-02-27 12:52:48 +03001887 /* We need to drop the replay_lock so any vCPU threads woken up
1888 * can finish their replay tasks
1889 */
1890 replay_mutex_unlock();
1891
Blue Swirl296af7c2010-03-29 19:23:50 +00001892 while (!all_vcpus_paused()) {
Paolo Bonzinibe7d6c52011-03-12 17:44:02 +01001893 qemu_cond_wait(&qemu_pause_cond, &qemu_global_mutex);
Andreas Färberbdc44642013-06-24 23:50:24 +02001894 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001895 qemu_cpu_kick(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001896 }
1897 }
Alex Bennéed759c952018-02-27 12:52:48 +03001898
1899 qemu_mutex_unlock_iothread();
1900 replay_mutex_lock();
1901 qemu_mutex_lock_iothread();
Blue Swirl296af7c2010-03-29 19:23:50 +00001902}
1903
Igor Mammedov29936832013-04-23 10:29:37 +02001904void cpu_resume(CPUState *cpu)
1905{
1906 cpu->stop = false;
1907 cpu->stopped = false;
1908 qemu_cpu_kick(cpu);
1909}
1910
Blue Swirl296af7c2010-03-29 19:23:50 +00001911void resume_all_vcpus(void)
1912{
Andreas Färberbdc44642013-06-24 23:50:24 +02001913 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001914
Alex Bligh40daca52013-08-21 16:03:02 +01001915 qemu_clock_enable(QEMU_CLOCK_VIRTUAL, true);
Andreas Färberbdc44642013-06-24 23:50:24 +02001916 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001917 cpu_resume(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001918 }
1919}
1920
Paolo Bonzinidbadee42018-01-30 16:40:12 +01001921void cpu_remove_sync(CPUState *cpu)
Gu Zheng4c055ab2016-05-12 09:18:13 +05301922{
1923 cpu->stop = true;
1924 cpu->unplug = true;
1925 qemu_cpu_kick(cpu);
Paolo Bonzinidbadee42018-01-30 16:40:12 +01001926 qemu_mutex_unlock_iothread();
1927 qemu_thread_join(cpu->thread);
1928 qemu_mutex_lock_iothread();
Bharata B Rao2c579042016-05-12 09:18:14 +05301929}
1930
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001931/* For temporary buffers for forming a name */
1932#define VCPU_THREAD_NAME_SIZE 16
1933
Andreas Färbere5ab30a2012-05-03 01:50:44 +02001934static void qemu_tcg_init_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001935{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001936 char thread_name[VCPU_THREAD_NAME_SIZE];
Alex Bennée37257942017-02-23 18:29:14 +00001937 static QemuCond *single_tcg_halt_cond;
1938 static QemuThread *single_tcg_cpu_thread;
Emilio G. Cotae8feb962017-07-07 19:24:20 -04001939 static int tcg_region_inited;
1940
Emilio G. Cotaf28d0df2018-06-22 13:45:31 -04001941 assert(tcg_enabled());
Emilio G. Cotae8feb962017-07-07 19:24:20 -04001942 /*
1943 * Initialize TCG regions--once. Now is a good time, because:
1944 * (1) TCG's init context, prologue and target globals have been set up.
1945 * (2) qemu_tcg_mttcg_enabled() works now (TCG init code runs before the
1946 * -accel flag is processed, so the check doesn't work then).
1947 */
1948 if (!tcg_region_inited) {
1949 tcg_region_inited = 1;
1950 tcg_region_init();
1951 }
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001952
Alex Bennée37257942017-02-23 18:29:14 +00001953 if (qemu_tcg_mttcg_enabled() || !single_tcg_cpu_thread) {
Andreas Färber814e6122012-05-02 17:00:37 +02001954 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001955 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1956 qemu_cond_init(cpu->halt_cond);
Alex Bennée37257942017-02-23 18:29:14 +00001957
1958 if (qemu_tcg_mttcg_enabled()) {
1959 /* create a thread per vCPU with TCG (MTTCG) */
1960 parallel_cpus = true;
1961 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/TCG",
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001962 cpu->cpu_index);
Alex Bennée37257942017-02-23 18:29:14 +00001963
1964 qemu_thread_create(cpu->thread, thread_name, qemu_tcg_cpu_thread_fn,
1965 cpu, QEMU_THREAD_JOINABLE);
1966
1967 } else {
1968 /* share a single thread for all cpus with TCG */
1969 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "ALL CPUs/TCG");
1970 qemu_thread_create(cpu->thread, thread_name,
1971 qemu_tcg_rr_cpu_thread_fn,
1972 cpu, QEMU_THREAD_JOINABLE);
1973
1974 single_tcg_halt_cond = cpu->halt_cond;
1975 single_tcg_cpu_thread = cpu->thread;
1976 }
Paolo Bonzini1ecf47b2011-12-13 13:43:52 +01001977#ifdef _WIN32
Andreas Färber814e6122012-05-02 17:00:37 +02001978 cpu->hThread = qemu_thread_get_handle(cpu->thread);
Paolo Bonzini1ecf47b2011-12-13 13:43:52 +01001979#endif
Blue Swirl296af7c2010-03-29 19:23:50 +00001980 } else {
Alex Bennée37257942017-02-23 18:29:14 +00001981 /* For non-MTTCG cases we share the thread */
1982 cpu->thread = single_tcg_cpu_thread;
1983 cpu->halt_cond = single_tcg_halt_cond;
David Hildenbranda3421732018-02-09 20:52:37 +01001984 cpu->thread_id = first_cpu->thread_id;
1985 cpu->can_do_io = 1;
1986 cpu->created = true;
Blue Swirl296af7c2010-03-29 19:23:50 +00001987 }
1988}
1989
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01001990static void qemu_hax_start_vcpu(CPUState *cpu)
1991{
1992 char thread_name[VCPU_THREAD_NAME_SIZE];
1993
1994 cpu->thread = g_malloc0(sizeof(QemuThread));
1995 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1996 qemu_cond_init(cpu->halt_cond);
1997
1998 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/HAX",
1999 cpu->cpu_index);
2000 qemu_thread_create(cpu->thread, thread_name, qemu_hax_cpu_thread_fn,
2001 cpu, QEMU_THREAD_JOINABLE);
2002#ifdef _WIN32
2003 cpu->hThread = qemu_thread_get_handle(cpu->thread);
2004#endif
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01002005}
2006
Andreas Färber48a106b2013-05-27 02:20:39 +02002007static void qemu_kvm_start_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00002008{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00002009 char thread_name[VCPU_THREAD_NAME_SIZE];
2010
Andreas Färber814e6122012-05-02 17:00:37 +02002011 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02002012 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
2013 qemu_cond_init(cpu->halt_cond);
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00002014 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/KVM",
2015 cpu->cpu_index);
2016 qemu_thread_create(cpu->thread, thread_name, qemu_kvm_cpu_thread_fn,
2017 cpu, QEMU_THREAD_JOINABLE);
Blue Swirl296af7c2010-03-29 19:23:50 +00002018}
2019
Sergio Andres Gomez Del Realc97d6d22017-09-13 04:05:09 -05002020static void qemu_hvf_start_vcpu(CPUState *cpu)
2021{
2022 char thread_name[VCPU_THREAD_NAME_SIZE];
2023
2024 /* HVF currently does not support TCG, and only runs in
2025 * unrestricted-guest mode. */
2026 assert(hvf_enabled());
2027
2028 cpu->thread = g_malloc0(sizeof(QemuThread));
2029 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
2030 qemu_cond_init(cpu->halt_cond);
2031
2032 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/HVF",
2033 cpu->cpu_index);
2034 qemu_thread_create(cpu->thread, thread_name, qemu_hvf_cpu_thread_fn,
2035 cpu, QEMU_THREAD_JOINABLE);
Sergio Andres Gomez Del Realc97d6d22017-09-13 04:05:09 -05002036}
2037
Justin Terry (VM)19306802018-01-22 13:07:49 -08002038static void qemu_whpx_start_vcpu(CPUState *cpu)
2039{
2040 char thread_name[VCPU_THREAD_NAME_SIZE];
2041
2042 cpu->thread = g_malloc0(sizeof(QemuThread));
2043 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
2044 qemu_cond_init(cpu->halt_cond);
2045 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/WHPX",
2046 cpu->cpu_index);
2047 qemu_thread_create(cpu->thread, thread_name, qemu_whpx_cpu_thread_fn,
2048 cpu, QEMU_THREAD_JOINABLE);
2049#ifdef _WIN32
2050 cpu->hThread = qemu_thread_get_handle(cpu->thread);
2051#endif
Justin Terry (VM)19306802018-01-22 13:07:49 -08002052}
2053
Andreas Färber10a90212013-05-27 02:24:35 +02002054static void qemu_dummy_start_vcpu(CPUState *cpu)
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02002055{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00002056 char thread_name[VCPU_THREAD_NAME_SIZE];
2057
Andreas Färber814e6122012-05-02 17:00:37 +02002058 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02002059 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
2060 qemu_cond_init(cpu->halt_cond);
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00002061 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/DUMMY",
2062 cpu->cpu_index);
2063 qemu_thread_create(cpu->thread, thread_name, qemu_dummy_cpu_thread_fn, cpu,
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02002064 QEMU_THREAD_JOINABLE);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02002065}
2066
Andreas Färberc643bed2013-05-27 03:23:24 +02002067void qemu_init_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00002068{
Andreas Färberce3960e2012-12-17 03:27:07 +01002069 cpu->nr_cores = smp_cores;
2070 cpu->nr_threads = smp_threads;
Andreas Färberf324e762012-05-02 23:26:21 +02002071 cpu->stopped = true;
Peter Maydell56943e82016-01-21 14:15:04 +00002072
2073 if (!cpu->as) {
2074 /* If the target cpu hasn't set up any address spaces itself,
2075 * give it the default one.
2076 */
Peter Maydell12ebc9a2016-01-21 14:15:04 +00002077 cpu->num_ases = 1;
Peter Xu80ceb072017-11-23 17:23:32 +08002078 cpu_address_space_init(cpu, 0, "cpu-memory", cpu->memory);
Peter Maydell56943e82016-01-21 14:15:04 +00002079 }
2080
Jan Kiszka0ab07c62011-02-07 12:19:14 +01002081 if (kvm_enabled()) {
Andreas Färber48a106b2013-05-27 02:20:39 +02002082 qemu_kvm_start_vcpu(cpu);
Vincent Palatinb0cb0a62017-01-10 11:59:57 +01002083 } else if (hax_enabled()) {
2084 qemu_hax_start_vcpu(cpu);
Sergio Andres Gomez Del Realc97d6d22017-09-13 04:05:09 -05002085 } else if (hvf_enabled()) {
2086 qemu_hvf_start_vcpu(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02002087 } else if (tcg_enabled()) {
Andreas Färbere5ab30a2012-05-03 01:50:44 +02002088 qemu_tcg_init_vcpu(cpu);
Justin Terry (VM)19306802018-01-22 13:07:49 -08002089 } else if (whpx_enabled()) {
2090 qemu_whpx_start_vcpu(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02002091 } else {
Andreas Färber10a90212013-05-27 02:24:35 +02002092 qemu_dummy_start_vcpu(cpu);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01002093 }
David Hildenbrand81e96312018-02-09 20:52:38 +01002094
2095 while (!cpu->created) {
2096 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
2097 }
Blue Swirl296af7c2010-03-29 19:23:50 +00002098}
2099
Jan Kiszkab4a3d962011-02-01 22:15:43 +01002100void cpu_stop_current(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00002101{
Andreas Färber4917cf42013-05-27 05:17:50 +02002102 if (current_cpu) {
David Hildenbrandebd05fe2017-11-29 20:12:15 +01002103 qemu_cpu_stop(current_cpu, true);
Jan Kiszkab4a3d962011-02-01 22:15:43 +01002104 }
Blue Swirl296af7c2010-03-29 19:23:50 +00002105}
2106
Kevin Wolf56983462013-07-05 13:49:54 +02002107int vm_stop(RunState state)
Blue Swirl296af7c2010-03-29 19:23:50 +00002108{
Juan Quintelaaa723c22012-09-18 16:30:11 +02002109 if (qemu_in_vcpu_thread()) {
Paolo Bonzini74892d22014-06-05 14:53:58 +02002110 qemu_system_vmstop_request_prepare();
Luiz Capitulino1dfb4dd2011-07-29 14:26:33 -03002111 qemu_system_vmstop_request(state);
Blue Swirl296af7c2010-03-29 19:23:50 +00002112 /*
2113 * FIXME: should not return to device code in case
2114 * vm_stop() has been requested.
2115 */
Jan Kiszkab4a3d962011-02-01 22:15:43 +01002116 cpu_stop_current();
Kevin Wolf56983462013-07-05 13:49:54 +02002117 return 0;
Blue Swirl296af7c2010-03-29 19:23:50 +00002118 }
Kevin Wolf56983462013-07-05 13:49:54 +02002119
Stefan Hajnoczi4486e892018-03-07 14:42:05 +00002120 return do_vm_stop(state, true);
Blue Swirl296af7c2010-03-29 19:23:50 +00002121}
2122
Claudio Imbrenda2d76e822017-02-14 18:07:47 +01002123/**
2124 * Prepare for (re)starting the VM.
2125 * Returns -1 if the vCPUs are not to be restarted (e.g. if they are already
2126 * running or in case of an error condition), 0 otherwise.
2127 */
2128int vm_prepare_start(void)
2129{
2130 RunState requested;
Claudio Imbrenda2d76e822017-02-14 18:07:47 +01002131
2132 qemu_vmstop_requested(&requested);
2133 if (runstate_is_running() && requested == RUN_STATE__MAX) {
2134 return -1;
2135 }
2136
2137 /* Ensure that a STOP/RESUME pair of events is emitted if a
2138 * vmstop request was pending. The BLOCK_IO_ERROR event, for
2139 * example, according to documentation is always followed by
2140 * the STOP event.
2141 */
2142 if (runstate_is_running()) {
Peter Xu3ab72382018-08-15 21:37:37 +08002143 qapi_event_send_stop();
2144 qapi_event_send_resume();
Markus Armbrusterf0561582018-04-23 10:45:18 +02002145 return -1;
Claudio Imbrenda2d76e822017-02-14 18:07:47 +01002146 }
2147
2148 /* We are sending this now, but the CPUs will be resumed shortly later */
Peter Xu3ab72382018-08-15 21:37:37 +08002149 qapi_event_send_resume();
Markus Armbrusterf0561582018-04-23 10:45:18 +02002150
2151 replay_enable_events();
2152 cpu_enable_ticks();
2153 runstate_set(RUN_STATE_RUNNING);
2154 vm_state_notify(1, RUN_STATE_RUNNING);
2155 return 0;
Claudio Imbrenda2d76e822017-02-14 18:07:47 +01002156}
2157
2158void vm_start(void)
2159{
2160 if (!vm_prepare_start()) {
2161 resume_all_vcpus();
2162 }
2163}
2164
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03002165/* does a state transition even if the VM is already stopped,
2166 current state is forgotten forever */
Kevin Wolf56983462013-07-05 13:49:54 +02002167int vm_stop_force_state(RunState state)
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03002168{
2169 if (runstate_is_running()) {
Kevin Wolf56983462013-07-05 13:49:54 +02002170 return vm_stop(state);
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03002171 } else {
2172 runstate_set(state);
Wen Congyangb2780d32015-11-20 17:34:38 +08002173
2174 bdrv_drain_all();
Kevin Wolf594a45c2013-07-18 14:52:19 +02002175 /* Make sure to return an error if the flush in a previous vm_stop()
2176 * failed. */
John Snow22af08e2016-09-22 21:45:51 -04002177 return bdrv_flush_all();
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03002178 }
2179}
2180
Stefan Weil9a78eea2010-10-22 23:03:33 +02002181void list_cpus(FILE *f, fprintf_function cpu_fprintf, const char *optarg)
Blue Swirl262353c2010-05-04 19:55:35 +00002182{
2183 /* XXX: implement xxx_cpu_list for targets that still miss it */
Peter Maydelle916cbf2012-09-05 17:41:08 -03002184#if defined(cpu_list)
2185 cpu_list(f, cpu_fprintf);
Blue Swirl262353c2010-05-04 19:55:35 +00002186#endif
2187}
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03002188
2189CpuInfoList *qmp_query_cpus(Error **errp)
2190{
Igor Mammedovafed5a52017-05-10 13:29:55 +02002191 MachineState *ms = MACHINE(qdev_get_machine());
2192 MachineClass *mc = MACHINE_GET_CLASS(ms);
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03002193 CpuInfoList *head = NULL, *cur_item = NULL;
Andreas Färber182735e2013-05-29 22:29:20 +02002194 CPUState *cpu;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03002195
Andreas Färberbdc44642013-06-24 23:50:24 +02002196 CPU_FOREACH(cpu) {
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03002197 CpuInfoList *info;
Andreas Färber182735e2013-05-29 22:29:20 +02002198#if defined(TARGET_I386)
2199 X86CPU *x86_cpu = X86_CPU(cpu);
2200 CPUX86State *env = &x86_cpu->env;
2201#elif defined(TARGET_PPC)
2202 PowerPCCPU *ppc_cpu = POWERPC_CPU(cpu);
2203 CPUPPCState *env = &ppc_cpu->env;
2204#elif defined(TARGET_SPARC)
2205 SPARCCPU *sparc_cpu = SPARC_CPU(cpu);
2206 CPUSPARCState *env = &sparc_cpu->env;
Michael Clark25fa1942018-03-03 01:32:59 +13002207#elif defined(TARGET_RISCV)
2208 RISCVCPU *riscv_cpu = RISCV_CPU(cpu);
2209 CPURISCVState *env = &riscv_cpu->env;
Andreas Färber182735e2013-05-29 22:29:20 +02002210#elif defined(TARGET_MIPS)
2211 MIPSCPU *mips_cpu = MIPS_CPU(cpu);
2212 CPUMIPSState *env = &mips_cpu->env;
Bastian Koppelmann48e06fe2014-09-01 12:59:46 +01002213#elif defined(TARGET_TRICORE)
2214 TriCoreCPU *tricore_cpu = TRICORE_CPU(cpu);
2215 CPUTriCoreState *env = &tricore_cpu->env;
Viktor Mihajlovski9d0306d2018-02-16 17:08:37 +01002216#elif defined(TARGET_S390X)
2217 S390CPU *s390_cpu = S390_CPU(cpu);
2218 CPUS390XState *env = &s390_cpu->env;
Andreas Färber182735e2013-05-29 22:29:20 +02002219#endif
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03002220
Andreas Färbercb446ec2013-05-01 14:24:52 +02002221 cpu_synchronize_state(cpu);
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03002222
2223 info = g_malloc0(sizeof(*info));
2224 info->value = g_malloc0(sizeof(*info->value));
Andreas Färber55e5c282012-12-17 06:18:02 +01002225 info->value->CPU = cpu->cpu_index;
Andreas Färber182735e2013-05-29 22:29:20 +02002226 info->value->current = (cpu == first_cpu);
Andreas Färber259186a2013-01-17 18:51:17 +01002227 info->value->halted = cpu->halted;
Eduardo Habkost58f88d42015-05-08 16:04:22 -03002228 info->value->qom_path = object_get_canonical_path(OBJECT(cpu));
Andreas Färber9f09e182012-05-03 06:59:07 +02002229 info->value->thread_id = cpu->thread_id;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03002230#if defined(TARGET_I386)
Eric Blake86f4b682015-11-18 01:52:59 -07002231 info->value->arch = CPU_INFO_ARCH_X86;
Eric Blake544a3732016-02-17 23:48:27 -07002232 info->value->u.x86.pc = env->eip + env->segs[R_CS].base;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03002233#elif defined(TARGET_PPC)
Eric Blake86f4b682015-11-18 01:52:59 -07002234 info->value->arch = CPU_INFO_ARCH_PPC;
Eric Blake544a3732016-02-17 23:48:27 -07002235 info->value->u.ppc.nip = env->nip;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03002236#elif defined(TARGET_SPARC)
Eric Blake86f4b682015-11-18 01:52:59 -07002237 info->value->arch = CPU_INFO_ARCH_SPARC;
Eric Blake544a3732016-02-17 23:48:27 -07002238 info->value->u.q_sparc.pc = env->pc;
2239 info->value->u.q_sparc.npc = env->npc;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03002240#elif defined(TARGET_MIPS)
Eric Blake86f4b682015-11-18 01:52:59 -07002241 info->value->arch = CPU_INFO_ARCH_MIPS;
Eric Blake544a3732016-02-17 23:48:27 -07002242 info->value->u.q_mips.PC = env->active_tc.PC;
Bastian Koppelmann48e06fe2014-09-01 12:59:46 +01002243#elif defined(TARGET_TRICORE)
Eric Blake86f4b682015-11-18 01:52:59 -07002244 info->value->arch = CPU_INFO_ARCH_TRICORE;
Eric Blake544a3732016-02-17 23:48:27 -07002245 info->value->u.tricore.PC = env->PC;
Viktor Mihajlovski9d0306d2018-02-16 17:08:37 +01002246#elif defined(TARGET_S390X)
2247 info->value->arch = CPU_INFO_ARCH_S390;
2248 info->value->u.s390.cpu_state = env->cpu_state;
Michael Clark25fa1942018-03-03 01:32:59 +13002249#elif defined(TARGET_RISCV)
2250 info->value->arch = CPU_INFO_ARCH_RISCV;
2251 info->value->u.riscv.pc = env->pc;
Eric Blake86f4b682015-11-18 01:52:59 -07002252#else
2253 info->value->arch = CPU_INFO_ARCH_OTHER;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03002254#endif
Igor Mammedovafed5a52017-05-10 13:29:55 +02002255 info->value->has_props = !!mc->cpu_index_to_instance_props;
2256 if (info->value->has_props) {
2257 CpuInstanceProperties *props;
2258 props = g_malloc0(sizeof(*props));
2259 *props = mc->cpu_index_to_instance_props(ms, cpu->cpu_index);
2260 info->value->props = props;
2261 }
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03002262
2263 /* XXX: waiting for the qapi to support GSList */
2264 if (!cur_item) {
2265 head = cur_item = info;
2266 } else {
2267 cur_item->next = info;
2268 cur_item = info;
2269 }
2270 }
2271
2272 return head;
2273}
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02002274
Laszlo Ersekdaa9d2b2018-04-27 21:28:51 +02002275static CpuInfoArch sysemu_target_to_cpuinfo_arch(SysEmuTarget target)
2276{
2277 /*
2278 * The @SysEmuTarget -> @CpuInfoArch mapping below is based on the
2279 * TARGET_ARCH -> TARGET_BASE_ARCH mapping in the "configure" script.
2280 */
2281 switch (target) {
2282 case SYS_EMU_TARGET_I386:
2283 case SYS_EMU_TARGET_X86_64:
2284 return CPU_INFO_ARCH_X86;
2285
2286 case SYS_EMU_TARGET_PPC:
Laszlo Ersekdaa9d2b2018-04-27 21:28:51 +02002287 case SYS_EMU_TARGET_PPC64:
2288 return CPU_INFO_ARCH_PPC;
2289
2290 case SYS_EMU_TARGET_SPARC:
2291 case SYS_EMU_TARGET_SPARC64:
2292 return CPU_INFO_ARCH_SPARC;
2293
2294 case SYS_EMU_TARGET_MIPS:
2295 case SYS_EMU_TARGET_MIPSEL:
2296 case SYS_EMU_TARGET_MIPS64:
2297 case SYS_EMU_TARGET_MIPS64EL:
2298 return CPU_INFO_ARCH_MIPS;
2299
2300 case SYS_EMU_TARGET_TRICORE:
2301 return CPU_INFO_ARCH_TRICORE;
2302
2303 case SYS_EMU_TARGET_S390X:
2304 return CPU_INFO_ARCH_S390;
2305
2306 case SYS_EMU_TARGET_RISCV32:
2307 case SYS_EMU_TARGET_RISCV64:
2308 return CPU_INFO_ARCH_RISCV;
2309
2310 default:
2311 return CPU_INFO_ARCH_OTHER;
2312 }
2313}
2314
2315static void cpustate_to_cpuinfo_s390(CpuInfoS390 *info, const CPUState *cpu)
2316{
2317#ifdef TARGET_S390X
2318 S390CPU *s390_cpu = S390_CPU(cpu);
2319 CPUS390XState *env = &s390_cpu->env;
2320
2321 info->cpu_state = env->cpu_state;
2322#else
2323 abort();
2324#endif
2325}
2326
Luiz Capitulinoce74ee32018-02-16 17:08:38 +01002327/*
2328 * fast means: we NEVER interrupt vCPU threads to retrieve
2329 * information from KVM.
2330 */
2331CpuInfoFastList *qmp_query_cpus_fast(Error **errp)
2332{
2333 MachineState *ms = MACHINE(qdev_get_machine());
2334 MachineClass *mc = MACHINE_GET_CLASS(ms);
2335 CpuInfoFastList *head = NULL, *cur_item = NULL;
Laszlo Ersekdaa9d2b2018-04-27 21:28:51 +02002336 SysEmuTarget target = qapi_enum_parse(&SysEmuTarget_lookup, TARGET_NAME,
2337 -1, &error_abort);
Luiz Capitulinoce74ee32018-02-16 17:08:38 +01002338 CPUState *cpu;
2339
2340 CPU_FOREACH(cpu) {
2341 CpuInfoFastList *info = g_malloc0(sizeof(*info));
2342 info->value = g_malloc0(sizeof(*info->value));
2343
2344 info->value->cpu_index = cpu->cpu_index;
2345 info->value->qom_path = object_get_canonical_path(OBJECT(cpu));
2346 info->value->thread_id = cpu->thread_id;
2347
2348 info->value->has_props = !!mc->cpu_index_to_instance_props;
2349 if (info->value->has_props) {
2350 CpuInstanceProperties *props;
2351 props = g_malloc0(sizeof(*props));
2352 *props = mc->cpu_index_to_instance_props(ms, cpu->cpu_index);
2353 info->value->props = props;
2354 }
2355
Laszlo Ersekdaa9d2b2018-04-27 21:28:51 +02002356 info->value->arch = sysemu_target_to_cpuinfo_arch(target);
2357 info->value->target = target;
2358 if (target == SYS_EMU_TARGET_S390X) {
2359 cpustate_to_cpuinfo_s390(&info->value->u.s390x, cpu);
Laszlo Ersekdaa9d2b2018-04-27 21:28:51 +02002360 }
2361
Luiz Capitulinoce74ee32018-02-16 17:08:38 +01002362 if (!cur_item) {
2363 head = cur_item = info;
2364 } else {
2365 cur_item->next = info;
2366 cur_item = info;
2367 }
2368 }
2369
2370 return head;
2371}
2372
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02002373void qmp_memsave(int64_t addr, int64_t size, const char *filename,
2374 bool has_cpu, int64_t cpu_index, Error **errp)
2375{
2376 FILE *f;
2377 uint32_t l;
Andreas Färber55e5c282012-12-17 06:18:02 +01002378 CPUState *cpu;
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02002379 uint8_t buf[1024];
Borislav Petkov0dc9daf2015-02-08 13:14:38 +01002380 int64_t orig_addr = addr, orig_size = size;
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02002381
2382 if (!has_cpu) {
2383 cpu_index = 0;
2384 }
2385
Andreas Färber151d1322013-02-15 15:41:49 +01002386 cpu = qemu_get_cpu(cpu_index);
2387 if (cpu == NULL) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01002388 error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "cpu-index",
2389 "a CPU number");
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02002390 return;
2391 }
2392
2393 f = fopen(filename, "wb");
2394 if (!f) {
Luiz Capitulino618da852013-06-07 14:35:06 -04002395 error_setg_file_open(errp, errno, filename);
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02002396 return;
2397 }
2398
2399 while (size != 0) {
2400 l = sizeof(buf);
2401 if (l > size)
2402 l = size;
Aneesh Kumar K.V2f4d0f52013-10-01 21:49:30 +05302403 if (cpu_memory_rw_debug(cpu, addr, buf, l, 0) != 0) {
Borislav Petkov0dc9daf2015-02-08 13:14:38 +01002404 error_setg(errp, "Invalid addr 0x%016" PRIx64 "/size %" PRId64
2405 " specified", orig_addr, orig_size);
Aneesh Kumar K.V2f4d0f52013-10-01 21:49:30 +05302406 goto exit;
2407 }
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02002408 if (fwrite(buf, 1, l, f) != l) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01002409 error_setg(errp, QERR_IO_ERROR);
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02002410 goto exit;
2411 }
2412 addr += l;
2413 size -= l;
2414 }
2415
2416exit:
2417 fclose(f);
2418}
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02002419
2420void qmp_pmemsave(int64_t addr, int64_t size, const char *filename,
2421 Error **errp)
2422{
2423 FILE *f;
2424 uint32_t l;
2425 uint8_t buf[1024];
2426
2427 f = fopen(filename, "wb");
2428 if (!f) {
Luiz Capitulino618da852013-06-07 14:35:06 -04002429 error_setg_file_open(errp, errno, filename);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02002430 return;
2431 }
2432
2433 while (size != 0) {
2434 l = sizeof(buf);
2435 if (l > size)
2436 l = size;
Stefan Weileb6282f2014-04-07 20:28:23 +02002437 cpu_physical_memory_read(addr, buf, l);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02002438 if (fwrite(buf, 1, l, f) != l) {
Markus Armbrusterc6bd8c72015-03-17 11:54:50 +01002439 error_setg(errp, QERR_IO_ERROR);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02002440 goto exit;
2441 }
2442 addr += l;
2443 size -= l;
2444 }
2445
2446exit:
2447 fclose(f);
2448}
Luiz Capitulinoab49ab52011-11-23 12:55:53 -02002449
2450void qmp_inject_nmi(Error **errp)
2451{
Alexey Kardashevskiy9cb805f2014-08-20 22:16:33 +10002452 nmi_monitor_handle(monitor_get_cpu_index(), errp);
Luiz Capitulinoab49ab52011-11-23 12:55:53 -02002453}
Sebastian Tanase27498be2014-07-25 11:56:33 +02002454
2455void dump_drift_info(FILE *f, fprintf_function cpu_fprintf)
2456{
2457 if (!use_icount) {
2458 return;
2459 }
2460
2461 cpu_fprintf(f, "Host - Guest clock %"PRIi64" ms\n",
2462 (cpu_get_clock() - cpu_get_icount())/SCALE_MS);
2463 if (icount_align_option) {
2464 cpu_fprintf(f, "Max guest delay %"PRIi64" ms\n", -max_delay/SCALE_MS);
2465 cpu_fprintf(f, "Max guest advance %"PRIi64" ms\n", max_advance/SCALE_MS);
2466 } else {
2467 cpu_fprintf(f, "Max guest delay NA\n");
2468 cpu_fprintf(f, "Max guest advance NA\n");
2469 }
2470}