]> Git Repo - qemu.git/blame - cpus.c
qemu-common: Move tcg_enabled() etc. to sysemu/tcg.h
[qemu.git] / cpus.c
CommitLineData
296af7c9
BS
1/*
2 * QEMU System Emulator
3 *
4 * Copyright (c) 2003-2008 Fabrice Bellard
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
24
7b31bbc2 25#include "qemu/osdep.h"
8d4e9146 26#include "qemu/config-file.h"
33c11879 27#include "cpu.h"
83c9089e 28#include "monitor/monitor.h"
e688df6b 29#include "qapi/error.h"
112ed241 30#include "qapi/qapi-commands-misc.h"
9af23989 31#include "qapi/qapi-events-run-state.h"
a4e15de9 32#include "qapi/qmp/qerror.h"
d49b6836 33#include "qemu/error-report.h"
76c86615 34#include "qemu/qemu-print.h"
9c17d615 35#include "sysemu/sysemu.h"
14a48c1d 36#include "sysemu/tcg.h"
da31d594 37#include "sysemu/block-backend.h"
022c62cb 38#include "exec/gdbstub.h"
9c17d615 39#include "sysemu/dma.h"
b3946626 40#include "sysemu/hw_accel.h"
9c17d615 41#include "sysemu/kvm.h"
b0cb0a66 42#include "sysemu/hax.h"
c97d6d2c 43#include "sysemu/hvf.h"
19306806 44#include "sysemu/whpx.h"
63c91552 45#include "exec/exec-all.h"
296af7c9 46
1de7afc9 47#include "qemu/thread.h"
9c17d615
PB
48#include "sysemu/cpus.h"
49#include "sysemu/qtest.h"
1de7afc9 50#include "qemu/main-loop.h"
922a01a0 51#include "qemu/option.h"
1de7afc9 52#include "qemu/bitmap.h"
cb365646 53#include "qemu/seqlock.h"
9c09a251 54#include "qemu/guest-random.h"
8d4e9146 55#include "tcg.h"
9cb805fd 56#include "hw/nmi.h"
8b427044 57#include "sysemu/replay.h"
afed5a5a 58#include "hw/boards.h"
0ff0fc19 59
6d9cb73c
JK
60#ifdef CONFIG_LINUX
61
62#include <sys/prctl.h>
63
c0532a76
MT
64#ifndef PR_MCE_KILL
65#define PR_MCE_KILL 33
66#endif
67
6d9cb73c
JK
68#ifndef PR_MCE_KILL_SET
69#define PR_MCE_KILL_SET 1
70#endif
71
72#ifndef PR_MCE_KILL_EARLY
73#define PR_MCE_KILL_EARLY 1
74#endif
75
76#endif /* CONFIG_LINUX */
77
27498bef
ST
78int64_t max_delay;
79int64_t max_advance;
296af7c9 80
2adcc85d
JH
81/* vcpu throttling controls */
82static QEMUTimer *throttle_timer;
83static unsigned int throttle_percentage;
84
85#define CPU_THROTTLE_PCT_MIN 1
86#define CPU_THROTTLE_PCT_MAX 99
87#define CPU_THROTTLE_TIMESLICE_NS 10000000
88
321bc0b2
TC
89bool cpu_is_stopped(CPUState *cpu)
90{
91 return cpu->stopped || !runstate_is_running();
92}
93
a98ae1d8 94static bool cpu_thread_is_idle(CPUState *cpu)
ac873f1e 95{
c64ca814 96 if (cpu->stop || cpu->queued_work_first) {
ac873f1e
PM
97 return false;
98 }
321bc0b2 99 if (cpu_is_stopped(cpu)) {
ac873f1e
PM
100 return true;
101 }
8c2e1b00 102 if (!cpu->halted || cpu_has_work(cpu) ||
215e79c0 103 kvm_halt_in_kernel()) {
ac873f1e
PM
104 return false;
105 }
106 return true;
107}
108
109static bool all_cpu_threads_idle(void)
110{
182735ef 111 CPUState *cpu;
ac873f1e 112
bdc44640 113 CPU_FOREACH(cpu) {
182735ef 114 if (!cpu_thread_is_idle(cpu)) {
ac873f1e
PM
115 return false;
116 }
117 }
118 return true;
119}
120
946fb27c
PB
121/***********************************************************/
122/* guest cycle counter */
123
a3270e19
PB
124/* Protected by TimersState seqlock */
125
5045e9d9 126static bool icount_sleep = true;
946fb27c
PB
127/* Arbitrarily pick 1MIPS as the minimum allowable speed. */
128#define MAX_ICOUNT_SHIFT 10
a3270e19 129
946fb27c 130typedef struct TimersState {
cb365646 131 /* Protected by BQL. */
946fb27c
PB
132 int64_t cpu_ticks_prev;
133 int64_t cpu_ticks_offset;
cb365646 134
94377115
PB
135 /* Protect fields that can be respectively read outside the
136 * BQL, and written from multiple threads.
cb365646
LPF
137 */
138 QemuSeqLock vm_clock_seqlock;
94377115
PB
139 QemuSpin vm_clock_lock;
140
141 int16_t cpu_ticks_enabled;
c96778bb 142
c1ff073c 143 /* Conversion factor from emulated instructions to virtual clock ticks. */
94377115
PB
144 int16_t icount_time_shift;
145
c96778bb
FK
146 /* Compensate for varying guest execution speed. */
147 int64_t qemu_icount_bias;
94377115
PB
148
149 int64_t vm_clock_warp_start;
150 int64_t cpu_clock_offset;
151
c96778bb
FK
152 /* Only written by TCG thread */
153 int64_t qemu_icount;
94377115 154
b39e3f34 155 /* for adjusting icount */
b39e3f34
PD
156 QEMUTimer *icount_rt_timer;
157 QEMUTimer *icount_vm_timer;
158 QEMUTimer *icount_warp_timer;
946fb27c
PB
159} TimersState;
160
d9cd4007 161static TimersState timers_state;
8d4e9146
FK
162bool mttcg_enabled;
163
164/*
165 * We default to false if we know other options have been enabled
166 * which are currently incompatible with MTTCG. Otherwise when each
167 * guest (target) has been updated to support:
168 * - atomic instructions
169 * - memory ordering primitives (barriers)
170 * they can set the appropriate CONFIG flags in ${target}-softmmu.mak
171 *
172 * Once a guest architecture has been converted to the new primitives
173 * there are two remaining limitations to check.
174 *
175 * - The guest can't be oversized (e.g. 64 bit guest on 32 bit host)
176 * - The host must have a stronger memory order than the guest
177 *
178 * It may be possible in future to support strong guests on weak hosts
179 * but that will require tagging all load/stores in a guest with their
180 * implicit memory order requirements which would likely slow things
181 * down a lot.
182 */
183
184static bool check_tcg_memory_orders_compatible(void)
185{
186#if defined(TCG_GUEST_DEFAULT_MO) && defined(TCG_TARGET_DEFAULT_MO)
187 return (TCG_GUEST_DEFAULT_MO & ~TCG_TARGET_DEFAULT_MO) == 0;
188#else
189 return false;
190#endif
191}
192
193static bool default_mttcg_enabled(void)
194{
83fd9629 195 if (use_icount || TCG_OVERSIZED_GUEST) {
8d4e9146
FK
196 return false;
197 } else {
198#ifdef TARGET_SUPPORTS_MTTCG
199 return check_tcg_memory_orders_compatible();
200#else
201 return false;
202#endif
203 }
204}
205
206void qemu_tcg_configure(QemuOpts *opts, Error **errp)
207{
208 const char *t = qemu_opt_get(opts, "thread");
209 if (t) {
210 if (strcmp(t, "multi") == 0) {
211 if (TCG_OVERSIZED_GUEST) {
212 error_setg(errp, "No MTTCG when guest word size > hosts");
83fd9629
AB
213 } else if (use_icount) {
214 error_setg(errp, "No MTTCG when icount is enabled");
8d4e9146 215 } else {
86953503 216#ifndef TARGET_SUPPORTS_MTTCG
0765691e
MA
217 warn_report("Guest not yet converted to MTTCG - "
218 "you may get unexpected results");
c34c7620 219#endif
8d4e9146 220 if (!check_tcg_memory_orders_compatible()) {
0765691e
MA
221 warn_report("Guest expects a stronger memory ordering "
222 "than the host provides");
8cfef892 223 error_printf("This may cause strange/hard to debug errors\n");
8d4e9146
FK
224 }
225 mttcg_enabled = true;
226 }
227 } else if (strcmp(t, "single") == 0) {
228 mttcg_enabled = false;
229 } else {
230 error_setg(errp, "Invalid 'thread' setting %s", t);
231 }
232 } else {
233 mttcg_enabled = default_mttcg_enabled();
234 }
235}
946fb27c 236
e4cd9657
AB
237/* The current number of executed instructions is based on what we
238 * originally budgeted minus the current state of the decrementing
239 * icount counters in extra/u16.low.
240 */
241static int64_t cpu_get_icount_executed(CPUState *cpu)
242{
5e140196
RH
243 return (cpu->icount_budget -
244 (cpu_neg(cpu)->icount_decr.u16.low + cpu->icount_extra));
e4cd9657
AB
245}
246
512d3c80
AB
247/*
248 * Update the global shared timer_state.qemu_icount to take into
249 * account executed instructions. This is done by the TCG vCPU
250 * thread so the main-loop can see time has moved forward.
251 */
9b4e6f49 252static void cpu_update_icount_locked(CPUState *cpu)
512d3c80
AB
253{
254 int64_t executed = cpu_get_icount_executed(cpu);
255 cpu->icount_budget -= executed;
256
38adcb6e
EC
257 atomic_set_i64(&timers_state.qemu_icount,
258 timers_state.qemu_icount + executed);
9b4e6f49
PB
259}
260
261/*
262 * Update the global shared timer_state.qemu_icount to take into
263 * account executed instructions. This is done by the TCG vCPU
264 * thread so the main-loop can see time has moved forward.
265 */
266void cpu_update_icount(CPUState *cpu)
267{
268 seqlock_write_lock(&timers_state.vm_clock_seqlock,
269 &timers_state.vm_clock_lock);
270 cpu_update_icount_locked(cpu);
94377115
PB
271 seqlock_write_unlock(&timers_state.vm_clock_seqlock,
272 &timers_state.vm_clock_lock);
512d3c80
AB
273}
274
c1ff073c 275static int64_t cpu_get_icount_raw_locked(void)
946fb27c 276{
4917cf44 277 CPUState *cpu = current_cpu;
946fb27c 278
243c5f77 279 if (cpu && cpu->running) {
414b15c9 280 if (!cpu->can_do_io) {
493d89bf 281 error_report("Bad icount read");
2a62914b 282 exit(1);
946fb27c 283 }
e4cd9657 284 /* Take into account what has run */
9b4e6f49 285 cpu_update_icount_locked(cpu);
946fb27c 286 }
38adcb6e
EC
287 /* The read is protected by the seqlock, but needs atomic64 to avoid UB */
288 return atomic_read_i64(&timers_state.qemu_icount);
2a62914b
PD
289}
290
2a62914b
PD
291static int64_t cpu_get_icount_locked(void)
292{
c1ff073c 293 int64_t icount = cpu_get_icount_raw_locked();
c97595d1
EC
294 return atomic_read_i64(&timers_state.qemu_icount_bias) +
295 cpu_icount_to_ns(icount);
c1ff073c
PB
296}
297
298int64_t cpu_get_icount_raw(void)
299{
300 int64_t icount;
301 unsigned start;
302
303 do {
304 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
305 icount = cpu_get_icount_raw_locked();
306 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
307
308 return icount;
946fb27c
PB
309}
310
c1ff073c 311/* Return the virtual CPU time, based on the instruction counter. */
17a15f1b
PB
312int64_t cpu_get_icount(void)
313{
314 int64_t icount;
315 unsigned start;
316
317 do {
318 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
319 icount = cpu_get_icount_locked();
320 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
321
322 return icount;
323}
324
3f031313
FK
325int64_t cpu_icount_to_ns(int64_t icount)
326{
c1ff073c 327 return icount << atomic_read(&timers_state.icount_time_shift);
3f031313
FK
328}
329
f2a4ad6d
PB
330static int64_t cpu_get_ticks_locked(void)
331{
332 int64_t ticks = timers_state.cpu_ticks_offset;
333 if (timers_state.cpu_ticks_enabled) {
334 ticks += cpu_get_host_ticks();
335 }
336
337 if (timers_state.cpu_ticks_prev > ticks) {
338 /* Non increasing ticks may happen if the host uses software suspend. */
339 timers_state.cpu_ticks_offset += timers_state.cpu_ticks_prev - ticks;
340 ticks = timers_state.cpu_ticks_prev;
341 }
342
343 timers_state.cpu_ticks_prev = ticks;
344 return ticks;
345}
346
d90f3cca
C
347/* return the time elapsed in VM between vm_start and vm_stop. Unless
348 * icount is active, cpu_get_ticks() uses units of the host CPU cycle
349 * counter.
d90f3cca 350 */
946fb27c
PB
351int64_t cpu_get_ticks(void)
352{
5f3e3101
PB
353 int64_t ticks;
354
946fb27c
PB
355 if (use_icount) {
356 return cpu_get_icount();
357 }
5f3e3101 358
f2a4ad6d
PB
359 qemu_spin_lock(&timers_state.vm_clock_lock);
360 ticks = cpu_get_ticks_locked();
361 qemu_spin_unlock(&timers_state.vm_clock_lock);
5f3e3101 362 return ticks;
946fb27c
PB
363}
364
cb365646 365static int64_t cpu_get_clock_locked(void)
946fb27c 366{
1d45cea5 367 int64_t time;
cb365646 368
1d45cea5 369 time = timers_state.cpu_clock_offset;
5f3e3101 370 if (timers_state.cpu_ticks_enabled) {
1d45cea5 371 time += get_clock();
946fb27c 372 }
cb365646 373
1d45cea5 374 return time;
cb365646
LPF
375}
376
d90f3cca 377/* Return the monotonic time elapsed in VM, i.e.,
8212ff86
PM
378 * the time between vm_start and vm_stop
379 */
cb365646
LPF
380int64_t cpu_get_clock(void)
381{
382 int64_t ti;
383 unsigned start;
384
385 do {
386 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
387 ti = cpu_get_clock_locked();
388 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
389
390 return ti;
946fb27c
PB
391}
392
cb365646 393/* enable cpu_get_ticks()
3224e878 394 * Caller must hold BQL which serves as mutex for vm_clock_seqlock.
cb365646 395 */
946fb27c
PB
396void cpu_enable_ticks(void)
397{
94377115
PB
398 seqlock_write_lock(&timers_state.vm_clock_seqlock,
399 &timers_state.vm_clock_lock);
946fb27c 400 if (!timers_state.cpu_ticks_enabled) {
4a7428c5 401 timers_state.cpu_ticks_offset -= cpu_get_host_ticks();
946fb27c
PB
402 timers_state.cpu_clock_offset -= get_clock();
403 timers_state.cpu_ticks_enabled = 1;
404 }
94377115
PB
405 seqlock_write_unlock(&timers_state.vm_clock_seqlock,
406 &timers_state.vm_clock_lock);
946fb27c
PB
407}
408
409/* disable cpu_get_ticks() : the clock is stopped. You must not call
cb365646 410 * cpu_get_ticks() after that.
3224e878 411 * Caller must hold BQL which serves as mutex for vm_clock_seqlock.
cb365646 412 */
946fb27c
PB
413void cpu_disable_ticks(void)
414{
94377115
PB
415 seqlock_write_lock(&timers_state.vm_clock_seqlock,
416 &timers_state.vm_clock_lock);
946fb27c 417 if (timers_state.cpu_ticks_enabled) {
4a7428c5 418 timers_state.cpu_ticks_offset += cpu_get_host_ticks();
cb365646 419 timers_state.cpu_clock_offset = cpu_get_clock_locked();
946fb27c
PB
420 timers_state.cpu_ticks_enabled = 0;
421 }
94377115
PB
422 seqlock_write_unlock(&timers_state.vm_clock_seqlock,
423 &timers_state.vm_clock_lock);
946fb27c
PB
424}
425
426/* Correlation between real and virtual time is always going to be
427 fairly approximate, so ignore small variation.
428 When the guest is idle real and virtual time will be aligned in
429 the IO wait loop. */
73bcb24d 430#define ICOUNT_WOBBLE (NANOSECONDS_PER_SECOND / 10)
946fb27c
PB
431
432static void icount_adjust(void)
433{
434 int64_t cur_time;
435 int64_t cur_icount;
436 int64_t delta;
a3270e19
PB
437
438 /* Protected by TimersState mutex. */
946fb27c 439 static int64_t last_delta;
468cc7cf 440
946fb27c
PB
441 /* If the VM is not running, then do nothing. */
442 if (!runstate_is_running()) {
443 return;
444 }
468cc7cf 445
94377115
PB
446 seqlock_write_lock(&timers_state.vm_clock_seqlock,
447 &timers_state.vm_clock_lock);
17a15f1b
PB
448 cur_time = cpu_get_clock_locked();
449 cur_icount = cpu_get_icount_locked();
468cc7cf 450
946fb27c
PB
451 delta = cur_icount - cur_time;
452 /* FIXME: This is a very crude algorithm, somewhat prone to oscillation. */
453 if (delta > 0
454 && last_delta + ICOUNT_WOBBLE < delta * 2
c1ff073c 455 && timers_state.icount_time_shift > 0) {
946fb27c 456 /* The guest is getting too far ahead. Slow time down. */
c1ff073c
PB
457 atomic_set(&timers_state.icount_time_shift,
458 timers_state.icount_time_shift - 1);
946fb27c
PB
459 }
460 if (delta < 0
461 && last_delta - ICOUNT_WOBBLE > delta * 2
c1ff073c 462 && timers_state.icount_time_shift < MAX_ICOUNT_SHIFT) {
946fb27c 463 /* The guest is getting too far behind. Speed time up. */
c1ff073c
PB
464 atomic_set(&timers_state.icount_time_shift,
465 timers_state.icount_time_shift + 1);
946fb27c
PB
466 }
467 last_delta = delta;
c97595d1
EC
468 atomic_set_i64(&timers_state.qemu_icount_bias,
469 cur_icount - (timers_state.qemu_icount
470 << timers_state.icount_time_shift));
94377115
PB
471 seqlock_write_unlock(&timers_state.vm_clock_seqlock,
472 &timers_state.vm_clock_lock);
946fb27c
PB
473}
474
475static void icount_adjust_rt(void *opaque)
476{
b39e3f34 477 timer_mod(timers_state.icount_rt_timer,
1979b908 478 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL_RT) + 1000);
946fb27c
PB
479 icount_adjust();
480}
481
482static void icount_adjust_vm(void *opaque)
483{
b39e3f34 484 timer_mod(timers_state.icount_vm_timer,
40daca54 485 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
73bcb24d 486 NANOSECONDS_PER_SECOND / 10);
946fb27c
PB
487 icount_adjust();
488}
489
490static int64_t qemu_icount_round(int64_t count)
491{
c1ff073c
PB
492 int shift = atomic_read(&timers_state.icount_time_shift);
493 return (count + (1 << shift) - 1) >> shift;
946fb27c
PB
494}
495
efab87cf 496static void icount_warp_rt(void)
946fb27c 497{
ccffff48
AB
498 unsigned seq;
499 int64_t warp_start;
500
17a15f1b
PB
501 /* The icount_warp_timer is rescheduled soon after vm_clock_warp_start
502 * changes from -1 to another value, so the race here is okay.
503 */
ccffff48
AB
504 do {
505 seq = seqlock_read_begin(&timers_state.vm_clock_seqlock);
b39e3f34 506 warp_start = timers_state.vm_clock_warp_start;
ccffff48
AB
507 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, seq));
508
509 if (warp_start == -1) {
946fb27c
PB
510 return;
511 }
512
94377115
PB
513 seqlock_write_lock(&timers_state.vm_clock_seqlock,
514 &timers_state.vm_clock_lock);
946fb27c 515 if (runstate_is_running()) {
74c0b816
PB
516 int64_t clock = REPLAY_CLOCK_LOCKED(REPLAY_CLOCK_VIRTUAL_RT,
517 cpu_get_clock_locked());
8ed961d9
PB
518 int64_t warp_delta;
519
b39e3f34 520 warp_delta = clock - timers_state.vm_clock_warp_start;
8ed961d9 521 if (use_icount == 2) {
946fb27c 522 /*
40daca54 523 * In adaptive mode, do not let QEMU_CLOCK_VIRTUAL run too
946fb27c
PB
524 * far ahead of real time.
525 */
17a15f1b 526 int64_t cur_icount = cpu_get_icount_locked();
bf2a7ddb 527 int64_t delta = clock - cur_icount;
8ed961d9 528 warp_delta = MIN(warp_delta, delta);
946fb27c 529 }
c97595d1
EC
530 atomic_set_i64(&timers_state.qemu_icount_bias,
531 timers_state.qemu_icount_bias + warp_delta);
946fb27c 532 }
b39e3f34 533 timers_state.vm_clock_warp_start = -1;
94377115
PB
534 seqlock_write_unlock(&timers_state.vm_clock_seqlock,
535 &timers_state.vm_clock_lock);
8ed961d9
PB
536
537 if (qemu_clock_expired(QEMU_CLOCK_VIRTUAL)) {
538 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
539 }
946fb27c
PB
540}
541
e76d1798 542static void icount_timer_cb(void *opaque)
efab87cf 543{
e76d1798
PD
544 /* No need for a checkpoint because the timer already synchronizes
545 * with CHECKPOINT_CLOCK_VIRTUAL_RT.
546 */
547 icount_warp_rt();
efab87cf
PD
548}
549
8156be56
PB
550void qtest_clock_warp(int64_t dest)
551{
40daca54 552 int64_t clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
efef88b3 553 AioContext *aio_context;
8156be56 554 assert(qtest_enabled());
efef88b3 555 aio_context = qemu_get_aio_context();
8156be56 556 while (clock < dest) {
40daca54 557 int64_t deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
c9299e2f 558 int64_t warp = qemu_soonest_timeout(dest - clock, deadline);
efef88b3 559
94377115
PB
560 seqlock_write_lock(&timers_state.vm_clock_seqlock,
561 &timers_state.vm_clock_lock);
c97595d1
EC
562 atomic_set_i64(&timers_state.qemu_icount_bias,
563 timers_state.qemu_icount_bias + warp);
94377115
PB
564 seqlock_write_unlock(&timers_state.vm_clock_seqlock,
565 &timers_state.vm_clock_lock);
17a15f1b 566
40daca54 567 qemu_clock_run_timers(QEMU_CLOCK_VIRTUAL);
efef88b3 568 timerlist_run_timers(aio_context->tlg.tl[QEMU_CLOCK_VIRTUAL]);
40daca54 569 clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
8156be56 570 }
40daca54 571 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
8156be56
PB
572}
573
e76d1798 574void qemu_start_warp_timer(void)
946fb27c 575{
ce78d18c 576 int64_t clock;
946fb27c
PB
577 int64_t deadline;
578
e76d1798 579 if (!use_icount) {
946fb27c
PB
580 return;
581 }
582
8bd7f71d
PD
583 /* Nothing to do if the VM is stopped: QEMU_CLOCK_VIRTUAL timers
584 * do not fire, so computing the deadline does not make sense.
585 */
586 if (!runstate_is_running()) {
587 return;
588 }
589
0c08185f
PD
590 if (replay_mode != REPLAY_MODE_PLAY) {
591 if (!all_cpu_threads_idle()) {
592 return;
593 }
8bd7f71d 594
0c08185f
PD
595 if (qtest_enabled()) {
596 /* When testing, qtest commands advance icount. */
597 return;
598 }
946fb27c 599
0c08185f
PD
600 replay_checkpoint(CHECKPOINT_CLOCK_WARP_START);
601 } else {
602 /* warp clock deterministically in record/replay mode */
603 if (!replay_checkpoint(CHECKPOINT_CLOCK_WARP_START)) {
604 /* vCPU is sleeping and warp can't be started.
605 It is probably a race condition: notification sent
606 to vCPU was processed in advance and vCPU went to sleep.
607 Therefore we have to wake it up for doing someting. */
608 if (replay_has_checkpoint()) {
609 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
610 }
611 return;
612 }
8156be56
PB
613 }
614
ac70aafc 615 /* We want to use the earliest deadline from ALL vm_clocks */
bf2a7ddb 616 clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT);
40daca54 617 deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
ce78d18c 618 if (deadline < 0) {
d7a0f71d
VC
619 static bool notified;
620 if (!icount_sleep && !notified) {
3dc6f869 621 warn_report("icount sleep disabled and no active timers");
d7a0f71d
VC
622 notified = true;
623 }
ce78d18c 624 return;
ac70aafc
AB
625 }
626
946fb27c
PB
627 if (deadline > 0) {
628 /*
40daca54 629 * Ensure QEMU_CLOCK_VIRTUAL proceeds even when the virtual CPU goes to
946fb27c
PB
630 * sleep. Otherwise, the CPU might be waiting for a future timer
631 * interrupt to wake it up, but the interrupt never comes because
632 * the vCPU isn't running any insns and thus doesn't advance the
40daca54 633 * QEMU_CLOCK_VIRTUAL.
946fb27c 634 */
5045e9d9
VC
635 if (!icount_sleep) {
636 /*
637 * We never let VCPUs sleep in no sleep icount mode.
638 * If there is a pending QEMU_CLOCK_VIRTUAL timer we just advance
639 * to the next QEMU_CLOCK_VIRTUAL event and notify it.
640 * It is useful when we want a deterministic execution time,
641 * isolated from host latencies.
642 */
94377115
PB
643 seqlock_write_lock(&timers_state.vm_clock_seqlock,
644 &timers_state.vm_clock_lock);
c97595d1
EC
645 atomic_set_i64(&timers_state.qemu_icount_bias,
646 timers_state.qemu_icount_bias + deadline);
94377115
PB
647 seqlock_write_unlock(&timers_state.vm_clock_seqlock,
648 &timers_state.vm_clock_lock);
5045e9d9
VC
649 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
650 } else {
651 /*
652 * We do stop VCPUs and only advance QEMU_CLOCK_VIRTUAL after some
653 * "real" time, (related to the time left until the next event) has
654 * passed. The QEMU_CLOCK_VIRTUAL_RT clock will do this.
655 * This avoids that the warps are visible externally; for example,
656 * you will not be sending network packets continuously instead of
657 * every 100ms.
658 */
94377115
PB
659 seqlock_write_lock(&timers_state.vm_clock_seqlock,
660 &timers_state.vm_clock_lock);
b39e3f34
PD
661 if (timers_state.vm_clock_warp_start == -1
662 || timers_state.vm_clock_warp_start > clock) {
663 timers_state.vm_clock_warp_start = clock;
5045e9d9 664 }
94377115
PB
665 seqlock_write_unlock(&timers_state.vm_clock_seqlock,
666 &timers_state.vm_clock_lock);
b39e3f34
PD
667 timer_mod_anticipate(timers_state.icount_warp_timer,
668 clock + deadline);
ce78d18c 669 }
ac70aafc 670 } else if (deadline == 0) {
40daca54 671 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
946fb27c
PB
672 }
673}
674
e76d1798
PD
675static void qemu_account_warp_timer(void)
676{
677 if (!use_icount || !icount_sleep) {
678 return;
679 }
680
681 /* Nothing to do if the VM is stopped: QEMU_CLOCK_VIRTUAL timers
682 * do not fire, so computing the deadline does not make sense.
683 */
684 if (!runstate_is_running()) {
685 return;
686 }
687
688 /* warp clock deterministically in record/replay mode */
689 if (!replay_checkpoint(CHECKPOINT_CLOCK_WARP_ACCOUNT)) {
690 return;
691 }
692
b39e3f34 693 timer_del(timers_state.icount_warp_timer);
e76d1798
PD
694 icount_warp_rt();
695}
696
d09eae37
FK
697static bool icount_state_needed(void *opaque)
698{
699 return use_icount;
700}
701
b39e3f34
PD
702static bool warp_timer_state_needed(void *opaque)
703{
704 TimersState *s = opaque;
705 return s->icount_warp_timer != NULL;
706}
707
708static bool adjust_timers_state_needed(void *opaque)
709{
710 TimersState *s = opaque;
711 return s->icount_rt_timer != NULL;
712}
713
714/*
715 * Subsection for warp timer migration is optional, because may not be created
716 */
717static const VMStateDescription icount_vmstate_warp_timer = {
718 .name = "timer/icount/warp_timer",
719 .version_id = 1,
720 .minimum_version_id = 1,
721 .needed = warp_timer_state_needed,
722 .fields = (VMStateField[]) {
723 VMSTATE_INT64(vm_clock_warp_start, TimersState),
724 VMSTATE_TIMER_PTR(icount_warp_timer, TimersState),
725 VMSTATE_END_OF_LIST()
726 }
727};
728
729static const VMStateDescription icount_vmstate_adjust_timers = {
730 .name = "timer/icount/timers",
731 .version_id = 1,
732 .minimum_version_id = 1,
733 .needed = adjust_timers_state_needed,
734 .fields = (VMStateField[]) {
735 VMSTATE_TIMER_PTR(icount_rt_timer, TimersState),
736 VMSTATE_TIMER_PTR(icount_vm_timer, TimersState),
737 VMSTATE_END_OF_LIST()
738 }
739};
740
d09eae37
FK
741/*
742 * This is a subsection for icount migration.
743 */
744static const VMStateDescription icount_vmstate_timers = {
745 .name = "timer/icount",
746 .version_id = 1,
747 .minimum_version_id = 1,
5cd8cada 748 .needed = icount_state_needed,
d09eae37
FK
749 .fields = (VMStateField[]) {
750 VMSTATE_INT64(qemu_icount_bias, TimersState),
751 VMSTATE_INT64(qemu_icount, TimersState),
752 VMSTATE_END_OF_LIST()
b39e3f34
PD
753 },
754 .subsections = (const VMStateDescription*[]) {
755 &icount_vmstate_warp_timer,
756 &icount_vmstate_adjust_timers,
757 NULL
d09eae37
FK
758 }
759};
760
946fb27c
PB
761static const VMStateDescription vmstate_timers = {
762 .name = "timer",
763 .version_id = 2,
764 .minimum_version_id = 1,
35d08458 765 .fields = (VMStateField[]) {
946fb27c 766 VMSTATE_INT64(cpu_ticks_offset, TimersState),
c1ff073c 767 VMSTATE_UNUSED(8),
946fb27c
PB
768 VMSTATE_INT64_V(cpu_clock_offset, TimersState, 2),
769 VMSTATE_END_OF_LIST()
d09eae37 770 },
5cd8cada
JQ
771 .subsections = (const VMStateDescription*[]) {
772 &icount_vmstate_timers,
773 NULL
946fb27c
PB
774 }
775};
776
14e6fe12 777static void cpu_throttle_thread(CPUState *cpu, run_on_cpu_data opaque)
2adcc85d 778{
2adcc85d
JH
779 double pct;
780 double throttle_ratio;
781 long sleeptime_ns;
782
783 if (!cpu_throttle_get_percentage()) {
784 return;
785 }
786
787 pct = (double)cpu_throttle_get_percentage()/100;
788 throttle_ratio = pct / (1 - pct);
789 sleeptime_ns = (long)(throttle_ratio * CPU_THROTTLE_TIMESLICE_NS);
790
791 qemu_mutex_unlock_iothread();
2adcc85d
JH
792 g_usleep(sleeptime_ns / 1000); /* Convert ns to us for usleep call */
793 qemu_mutex_lock_iothread();
90bb0c04 794 atomic_set(&cpu->throttle_thread_scheduled, 0);
2adcc85d
JH
795}
796
797static void cpu_throttle_timer_tick(void *opaque)
798{
799 CPUState *cpu;
800 double pct;
801
802 /* Stop the timer if needed */
803 if (!cpu_throttle_get_percentage()) {
804 return;
805 }
806 CPU_FOREACH(cpu) {
807 if (!atomic_xchg(&cpu->throttle_thread_scheduled, 1)) {
14e6fe12
PB
808 async_run_on_cpu(cpu, cpu_throttle_thread,
809 RUN_ON_CPU_NULL);
2adcc85d
JH
810 }
811 }
812
813 pct = (double)cpu_throttle_get_percentage()/100;
814 timer_mod(throttle_timer, qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT) +
815 CPU_THROTTLE_TIMESLICE_NS / (1-pct));
816}
817
818void cpu_throttle_set(int new_throttle_pct)
819{
820 /* Ensure throttle percentage is within valid range */
821 new_throttle_pct = MIN(new_throttle_pct, CPU_THROTTLE_PCT_MAX);
822 new_throttle_pct = MAX(new_throttle_pct, CPU_THROTTLE_PCT_MIN);
823
824 atomic_set(&throttle_percentage, new_throttle_pct);
825
826 timer_mod(throttle_timer, qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL_RT) +
827 CPU_THROTTLE_TIMESLICE_NS);
828}
829
830void cpu_throttle_stop(void)
831{
832 atomic_set(&throttle_percentage, 0);
833}
834
835bool cpu_throttle_active(void)
836{
837 return (cpu_throttle_get_percentage() != 0);
838}
839
840int cpu_throttle_get_percentage(void)
841{
842 return atomic_read(&throttle_percentage);
843}
844
4603ea01
PD
845void cpu_ticks_init(void)
846{
ccdb3c1f 847 seqlock_init(&timers_state.vm_clock_seqlock);
87a09cdc 848 qemu_spin_init(&timers_state.vm_clock_lock);
4603ea01 849 vmstate_register(NULL, 0, &vmstate_timers, &timers_state);
2adcc85d
JH
850 throttle_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL_RT,
851 cpu_throttle_timer_tick, NULL);
4603ea01
PD
852}
853
1ad9580b 854void configure_icount(QemuOpts *opts, Error **errp)
946fb27c 855{
1ad9580b 856 const char *option;
a8bfac37 857 char *rem_str = NULL;
1ad9580b 858
1ad9580b 859 option = qemu_opt_get(opts, "shift");
946fb27c 860 if (!option) {
a8bfac37
ST
861 if (qemu_opt_get(opts, "align") != NULL) {
862 error_setg(errp, "Please specify shift option when using align");
863 }
946fb27c
PB
864 return;
865 }
f1f4b57e
VC
866
867 icount_sleep = qemu_opt_get_bool(opts, "sleep", true);
5045e9d9 868 if (icount_sleep) {
b39e3f34 869 timers_state.icount_warp_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL_RT,
e76d1798 870 icount_timer_cb, NULL);
5045e9d9 871 }
f1f4b57e 872
a8bfac37 873 icount_align_option = qemu_opt_get_bool(opts, "align", false);
f1f4b57e
VC
874
875 if (icount_align_option && !icount_sleep) {
778d9f9b 876 error_setg(errp, "align=on and sleep=off are incompatible");
f1f4b57e 877 }
946fb27c 878 if (strcmp(option, "auto") != 0) {
a8bfac37 879 errno = 0;
c1ff073c 880 timers_state.icount_time_shift = strtol(option, &rem_str, 0);
a8bfac37
ST
881 if (errno != 0 || *rem_str != '\0' || !strlen(option)) {
882 error_setg(errp, "icount: Invalid shift value");
883 }
946fb27c
PB
884 use_icount = 1;
885 return;
a8bfac37
ST
886 } else if (icount_align_option) {
887 error_setg(errp, "shift=auto and align=on are incompatible");
f1f4b57e 888 } else if (!icount_sleep) {
778d9f9b 889 error_setg(errp, "shift=auto and sleep=off are incompatible");
946fb27c
PB
890 }
891
892 use_icount = 2;
893
894 /* 125MIPS seems a reasonable initial guess at the guest speed.
895 It will be corrected fairly quickly anyway. */
c1ff073c 896 timers_state.icount_time_shift = 3;
946fb27c
PB
897
898 /* Have both realtime and virtual time triggers for speed adjustment.
899 The realtime trigger catches emulated time passing too slowly,
900 the virtual time trigger catches emulated time passing too fast.
901 Realtime triggers occur even when idle, so use them less frequently
902 than VM triggers. */
b39e3f34
PD
903 timers_state.vm_clock_warp_start = -1;
904 timers_state.icount_rt_timer = timer_new_ms(QEMU_CLOCK_VIRTUAL_RT,
bf2a7ddb 905 icount_adjust_rt, NULL);
b39e3f34 906 timer_mod(timers_state.icount_rt_timer,
bf2a7ddb 907 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL_RT) + 1000);
b39e3f34 908 timers_state.icount_vm_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
40daca54 909 icount_adjust_vm, NULL);
b39e3f34 910 timer_mod(timers_state.icount_vm_timer,
40daca54 911 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
73bcb24d 912 NANOSECONDS_PER_SECOND / 10);
946fb27c
PB
913}
914
6546706d
AB
915/***********************************************************/
916/* TCG vCPU kick timer
917 *
918 * The kick timer is responsible for moving single threaded vCPU
919 * emulation on to the next vCPU. If more than one vCPU is running a
920 * timer event with force a cpu->exit so the next vCPU can get
921 * scheduled.
922 *
923 * The timer is removed if all vCPUs are idle and restarted again once
924 * idleness is complete.
925 */
926
927static QEMUTimer *tcg_kick_vcpu_timer;
791158d9 928static CPUState *tcg_current_rr_cpu;
6546706d
AB
929
930#define TCG_KICK_PERIOD (NANOSECONDS_PER_SECOND / 10)
931
932static inline int64_t qemu_tcg_next_kick(void)
933{
934 return qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + TCG_KICK_PERIOD;
935}
936
791158d9
AB
937/* Kick the currently round-robin scheduled vCPU */
938static void qemu_cpu_kick_rr_cpu(void)
939{
940 CPUState *cpu;
791158d9
AB
941 do {
942 cpu = atomic_mb_read(&tcg_current_rr_cpu);
943 if (cpu) {
944 cpu_exit(cpu);
945 }
946 } while (cpu != atomic_mb_read(&tcg_current_rr_cpu));
947}
948
6b8f0187
PB
949static void do_nothing(CPUState *cpu, run_on_cpu_data unused)
950{
951}
952
3f53bc61
PB
953void qemu_timer_notify_cb(void *opaque, QEMUClockType type)
954{
6b8f0187
PB
955 if (!use_icount || type != QEMU_CLOCK_VIRTUAL) {
956 qemu_notify_event();
957 return;
958 }
959
c52e7132
PM
960 if (qemu_in_vcpu_thread()) {
961 /* A CPU is currently running; kick it back out to the
962 * tcg_cpu_exec() loop so it will recalculate its
963 * icount deadline immediately.
964 */
965 qemu_cpu_kick(current_cpu);
966 } else if (first_cpu) {
6b8f0187
PB
967 /* qemu_cpu_kick is not enough to kick a halted CPU out of
968 * qemu_tcg_wait_io_event. async_run_on_cpu, instead,
969 * causes cpu_thread_is_idle to return false. This way,
970 * handle_icount_deadline can run.
c52e7132
PM
971 * If we have no CPUs at all for some reason, we don't
972 * need to do anything.
6b8f0187
PB
973 */
974 async_run_on_cpu(first_cpu, do_nothing, RUN_ON_CPU_NULL);
975 }
3f53bc61
PB
976}
977
6546706d
AB
978static void kick_tcg_thread(void *opaque)
979{
980 timer_mod(tcg_kick_vcpu_timer, qemu_tcg_next_kick());
791158d9 981 qemu_cpu_kick_rr_cpu();
6546706d
AB
982}
983
984static void start_tcg_kick_timer(void)
985{
db08b687
PB
986 assert(!mttcg_enabled);
987 if (!tcg_kick_vcpu_timer && CPU_NEXT(first_cpu)) {
6546706d
AB
988 tcg_kick_vcpu_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
989 kick_tcg_thread, NULL);
1926ab27
AB
990 }
991 if (tcg_kick_vcpu_timer && !timer_pending(tcg_kick_vcpu_timer)) {
6546706d
AB
992 timer_mod(tcg_kick_vcpu_timer, qemu_tcg_next_kick());
993 }
994}
995
996static void stop_tcg_kick_timer(void)
997{
db08b687 998 assert(!mttcg_enabled);
1926ab27 999 if (tcg_kick_vcpu_timer && timer_pending(tcg_kick_vcpu_timer)) {
6546706d 1000 timer_del(tcg_kick_vcpu_timer);
6546706d
AB
1001 }
1002}
1003
296af7c9
BS
1004/***********************************************************/
1005void hw_error(const char *fmt, ...)
1006{
1007 va_list ap;
55e5c285 1008 CPUState *cpu;
296af7c9
BS
1009
1010 va_start(ap, fmt);
1011 fprintf(stderr, "qemu: hardware error: ");
1012 vfprintf(stderr, fmt, ap);
1013 fprintf(stderr, "\n");
bdc44640 1014 CPU_FOREACH(cpu) {
55e5c285 1015 fprintf(stderr, "CPU #%d:\n", cpu->cpu_index);
90c84c56 1016 cpu_dump_state(cpu, stderr, CPU_DUMP_FPU);
296af7c9
BS
1017 }
1018 va_end(ap);
1019 abort();
1020}
1021
1022void cpu_synchronize_all_states(void)
1023{
182735ef 1024 CPUState *cpu;
296af7c9 1025
bdc44640 1026 CPU_FOREACH(cpu) {
182735ef 1027 cpu_synchronize_state(cpu);
c97d6d2c
SAGDR
1028 /* TODO: move to cpu_synchronize_state() */
1029 if (hvf_enabled()) {
1030 hvf_cpu_synchronize_state(cpu);
1031 }
296af7c9
BS
1032 }
1033}
1034
1035void cpu_synchronize_all_post_reset(void)
1036{
182735ef 1037 CPUState *cpu;
296af7c9 1038
bdc44640 1039 CPU_FOREACH(cpu) {
182735ef 1040 cpu_synchronize_post_reset(cpu);
c97d6d2c
SAGDR
1041 /* TODO: move to cpu_synchronize_post_reset() */
1042 if (hvf_enabled()) {
1043 hvf_cpu_synchronize_post_reset(cpu);
1044 }
296af7c9
BS
1045 }
1046}
1047
1048void cpu_synchronize_all_post_init(void)
1049{
182735ef 1050 CPUState *cpu;
296af7c9 1051
bdc44640 1052 CPU_FOREACH(cpu) {
182735ef 1053 cpu_synchronize_post_init(cpu);
c97d6d2c
SAGDR
1054 /* TODO: move to cpu_synchronize_post_init() */
1055 if (hvf_enabled()) {
1056 hvf_cpu_synchronize_post_init(cpu);
1057 }
296af7c9
BS
1058 }
1059}
1060
75e972da
DG
1061void cpu_synchronize_all_pre_loadvm(void)
1062{
1063 CPUState *cpu;
1064
1065 CPU_FOREACH(cpu) {
1066 cpu_synchronize_pre_loadvm(cpu);
1067 }
1068}
1069
4486e89c 1070static int do_vm_stop(RunState state, bool send_stop)
296af7c9 1071{
56983463
KW
1072 int ret = 0;
1073
1354869c 1074 if (runstate_is_running()) {
296af7c9 1075 cpu_disable_ticks();
296af7c9 1076 pause_all_vcpus();
f5bbfba1 1077 runstate_set(state);
1dfb4dd9 1078 vm_state_notify(0, state);
4486e89c 1079 if (send_stop) {
3ab72385 1080 qapi_event_send_stop();
4486e89c 1081 }
296af7c9 1082 }
56983463 1083
594a45ce 1084 bdrv_drain_all();
6d0ceb80 1085 replay_disable_events();
22af08ea 1086 ret = bdrv_flush_all();
594a45ce 1087
56983463 1088 return ret;
296af7c9
BS
1089}
1090
4486e89c
SH
1091/* Special vm_stop() variant for terminating the process. Historically clients
1092 * did not expect a QMP STOP event and so we need to retain compatibility.
1093 */
1094int vm_shutdown(void)
1095{
1096 return do_vm_stop(RUN_STATE_SHUTDOWN, false);
1097}
1098
a1fcaa73 1099static bool cpu_can_run(CPUState *cpu)
296af7c9 1100{
4fdeee7c 1101 if (cpu->stop) {
a1fcaa73 1102 return false;
0ab07c62 1103 }
321bc0b2 1104 if (cpu_is_stopped(cpu)) {
a1fcaa73 1105 return false;
0ab07c62 1106 }
a1fcaa73 1107 return true;
296af7c9
BS
1108}
1109
91325046 1110static void cpu_handle_guest_debug(CPUState *cpu)
83f338f7 1111{
64f6b346 1112 gdb_set_stop_cpu(cpu);
8cf71710 1113 qemu_system_debug_request();
f324e766 1114 cpu->stopped = true;
3c638d06
JK
1115}
1116
6d9cb73c
JK
1117#ifdef CONFIG_LINUX
1118static void sigbus_reraise(void)
1119{
1120 sigset_t set;
1121 struct sigaction action;
1122
1123 memset(&action, 0, sizeof(action));
1124 action.sa_handler = SIG_DFL;
1125 if (!sigaction(SIGBUS, &action, NULL)) {
1126 raise(SIGBUS);
1127 sigemptyset(&set);
1128 sigaddset(&set, SIGBUS);
a2d1761d 1129 pthread_sigmask(SIG_UNBLOCK, &set, NULL);
6d9cb73c
JK
1130 }
1131 perror("Failed to re-raise SIGBUS!\n");
1132 abort();
1133}
1134
d98d4072 1135static void sigbus_handler(int n, siginfo_t *siginfo, void *ctx)
6d9cb73c 1136{
a16fc07e
PB
1137 if (siginfo->si_code != BUS_MCEERR_AO && siginfo->si_code != BUS_MCEERR_AR) {
1138 sigbus_reraise();
1139 }
1140
2ae41db2
PB
1141 if (current_cpu) {
1142 /* Called asynchronously in VCPU thread. */
1143 if (kvm_on_sigbus_vcpu(current_cpu, siginfo->si_code, siginfo->si_addr)) {
1144 sigbus_reraise();
1145 }
1146 } else {
1147 /* Called synchronously (via signalfd) in main thread. */
1148 if (kvm_on_sigbus(siginfo->si_code, siginfo->si_addr)) {
1149 sigbus_reraise();
1150 }
6d9cb73c
JK
1151 }
1152}
1153
1154static void qemu_init_sigbus(void)
1155{
1156 struct sigaction action;
1157
1158 memset(&action, 0, sizeof(action));
1159 action.sa_flags = SA_SIGINFO;
d98d4072 1160 action.sa_sigaction = sigbus_handler;
6d9cb73c
JK
1161 sigaction(SIGBUS, &action, NULL);
1162
1163 prctl(PR_MCE_KILL, PR_MCE_KILL_SET, PR_MCE_KILL_EARLY, 0, 0);
1164}
6d9cb73c 1165#else /* !CONFIG_LINUX */
6d9cb73c
JK
1166static void qemu_init_sigbus(void)
1167{
1168}
a16fc07e 1169#endif /* !CONFIG_LINUX */
ff48eb5f 1170
b2532d88 1171static QemuMutex qemu_global_mutex;
296af7c9
BS
1172
1173static QemuThread io_thread;
1174
296af7c9
BS
1175/* cpu creation */
1176static QemuCond qemu_cpu_cond;
1177/* system init */
296af7c9
BS
1178static QemuCond qemu_pause_cond;
1179
d3b12f5d 1180void qemu_init_cpu_loop(void)
296af7c9 1181{
6d9cb73c 1182 qemu_init_sigbus();
ed94592b 1183 qemu_cond_init(&qemu_cpu_cond);
ed94592b 1184 qemu_cond_init(&qemu_pause_cond);
296af7c9 1185 qemu_mutex_init(&qemu_global_mutex);
296af7c9 1186
b7680cb6 1187 qemu_thread_get_self(&io_thread);
296af7c9
BS
1188}
1189
14e6fe12 1190void run_on_cpu(CPUState *cpu, run_on_cpu_func func, run_on_cpu_data data)
e82bcec2 1191{
d148d90e 1192 do_run_on_cpu(cpu, func, data, &qemu_global_mutex);
3c02270d
CV
1193}
1194
4c055ab5
GZ
1195static void qemu_kvm_destroy_vcpu(CPUState *cpu)
1196{
1197 if (kvm_destroy_vcpu(cpu) < 0) {
1198 error_report("kvm_destroy_vcpu failed");
1199 exit(EXIT_FAILURE);
1200 }
1201}
1202
1203static void qemu_tcg_destroy_vcpu(CPUState *cpu)
1204{
1205}
1206
ebd05fea
DH
1207static void qemu_cpu_stop(CPUState *cpu, bool exit)
1208{
1209 g_assert(qemu_cpu_is_self(cpu));
1210 cpu->stop = false;
1211 cpu->stopped = true;
1212 if (exit) {
1213 cpu_exit(cpu);
1214 }
1215 qemu_cond_broadcast(&qemu_pause_cond);
1216}
1217
509a0d78 1218static void qemu_wait_io_event_common(CPUState *cpu)
296af7c9 1219{
37257942 1220 atomic_mb_set(&cpu->thread_kicked, false);
4fdeee7c 1221 if (cpu->stop) {
ebd05fea 1222 qemu_cpu_stop(cpu, false);
296af7c9 1223 }
a5403c69 1224 process_queued_cpu_work(cpu);
37257942
AB
1225}
1226
a8efa606 1227static void qemu_tcg_rr_wait_io_event(void)
37257942 1228{
a8efa606
PB
1229 CPUState *cpu;
1230
db08b687 1231 while (all_cpu_threads_idle()) {
6546706d 1232 stop_tcg_kick_timer();
a8efa606 1233 qemu_cond_wait(first_cpu->halt_cond, &qemu_global_mutex);
16400322 1234 }
296af7c9 1235
6546706d
AB
1236 start_tcg_kick_timer();
1237
a8efa606
PB
1238 CPU_FOREACH(cpu) {
1239 qemu_wait_io_event_common(cpu);
1240 }
296af7c9
BS
1241}
1242
db08b687 1243static void qemu_wait_io_event(CPUState *cpu)
296af7c9 1244{
a98ae1d8 1245 while (cpu_thread_is_idle(cpu)) {
f5c121b8 1246 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
16400322 1247 }
296af7c9 1248
db08b687
PB
1249#ifdef _WIN32
1250 /* Eat dummy APC queued by qemu_cpu_kick_thread. */
1251 if (!tcg_enabled()) {
1252 SleepEx(0, TRUE);
c97d6d2c 1253 }
db08b687 1254#endif
c97d6d2c
SAGDR
1255 qemu_wait_io_event_common(cpu);
1256}
1257
7e97cd88 1258static void *qemu_kvm_cpu_thread_fn(void *arg)
296af7c9 1259{
48a106bd 1260 CPUState *cpu = arg;
84b4915d 1261 int r;
296af7c9 1262
ab28bd23
PB
1263 rcu_register_thread();
1264
2e7f7a3c 1265 qemu_mutex_lock_iothread();
814e612e 1266 qemu_thread_get_self(cpu->thread);
9f09e18a 1267 cpu->thread_id = qemu_get_thread_id();
626cf8f4 1268 cpu->can_do_io = 1;
4917cf44 1269 current_cpu = cpu;
296af7c9 1270
504134d2 1271 r = kvm_init_vcpu(cpu);
84b4915d 1272 if (r < 0) {
493d89bf 1273 error_report("kvm_init_vcpu failed: %s", strerror(-r));
84b4915d
JK
1274 exit(1);
1275 }
296af7c9 1276
18268b60 1277 kvm_init_cpu_signals(cpu);
296af7c9
BS
1278
1279 /* signal CPU creation */
61a46217 1280 cpu->created = true;
296af7c9 1281 qemu_cond_signal(&qemu_cpu_cond);
9c09a251 1282 qemu_guest_random_seed_thread_part2(cpu->random_seed);
296af7c9 1283
4c055ab5 1284 do {
a1fcaa73 1285 if (cpu_can_run(cpu)) {
1458c363 1286 r = kvm_cpu_exec(cpu);
83f338f7 1287 if (r == EXCP_DEBUG) {
91325046 1288 cpu_handle_guest_debug(cpu);
83f338f7 1289 }
0ab07c62 1290 }
db08b687 1291 qemu_wait_io_event(cpu);
4c055ab5 1292 } while (!cpu->unplug || cpu_can_run(cpu));
296af7c9 1293
4c055ab5 1294 qemu_kvm_destroy_vcpu(cpu);
2c579042
BR
1295 cpu->created = false;
1296 qemu_cond_signal(&qemu_cpu_cond);
4c055ab5 1297 qemu_mutex_unlock_iothread();
57615ed5 1298 rcu_unregister_thread();
296af7c9
BS
1299 return NULL;
1300}
1301
c7f0f3b1
AL
1302static void *qemu_dummy_cpu_thread_fn(void *arg)
1303{
1304#ifdef _WIN32
493d89bf 1305 error_report("qtest is not supported under Windows");
c7f0f3b1
AL
1306 exit(1);
1307#else
10a9021d 1308 CPUState *cpu = arg;
c7f0f3b1
AL
1309 sigset_t waitset;
1310 int r;
1311
ab28bd23
PB
1312 rcu_register_thread();
1313
c7f0f3b1 1314 qemu_mutex_lock_iothread();
814e612e 1315 qemu_thread_get_self(cpu->thread);
9f09e18a 1316 cpu->thread_id = qemu_get_thread_id();
626cf8f4 1317 cpu->can_do_io = 1;
37257942 1318 current_cpu = cpu;
c7f0f3b1
AL
1319
1320 sigemptyset(&waitset);
1321 sigaddset(&waitset, SIG_IPI);
1322
1323 /* signal CPU creation */
61a46217 1324 cpu->created = true;
c7f0f3b1 1325 qemu_cond_signal(&qemu_cpu_cond);
9c09a251 1326 qemu_guest_random_seed_thread_part2(cpu->random_seed);
c7f0f3b1 1327
d2831ab0 1328 do {
c7f0f3b1
AL
1329 qemu_mutex_unlock_iothread();
1330 do {
1331 int sig;
1332 r = sigwait(&waitset, &sig);
1333 } while (r == -1 && (errno == EAGAIN || errno == EINTR));
1334 if (r == -1) {
1335 perror("sigwait");
1336 exit(1);
1337 }
1338 qemu_mutex_lock_iothread();
db08b687 1339 qemu_wait_io_event(cpu);
d2831ab0 1340 } while (!cpu->unplug);
c7f0f3b1 1341
d40bfcbb 1342 qemu_mutex_unlock_iothread();
d2831ab0 1343 rcu_unregister_thread();
c7f0f3b1
AL
1344 return NULL;
1345#endif
1346}
1347
1be7fcb8
AB
1348static int64_t tcg_get_icount_limit(void)
1349{
1350 int64_t deadline;
1351
1352 if (replay_mode != REPLAY_MODE_PLAY) {
1353 deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
1354
1355 /* Maintain prior (possibly buggy) behaviour where if no deadline
1356 * was set (as there is no QEMU_CLOCK_VIRTUAL timer) or it is more than
1357 * INT32_MAX nanoseconds ahead, we still use INT32_MAX
1358 * nanoseconds.
1359 */
1360 if ((deadline < 0) || (deadline > INT32_MAX)) {
1361 deadline = INT32_MAX;
1362 }
1363
1364 return qemu_icount_round(deadline);
1365 } else {
1366 return replay_get_instructions();
1367 }
1368}
1369
12e9700d
AB
1370static void handle_icount_deadline(void)
1371{
6b8f0187 1372 assert(qemu_in_vcpu_thread());
12e9700d
AB
1373 if (use_icount) {
1374 int64_t deadline =
1375 qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
1376
1377 if (deadline == 0) {
6b8f0187 1378 /* Wake up other AioContexts. */
12e9700d 1379 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
6b8f0187 1380 qemu_clock_run_timers(QEMU_CLOCK_VIRTUAL);
12e9700d
AB
1381 }
1382 }
1383}
1384
05248382 1385static void prepare_icount_for_run(CPUState *cpu)
1be7fcb8 1386{
1be7fcb8 1387 if (use_icount) {
eda5f7c6 1388 int insns_left;
05248382
AB
1389
1390 /* These should always be cleared by process_icount_data after
1391 * each vCPU execution. However u16.high can be raised
1392 * asynchronously by cpu_exit/cpu_interrupt/tcg_handle_interrupt
1393 */
5e140196 1394 g_assert(cpu_neg(cpu)->icount_decr.u16.low == 0);
05248382
AB
1395 g_assert(cpu->icount_extra == 0);
1396
eda5f7c6
AB
1397 cpu->icount_budget = tcg_get_icount_limit();
1398 insns_left = MIN(0xffff, cpu->icount_budget);
5e140196 1399 cpu_neg(cpu)->icount_decr.u16.low = insns_left;
eda5f7c6 1400 cpu->icount_extra = cpu->icount_budget - insns_left;
d759c951
AB
1401
1402 replay_mutex_lock();
1be7fcb8 1403 }
05248382
AB
1404}
1405
1406static void process_icount_data(CPUState *cpu)
1407{
1be7fcb8 1408 if (use_icount) {
e4cd9657 1409 /* Account for executed instructions */
512d3c80 1410 cpu_update_icount(cpu);
05248382
AB
1411
1412 /* Reset the counters */
5e140196 1413 cpu_neg(cpu)->icount_decr.u16.low = 0;
1be7fcb8 1414 cpu->icount_extra = 0;
e4cd9657
AB
1415 cpu->icount_budget = 0;
1416
1be7fcb8 1417 replay_account_executed_instructions();
d759c951
AB
1418
1419 replay_mutex_unlock();
1be7fcb8 1420 }
05248382
AB
1421}
1422
1423
1424static int tcg_cpu_exec(CPUState *cpu)
1425{
1426 int ret;
1427#ifdef CONFIG_PROFILER
1428 int64_t ti;
1429#endif
1430
f28d0dfd 1431 assert(tcg_enabled());
05248382
AB
1432#ifdef CONFIG_PROFILER
1433 ti = profile_getclock();
1434#endif
05248382
AB
1435 cpu_exec_start(cpu);
1436 ret = cpu_exec(cpu);
1437 cpu_exec_end(cpu);
05248382 1438#ifdef CONFIG_PROFILER
72fd2efb
EC
1439 atomic_set(&tcg_ctx->prof.cpu_exec_time,
1440 tcg_ctx->prof.cpu_exec_time + profile_getclock() - ti);
05248382 1441#endif
1be7fcb8
AB
1442 return ret;
1443}
1444
c93bbbef
AB
1445/* Destroy any remaining vCPUs which have been unplugged and have
1446 * finished running
1447 */
1448static void deal_with_unplugged_cpus(void)
1be7fcb8 1449{
c93bbbef 1450 CPUState *cpu;
1be7fcb8 1451
c93bbbef
AB
1452 CPU_FOREACH(cpu) {
1453 if (cpu->unplug && !cpu_can_run(cpu)) {
1454 qemu_tcg_destroy_vcpu(cpu);
1455 cpu->created = false;
1456 qemu_cond_signal(&qemu_cpu_cond);
1be7fcb8
AB
1457 break;
1458 }
1459 }
1be7fcb8 1460}
bdb7ca67 1461
6546706d
AB
1462/* Single-threaded TCG
1463 *
1464 * In the single-threaded case each vCPU is simulated in turn. If
1465 * there is more than a single vCPU we create a simple timer to kick
1466 * the vCPU and ensure we don't get stuck in a tight loop in one vCPU.
1467 * This is done explicitly rather than relying on side-effects
1468 * elsewhere.
1469 */
1470
37257942 1471static void *qemu_tcg_rr_cpu_thread_fn(void *arg)
296af7c9 1472{
c3586ba7 1473 CPUState *cpu = arg;
296af7c9 1474
f28d0dfd 1475 assert(tcg_enabled());
ab28bd23 1476 rcu_register_thread();
3468b59e 1477 tcg_register_thread();
ab28bd23 1478
2e7f7a3c 1479 qemu_mutex_lock_iothread();
814e612e 1480 qemu_thread_get_self(cpu->thread);
296af7c9 1481
5a9c973b
DH
1482 cpu->thread_id = qemu_get_thread_id();
1483 cpu->created = true;
1484 cpu->can_do_io = 1;
296af7c9 1485 qemu_cond_signal(&qemu_cpu_cond);
9c09a251 1486 qemu_guest_random_seed_thread_part2(cpu->random_seed);
296af7c9 1487
fa7d1867 1488 /* wait for initial kick-off after machine start */
c28e399c 1489 while (first_cpu->stopped) {
d5f8d613 1490 qemu_cond_wait(first_cpu->halt_cond, &qemu_global_mutex);
8e564b4e
JK
1491
1492 /* process any pending work */
bdc44640 1493 CPU_FOREACH(cpu) {
37257942 1494 current_cpu = cpu;
182735ef 1495 qemu_wait_io_event_common(cpu);
8e564b4e 1496 }
0ab07c62 1497 }
296af7c9 1498
6546706d
AB
1499 start_tcg_kick_timer();
1500
c93bbbef
AB
1501 cpu = first_cpu;
1502
e5143e30
AB
1503 /* process any pending work */
1504 cpu->exit_request = 1;
1505
296af7c9 1506 while (1) {
d759c951
AB
1507 qemu_mutex_unlock_iothread();
1508 replay_mutex_lock();
1509 qemu_mutex_lock_iothread();
c93bbbef
AB
1510 /* Account partial waits to QEMU_CLOCK_VIRTUAL. */
1511 qemu_account_warp_timer();
1512
6b8f0187
PB
1513 /* Run the timers here. This is much more efficient than
1514 * waking up the I/O thread and waiting for completion.
1515 */
1516 handle_icount_deadline();
1517
d759c951
AB
1518 replay_mutex_unlock();
1519
c93bbbef
AB
1520 if (!cpu) {
1521 cpu = first_cpu;
1522 }
1523
e5143e30
AB
1524 while (cpu && !cpu->queued_work_first && !cpu->exit_request) {
1525
791158d9 1526 atomic_mb_set(&tcg_current_rr_cpu, cpu);
37257942 1527 current_cpu = cpu;
c93bbbef
AB
1528
1529 qemu_clock_enable(QEMU_CLOCK_VIRTUAL,
1530 (cpu->singlestep_enabled & SSTEP_NOTIMER) == 0);
1531
1532 if (cpu_can_run(cpu)) {
1533 int r;
05248382 1534
d759c951 1535 qemu_mutex_unlock_iothread();
05248382
AB
1536 prepare_icount_for_run(cpu);
1537
c93bbbef 1538 r = tcg_cpu_exec(cpu);
05248382
AB
1539
1540 process_icount_data(cpu);
d759c951 1541 qemu_mutex_lock_iothread();
05248382 1542
c93bbbef
AB
1543 if (r == EXCP_DEBUG) {
1544 cpu_handle_guest_debug(cpu);
1545 break;
08e73c48
PK
1546 } else if (r == EXCP_ATOMIC) {
1547 qemu_mutex_unlock_iothread();
1548 cpu_exec_step_atomic(cpu);
1549 qemu_mutex_lock_iothread();
1550 break;
c93bbbef 1551 }
37257942 1552 } else if (cpu->stop) {
c93bbbef
AB
1553 if (cpu->unplug) {
1554 cpu = CPU_NEXT(cpu);
1555 }
1556 break;
1557 }
1558
e5143e30
AB
1559 cpu = CPU_NEXT(cpu);
1560 } /* while (cpu && !cpu->exit_request).. */
1561
791158d9
AB
1562 /* Does not need atomic_mb_set because a spurious wakeup is okay. */
1563 atomic_set(&tcg_current_rr_cpu, NULL);
c93bbbef 1564
e5143e30
AB
1565 if (cpu && cpu->exit_request) {
1566 atomic_mb_set(&cpu->exit_request, 0);
1567 }
ac70aafc 1568
013aabdc
CD
1569 if (use_icount && all_cpu_threads_idle()) {
1570 /*
1571 * When all cpus are sleeping (e.g in WFI), to avoid a deadlock
1572 * in the main_loop, wake it up in order to start the warp timer.
1573 */
1574 qemu_notify_event();
1575 }
1576
a8efa606 1577 qemu_tcg_rr_wait_io_event();
c93bbbef 1578 deal_with_unplugged_cpus();
296af7c9
BS
1579 }
1580
9b0605f9 1581 rcu_unregister_thread();
296af7c9
BS
1582 return NULL;
1583}
1584
b0cb0a66
VP
1585static void *qemu_hax_cpu_thread_fn(void *arg)
1586{
1587 CPUState *cpu = arg;
1588 int r;
b3d3a426 1589
9857c2d2 1590 rcu_register_thread();
b3d3a426 1591 qemu_mutex_lock_iothread();
b0cb0a66 1592 qemu_thread_get_self(cpu->thread);
b0cb0a66
VP
1593
1594 cpu->thread_id = qemu_get_thread_id();
1595 cpu->created = true;
1596 cpu->halted = 0;
1597 current_cpu = cpu;
1598
1599 hax_init_vcpu(cpu);
1600 qemu_cond_signal(&qemu_cpu_cond);
9c09a251 1601 qemu_guest_random_seed_thread_part2(cpu->random_seed);
b0cb0a66 1602
9857c2d2 1603 do {
b0cb0a66
VP
1604 if (cpu_can_run(cpu)) {
1605 r = hax_smp_cpu_exec(cpu);
1606 if (r == EXCP_DEBUG) {
1607 cpu_handle_guest_debug(cpu);
1608 }
1609 }
1610
db08b687 1611 qemu_wait_io_event(cpu);
9857c2d2
PB
1612 } while (!cpu->unplug || cpu_can_run(cpu));
1613 rcu_unregister_thread();
b0cb0a66
VP
1614 return NULL;
1615}
1616
c97d6d2c
SAGDR
1617/* The HVF-specific vCPU thread function. This one should only run when the host
1618 * CPU supports the VMX "unrestricted guest" feature. */
1619static void *qemu_hvf_cpu_thread_fn(void *arg)
1620{
1621 CPUState *cpu = arg;
1622
1623 int r;
1624
1625 assert(hvf_enabled());
1626
1627 rcu_register_thread();
1628
1629 qemu_mutex_lock_iothread();
1630 qemu_thread_get_self(cpu->thread);
1631
1632 cpu->thread_id = qemu_get_thread_id();
1633 cpu->can_do_io = 1;
1634 current_cpu = cpu;
1635
1636 hvf_init_vcpu(cpu);
1637
1638 /* signal CPU creation */
1639 cpu->created = true;
1640 qemu_cond_signal(&qemu_cpu_cond);
9c09a251 1641 qemu_guest_random_seed_thread_part2(cpu->random_seed);
c97d6d2c
SAGDR
1642
1643 do {
1644 if (cpu_can_run(cpu)) {
1645 r = hvf_vcpu_exec(cpu);
1646 if (r == EXCP_DEBUG) {
1647 cpu_handle_guest_debug(cpu);
1648 }
1649 }
db08b687 1650 qemu_wait_io_event(cpu);
c97d6d2c
SAGDR
1651 } while (!cpu->unplug || cpu_can_run(cpu));
1652
1653 hvf_vcpu_destroy(cpu);
1654 cpu->created = false;
1655 qemu_cond_signal(&qemu_cpu_cond);
1656 qemu_mutex_unlock_iothread();
8178e637 1657 rcu_unregister_thread();
c97d6d2c
SAGDR
1658 return NULL;
1659}
1660
19306806
JTV
1661static void *qemu_whpx_cpu_thread_fn(void *arg)
1662{
1663 CPUState *cpu = arg;
1664 int r;
1665
1666 rcu_register_thread();
1667
1668 qemu_mutex_lock_iothread();
1669 qemu_thread_get_self(cpu->thread);
1670 cpu->thread_id = qemu_get_thread_id();
1671 current_cpu = cpu;
1672
1673 r = whpx_init_vcpu(cpu);
1674 if (r < 0) {
1675 fprintf(stderr, "whpx_init_vcpu failed: %s\n", strerror(-r));
1676 exit(1);
1677 }
1678
1679 /* signal CPU creation */
1680 cpu->created = true;
1681 qemu_cond_signal(&qemu_cpu_cond);
9c09a251 1682 qemu_guest_random_seed_thread_part2(cpu->random_seed);
19306806
JTV
1683
1684 do {
1685 if (cpu_can_run(cpu)) {
1686 r = whpx_vcpu_exec(cpu);
1687 if (r == EXCP_DEBUG) {
1688 cpu_handle_guest_debug(cpu);
1689 }
1690 }
1691 while (cpu_thread_is_idle(cpu)) {
1692 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
1693 }
1694 qemu_wait_io_event_common(cpu);
1695 } while (!cpu->unplug || cpu_can_run(cpu));
1696
1697 whpx_destroy_vcpu(cpu);
1698 cpu->created = false;
1699 qemu_cond_signal(&qemu_cpu_cond);
1700 qemu_mutex_unlock_iothread();
1701 rcu_unregister_thread();
c97d6d2c
SAGDR
1702 return NULL;
1703}
1704
b0cb0a66
VP
1705#ifdef _WIN32
1706static void CALLBACK dummy_apc_func(ULONG_PTR unused)
1707{
1708}
1709#endif
1710
37257942
AB
1711/* Multi-threaded TCG
1712 *
1713 * In the multi-threaded case each vCPU has its own thread. The TLS
1714 * variable current_cpu can be used deep in the code to find the
1715 * current CPUState for a given thread.
1716 */
1717
1718static void *qemu_tcg_cpu_thread_fn(void *arg)
1719{
1720 CPUState *cpu = arg;
1721
f28d0dfd 1722 assert(tcg_enabled());
bf51c720
AB
1723 g_assert(!use_icount);
1724
37257942 1725 rcu_register_thread();
3468b59e 1726 tcg_register_thread();
37257942
AB
1727
1728 qemu_mutex_lock_iothread();
1729 qemu_thread_get_self(cpu->thread);
1730
1731 cpu->thread_id = qemu_get_thread_id();
1732 cpu->created = true;
1733 cpu->can_do_io = 1;
1734 current_cpu = cpu;
1735 qemu_cond_signal(&qemu_cpu_cond);
9c09a251 1736 qemu_guest_random_seed_thread_part2(cpu->random_seed);
37257942
AB
1737
1738 /* process any pending work */
1739 cpu->exit_request = 1;
1740
54961aac 1741 do {
37257942
AB
1742 if (cpu_can_run(cpu)) {
1743 int r;
d759c951 1744 qemu_mutex_unlock_iothread();
37257942 1745 r = tcg_cpu_exec(cpu);
d759c951 1746 qemu_mutex_lock_iothread();
37257942
AB
1747 switch (r) {
1748 case EXCP_DEBUG:
1749 cpu_handle_guest_debug(cpu);
1750 break;
1751 case EXCP_HALTED:
1752 /* during start-up the vCPU is reset and the thread is
1753 * kicked several times. If we don't ensure we go back
1754 * to sleep in the halted state we won't cleanly
1755 * start-up when the vCPU is enabled.
1756 *
1757 * cpu->halted should ensure we sleep in wait_io_event
1758 */
1759 g_assert(cpu->halted);
1760 break;
08e73c48
PK
1761 case EXCP_ATOMIC:
1762 qemu_mutex_unlock_iothread();
1763 cpu_exec_step_atomic(cpu);
1764 qemu_mutex_lock_iothread();
37257942
AB
1765 default:
1766 /* Ignore everything else? */
1767 break;
1768 }
1769 }
1770
37257942 1771 atomic_mb_set(&cpu->exit_request, 0);
db08b687 1772 qemu_wait_io_event(cpu);
9b0605f9 1773 } while (!cpu->unplug || cpu_can_run(cpu));
37257942 1774
9b0605f9
PB
1775 qemu_tcg_destroy_vcpu(cpu);
1776 cpu->created = false;
1777 qemu_cond_signal(&qemu_cpu_cond);
1778 qemu_mutex_unlock_iothread();
1779 rcu_unregister_thread();
37257942
AB
1780 return NULL;
1781}
1782
2ff09a40 1783static void qemu_cpu_kick_thread(CPUState *cpu)
cc015e9a
PB
1784{
1785#ifndef _WIN32
1786 int err;
1787
e0c38211
PB
1788 if (cpu->thread_kicked) {
1789 return;
9102deda 1790 }
e0c38211 1791 cpu->thread_kicked = true;
814e612e 1792 err = pthread_kill(cpu->thread->thread, SIG_IPI);
d455ebc4 1793 if (err && err != ESRCH) {
cc015e9a
PB
1794 fprintf(stderr, "qemu:%s: %s", __func__, strerror(err));
1795 exit(1);
1796 }
1797#else /* _WIN32 */
b0cb0a66 1798 if (!qemu_cpu_is_self(cpu)) {
19306806
JTV
1799 if (whpx_enabled()) {
1800 whpx_vcpu_kick(cpu);
1801 } else if (!QueueUserAPC(dummy_apc_func, cpu->hThread, 0)) {
b0cb0a66
VP
1802 fprintf(stderr, "%s: QueueUserAPC failed with error %lu\n",
1803 __func__, GetLastError());
1804 exit(1);
1805 }
1806 }
e0c38211
PB
1807#endif
1808}
ed9164a3 1809
c08d7424 1810void qemu_cpu_kick(CPUState *cpu)
296af7c9 1811{
f5c121b8 1812 qemu_cond_broadcast(cpu->halt_cond);
e0c38211 1813 if (tcg_enabled()) {
791158d9 1814 cpu_exit(cpu);
37257942 1815 /* NOP unless doing single-thread RR */
791158d9 1816 qemu_cpu_kick_rr_cpu();
e0c38211 1817 } else {
b0cb0a66
VP
1818 if (hax_enabled()) {
1819 /*
1820 * FIXME: race condition with the exit_request check in
1821 * hax_vcpu_hax_exec
1822 */
1823 cpu->exit_request = 1;
1824 }
e0c38211
PB
1825 qemu_cpu_kick_thread(cpu);
1826 }
296af7c9
BS
1827}
1828
46d62fac 1829void qemu_cpu_kick_self(void)
296af7c9 1830{
4917cf44 1831 assert(current_cpu);
9102deda 1832 qemu_cpu_kick_thread(current_cpu);
296af7c9
BS
1833}
1834
60e82579 1835bool qemu_cpu_is_self(CPUState *cpu)
296af7c9 1836{
814e612e 1837 return qemu_thread_is_self(cpu->thread);
296af7c9
BS
1838}
1839
79e2b9ae 1840bool qemu_in_vcpu_thread(void)
aa723c23 1841{
4917cf44 1842 return current_cpu && qemu_cpu_is_self(current_cpu);
aa723c23
JQ
1843}
1844
afbe7053
PB
1845static __thread bool iothread_locked = false;
1846
1847bool qemu_mutex_iothread_locked(void)
1848{
1849 return iothread_locked;
1850}
1851
cb764d06
EC
1852/*
1853 * The BQL is taken from so many places that it is worth profiling the
1854 * callers directly, instead of funneling them all through a single function.
1855 */
1856void qemu_mutex_lock_iothread_impl(const char *file, int line)
296af7c9 1857{
cb764d06
EC
1858 QemuMutexLockFunc bql_lock = atomic_read(&qemu_bql_mutex_lock_func);
1859
8d04fb55 1860 g_assert(!qemu_mutex_iothread_locked());
cb764d06 1861 bql_lock(&qemu_global_mutex, file, line);
afbe7053 1862 iothread_locked = true;
296af7c9
BS
1863}
1864
1865void qemu_mutex_unlock_iothread(void)
1866{
8d04fb55 1867 g_assert(qemu_mutex_iothread_locked());
afbe7053 1868 iothread_locked = false;
296af7c9
BS
1869 qemu_mutex_unlock(&qemu_global_mutex);
1870}
1871
e8faee06 1872static bool all_vcpus_paused(void)
296af7c9 1873{
bdc44640 1874 CPUState *cpu;
296af7c9 1875
bdc44640 1876 CPU_FOREACH(cpu) {
182735ef 1877 if (!cpu->stopped) {
e8faee06 1878 return false;
0ab07c62 1879 }
296af7c9
BS
1880 }
1881
e8faee06 1882 return true;
296af7c9
BS
1883}
1884
1885void pause_all_vcpus(void)
1886{
bdc44640 1887 CPUState *cpu;
296af7c9 1888
40daca54 1889 qemu_clock_enable(QEMU_CLOCK_VIRTUAL, false);
bdc44640 1890 CPU_FOREACH(cpu) {
ebd05fea
DH
1891 if (qemu_cpu_is_self(cpu)) {
1892 qemu_cpu_stop(cpu, true);
1893 } else {
1894 cpu->stop = true;
1895 qemu_cpu_kick(cpu);
1896 }
d798e974
JK
1897 }
1898
d759c951
AB
1899 /* We need to drop the replay_lock so any vCPU threads woken up
1900 * can finish their replay tasks
1901 */
1902 replay_mutex_unlock();
1903
296af7c9 1904 while (!all_vcpus_paused()) {
be7d6c57 1905 qemu_cond_wait(&qemu_pause_cond, &qemu_global_mutex);
bdc44640 1906 CPU_FOREACH(cpu) {
182735ef 1907 qemu_cpu_kick(cpu);
296af7c9
BS
1908 }
1909 }
d759c951
AB
1910
1911 qemu_mutex_unlock_iothread();
1912 replay_mutex_lock();
1913 qemu_mutex_lock_iothread();
296af7c9
BS
1914}
1915
2993683b
IM
1916void cpu_resume(CPUState *cpu)
1917{
1918 cpu->stop = false;
1919 cpu->stopped = false;
1920 qemu_cpu_kick(cpu);
1921}
1922
296af7c9
BS
1923void resume_all_vcpus(void)
1924{
bdc44640 1925 CPUState *cpu;
296af7c9 1926
40daca54 1927 qemu_clock_enable(QEMU_CLOCK_VIRTUAL, true);
bdc44640 1928 CPU_FOREACH(cpu) {
182735ef 1929 cpu_resume(cpu);
296af7c9
BS
1930 }
1931}
1932
dbadee4f 1933void cpu_remove_sync(CPUState *cpu)
4c055ab5
GZ
1934{
1935 cpu->stop = true;
1936 cpu->unplug = true;
1937 qemu_cpu_kick(cpu);
dbadee4f
PB
1938 qemu_mutex_unlock_iothread();
1939 qemu_thread_join(cpu->thread);
1940 qemu_mutex_lock_iothread();
2c579042
BR
1941}
1942
4900116e
DDAG
1943/* For temporary buffers for forming a name */
1944#define VCPU_THREAD_NAME_SIZE 16
1945
e5ab30a2 1946static void qemu_tcg_init_vcpu(CPUState *cpu)
296af7c9 1947{
4900116e 1948 char thread_name[VCPU_THREAD_NAME_SIZE];
37257942
AB
1949 static QemuCond *single_tcg_halt_cond;
1950 static QemuThread *single_tcg_cpu_thread;
e8feb96f
EC
1951 static int tcg_region_inited;
1952
f28d0dfd 1953 assert(tcg_enabled());
e8feb96f
EC
1954 /*
1955 * Initialize TCG regions--once. Now is a good time, because:
1956 * (1) TCG's init context, prologue and target globals have been set up.
1957 * (2) qemu_tcg_mttcg_enabled() works now (TCG init code runs before the
1958 * -accel flag is processed, so the check doesn't work then).
1959 */
1960 if (!tcg_region_inited) {
1961 tcg_region_inited = 1;
1962 tcg_region_init();
1963 }
4900116e 1964
37257942 1965 if (qemu_tcg_mttcg_enabled() || !single_tcg_cpu_thread) {
814e612e 1966 cpu->thread = g_malloc0(sizeof(QemuThread));
f5c121b8
AF
1967 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1968 qemu_cond_init(cpu->halt_cond);
37257942
AB
1969
1970 if (qemu_tcg_mttcg_enabled()) {
1971 /* create a thread per vCPU with TCG (MTTCG) */
1972 parallel_cpus = true;
1973 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/TCG",
4900116e 1974 cpu->cpu_index);
37257942
AB
1975
1976 qemu_thread_create(cpu->thread, thread_name, qemu_tcg_cpu_thread_fn,
1977 cpu, QEMU_THREAD_JOINABLE);
1978
1979 } else {
1980 /* share a single thread for all cpus with TCG */
1981 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "ALL CPUs/TCG");
1982 qemu_thread_create(cpu->thread, thread_name,
1983 qemu_tcg_rr_cpu_thread_fn,
1984 cpu, QEMU_THREAD_JOINABLE);
1985
1986 single_tcg_halt_cond = cpu->halt_cond;
1987 single_tcg_cpu_thread = cpu->thread;
1988 }
1ecf47bf 1989#ifdef _WIN32
814e612e 1990 cpu->hThread = qemu_thread_get_handle(cpu->thread);
1ecf47bf 1991#endif
296af7c9 1992 } else {
37257942
AB
1993 /* For non-MTTCG cases we share the thread */
1994 cpu->thread = single_tcg_cpu_thread;
1995 cpu->halt_cond = single_tcg_halt_cond;
a342173a
DH
1996 cpu->thread_id = first_cpu->thread_id;
1997 cpu->can_do_io = 1;
1998 cpu->created = true;
296af7c9
BS
1999 }
2000}
2001
b0cb0a66
VP
2002static void qemu_hax_start_vcpu(CPUState *cpu)
2003{
2004 char thread_name[VCPU_THREAD_NAME_SIZE];
2005
2006 cpu->thread = g_malloc0(sizeof(QemuThread));
2007 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
2008 qemu_cond_init(cpu->halt_cond);
2009
2010 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/HAX",
2011 cpu->cpu_index);
2012 qemu_thread_create(cpu->thread, thread_name, qemu_hax_cpu_thread_fn,
2013 cpu, QEMU_THREAD_JOINABLE);
2014#ifdef _WIN32
2015 cpu->hThread = qemu_thread_get_handle(cpu->thread);
2016#endif
b0cb0a66
VP
2017}
2018
48a106bd 2019static void qemu_kvm_start_vcpu(CPUState *cpu)
296af7c9 2020{
4900116e
DDAG
2021 char thread_name[VCPU_THREAD_NAME_SIZE];
2022
814e612e 2023 cpu->thread = g_malloc0(sizeof(QemuThread));
f5c121b8
AF
2024 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
2025 qemu_cond_init(cpu->halt_cond);
4900116e
DDAG
2026 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/KVM",
2027 cpu->cpu_index);
2028 qemu_thread_create(cpu->thread, thread_name, qemu_kvm_cpu_thread_fn,
2029 cpu, QEMU_THREAD_JOINABLE);
296af7c9
BS
2030}
2031
c97d6d2c
SAGDR
2032static void qemu_hvf_start_vcpu(CPUState *cpu)
2033{
2034 char thread_name[VCPU_THREAD_NAME_SIZE];
2035
2036 /* HVF currently does not support TCG, and only runs in
2037 * unrestricted-guest mode. */
2038 assert(hvf_enabled());
2039
2040 cpu->thread = g_malloc0(sizeof(QemuThread));
2041 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
2042 qemu_cond_init(cpu->halt_cond);
2043
2044 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/HVF",
2045 cpu->cpu_index);
2046 qemu_thread_create(cpu->thread, thread_name, qemu_hvf_cpu_thread_fn,
2047 cpu, QEMU_THREAD_JOINABLE);
c97d6d2c
SAGDR
2048}
2049
19306806
JTV
2050static void qemu_whpx_start_vcpu(CPUState *cpu)
2051{
2052 char thread_name[VCPU_THREAD_NAME_SIZE];
2053
2054 cpu->thread = g_malloc0(sizeof(QemuThread));
2055 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
2056 qemu_cond_init(cpu->halt_cond);
2057 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/WHPX",
2058 cpu->cpu_index);
2059 qemu_thread_create(cpu->thread, thread_name, qemu_whpx_cpu_thread_fn,
2060 cpu, QEMU_THREAD_JOINABLE);
2061#ifdef _WIN32
2062 cpu->hThread = qemu_thread_get_handle(cpu->thread);
2063#endif
19306806
JTV
2064}
2065
10a9021d 2066static void qemu_dummy_start_vcpu(CPUState *cpu)
c7f0f3b1 2067{
4900116e
DDAG
2068 char thread_name[VCPU_THREAD_NAME_SIZE];
2069
814e612e 2070 cpu->thread = g_malloc0(sizeof(QemuThread));
f5c121b8
AF
2071 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
2072 qemu_cond_init(cpu->halt_cond);
4900116e
DDAG
2073 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/DUMMY",
2074 cpu->cpu_index);
2075 qemu_thread_create(cpu->thread, thread_name, qemu_dummy_cpu_thread_fn, cpu,
c7f0f3b1 2076 QEMU_THREAD_JOINABLE);
c7f0f3b1
AL
2077}
2078
c643bed9 2079void qemu_init_vcpu(CPUState *cpu)
296af7c9 2080{
ce3960eb
AF
2081 cpu->nr_cores = smp_cores;
2082 cpu->nr_threads = smp_threads;
f324e766 2083 cpu->stopped = true;
9c09a251 2084 cpu->random_seed = qemu_guest_random_seed_thread_part1();
56943e8c
PM
2085
2086 if (!cpu->as) {
2087 /* If the target cpu hasn't set up any address spaces itself,
2088 * give it the default one.
2089 */
12ebc9a7 2090 cpu->num_ases = 1;
80ceb07a 2091 cpu_address_space_init(cpu, 0, "cpu-memory", cpu->memory);
56943e8c
PM
2092 }
2093
0ab07c62 2094 if (kvm_enabled()) {
48a106bd 2095 qemu_kvm_start_vcpu(cpu);
b0cb0a66
VP
2096 } else if (hax_enabled()) {
2097 qemu_hax_start_vcpu(cpu);
c97d6d2c
SAGDR
2098 } else if (hvf_enabled()) {
2099 qemu_hvf_start_vcpu(cpu);
c7f0f3b1 2100 } else if (tcg_enabled()) {
e5ab30a2 2101 qemu_tcg_init_vcpu(cpu);
19306806
JTV
2102 } else if (whpx_enabled()) {
2103 qemu_whpx_start_vcpu(cpu);
c7f0f3b1 2104 } else {
10a9021d 2105 qemu_dummy_start_vcpu(cpu);
0ab07c62 2106 }
81e96311
DH
2107
2108 while (!cpu->created) {
2109 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
2110 }
296af7c9
BS
2111}
2112
b4a3d965 2113void cpu_stop_current(void)
296af7c9 2114{
4917cf44 2115 if (current_cpu) {
0ec7e677
PM
2116 current_cpu->stop = true;
2117 cpu_exit(current_cpu);
b4a3d965 2118 }
296af7c9
BS
2119}
2120
56983463 2121int vm_stop(RunState state)
296af7c9 2122{
aa723c23 2123 if (qemu_in_vcpu_thread()) {
74892d24 2124 qemu_system_vmstop_request_prepare();
1dfb4dd9 2125 qemu_system_vmstop_request(state);
296af7c9
BS
2126 /*
2127 * FIXME: should not return to device code in case
2128 * vm_stop() has been requested.
2129 */
b4a3d965 2130 cpu_stop_current();
56983463 2131 return 0;
296af7c9 2132 }
56983463 2133
4486e89c 2134 return do_vm_stop(state, true);
296af7c9
BS
2135}
2136
2d76e823
CI
2137/**
2138 * Prepare for (re)starting the VM.
2139 * Returns -1 if the vCPUs are not to be restarted (e.g. if they are already
2140 * running or in case of an error condition), 0 otherwise.
2141 */
2142int vm_prepare_start(void)
2143{
2144 RunState requested;
2d76e823
CI
2145
2146 qemu_vmstop_requested(&requested);
2147 if (runstate_is_running() && requested == RUN_STATE__MAX) {
2148 return -1;
2149 }
2150
2151 /* Ensure that a STOP/RESUME pair of events is emitted if a
2152 * vmstop request was pending. The BLOCK_IO_ERROR event, for
2153 * example, according to documentation is always followed by
2154 * the STOP event.
2155 */
2156 if (runstate_is_running()) {
3ab72385
PX
2157 qapi_event_send_stop();
2158 qapi_event_send_resume();
f056158d 2159 return -1;
2d76e823
CI
2160 }
2161
2162 /* We are sending this now, but the CPUs will be resumed shortly later */
3ab72385 2163 qapi_event_send_resume();
f056158d
MA
2164
2165 replay_enable_events();
2166 cpu_enable_ticks();
2167 runstate_set(RUN_STATE_RUNNING);
2168 vm_state_notify(1, RUN_STATE_RUNNING);
2169 return 0;
2d76e823
CI
2170}
2171
2172void vm_start(void)
2173{
2174 if (!vm_prepare_start()) {
2175 resume_all_vcpus();
2176 }
2177}
2178
8a9236f1
LC
2179/* does a state transition even if the VM is already stopped,
2180 current state is forgotten forever */
56983463 2181int vm_stop_force_state(RunState state)
8a9236f1
LC
2182{
2183 if (runstate_is_running()) {
56983463 2184 return vm_stop(state);
8a9236f1
LC
2185 } else {
2186 runstate_set(state);
b2780d32
WC
2187
2188 bdrv_drain_all();
594a45ce
KW
2189 /* Make sure to return an error if the flush in a previous vm_stop()
2190 * failed. */
22af08ea 2191 return bdrv_flush_all();
8a9236f1
LC
2192 }
2193}
2194
0442428a 2195void list_cpus(const char *optarg)
262353cb
BS
2196{
2197 /* XXX: implement xxx_cpu_list for targets that still miss it */
e916cbf8 2198#if defined(cpu_list)
0442428a 2199 cpu_list();
262353cb
BS
2200#endif
2201}
de0b36b6
LC
2202
2203CpuInfoList *qmp_query_cpus(Error **errp)
2204{
afed5a5a
IM
2205 MachineState *ms = MACHINE(qdev_get_machine());
2206 MachineClass *mc = MACHINE_GET_CLASS(ms);
de0b36b6 2207 CpuInfoList *head = NULL, *cur_item = NULL;
182735ef 2208 CPUState *cpu;
de0b36b6 2209
bdc44640 2210 CPU_FOREACH(cpu) {
de0b36b6 2211 CpuInfoList *info;
182735ef
AF
2212#if defined(TARGET_I386)
2213 X86CPU *x86_cpu = X86_CPU(cpu);
2214 CPUX86State *env = &x86_cpu->env;
2215#elif defined(TARGET_PPC)
2216 PowerPCCPU *ppc_cpu = POWERPC_CPU(cpu);
2217 CPUPPCState *env = &ppc_cpu->env;
2218#elif defined(TARGET_SPARC)
2219 SPARCCPU *sparc_cpu = SPARC_CPU(cpu);
2220 CPUSPARCState *env = &sparc_cpu->env;
25fa194b
MC
2221#elif defined(TARGET_RISCV)
2222 RISCVCPU *riscv_cpu = RISCV_CPU(cpu);
2223 CPURISCVState *env = &riscv_cpu->env;
182735ef
AF
2224#elif defined(TARGET_MIPS)
2225 MIPSCPU *mips_cpu = MIPS_CPU(cpu);
2226 CPUMIPSState *env = &mips_cpu->env;
48e06fe0
BK
2227#elif defined(TARGET_TRICORE)
2228 TriCoreCPU *tricore_cpu = TRICORE_CPU(cpu);
2229 CPUTriCoreState *env = &tricore_cpu->env;
9d0306df
VM
2230#elif defined(TARGET_S390X)
2231 S390CPU *s390_cpu = S390_CPU(cpu);
2232 CPUS390XState *env = &s390_cpu->env;
182735ef 2233#endif
de0b36b6 2234
cb446eca 2235 cpu_synchronize_state(cpu);
de0b36b6
LC
2236
2237 info = g_malloc0(sizeof(*info));
2238 info->value = g_malloc0(sizeof(*info->value));
55e5c285 2239 info->value->CPU = cpu->cpu_index;
182735ef 2240 info->value->current = (cpu == first_cpu);
259186a7 2241 info->value->halted = cpu->halted;
58f88d4b 2242 info->value->qom_path = object_get_canonical_path(OBJECT(cpu));
9f09e18a 2243 info->value->thread_id = cpu->thread_id;
de0b36b6 2244#if defined(TARGET_I386)
86f4b687 2245 info->value->arch = CPU_INFO_ARCH_X86;
544a3731 2246 info->value->u.x86.pc = env->eip + env->segs[R_CS].base;
de0b36b6 2247#elif defined(TARGET_PPC)
86f4b687 2248 info->value->arch = CPU_INFO_ARCH_PPC;
544a3731 2249 info->value->u.ppc.nip = env->nip;
de0b36b6 2250#elif defined(TARGET_SPARC)
86f4b687 2251 info->value->arch = CPU_INFO_ARCH_SPARC;
544a3731
EB
2252 info->value->u.q_sparc.pc = env->pc;
2253 info->value->u.q_sparc.npc = env->npc;
de0b36b6 2254#elif defined(TARGET_MIPS)
86f4b687 2255 info->value->arch = CPU_INFO_ARCH_MIPS;
544a3731 2256 info->value->u.q_mips.PC = env->active_tc.PC;
48e06fe0 2257#elif defined(TARGET_TRICORE)
86f4b687 2258 info->value->arch = CPU_INFO_ARCH_TRICORE;
544a3731 2259 info->value->u.tricore.PC = env->PC;
9d0306df
VM
2260#elif defined(TARGET_S390X)
2261 info->value->arch = CPU_INFO_ARCH_S390;
2262 info->value->u.s390.cpu_state = env->cpu_state;
25fa194b
MC
2263#elif defined(TARGET_RISCV)
2264 info->value->arch = CPU_INFO_ARCH_RISCV;
2265 info->value->u.riscv.pc = env->pc;
86f4b687
EB
2266#else
2267 info->value->arch = CPU_INFO_ARCH_OTHER;
de0b36b6 2268#endif
afed5a5a
IM
2269 info->value->has_props = !!mc->cpu_index_to_instance_props;
2270 if (info->value->has_props) {
2271 CpuInstanceProperties *props;
2272 props = g_malloc0(sizeof(*props));
2273 *props = mc->cpu_index_to_instance_props(ms, cpu->cpu_index);
2274 info->value->props = props;
2275 }
de0b36b6
LC
2276
2277 /* XXX: waiting for the qapi to support GSList */
2278 if (!cur_item) {
2279 head = cur_item = info;
2280 } else {
2281 cur_item->next = info;
2282 cur_item = info;
2283 }
2284 }
2285
2286 return head;
2287}
0cfd6a9a 2288
daa9d2bc
LE
2289static CpuInfoArch sysemu_target_to_cpuinfo_arch(SysEmuTarget target)
2290{
2291 /*
2292 * The @SysEmuTarget -> @CpuInfoArch mapping below is based on the
2293 * TARGET_ARCH -> TARGET_BASE_ARCH mapping in the "configure" script.
2294 */
2295 switch (target) {
2296 case SYS_EMU_TARGET_I386:
2297 case SYS_EMU_TARGET_X86_64:
2298 return CPU_INFO_ARCH_X86;
2299
2300 case SYS_EMU_TARGET_PPC:
daa9d2bc
LE
2301 case SYS_EMU_TARGET_PPC64:
2302 return CPU_INFO_ARCH_PPC;
2303
2304 case SYS_EMU_TARGET_SPARC:
2305 case SYS_EMU_TARGET_SPARC64:
2306 return CPU_INFO_ARCH_SPARC;
2307
2308 case SYS_EMU_TARGET_MIPS:
2309 case SYS_EMU_TARGET_MIPSEL:
2310 case SYS_EMU_TARGET_MIPS64:
2311 case SYS_EMU_TARGET_MIPS64EL:
2312 return CPU_INFO_ARCH_MIPS;
2313
2314 case SYS_EMU_TARGET_TRICORE:
2315 return CPU_INFO_ARCH_TRICORE;
2316
2317 case SYS_EMU_TARGET_S390X:
2318 return CPU_INFO_ARCH_S390;
2319
2320 case SYS_EMU_TARGET_RISCV32:
2321 case SYS_EMU_TARGET_RISCV64:
2322 return CPU_INFO_ARCH_RISCV;
2323
2324 default:
2325 return CPU_INFO_ARCH_OTHER;
2326 }
2327}
2328
2329static void cpustate_to_cpuinfo_s390(CpuInfoS390 *info, const CPUState *cpu)
2330{
2331#ifdef TARGET_S390X
2332 S390CPU *s390_cpu = S390_CPU(cpu);
2333 CPUS390XState *env = &s390_cpu->env;
2334
2335 info->cpu_state = env->cpu_state;
2336#else
2337 abort();
2338#endif
2339}
2340
ce74ee3d
LC
2341/*
2342 * fast means: we NEVER interrupt vCPU threads to retrieve
2343 * information from KVM.
2344 */
2345CpuInfoFastList *qmp_query_cpus_fast(Error **errp)
2346{
2347 MachineState *ms = MACHINE(qdev_get_machine());
2348 MachineClass *mc = MACHINE_GET_CLASS(ms);
2349 CpuInfoFastList *head = NULL, *cur_item = NULL;
daa9d2bc
LE
2350 SysEmuTarget target = qapi_enum_parse(&SysEmuTarget_lookup, TARGET_NAME,
2351 -1, &error_abort);
ce74ee3d
LC
2352 CPUState *cpu;
2353
2354 CPU_FOREACH(cpu) {
2355 CpuInfoFastList *info = g_malloc0(sizeof(*info));
2356 info->value = g_malloc0(sizeof(*info->value));
2357
2358 info->value->cpu_index = cpu->cpu_index;
2359 info->value->qom_path = object_get_canonical_path(OBJECT(cpu));
2360 info->value->thread_id = cpu->thread_id;
2361
2362 info->value->has_props = !!mc->cpu_index_to_instance_props;
2363 if (info->value->has_props) {
2364 CpuInstanceProperties *props;
2365 props = g_malloc0(sizeof(*props));
2366 *props = mc->cpu_index_to_instance_props(ms, cpu->cpu_index);
2367 info->value->props = props;
2368 }
2369
daa9d2bc
LE
2370 info->value->arch = sysemu_target_to_cpuinfo_arch(target);
2371 info->value->target = target;
2372 if (target == SYS_EMU_TARGET_S390X) {
2373 cpustate_to_cpuinfo_s390(&info->value->u.s390x, cpu);
daa9d2bc
LE
2374 }
2375
ce74ee3d
LC
2376 if (!cur_item) {
2377 head = cur_item = info;
2378 } else {
2379 cur_item->next = info;
2380 cur_item = info;
2381 }
2382 }
2383
2384 return head;
2385}
2386
0cfd6a9a
LC
2387void qmp_memsave(int64_t addr, int64_t size, const char *filename,
2388 bool has_cpu, int64_t cpu_index, Error **errp)
2389{
2390 FILE *f;
2391 uint32_t l;
55e5c285 2392 CPUState *cpu;
0cfd6a9a 2393 uint8_t buf[1024];
0dc9daf0 2394 int64_t orig_addr = addr, orig_size = size;
0cfd6a9a
LC
2395
2396 if (!has_cpu) {
2397 cpu_index = 0;
2398 }
2399
151d1322
AF
2400 cpu = qemu_get_cpu(cpu_index);
2401 if (cpu == NULL) {
c6bd8c70
MA
2402 error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "cpu-index",
2403 "a CPU number");
0cfd6a9a
LC
2404 return;
2405 }
2406
2407 f = fopen(filename, "wb");
2408 if (!f) {
618da851 2409 error_setg_file_open(errp, errno, filename);
0cfd6a9a
LC
2410 return;
2411 }
2412
2413 while (size != 0) {
2414 l = sizeof(buf);
2415 if (l > size)
2416 l = size;
2f4d0f59 2417 if (cpu_memory_rw_debug(cpu, addr, buf, l, 0) != 0) {
0dc9daf0
BP
2418 error_setg(errp, "Invalid addr 0x%016" PRIx64 "/size %" PRId64
2419 " specified", orig_addr, orig_size);
2f4d0f59
AK
2420 goto exit;
2421 }
0cfd6a9a 2422 if (fwrite(buf, 1, l, f) != l) {
c6bd8c70 2423 error_setg(errp, QERR_IO_ERROR);
0cfd6a9a
LC
2424 goto exit;
2425 }
2426 addr += l;
2427 size -= l;
2428 }
2429
2430exit:
2431 fclose(f);
2432}
6d3962bf
LC
2433
2434void qmp_pmemsave(int64_t addr, int64_t size, const char *filename,
2435 Error **errp)
2436{
2437 FILE *f;
2438 uint32_t l;
2439 uint8_t buf[1024];
2440
2441 f = fopen(filename, "wb");
2442 if (!f) {
618da851 2443 error_setg_file_open(errp, errno, filename);
6d3962bf
LC
2444 return;
2445 }
2446
2447 while (size != 0) {
2448 l = sizeof(buf);
2449 if (l > size)
2450 l = size;
eb6282f2 2451 cpu_physical_memory_read(addr, buf, l);
6d3962bf 2452 if (fwrite(buf, 1, l, f) != l) {
c6bd8c70 2453 error_setg(errp, QERR_IO_ERROR);
6d3962bf
LC
2454 goto exit;
2455 }
2456 addr += l;
2457 size -= l;
2458 }
2459
2460exit:
2461 fclose(f);
2462}
ab49ab5c
LC
2463
2464void qmp_inject_nmi(Error **errp)
2465{
9cb805fd 2466 nmi_monitor_handle(monitor_get_cpu_index(), errp);
ab49ab5c 2467}
27498bef 2468
76c86615 2469void dump_drift_info(void)
27498bef
ST
2470{
2471 if (!use_icount) {
2472 return;
2473 }
2474
76c86615 2475 qemu_printf("Host - Guest clock %"PRIi64" ms\n",
27498bef
ST
2476 (cpu_get_clock() - cpu_get_icount())/SCALE_MS);
2477 if (icount_align_option) {
76c86615
MA
2478 qemu_printf("Max guest delay %"PRIi64" ms\n",
2479 -max_delay / SCALE_MS);
2480 qemu_printf("Max guest advance %"PRIi64" ms\n",
2481 max_advance / SCALE_MS);
27498bef 2482 } else {
76c86615
MA
2483 qemu_printf("Max guest delay NA\n");
2484 qemu_printf("Max guest advance NA\n");
27498bef
ST
2485 }
2486}
This page took 0.894292 seconds and 4 git commands to generate.