blob: 2a0e133d39aef03ba8bab325bde5430e443995f3 [file] [log] [blame]
Blue Swirl296af7c2010-03-29 19:23:50 +00001/*
2 * QEMU System Emulator
3 *
4 * Copyright (c) 2003-2008 Fabrice Bellard
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
24
25/* Needed early for CONFIG_BSD etc. */
26#include "config-host.h"
27
Paolo Bonzini83c90892012-12-17 18:19:49 +010028#include "monitor/monitor.h"
Wenchao Xiaa4e15de2014-06-18 08:43:36 +020029#include "qapi/qmp/qerror.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010030#include "sysemu/sysemu.h"
Paolo Bonzini022c62c2012-12-17 18:19:49 +010031#include "exec/gdbstub.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010032#include "sysemu/dma.h"
33#include "sysemu/kvm.h"
Luiz Capitulinode0b36b2011-09-21 16:38:35 -030034#include "qmp-commands.h"
Blue Swirl296af7c2010-03-29 19:23:50 +000035
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010036#include "qemu/thread.h"
Paolo Bonzini9c17d612012-12-17 18:20:04 +010037#include "sysemu/cpus.h"
38#include "sysemu/qtest.h"
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010039#include "qemu/main-loop.h"
40#include "qemu/bitmap.h"
Liu Ping Fancb365642013-09-25 14:20:58 +080041#include "qemu/seqlock.h"
Wenchao Xiaa4e15de2014-06-18 08:43:36 +020042#include "qapi-event.h"
Alexey Kardashevskiy9cb805f2014-08-20 22:16:33 +100043#include "hw/nmi.h"
Jan Kiszka0ff0fc12011-06-23 10:15:55 +020044
45#ifndef _WIN32
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010046#include "qemu/compatfd.h"
Jan Kiszka0ff0fc12011-06-23 10:15:55 +020047#endif
Blue Swirl296af7c2010-03-29 19:23:50 +000048
Jan Kiszka6d9cb732011-02-01 22:15:58 +010049#ifdef CONFIG_LINUX
50
51#include <sys/prctl.h>
52
Marcelo Tosattic0532a72010-10-11 15:31:21 -030053#ifndef PR_MCE_KILL
54#define PR_MCE_KILL 33
55#endif
56
Jan Kiszka6d9cb732011-02-01 22:15:58 +010057#ifndef PR_MCE_KILL_SET
58#define PR_MCE_KILL_SET 1
59#endif
60
61#ifndef PR_MCE_KILL_EARLY
62#define PR_MCE_KILL_EARLY 1
63#endif
64
65#endif /* CONFIG_LINUX */
66
Andreas Färber182735e2013-05-29 22:29:20 +020067static CPUState *next_cpu;
Sebastian Tanase27498be2014-07-25 11:56:33 +020068int64_t max_delay;
69int64_t max_advance;
Blue Swirl296af7c2010-03-29 19:23:50 +000070
Tiejun Chen321bc0b2013-08-02 09:43:09 +080071bool cpu_is_stopped(CPUState *cpu)
72{
73 return cpu->stopped || !runstate_is_running();
74}
75
Andreas Färbera98ae1d2013-05-26 23:21:08 +020076static bool cpu_thread_is_idle(CPUState *cpu)
Peter Maydellac873f12012-07-19 16:52:27 +010077{
Andreas Färberc64ca812012-05-03 02:11:45 +020078 if (cpu->stop || cpu->queued_work_first) {
Peter Maydellac873f12012-07-19 16:52:27 +010079 return false;
80 }
Tiejun Chen321bc0b2013-08-02 09:43:09 +080081 if (cpu_is_stopped(cpu)) {
Peter Maydellac873f12012-07-19 16:52:27 +010082 return true;
83 }
Andreas Färber8c2e1b02013-08-25 18:53:55 +020084 if (!cpu->halted || cpu_has_work(cpu) ||
Alexander Graf215e79c2013-04-24 22:24:12 +020085 kvm_halt_in_kernel()) {
Peter Maydellac873f12012-07-19 16:52:27 +010086 return false;
87 }
88 return true;
89}
90
91static bool all_cpu_threads_idle(void)
92{
Andreas Färber182735e2013-05-29 22:29:20 +020093 CPUState *cpu;
Peter Maydellac873f12012-07-19 16:52:27 +010094
Andreas Färberbdc44642013-06-24 23:50:24 +020095 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +020096 if (!cpu_thread_is_idle(cpu)) {
Peter Maydellac873f12012-07-19 16:52:27 +010097 return false;
98 }
99 }
100 return true;
101}
102
Blue Swirl296af7c2010-03-29 19:23:50 +0000103/***********************************************************/
Paolo Bonzini946fb272011-09-12 13:57:37 +0200104/* guest cycle counter */
105
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200106/* Protected by TimersState seqlock */
107
Sebastian Tanase71468392014-07-23 11:47:50 +0200108static int64_t vm_clock_warp_start = -1;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200109/* Conversion factor from emulated instructions to virtual clock ticks. */
110static int icount_time_shift;
111/* Arbitrarily pick 1MIPS as the minimum allowable speed. */
112#define MAX_ICOUNT_SHIFT 10
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200113
Paolo Bonzini946fb272011-09-12 13:57:37 +0200114static QEMUTimer *icount_rt_timer;
115static QEMUTimer *icount_vm_timer;
116static QEMUTimer *icount_warp_timer;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200117
118typedef struct TimersState {
Liu Ping Fancb365642013-09-25 14:20:58 +0800119 /* Protected by BQL. */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200120 int64_t cpu_ticks_prev;
121 int64_t cpu_ticks_offset;
Liu Ping Fancb365642013-09-25 14:20:58 +0800122
123 /* cpu_clock_offset can be read out of BQL, so protect it with
124 * this lock.
125 */
126 QemuSeqLock vm_clock_seqlock;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200127 int64_t cpu_clock_offset;
128 int32_t cpu_ticks_enabled;
129 int64_t dummy;
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200130
131 /* Compensate for varying guest execution speed. */
132 int64_t qemu_icount_bias;
133 /* Only written by TCG thread */
134 int64_t qemu_icount;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200135} TimersState;
136
Liu Ping Fand9cd4002013-07-21 08:43:00 +0000137static TimersState timers_state;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200138
139/* Return the virtual CPU time, based on the instruction counter. */
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200140static int64_t cpu_get_icount_locked(void)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200141{
142 int64_t icount;
Andreas Färber4917cf42013-05-27 05:17:50 +0200143 CPUState *cpu = current_cpu;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200144
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200145 icount = timers_state.qemu_icount;
Andreas Färber4917cf42013-05-27 05:17:50 +0200146 if (cpu) {
Andreas Färber99df7dc2013-08-26 05:15:23 +0200147 if (!cpu_can_do_io(cpu)) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200148 fprintf(stderr, "Bad clock read\n");
149 }
Andreas Färber28ecfd72013-08-26 05:51:49 +0200150 icount -= (cpu->icount_decr.u16.low + cpu->icount_extra);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200151 }
KONRAD Frederic3f031312014-08-01 01:37:15 +0200152 return timers_state.qemu_icount_bias + cpu_icount_to_ns(icount);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200153}
154
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200155int64_t cpu_get_icount(void)
156{
157 int64_t icount;
158 unsigned start;
159
160 do {
161 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
162 icount = cpu_get_icount_locked();
163 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
164
165 return icount;
166}
167
KONRAD Frederic3f031312014-08-01 01:37:15 +0200168int64_t cpu_icount_to_ns(int64_t icount)
169{
170 return icount << icount_time_shift;
171}
172
Paolo Bonzini946fb272011-09-12 13:57:37 +0200173/* return the host CPU cycle counter and handle stop/restart */
Liu Ping Fancb365642013-09-25 14:20:58 +0800174/* Caller must hold the BQL */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200175int64_t cpu_get_ticks(void)
176{
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100177 int64_t ticks;
178
Paolo Bonzini946fb272011-09-12 13:57:37 +0200179 if (use_icount) {
180 return cpu_get_icount();
181 }
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100182
183 ticks = timers_state.cpu_ticks_offset;
184 if (timers_state.cpu_ticks_enabled) {
185 ticks += cpu_get_real_ticks();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200186 }
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100187
188 if (timers_state.cpu_ticks_prev > ticks) {
189 /* Note: non increasing ticks may happen if the host uses
190 software suspend */
191 timers_state.cpu_ticks_offset += timers_state.cpu_ticks_prev - ticks;
192 ticks = timers_state.cpu_ticks_prev;
193 }
194
195 timers_state.cpu_ticks_prev = ticks;
196 return ticks;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200197}
198
Liu Ping Fancb365642013-09-25 14:20:58 +0800199static int64_t cpu_get_clock_locked(void)
200{
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100201 int64_t ticks;
Liu Ping Fancb365642013-09-25 14:20:58 +0800202
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100203 ticks = timers_state.cpu_clock_offset;
204 if (timers_state.cpu_ticks_enabled) {
205 ticks += get_clock();
Liu Ping Fancb365642013-09-25 14:20:58 +0800206 }
207
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100208 return ticks;
Liu Ping Fancb365642013-09-25 14:20:58 +0800209}
210
Paolo Bonzini946fb272011-09-12 13:57:37 +0200211/* return the host CPU monotonic timer and handle stop/restart */
212int64_t cpu_get_clock(void)
213{
214 int64_t ti;
Liu Ping Fancb365642013-09-25 14:20:58 +0800215 unsigned start;
216
217 do {
218 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
219 ti = cpu_get_clock_locked();
220 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
221
222 return ti;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200223}
224
Sebastian Tanasec2aa5f82014-07-25 11:56:31 +0200225/* return the offset between the host clock and virtual CPU clock */
226int64_t cpu_get_clock_offset(void)
227{
228 int64_t ti;
229 unsigned start;
230
231 do {
232 start = seqlock_read_begin(&timers_state.vm_clock_seqlock);
233 ti = timers_state.cpu_clock_offset;
234 if (!timers_state.cpu_ticks_enabled) {
235 ti -= get_clock();
236 }
237 } while (seqlock_read_retry(&timers_state.vm_clock_seqlock, start));
238
239 return -ti;
240}
241
Liu Ping Fancb365642013-09-25 14:20:58 +0800242/* enable cpu_get_ticks()
243 * Caller must hold BQL which server as mutex for vm_clock_seqlock.
244 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200245void cpu_enable_ticks(void)
246{
Liu Ping Fancb365642013-09-25 14:20:58 +0800247 /* Here, the really thing protected by seqlock is cpu_clock_offset. */
248 seqlock_write_lock(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200249 if (!timers_state.cpu_ticks_enabled) {
250 timers_state.cpu_ticks_offset -= cpu_get_real_ticks();
251 timers_state.cpu_clock_offset -= get_clock();
252 timers_state.cpu_ticks_enabled = 1;
253 }
Liu Ping Fancb365642013-09-25 14:20:58 +0800254 seqlock_write_unlock(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200255}
256
257/* disable cpu_get_ticks() : the clock is stopped. You must not call
Liu Ping Fancb365642013-09-25 14:20:58 +0800258 * cpu_get_ticks() after that.
259 * Caller must hold BQL which server as mutex for vm_clock_seqlock.
260 */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200261void cpu_disable_ticks(void)
262{
Liu Ping Fancb365642013-09-25 14:20:58 +0800263 /* Here, the really thing protected by seqlock is cpu_clock_offset. */
264 seqlock_write_lock(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200265 if (timers_state.cpu_ticks_enabled) {
Paolo Bonzini5f3e3102013-10-28 17:32:18 +0100266 timers_state.cpu_ticks_offset += cpu_get_real_ticks();
Liu Ping Fancb365642013-09-25 14:20:58 +0800267 timers_state.cpu_clock_offset = cpu_get_clock_locked();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200268 timers_state.cpu_ticks_enabled = 0;
269 }
Liu Ping Fancb365642013-09-25 14:20:58 +0800270 seqlock_write_unlock(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200271}
272
273/* Correlation between real and virtual time is always going to be
274 fairly approximate, so ignore small variation.
275 When the guest is idle real and virtual time will be aligned in
276 the IO wait loop. */
277#define ICOUNT_WOBBLE (get_ticks_per_sec() / 10)
278
279static void icount_adjust(void)
280{
281 int64_t cur_time;
282 int64_t cur_icount;
283 int64_t delta;
Paolo Bonzinia3270e12013-10-07 17:18:15 +0200284
285 /* Protected by TimersState mutex. */
Paolo Bonzini946fb272011-09-12 13:57:37 +0200286 static int64_t last_delta;
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200287
Paolo Bonzini946fb272011-09-12 13:57:37 +0200288 /* If the VM is not running, then do nothing. */
289 if (!runstate_is_running()) {
290 return;
291 }
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200292
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200293 seqlock_write_lock(&timers_state.vm_clock_seqlock);
294 cur_time = cpu_get_clock_locked();
295 cur_icount = cpu_get_icount_locked();
Paolo Bonzini468cc7c2013-10-07 17:21:51 +0200296
Paolo Bonzini946fb272011-09-12 13:57:37 +0200297 delta = cur_icount - cur_time;
298 /* FIXME: This is a very crude algorithm, somewhat prone to oscillation. */
299 if (delta > 0
300 && last_delta + ICOUNT_WOBBLE < delta * 2
301 && icount_time_shift > 0) {
302 /* The guest is getting too far ahead. Slow time down. */
303 icount_time_shift--;
304 }
305 if (delta < 0
306 && last_delta - ICOUNT_WOBBLE > delta * 2
307 && icount_time_shift < MAX_ICOUNT_SHIFT) {
308 /* The guest is getting too far behind. Speed time up. */
309 icount_time_shift++;
310 }
311 last_delta = delta;
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200312 timers_state.qemu_icount_bias = cur_icount
313 - (timers_state.qemu_icount << icount_time_shift);
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200314 seqlock_write_unlock(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200315}
316
317static void icount_adjust_rt(void *opaque)
318{
Alex Bligh40daca52013-08-21 16:03:02 +0100319 timer_mod(icount_rt_timer,
320 qemu_clock_get_ms(QEMU_CLOCK_REALTIME) + 1000);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200321 icount_adjust();
322}
323
324static void icount_adjust_vm(void *opaque)
325{
Alex Bligh40daca52013-08-21 16:03:02 +0100326 timer_mod(icount_vm_timer,
327 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
328 get_ticks_per_sec() / 10);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200329 icount_adjust();
330}
331
332static int64_t qemu_icount_round(int64_t count)
333{
334 return (count + (1 << icount_time_shift) - 1) >> icount_time_shift;
335}
336
337static void icount_warp_rt(void *opaque)
338{
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200339 /* The icount_warp_timer is rescheduled soon after vm_clock_warp_start
340 * changes from -1 to another value, so the race here is okay.
341 */
342 if (atomic_read(&vm_clock_warp_start) == -1) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200343 return;
344 }
345
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200346 seqlock_write_lock(&timers_state.vm_clock_seqlock);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200347 if (runstate_is_running()) {
Alex Bligh40daca52013-08-21 16:03:02 +0100348 int64_t clock = qemu_clock_get_ns(QEMU_CLOCK_REALTIME);
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200349 int64_t warp_delta;
350
351 warp_delta = clock - vm_clock_warp_start;
352 if (use_icount == 2) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200353 /*
Alex Bligh40daca52013-08-21 16:03:02 +0100354 * In adaptive mode, do not let QEMU_CLOCK_VIRTUAL run too
Paolo Bonzini946fb272011-09-12 13:57:37 +0200355 * far ahead of real time.
356 */
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200357 int64_t cur_time = cpu_get_clock_locked();
358 int64_t cur_icount = cpu_get_icount_locked();
Paolo Bonzini946fb272011-09-12 13:57:37 +0200359 int64_t delta = cur_time - cur_icount;
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200360 warp_delta = MIN(warp_delta, delta);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200361 }
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200362 timers_state.qemu_icount_bias += warp_delta;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200363 }
364 vm_clock_warp_start = -1;
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200365 seqlock_write_unlock(&timers_state.vm_clock_seqlock);
Paolo Bonzini8ed961d2013-10-07 17:26:07 +0200366
367 if (qemu_clock_expired(QEMU_CLOCK_VIRTUAL)) {
368 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
369 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200370}
371
Paolo Bonzini8156be52012-03-28 15:42:04 +0200372void qtest_clock_warp(int64_t dest)
373{
Alex Bligh40daca52013-08-21 16:03:02 +0100374 int64_t clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini8156be52012-03-28 15:42:04 +0200375 assert(qtest_enabled());
376 while (clock < dest) {
Alex Bligh40daca52013-08-21 16:03:02 +0100377 int64_t deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
Sergey Fedorovc9299e22014-06-10 13:10:28 +0400378 int64_t warp = qemu_soonest_timeout(dest - clock, deadline);
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200379 seqlock_write_lock(&timers_state.vm_clock_seqlock);
KONRAD Fredericc96778b2014-08-01 01:37:09 +0200380 timers_state.qemu_icount_bias += warp;
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200381 seqlock_write_unlock(&timers_state.vm_clock_seqlock);
382
Alex Bligh40daca52013-08-21 16:03:02 +0100383 qemu_clock_run_timers(QEMU_CLOCK_VIRTUAL);
384 clock = qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini8156be52012-03-28 15:42:04 +0200385 }
Alex Bligh40daca52013-08-21 16:03:02 +0100386 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini8156be52012-03-28 15:42:04 +0200387}
388
Alex Bligh40daca52013-08-21 16:03:02 +0100389void qemu_clock_warp(QEMUClockType type)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200390{
Paolo Bonzinice78d182013-10-07 17:30:02 +0200391 int64_t clock;
Paolo Bonzini946fb272011-09-12 13:57:37 +0200392 int64_t deadline;
393
394 /*
395 * There are too many global variables to make the "warp" behavior
396 * applicable to other clocks. But a clock argument removes the
397 * need for if statements all over the place.
398 */
Alex Bligh40daca52013-08-21 16:03:02 +0100399 if (type != QEMU_CLOCK_VIRTUAL || !use_icount) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200400 return;
401 }
402
403 /*
Alex Bligh40daca52013-08-21 16:03:02 +0100404 * If the CPUs have been sleeping, advance QEMU_CLOCK_VIRTUAL timer now.
405 * This ensures that the deadline for the timer is computed correctly below.
Paolo Bonzini946fb272011-09-12 13:57:37 +0200406 * This also makes sure that the insn counter is synchronized before the
407 * CPU starts running, in case the CPU is woken by an event other than
Alex Bligh40daca52013-08-21 16:03:02 +0100408 * the earliest QEMU_CLOCK_VIRTUAL timer.
Paolo Bonzini946fb272011-09-12 13:57:37 +0200409 */
410 icount_warp_rt(NULL);
Paolo Bonzinice78d182013-10-07 17:30:02 +0200411 timer_del(icount_warp_timer);
412 if (!all_cpu_threads_idle()) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200413 return;
414 }
415
Paolo Bonzini8156be52012-03-28 15:42:04 +0200416 if (qtest_enabled()) {
417 /* When testing, qtest commands advance icount. */
418 return;
419 }
420
Alex Blighac70aaf2013-08-21 16:02:57 +0100421 /* We want to use the earliest deadline from ALL vm_clocks */
Paolo Bonzinice78d182013-10-07 17:30:02 +0200422 clock = qemu_clock_get_ns(QEMU_CLOCK_REALTIME);
Alex Bligh40daca52013-08-21 16:03:02 +0100423 deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
Paolo Bonzinice78d182013-10-07 17:30:02 +0200424 if (deadline < 0) {
425 return;
Alex Blighac70aaf2013-08-21 16:02:57 +0100426 }
427
Paolo Bonzini946fb272011-09-12 13:57:37 +0200428 if (deadline > 0) {
429 /*
Alex Bligh40daca52013-08-21 16:03:02 +0100430 * Ensure QEMU_CLOCK_VIRTUAL proceeds even when the virtual CPU goes to
Paolo Bonzini946fb272011-09-12 13:57:37 +0200431 * sleep. Otherwise, the CPU might be waiting for a future timer
432 * interrupt to wake it up, but the interrupt never comes because
433 * the vCPU isn't running any insns and thus doesn't advance the
Alex Bligh40daca52013-08-21 16:03:02 +0100434 * QEMU_CLOCK_VIRTUAL.
Paolo Bonzini946fb272011-09-12 13:57:37 +0200435 *
436 * An extreme solution for this problem would be to never let VCPUs
Alex Bligh40daca52013-08-21 16:03:02 +0100437 * sleep in icount mode if there is a pending QEMU_CLOCK_VIRTUAL
438 * timer; rather time could just advance to the next QEMU_CLOCK_VIRTUAL
439 * event. Instead, we do stop VCPUs and only advance QEMU_CLOCK_VIRTUAL
440 * after some e"real" time, (related to the time left until the next
441 * event) has passed. The QEMU_CLOCK_REALTIME timer will do this.
442 * This avoids that the warps are visible externally; for example,
443 * you will not be sending network packets continuously instead of
444 * every 100ms.
Paolo Bonzini946fb272011-09-12 13:57:37 +0200445 */
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200446 seqlock_write_lock(&timers_state.vm_clock_seqlock);
Paolo Bonzinice78d182013-10-07 17:30:02 +0200447 if (vm_clock_warp_start == -1 || vm_clock_warp_start > clock) {
448 vm_clock_warp_start = clock;
449 }
Paolo Bonzini17a15f12013-10-03 15:17:25 +0200450 seqlock_write_unlock(&timers_state.vm_clock_seqlock);
Paolo Bonzinice78d182013-10-07 17:30:02 +0200451 timer_mod_anticipate(icount_warp_timer, clock + deadline);
Alex Blighac70aaf2013-08-21 16:02:57 +0100452 } else if (deadline == 0) {
Alex Bligh40daca52013-08-21 16:03:02 +0100453 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200454 }
455}
456
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200457static bool icount_state_needed(void *opaque)
458{
459 return use_icount;
460}
461
462/*
463 * This is a subsection for icount migration.
464 */
465static const VMStateDescription icount_vmstate_timers = {
466 .name = "timer/icount",
467 .version_id = 1,
468 .minimum_version_id = 1,
469 .fields = (VMStateField[]) {
470 VMSTATE_INT64(qemu_icount_bias, TimersState),
471 VMSTATE_INT64(qemu_icount, TimersState),
472 VMSTATE_END_OF_LIST()
473 }
474};
475
Paolo Bonzini946fb272011-09-12 13:57:37 +0200476static const VMStateDescription vmstate_timers = {
477 .name = "timer",
478 .version_id = 2,
479 .minimum_version_id = 1,
Juan Quintela35d08452014-04-16 16:01:33 +0200480 .fields = (VMStateField[]) {
Paolo Bonzini946fb272011-09-12 13:57:37 +0200481 VMSTATE_INT64(cpu_ticks_offset, TimersState),
482 VMSTATE_INT64(dummy, TimersState),
483 VMSTATE_INT64_V(cpu_clock_offset, TimersState, 2),
484 VMSTATE_END_OF_LIST()
KONRAD Fredericd09eae32014-08-01 01:37:10 +0200485 },
486 .subsections = (VMStateSubsection[]) {
487 {
488 .vmsd = &icount_vmstate_timers,
489 .needed = icount_state_needed,
490 }, {
491 /* empty */
492 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200493 }
494};
495
Pavel Dovgalyuk4603ea02014-09-01 09:34:49 +0400496void cpu_ticks_init(void)
497{
498 seqlock_init(&timers_state.vm_clock_seqlock, NULL);
499 vmstate_register(NULL, 0, &vmstate_timers, &timers_state);
500}
501
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200502void configure_icount(QemuOpts *opts, Error **errp)
Paolo Bonzini946fb272011-09-12 13:57:37 +0200503{
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200504 const char *option;
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200505 char *rem_str = NULL;
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200506
Sebastian Tanase1ad95802014-07-25 11:56:28 +0200507 option = qemu_opt_get(opts, "shift");
Paolo Bonzini946fb272011-09-12 13:57:37 +0200508 if (!option) {
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200509 if (qemu_opt_get(opts, "align") != NULL) {
510 error_setg(errp, "Please specify shift option when using align");
511 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200512 return;
513 }
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200514 icount_align_option = qemu_opt_get_bool(opts, "align", false);
Alex Bligh40daca52013-08-21 16:03:02 +0100515 icount_warp_timer = timer_new_ns(QEMU_CLOCK_REALTIME,
516 icount_warp_rt, NULL);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200517 if (strcmp(option, "auto") != 0) {
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200518 errno = 0;
519 icount_time_shift = strtol(option, &rem_str, 0);
520 if (errno != 0 || *rem_str != '\0' || !strlen(option)) {
521 error_setg(errp, "icount: Invalid shift value");
522 }
Paolo Bonzini946fb272011-09-12 13:57:37 +0200523 use_icount = 1;
524 return;
Sebastian Tanasea8bfac32014-07-25 11:56:29 +0200525 } else if (icount_align_option) {
526 error_setg(errp, "shift=auto and align=on are incompatible");
Paolo Bonzini946fb272011-09-12 13:57:37 +0200527 }
528
529 use_icount = 2;
530
531 /* 125MIPS seems a reasonable initial guess at the guest speed.
532 It will be corrected fairly quickly anyway. */
533 icount_time_shift = 3;
534
535 /* Have both realtime and virtual time triggers for speed adjustment.
536 The realtime trigger catches emulated time passing too slowly,
537 the virtual time trigger catches emulated time passing too fast.
538 Realtime triggers occur even when idle, so use them less frequently
539 than VM triggers. */
Alex Bligh40daca52013-08-21 16:03:02 +0100540 icount_rt_timer = timer_new_ms(QEMU_CLOCK_REALTIME,
541 icount_adjust_rt, NULL);
542 timer_mod(icount_rt_timer,
543 qemu_clock_get_ms(QEMU_CLOCK_REALTIME) + 1000);
544 icount_vm_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
545 icount_adjust_vm, NULL);
546 timer_mod(icount_vm_timer,
547 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) +
548 get_ticks_per_sec() / 10);
Paolo Bonzini946fb272011-09-12 13:57:37 +0200549}
550
551/***********************************************************/
Blue Swirl296af7c2010-03-29 19:23:50 +0000552void hw_error(const char *fmt, ...)
553{
554 va_list ap;
Andreas Färber55e5c282012-12-17 06:18:02 +0100555 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000556
557 va_start(ap, fmt);
558 fprintf(stderr, "qemu: hardware error: ");
559 vfprintf(stderr, fmt, ap);
560 fprintf(stderr, "\n");
Andreas Färberbdc44642013-06-24 23:50:24 +0200561 CPU_FOREACH(cpu) {
Andreas Färber55e5c282012-12-17 06:18:02 +0100562 fprintf(stderr, "CPU #%d:\n", cpu->cpu_index);
Andreas Färber878096e2013-05-27 01:33:50 +0200563 cpu_dump_state(cpu, stderr, fprintf, CPU_DUMP_FPU);
Blue Swirl296af7c2010-03-29 19:23:50 +0000564 }
565 va_end(ap);
566 abort();
567}
568
569void cpu_synchronize_all_states(void)
570{
Andreas Färber182735e2013-05-29 22:29:20 +0200571 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000572
Andreas Färberbdc44642013-06-24 23:50:24 +0200573 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200574 cpu_synchronize_state(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000575 }
576}
577
578void cpu_synchronize_all_post_reset(void)
579{
Andreas Färber182735e2013-05-29 22:29:20 +0200580 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000581
Andreas Färberbdc44642013-06-24 23:50:24 +0200582 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200583 cpu_synchronize_post_reset(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000584 }
585}
586
587void cpu_synchronize_all_post_init(void)
588{
Andreas Färber182735e2013-05-29 22:29:20 +0200589 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000590
Andreas Färberbdc44642013-06-24 23:50:24 +0200591 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200592 cpu_synchronize_post_init(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000593 }
594}
595
Kevin Wolf56983462013-07-05 13:49:54 +0200596static int do_vm_stop(RunState state)
Blue Swirl296af7c2010-03-29 19:23:50 +0000597{
Kevin Wolf56983462013-07-05 13:49:54 +0200598 int ret = 0;
599
Luiz Capitulino13548692011-07-29 15:36:43 -0300600 if (runstate_is_running()) {
Blue Swirl296af7c2010-03-29 19:23:50 +0000601 cpu_disable_ticks();
Blue Swirl296af7c2010-03-29 19:23:50 +0000602 pause_all_vcpus();
Luiz Capitulinof5bbfba2011-07-29 15:04:45 -0300603 runstate_set(state);
Luiz Capitulino1dfb4dd2011-07-29 14:26:33 -0300604 vm_state_notify(0, state);
Wenchao Xiaa4e15de2014-06-18 08:43:36 +0200605 qapi_event_send_stop(&error_abort);
Blue Swirl296af7c2010-03-29 19:23:50 +0000606 }
Kevin Wolf56983462013-07-05 13:49:54 +0200607
Kevin Wolf594a45c2013-07-18 14:52:19 +0200608 bdrv_drain_all();
609 ret = bdrv_flush_all();
610
Kevin Wolf56983462013-07-05 13:49:54 +0200611 return ret;
Blue Swirl296af7c2010-03-29 19:23:50 +0000612}
613
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200614static bool cpu_can_run(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +0000615{
Andreas Färber4fdeee72012-05-02 23:10:09 +0200616 if (cpu->stop) {
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200617 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +0100618 }
Tiejun Chen321bc0b2013-08-02 09:43:09 +0800619 if (cpu_is_stopped(cpu)) {
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200620 return false;
Jan Kiszka0ab07c62011-02-07 12:19:14 +0100621 }
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200622 return true;
Blue Swirl296af7c2010-03-29 19:23:50 +0000623}
624
Andreas Färber91325042013-05-27 02:07:49 +0200625static void cpu_handle_guest_debug(CPUState *cpu)
Jan Kiszka3c638d02010-06-25 16:56:56 +0200626{
Andreas Färber64f6b342013-05-27 02:06:09 +0200627 gdb_set_stop_cpu(cpu);
Jan Kiszka8cf71712011-02-07 12:19:16 +0100628 qemu_system_debug_request();
Andreas Färberf324e762012-05-02 23:26:21 +0200629 cpu->stopped = true;
Jan Kiszka3c638d02010-06-25 16:56:56 +0200630}
631
Paolo Bonzini714bd042011-03-12 17:44:06 +0100632static void cpu_signal(int sig)
633{
Andreas Färber4917cf42013-05-27 05:17:50 +0200634 if (current_cpu) {
635 cpu_exit(current_cpu);
Paolo Bonzini714bd042011-03-12 17:44:06 +0100636 }
637 exit_request = 1;
638}
Paolo Bonzini714bd042011-03-12 17:44:06 +0100639
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100640#ifdef CONFIG_LINUX
641static void sigbus_reraise(void)
642{
643 sigset_t set;
644 struct sigaction action;
645
646 memset(&action, 0, sizeof(action));
647 action.sa_handler = SIG_DFL;
648 if (!sigaction(SIGBUS, &action, NULL)) {
649 raise(SIGBUS);
650 sigemptyset(&set);
651 sigaddset(&set, SIGBUS);
652 sigprocmask(SIG_UNBLOCK, &set, NULL);
653 }
654 perror("Failed to re-raise SIGBUS!\n");
655 abort();
656}
657
658static void sigbus_handler(int n, struct qemu_signalfd_siginfo *siginfo,
659 void *ctx)
660{
661 if (kvm_on_sigbus(siginfo->ssi_code,
662 (void *)(intptr_t)siginfo->ssi_addr)) {
663 sigbus_reraise();
664 }
665}
666
667static void qemu_init_sigbus(void)
668{
669 struct sigaction action;
670
671 memset(&action, 0, sizeof(action));
672 action.sa_flags = SA_SIGINFO;
673 action.sa_sigaction = (void (*)(int, siginfo_t*, void*))sigbus_handler;
674 sigaction(SIGBUS, &action, NULL);
675
676 prctl(PR_MCE_KILL, PR_MCE_KILL_SET, PR_MCE_KILL_EARLY, 0, 0);
677}
678
Andreas Färber290adf32013-01-17 09:30:27 +0100679static void qemu_kvm_eat_signals(CPUState *cpu)
Jan Kiszka1ab3c6c2011-03-15 12:26:12 +0100680{
681 struct timespec ts = { 0, 0 };
682 siginfo_t siginfo;
683 sigset_t waitset;
684 sigset_t chkset;
685 int r;
686
687 sigemptyset(&waitset);
688 sigaddset(&waitset, SIG_IPI);
689 sigaddset(&waitset, SIGBUS);
690
691 do {
692 r = sigtimedwait(&waitset, &siginfo, &ts);
693 if (r == -1 && !(errno == EAGAIN || errno == EINTR)) {
694 perror("sigtimedwait");
695 exit(1);
696 }
697
698 switch (r) {
699 case SIGBUS:
Andreas Färber290adf32013-01-17 09:30:27 +0100700 if (kvm_on_sigbus_vcpu(cpu, siginfo.si_code, siginfo.si_addr)) {
Jan Kiszka1ab3c6c2011-03-15 12:26:12 +0100701 sigbus_reraise();
702 }
703 break;
704 default:
705 break;
706 }
707
708 r = sigpending(&chkset);
709 if (r == -1) {
710 perror("sigpending");
711 exit(1);
712 }
713 } while (sigismember(&chkset, SIG_IPI) || sigismember(&chkset, SIGBUS));
Jan Kiszka1ab3c6c2011-03-15 12:26:12 +0100714}
715
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100716#else /* !CONFIG_LINUX */
717
718static void qemu_init_sigbus(void)
719{
720}
Jan Kiszka1ab3c6c2011-03-15 12:26:12 +0100721
Andreas Färber290adf32013-01-17 09:30:27 +0100722static void qemu_kvm_eat_signals(CPUState *cpu)
Jan Kiszka1ab3c6c2011-03-15 12:26:12 +0100723{
724}
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100725#endif /* !CONFIG_LINUX */
726
Blue Swirl296af7c2010-03-29 19:23:50 +0000727#ifndef _WIN32
Jan Kiszka55f8d6a2011-02-01 22:15:52 +0100728static void dummy_signal(int sig)
Blue Swirl296af7c2010-03-29 19:23:50 +0000729{
730}
731
Andreas Färber13618e02013-05-26 23:41:00 +0200732static void qemu_kvm_init_cpu_signals(CPUState *cpu)
Paolo Bonzini714bd042011-03-12 17:44:06 +0100733{
734 int r;
735 sigset_t set;
736 struct sigaction sigact;
737
738 memset(&sigact, 0, sizeof(sigact));
739 sigact.sa_handler = dummy_signal;
740 sigaction(SIG_IPI, &sigact, NULL);
741
Paolo Bonzini714bd042011-03-12 17:44:06 +0100742 pthread_sigmask(SIG_BLOCK, NULL, &set);
743 sigdelset(&set, SIG_IPI);
744 sigdelset(&set, SIGBUS);
Andreas Färber491d6e82013-05-26 23:38:10 +0200745 r = kvm_set_signal_mask(cpu, &set);
Paolo Bonzini714bd042011-03-12 17:44:06 +0100746 if (r) {
747 fprintf(stderr, "kvm_set_signal_mask: %s\n", strerror(-r));
748 exit(1);
749 }
Paolo Bonzini714bd042011-03-12 17:44:06 +0100750}
751
752static void qemu_tcg_init_cpu_signals(void)
753{
Paolo Bonzini714bd042011-03-12 17:44:06 +0100754 sigset_t set;
755 struct sigaction sigact;
756
757 memset(&sigact, 0, sizeof(sigact));
758 sigact.sa_handler = cpu_signal;
759 sigaction(SIG_IPI, &sigact, NULL);
760
761 sigemptyset(&set);
762 sigaddset(&set, SIG_IPI);
763 pthread_sigmask(SIG_UNBLOCK, &set, NULL);
Paolo Bonzini714bd042011-03-12 17:44:06 +0100764}
765
Jan Kiszka55f8d6a2011-02-01 22:15:52 +0100766#else /* _WIN32 */
Andreas Färber13618e02013-05-26 23:41:00 +0200767static void qemu_kvm_init_cpu_signals(CPUState *cpu)
Paolo Bonzini714bd042011-03-12 17:44:06 +0100768{
769 abort();
770}
771
772static void qemu_tcg_init_cpu_signals(void)
773{
774}
Jan Kiszka55f8d6a2011-02-01 22:15:52 +0100775#endif /* _WIN32 */
Blue Swirl296af7c2010-03-29 19:23:50 +0000776
Stefan Weilb2532d82012-09-27 07:41:42 +0200777static QemuMutex qemu_global_mutex;
Paolo Bonzini46daff12011-06-09 13:10:24 +0200778static QemuCond qemu_io_proceeded_cond;
779static bool iothread_requesting_mutex;
Blue Swirl296af7c2010-03-29 19:23:50 +0000780
781static QemuThread io_thread;
782
783static QemuThread *tcg_cpu_thread;
784static QemuCond *tcg_halt_cond;
785
Blue Swirl296af7c2010-03-29 19:23:50 +0000786/* cpu creation */
787static QemuCond qemu_cpu_cond;
788/* system init */
Blue Swirl296af7c2010-03-29 19:23:50 +0000789static QemuCond qemu_pause_cond;
Marcelo Tosattie82bcec2010-05-04 09:45:22 -0300790static QemuCond qemu_work_cond;
Blue Swirl296af7c2010-03-29 19:23:50 +0000791
Paolo Bonzinid3b12f52011-09-13 10:30:52 +0200792void qemu_init_cpu_loop(void)
Blue Swirl296af7c2010-03-29 19:23:50 +0000793{
Jan Kiszka6d9cb732011-02-01 22:15:58 +0100794 qemu_init_sigbus();
Anthony Liguoried945922011-02-08 18:18:18 +0100795 qemu_cond_init(&qemu_cpu_cond);
Anthony Liguoried945922011-02-08 18:18:18 +0100796 qemu_cond_init(&qemu_pause_cond);
797 qemu_cond_init(&qemu_work_cond);
Paolo Bonzini46daff12011-06-09 13:10:24 +0200798 qemu_cond_init(&qemu_io_proceeded_cond);
Blue Swirl296af7c2010-03-29 19:23:50 +0000799 qemu_mutex_init(&qemu_global_mutex);
Blue Swirl296af7c2010-03-29 19:23:50 +0000800
Jan Kiszkab7680cb2011-03-12 17:43:51 +0100801 qemu_thread_get_self(&io_thread);
Blue Swirl296af7c2010-03-29 19:23:50 +0000802}
803
Andreas Färberf100f0b2012-05-03 14:58:47 +0200804void run_on_cpu(CPUState *cpu, void (*func)(void *data), void *data)
Marcelo Tosattie82bcec2010-05-04 09:45:22 -0300805{
806 struct qemu_work_item wi;
807
Andreas Färber60e82572012-05-02 22:23:49 +0200808 if (qemu_cpu_is_self(cpu)) {
Marcelo Tosattie82bcec2010-05-04 09:45:22 -0300809 func(data);
810 return;
811 }
812
813 wi.func = func;
814 wi.data = data;
Chegu Vinod3c022702013-06-24 03:49:41 -0600815 wi.free = false;
Andreas Färberc64ca812012-05-03 02:11:45 +0200816 if (cpu->queued_work_first == NULL) {
817 cpu->queued_work_first = &wi;
Jan Kiszka0ab07c62011-02-07 12:19:14 +0100818 } else {
Andreas Färberc64ca812012-05-03 02:11:45 +0200819 cpu->queued_work_last->next = &wi;
Jan Kiszka0ab07c62011-02-07 12:19:14 +0100820 }
Andreas Färberc64ca812012-05-03 02:11:45 +0200821 cpu->queued_work_last = &wi;
Marcelo Tosattie82bcec2010-05-04 09:45:22 -0300822 wi.next = NULL;
823 wi.done = false;
824
Andreas Färberc08d7422012-05-03 04:34:15 +0200825 qemu_cpu_kick(cpu);
Marcelo Tosattie82bcec2010-05-04 09:45:22 -0300826 while (!wi.done) {
Andreas Färber4917cf42013-05-27 05:17:50 +0200827 CPUState *self_cpu = current_cpu;
Marcelo Tosattie82bcec2010-05-04 09:45:22 -0300828
829 qemu_cond_wait(&qemu_work_cond, &qemu_global_mutex);
Andreas Färber4917cf42013-05-27 05:17:50 +0200830 current_cpu = self_cpu;
Marcelo Tosattie82bcec2010-05-04 09:45:22 -0300831 }
832}
833
Chegu Vinod3c022702013-06-24 03:49:41 -0600834void async_run_on_cpu(CPUState *cpu, void (*func)(void *data), void *data)
835{
836 struct qemu_work_item *wi;
837
838 if (qemu_cpu_is_self(cpu)) {
839 func(data);
840 return;
841 }
842
843 wi = g_malloc0(sizeof(struct qemu_work_item));
844 wi->func = func;
845 wi->data = data;
846 wi->free = true;
847 if (cpu->queued_work_first == NULL) {
848 cpu->queued_work_first = wi;
849 } else {
850 cpu->queued_work_last->next = wi;
851 }
852 cpu->queued_work_last = wi;
853 wi->next = NULL;
854 wi->done = false;
855
856 qemu_cpu_kick(cpu);
857}
858
Andreas Färber6d45b102012-05-03 02:13:22 +0200859static void flush_queued_work(CPUState *cpu)
Marcelo Tosattie82bcec2010-05-04 09:45:22 -0300860{
861 struct qemu_work_item *wi;
862
Andreas Färberc64ca812012-05-03 02:11:45 +0200863 if (cpu->queued_work_first == NULL) {
Marcelo Tosattie82bcec2010-05-04 09:45:22 -0300864 return;
Jan Kiszka0ab07c62011-02-07 12:19:14 +0100865 }
Marcelo Tosattie82bcec2010-05-04 09:45:22 -0300866
Andreas Färberc64ca812012-05-03 02:11:45 +0200867 while ((wi = cpu->queued_work_first)) {
868 cpu->queued_work_first = wi->next;
Marcelo Tosattie82bcec2010-05-04 09:45:22 -0300869 wi->func(wi->data);
870 wi->done = true;
Chegu Vinod3c022702013-06-24 03:49:41 -0600871 if (wi->free) {
872 g_free(wi);
873 }
Marcelo Tosattie82bcec2010-05-04 09:45:22 -0300874 }
Andreas Färberc64ca812012-05-03 02:11:45 +0200875 cpu->queued_work_last = NULL;
Marcelo Tosattie82bcec2010-05-04 09:45:22 -0300876 qemu_cond_broadcast(&qemu_work_cond);
877}
878
Andreas Färber509a0d72012-05-03 02:18:09 +0200879static void qemu_wait_io_event_common(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +0000880{
Andreas Färber4fdeee72012-05-02 23:10:09 +0200881 if (cpu->stop) {
882 cpu->stop = false;
Andreas Färberf324e762012-05-02 23:26:21 +0200883 cpu->stopped = true;
Blue Swirl296af7c2010-03-29 19:23:50 +0000884 qemu_cond_signal(&qemu_pause_cond);
885 }
Andreas Färber6d45b102012-05-03 02:13:22 +0200886 flush_queued_work(cpu);
Andreas Färber216fc9a2012-05-02 17:49:49 +0200887 cpu->thread_kicked = false;
Blue Swirl296af7c2010-03-29 19:23:50 +0000888}
889
Jan Kiszka6cabe1f2010-06-25 16:56:53 +0200890static void qemu_tcg_wait_io_event(void)
Blue Swirl296af7c2010-03-29 19:23:50 +0000891{
Andreas Färber182735e2013-05-29 22:29:20 +0200892 CPUState *cpu;
Jan Kiszka6cabe1f2010-06-25 16:56:53 +0200893
Jan Kiszka16400322011-02-09 16:29:37 +0100894 while (all_cpu_threads_idle()) {
Paolo Bonziniab33fcd2011-04-13 10:03:44 +0200895 /* Start accounting real time to the virtual clock if the CPUs
896 are idle. */
Alex Bligh40daca52013-08-21 16:03:02 +0100897 qemu_clock_warp(QEMU_CLOCK_VIRTUAL);
Paolo Bonzini9705fbb2011-03-12 17:44:00 +0100898 qemu_cond_wait(tcg_halt_cond, &qemu_global_mutex);
Jan Kiszka16400322011-02-09 16:29:37 +0100899 }
Blue Swirl296af7c2010-03-29 19:23:50 +0000900
Paolo Bonzini46daff12011-06-09 13:10:24 +0200901 while (iothread_requesting_mutex) {
902 qemu_cond_wait(&qemu_io_proceeded_cond, &qemu_global_mutex);
903 }
Jan Kiszka6cabe1f2010-06-25 16:56:53 +0200904
Andreas Färberbdc44642013-06-24 23:50:24 +0200905 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +0200906 qemu_wait_io_event_common(cpu);
Jan Kiszka6cabe1f2010-06-25 16:56:53 +0200907 }
Blue Swirl296af7c2010-03-29 19:23:50 +0000908}
909
Andreas Färberfd529e82013-05-26 23:24:55 +0200910static void qemu_kvm_wait_io_event(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +0000911{
Andreas Färbera98ae1d2013-05-26 23:21:08 +0200912 while (cpu_thread_is_idle(cpu)) {
Andreas Färberf5c121b2012-05-03 01:22:49 +0200913 qemu_cond_wait(cpu->halt_cond, &qemu_global_mutex);
Jan Kiszka16400322011-02-09 16:29:37 +0100914 }
Blue Swirl296af7c2010-03-29 19:23:50 +0000915
Andreas Färber290adf32013-01-17 09:30:27 +0100916 qemu_kvm_eat_signals(cpu);
Andreas Färber509a0d72012-05-03 02:18:09 +0200917 qemu_wait_io_event_common(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000918}
919
Jan Kiszka7e97cd82011-02-07 12:19:12 +0100920static void *qemu_kvm_cpu_thread_fn(void *arg)
Blue Swirl296af7c2010-03-29 19:23:50 +0000921{
Andreas Färber48a106b2013-05-27 02:20:39 +0200922 CPUState *cpu = arg;
Jan Kiszka84b49152011-02-01 22:15:50 +0100923 int r;
Blue Swirl296af7c2010-03-29 19:23:50 +0000924
Marcelo Tosatti6164e6d2010-03-23 13:37:13 -0300925 qemu_mutex_lock(&qemu_global_mutex);
Andreas Färber814e6122012-05-02 17:00:37 +0200926 qemu_thread_get_self(cpu->thread);
Andreas Färber9f09e182012-05-03 06:59:07 +0200927 cpu->thread_id = qemu_get_thread_id();
Andreas Färber4917cf42013-05-27 05:17:50 +0200928 current_cpu = cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +0000929
Andreas Färber504134d2012-12-17 06:38:45 +0100930 r = kvm_init_vcpu(cpu);
Jan Kiszka84b49152011-02-01 22:15:50 +0100931 if (r < 0) {
932 fprintf(stderr, "kvm_init_vcpu failed: %s\n", strerror(-r));
933 exit(1);
934 }
Blue Swirl296af7c2010-03-29 19:23:50 +0000935
Andreas Färber13618e02013-05-26 23:41:00 +0200936 qemu_kvm_init_cpu_signals(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000937
938 /* signal CPU creation */
Andreas Färber61a46212012-05-02 22:49:36 +0200939 cpu->created = true;
Blue Swirl296af7c2010-03-29 19:23:50 +0000940 qemu_cond_signal(&qemu_cpu_cond);
941
Blue Swirl296af7c2010-03-29 19:23:50 +0000942 while (1) {
Andreas Färbera1fcaa72012-05-02 23:42:26 +0200943 if (cpu_can_run(cpu)) {
Andreas Färber1458c362013-05-26 23:46:55 +0200944 r = kvm_cpu_exec(cpu);
Jan Kiszka83f338f2011-02-07 12:19:17 +0100945 if (r == EXCP_DEBUG) {
Andreas Färber91325042013-05-27 02:07:49 +0200946 cpu_handle_guest_debug(cpu);
Jan Kiszka83f338f2011-02-07 12:19:17 +0100947 }
Jan Kiszka0ab07c62011-02-07 12:19:14 +0100948 }
Andreas Färberfd529e82013-05-26 23:24:55 +0200949 qemu_kvm_wait_io_event(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +0000950 }
951
952 return NULL;
953}
954
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +0200955static void *qemu_dummy_cpu_thread_fn(void *arg)
956{
957#ifdef _WIN32
958 fprintf(stderr, "qtest is not supported under Windows\n");
959 exit(1);
960#else
Andreas Färber10a90212013-05-27 02:24:35 +0200961 CPUState *cpu = arg;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +0200962 sigset_t waitset;
963 int r;
964
965 qemu_mutex_lock_iothread();
Andreas Färber814e6122012-05-02 17:00:37 +0200966 qemu_thread_get_self(cpu->thread);
Andreas Färber9f09e182012-05-03 06:59:07 +0200967 cpu->thread_id = qemu_get_thread_id();
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +0200968
969 sigemptyset(&waitset);
970 sigaddset(&waitset, SIG_IPI);
971
972 /* signal CPU creation */
Andreas Färber61a46212012-05-02 22:49:36 +0200973 cpu->created = true;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +0200974 qemu_cond_signal(&qemu_cpu_cond);
975
Andreas Färber4917cf42013-05-27 05:17:50 +0200976 current_cpu = cpu;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +0200977 while (1) {
Andreas Färber4917cf42013-05-27 05:17:50 +0200978 current_cpu = NULL;
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +0200979 qemu_mutex_unlock_iothread();
980 do {
981 int sig;
982 r = sigwait(&waitset, &sig);
983 } while (r == -1 && (errno == EAGAIN || errno == EINTR));
984 if (r == -1) {
985 perror("sigwait");
986 exit(1);
987 }
988 qemu_mutex_lock_iothread();
Andreas Färber4917cf42013-05-27 05:17:50 +0200989 current_cpu = cpu;
Andreas Färber509a0d72012-05-03 02:18:09 +0200990 qemu_wait_io_event_common(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +0200991 }
992
993 return NULL;
994#endif
995}
996
Jan Kiszkabdb7ca62011-09-26 09:40:39 +0200997static void tcg_exec_all(void);
998
Jan Kiszka7e97cd82011-02-07 12:19:12 +0100999static void *qemu_tcg_cpu_thread_fn(void *arg)
Blue Swirl296af7c2010-03-29 19:23:50 +00001000{
Andreas Färberc3586ba2012-05-03 01:41:24 +02001001 CPUState *cpu = arg;
Blue Swirl296af7c2010-03-29 19:23:50 +00001002
Jan Kiszka55f8d6a2011-02-01 22:15:52 +01001003 qemu_tcg_init_cpu_signals();
Andreas Färber814e6122012-05-02 17:00:37 +02001004 qemu_thread_get_self(cpu->thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001005
Blue Swirl296af7c2010-03-29 19:23:50 +00001006 qemu_mutex_lock(&qemu_global_mutex);
Andreas Färber38fcbd32013-07-07 19:50:23 +02001007 CPU_FOREACH(cpu) {
1008 cpu->thread_id = qemu_get_thread_id();
1009 cpu->created = true;
1010 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001011 qemu_cond_signal(&qemu_cpu_cond);
1012
Jan Kiszkafa7d1862011-08-22 18:35:25 +02001013 /* wait for initial kick-off after machine start */
Andreas Färberbdc44642013-06-24 23:50:24 +02001014 while (QTAILQ_FIRST(&cpus)->stopped) {
Jan Kiszkafa7d1862011-08-22 18:35:25 +02001015 qemu_cond_wait(tcg_halt_cond, &qemu_global_mutex);
Jan Kiszka8e564b42012-02-17 18:31:15 +01001016
1017 /* process any pending work */
Andreas Färberbdc44642013-06-24 23:50:24 +02001018 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001019 qemu_wait_io_event_common(cpu);
Jan Kiszka8e564b42012-02-17 18:31:15 +01001020 }
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001021 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001022
1023 while (1) {
Jan Kiszkabdb7ca62011-09-26 09:40:39 +02001024 tcg_exec_all();
Alex Blighac70aaf2013-08-21 16:02:57 +01001025
1026 if (use_icount) {
Alex Bligh40daca52013-08-21 16:03:02 +01001027 int64_t deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
Alex Blighac70aaf2013-08-21 16:02:57 +01001028
1029 if (deadline == 0) {
Alex Bligh40daca52013-08-21 16:03:02 +01001030 qemu_clock_notify(QEMU_CLOCK_VIRTUAL);
Alex Blighac70aaf2013-08-21 16:02:57 +01001031 }
Paolo Bonzini3b2319a2011-04-13 10:03:43 +02001032 }
Jan Kiszka6cabe1f2010-06-25 16:56:53 +02001033 qemu_tcg_wait_io_event();
Blue Swirl296af7c2010-03-29 19:23:50 +00001034 }
1035
1036 return NULL;
1037}
1038
Andreas Färber2ff09a42012-05-03 00:23:30 +02001039static void qemu_cpu_kick_thread(CPUState *cpu)
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001040{
1041#ifndef _WIN32
1042 int err;
1043
Andreas Färber814e6122012-05-02 17:00:37 +02001044 err = pthread_kill(cpu->thread->thread, SIG_IPI);
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001045 if (err) {
1046 fprintf(stderr, "qemu:%s: %s", __func__, strerror(err));
1047 exit(1);
1048 }
1049#else /* _WIN32 */
Andreas Färber60e82572012-05-02 22:23:49 +02001050 if (!qemu_cpu_is_self(cpu)) {
Olivier Hainqueed9164a2013-04-09 18:06:53 +02001051 CONTEXT tcgContext;
1052
1053 if (SuspendThread(cpu->hThread) == (DWORD)-1) {
Stefan Weil7f1721d2013-04-13 22:45:50 +02001054 fprintf(stderr, "qemu:%s: GetLastError:%lu\n", __func__,
Olivier Hainqueed9164a2013-04-09 18:06:53 +02001055 GetLastError());
1056 exit(1);
1057 }
1058
1059 /* On multi-core systems, we are not sure that the thread is actually
1060 * suspended until we can get the context.
1061 */
1062 tcgContext.ContextFlags = CONTEXT_CONTROL;
1063 while (GetThreadContext(cpu->hThread, &tcgContext) != 0) {
1064 continue;
1065 }
1066
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001067 cpu_signal(0);
Olivier Hainqueed9164a2013-04-09 18:06:53 +02001068
1069 if (ResumeThread(cpu->hThread) == (DWORD)-1) {
Stefan Weil7f1721d2013-04-13 22:45:50 +02001070 fprintf(stderr, "qemu:%s: GetLastError:%lu\n", __func__,
Olivier Hainqueed9164a2013-04-09 18:06:53 +02001071 GetLastError());
1072 exit(1);
1073 }
Paolo Bonzinicc015e92011-03-12 17:44:08 +01001074 }
1075#endif
1076}
1077
Andreas Färberc08d7422012-05-03 04:34:15 +02001078void qemu_cpu_kick(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001079{
Andreas Färberf5c121b2012-05-03 01:22:49 +02001080 qemu_cond_broadcast(cpu->halt_cond);
Andreas Färber216fc9a2012-05-02 17:49:49 +02001081 if (!tcg_enabled() && !cpu->thread_kicked) {
Andreas Färber2ff09a42012-05-03 00:23:30 +02001082 qemu_cpu_kick_thread(cpu);
Andreas Färber216fc9a2012-05-02 17:49:49 +02001083 cpu->thread_kicked = true;
Jan Kiszkaaa2c3642011-02-01 22:15:42 +01001084 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001085}
1086
Jan Kiszka46d62fa2011-02-01 22:15:59 +01001087void qemu_cpu_kick_self(void)
1088{
Paolo Bonzinib55c22c2011-03-12 17:44:07 +01001089#ifndef _WIN32
Andreas Färber4917cf42013-05-27 05:17:50 +02001090 assert(current_cpu);
Jan Kiszka46d62fa2011-02-01 22:15:59 +01001091
Andreas Färber4917cf42013-05-27 05:17:50 +02001092 if (!current_cpu->thread_kicked) {
1093 qemu_cpu_kick_thread(current_cpu);
1094 current_cpu->thread_kicked = true;
Jan Kiszka46d62fa2011-02-01 22:15:59 +01001095 }
Paolo Bonzinib55c22c2011-03-12 17:44:07 +01001096#else
1097 abort();
1098#endif
Blue Swirl296af7c2010-03-29 19:23:50 +00001099}
1100
Andreas Färber60e82572012-05-02 22:23:49 +02001101bool qemu_cpu_is_self(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001102{
Andreas Färber814e6122012-05-02 17:00:37 +02001103 return qemu_thread_is_self(cpu->thread);
Blue Swirl296af7c2010-03-29 19:23:50 +00001104}
1105
Juan Quintelaaa723c22012-09-18 16:30:11 +02001106static bool qemu_in_vcpu_thread(void)
1107{
Andreas Färber4917cf42013-05-27 05:17:50 +02001108 return current_cpu && qemu_cpu_is_self(current_cpu);
Juan Quintelaaa723c22012-09-18 16:30:11 +02001109}
1110
Blue Swirl296af7c2010-03-29 19:23:50 +00001111void qemu_mutex_lock_iothread(void)
1112{
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001113 if (!tcg_enabled()) {
Blue Swirl296af7c2010-03-29 19:23:50 +00001114 qemu_mutex_lock(&qemu_global_mutex);
Marcelo Tosatti1a28cac2010-05-04 09:45:20 -03001115 } else {
Paolo Bonzini46daff12011-06-09 13:10:24 +02001116 iothread_requesting_mutex = true;
Marcelo Tosatti1a28cac2010-05-04 09:45:20 -03001117 if (qemu_mutex_trylock(&qemu_global_mutex)) {
Andreas Färber182735e2013-05-29 22:29:20 +02001118 qemu_cpu_kick_thread(first_cpu);
Marcelo Tosatti1a28cac2010-05-04 09:45:20 -03001119 qemu_mutex_lock(&qemu_global_mutex);
1120 }
Paolo Bonzini46daff12011-06-09 13:10:24 +02001121 iothread_requesting_mutex = false;
1122 qemu_cond_broadcast(&qemu_io_proceeded_cond);
Marcelo Tosatti1a28cac2010-05-04 09:45:20 -03001123 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001124}
1125
1126void qemu_mutex_unlock_iothread(void)
1127{
1128 qemu_mutex_unlock(&qemu_global_mutex);
1129}
1130
1131static int all_vcpus_paused(void)
1132{
Andreas Färberbdc44642013-06-24 23:50:24 +02001133 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001134
Andreas Färberbdc44642013-06-24 23:50:24 +02001135 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001136 if (!cpu->stopped) {
Blue Swirl296af7c2010-03-29 19:23:50 +00001137 return 0;
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001138 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001139 }
1140
1141 return 1;
1142}
1143
1144void pause_all_vcpus(void)
1145{
Andreas Färberbdc44642013-06-24 23:50:24 +02001146 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001147
Alex Bligh40daca52013-08-21 16:03:02 +01001148 qemu_clock_enable(QEMU_CLOCK_VIRTUAL, false);
Andreas Färberbdc44642013-06-24 23:50:24 +02001149 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001150 cpu->stop = true;
1151 qemu_cpu_kick(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001152 }
1153
Juan Quintelaaa723c22012-09-18 16:30:11 +02001154 if (qemu_in_vcpu_thread()) {
Jan Kiszkad798e972012-02-17 18:31:16 +01001155 cpu_stop_current();
1156 if (!kvm_enabled()) {
Andreas Färberbdc44642013-06-24 23:50:24 +02001157 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001158 cpu->stop = false;
1159 cpu->stopped = true;
Jan Kiszkad798e972012-02-17 18:31:16 +01001160 }
1161 return;
1162 }
1163 }
1164
Blue Swirl296af7c2010-03-29 19:23:50 +00001165 while (!all_vcpus_paused()) {
Paolo Bonzinibe7d6c52011-03-12 17:44:02 +01001166 qemu_cond_wait(&qemu_pause_cond, &qemu_global_mutex);
Andreas Färberbdc44642013-06-24 23:50:24 +02001167 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001168 qemu_cpu_kick(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001169 }
1170 }
1171}
1172
Igor Mammedov29936832013-04-23 10:29:37 +02001173void cpu_resume(CPUState *cpu)
1174{
1175 cpu->stop = false;
1176 cpu->stopped = false;
1177 qemu_cpu_kick(cpu);
1178}
1179
Blue Swirl296af7c2010-03-29 19:23:50 +00001180void resume_all_vcpus(void)
1181{
Andreas Färberbdc44642013-06-24 23:50:24 +02001182 CPUState *cpu;
Blue Swirl296af7c2010-03-29 19:23:50 +00001183
Alex Bligh40daca52013-08-21 16:03:02 +01001184 qemu_clock_enable(QEMU_CLOCK_VIRTUAL, true);
Andreas Färberbdc44642013-06-24 23:50:24 +02001185 CPU_FOREACH(cpu) {
Andreas Färber182735e2013-05-29 22:29:20 +02001186 cpu_resume(cpu);
Blue Swirl296af7c2010-03-29 19:23:50 +00001187 }
1188}
1189
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001190/* For temporary buffers for forming a name */
1191#define VCPU_THREAD_NAME_SIZE 16
1192
Andreas Färbere5ab30a2012-05-03 01:50:44 +02001193static void qemu_tcg_init_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001194{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001195 char thread_name[VCPU_THREAD_NAME_SIZE];
1196
Edgar E. Iglesias09daed82013-12-17 13:06:51 +10001197 tcg_cpu_address_space_init(cpu, cpu->as);
1198
Blue Swirl296af7c2010-03-29 19:23:50 +00001199 /* share a single thread for all cpus with TCG */
1200 if (!tcg_cpu_thread) {
Andreas Färber814e6122012-05-02 17:00:37 +02001201 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001202 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1203 qemu_cond_init(cpu->halt_cond);
1204 tcg_halt_cond = cpu->halt_cond;
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001205 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/TCG",
1206 cpu->cpu_index);
1207 qemu_thread_create(cpu->thread, thread_name, qemu_tcg_cpu_thread_fn,
1208 cpu, QEMU_THREAD_JOINABLE);
Paolo Bonzini1ecf47b2011-12-13 13:43:52 +01001209#ifdef _WIN32
Andreas Färber814e6122012-05-02 17:00:37 +02001210 cpu->hThread = qemu_thread_get_handle(cpu->thread);
Paolo Bonzini1ecf47b2011-12-13 13:43:52 +01001211#endif
Andreas Färber61a46212012-05-02 22:49:36 +02001212 while (!cpu->created) {
Paolo Bonzini18a85722011-03-12 17:44:03 +01001213 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001214 }
Andreas Färber814e6122012-05-02 17:00:37 +02001215 tcg_cpu_thread = cpu->thread;
Blue Swirl296af7c2010-03-29 19:23:50 +00001216 } else {
Andreas Färber814e6122012-05-02 17:00:37 +02001217 cpu->thread = tcg_cpu_thread;
Andreas Färberf5c121b2012-05-03 01:22:49 +02001218 cpu->halt_cond = tcg_halt_cond;
Blue Swirl296af7c2010-03-29 19:23:50 +00001219 }
1220}
1221
Andreas Färber48a106b2013-05-27 02:20:39 +02001222static void qemu_kvm_start_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001223{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001224 char thread_name[VCPU_THREAD_NAME_SIZE];
1225
Andreas Färber814e6122012-05-02 17:00:37 +02001226 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001227 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1228 qemu_cond_init(cpu->halt_cond);
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001229 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/KVM",
1230 cpu->cpu_index);
1231 qemu_thread_create(cpu->thread, thread_name, qemu_kvm_cpu_thread_fn,
1232 cpu, QEMU_THREAD_JOINABLE);
Andreas Färber61a46212012-05-02 22:49:36 +02001233 while (!cpu->created) {
Paolo Bonzini18a85722011-03-12 17:44:03 +01001234 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001235 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001236}
1237
Andreas Färber10a90212013-05-27 02:24:35 +02001238static void qemu_dummy_start_vcpu(CPUState *cpu)
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001239{
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001240 char thread_name[VCPU_THREAD_NAME_SIZE];
1241
Andreas Färber814e6122012-05-02 17:00:37 +02001242 cpu->thread = g_malloc0(sizeof(QemuThread));
Andreas Färberf5c121b2012-05-03 01:22:49 +02001243 cpu->halt_cond = g_malloc0(sizeof(QemuCond));
1244 qemu_cond_init(cpu->halt_cond);
Dr. David Alan Gilbert49001162014-01-30 10:20:32 +00001245 snprintf(thread_name, VCPU_THREAD_NAME_SIZE, "CPU %d/DUMMY",
1246 cpu->cpu_index);
1247 qemu_thread_create(cpu->thread, thread_name, qemu_dummy_cpu_thread_fn, cpu,
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001248 QEMU_THREAD_JOINABLE);
Andreas Färber61a46212012-05-02 22:49:36 +02001249 while (!cpu->created) {
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001250 qemu_cond_wait(&qemu_cpu_cond, &qemu_global_mutex);
1251 }
1252}
1253
Andreas Färberc643bed2013-05-27 03:23:24 +02001254void qemu_init_vcpu(CPUState *cpu)
Blue Swirl296af7c2010-03-29 19:23:50 +00001255{
Andreas Färberce3960e2012-12-17 03:27:07 +01001256 cpu->nr_cores = smp_cores;
1257 cpu->nr_threads = smp_threads;
Andreas Färberf324e762012-05-02 23:26:21 +02001258 cpu->stopped = true;
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001259 if (kvm_enabled()) {
Andreas Färber48a106b2013-05-27 02:20:39 +02001260 qemu_kvm_start_vcpu(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001261 } else if (tcg_enabled()) {
Andreas Färbere5ab30a2012-05-03 01:50:44 +02001262 qemu_tcg_init_vcpu(cpu);
Anthony Liguoric7f0f3b2012-03-28 15:42:02 +02001263 } else {
Andreas Färber10a90212013-05-27 02:24:35 +02001264 qemu_dummy_start_vcpu(cpu);
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001265 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001266}
1267
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001268void cpu_stop_current(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001269{
Andreas Färber4917cf42013-05-27 05:17:50 +02001270 if (current_cpu) {
1271 current_cpu->stop = false;
1272 current_cpu->stopped = true;
1273 cpu_exit(current_cpu);
Paolo Bonzini67bb1722011-03-12 17:43:59 +01001274 qemu_cond_signal(&qemu_pause_cond);
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001275 }
Blue Swirl296af7c2010-03-29 19:23:50 +00001276}
1277
Kevin Wolf56983462013-07-05 13:49:54 +02001278int vm_stop(RunState state)
Blue Swirl296af7c2010-03-29 19:23:50 +00001279{
Juan Quintelaaa723c22012-09-18 16:30:11 +02001280 if (qemu_in_vcpu_thread()) {
Paolo Bonzini74892d22014-06-05 14:53:58 +02001281 qemu_system_vmstop_request_prepare();
Luiz Capitulino1dfb4dd2011-07-29 14:26:33 -03001282 qemu_system_vmstop_request(state);
Blue Swirl296af7c2010-03-29 19:23:50 +00001283 /*
1284 * FIXME: should not return to device code in case
1285 * vm_stop() has been requested.
1286 */
Jan Kiszkab4a3d962011-02-01 22:15:43 +01001287 cpu_stop_current();
Kevin Wolf56983462013-07-05 13:49:54 +02001288 return 0;
Blue Swirl296af7c2010-03-29 19:23:50 +00001289 }
Kevin Wolf56983462013-07-05 13:49:54 +02001290
1291 return do_vm_stop(state);
Blue Swirl296af7c2010-03-29 19:23:50 +00001292}
1293
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001294/* does a state transition even if the VM is already stopped,
1295 current state is forgotten forever */
Kevin Wolf56983462013-07-05 13:49:54 +02001296int vm_stop_force_state(RunState state)
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001297{
1298 if (runstate_is_running()) {
Kevin Wolf56983462013-07-05 13:49:54 +02001299 return vm_stop(state);
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001300 } else {
1301 runstate_set(state);
Kevin Wolf594a45c2013-07-18 14:52:19 +02001302 /* Make sure to return an error if the flush in a previous vm_stop()
1303 * failed. */
1304 return bdrv_flush_all();
Luiz Capitulino8a9236f2011-10-14 11:18:09 -03001305 }
1306}
1307
Andreas Färber9349b4f2012-03-14 01:38:32 +01001308static int tcg_cpu_exec(CPUArchState *env)
Blue Swirl296af7c2010-03-29 19:23:50 +00001309{
Andreas Färberefee7342013-08-26 05:39:29 +02001310 CPUState *cpu = ENV_GET_CPU(env);
Blue Swirl296af7c2010-03-29 19:23:50 +00001311 int ret;
1312#ifdef CONFIG_PROFILER
1313 int64_t ti;
1314#endif
1315
1316#ifdef CONFIG_PROFILER
1317 ti = profile_getclock();
1318#endif
1319 if (use_icount) {
1320 int64_t count;
Alex Blighac70aaf2013-08-21 16:02:57 +01001321 int64_t deadline;
Blue Swirl296af7c2010-03-29 19:23:50 +00001322 int decr;
KONRAD Fredericc96778b2014-08-01 01:37:09 +02001323 timers_state.qemu_icount -= (cpu->icount_decr.u16.low
1324 + cpu->icount_extra);
Andreas Färber28ecfd72013-08-26 05:51:49 +02001325 cpu->icount_decr.u16.low = 0;
Andreas Färberefee7342013-08-26 05:39:29 +02001326 cpu->icount_extra = 0;
Alex Bligh40daca52013-08-21 16:03:02 +01001327 deadline = qemu_clock_deadline_ns_all(QEMU_CLOCK_VIRTUAL);
Alex Blighac70aaf2013-08-21 16:02:57 +01001328
1329 /* Maintain prior (possibly buggy) behaviour where if no deadline
Alex Bligh40daca52013-08-21 16:03:02 +01001330 * was set (as there is no QEMU_CLOCK_VIRTUAL timer) or it is more than
Alex Blighac70aaf2013-08-21 16:02:57 +01001331 * INT32_MAX nanoseconds ahead, we still use INT32_MAX
1332 * nanoseconds.
1333 */
1334 if ((deadline < 0) || (deadline > INT32_MAX)) {
1335 deadline = INT32_MAX;
1336 }
1337
1338 count = qemu_icount_round(deadline);
KONRAD Fredericc96778b2014-08-01 01:37:09 +02001339 timers_state.qemu_icount += count;
Blue Swirl296af7c2010-03-29 19:23:50 +00001340 decr = (count > 0xffff) ? 0xffff : count;
1341 count -= decr;
Andreas Färber28ecfd72013-08-26 05:51:49 +02001342 cpu->icount_decr.u16.low = decr;
Andreas Färberefee7342013-08-26 05:39:29 +02001343 cpu->icount_extra = count;
Blue Swirl296af7c2010-03-29 19:23:50 +00001344 }
1345 ret = cpu_exec(env);
1346#ifdef CONFIG_PROFILER
1347 qemu_time += profile_getclock() - ti;
1348#endif
1349 if (use_icount) {
1350 /* Fold pending instructions back into the
1351 instruction counter, and clear the interrupt flag. */
KONRAD Fredericc96778b2014-08-01 01:37:09 +02001352 timers_state.qemu_icount -= (cpu->icount_decr.u16.low
1353 + cpu->icount_extra);
Andreas Färber28ecfd72013-08-26 05:51:49 +02001354 cpu->icount_decr.u32 = 0;
Andreas Färberefee7342013-08-26 05:39:29 +02001355 cpu->icount_extra = 0;
Blue Swirl296af7c2010-03-29 19:23:50 +00001356 }
1357 return ret;
1358}
1359
Jan Kiszkabdb7ca62011-09-26 09:40:39 +02001360static void tcg_exec_all(void)
Blue Swirl296af7c2010-03-29 19:23:50 +00001361{
Jan Kiszka9a360852011-02-01 22:15:55 +01001362 int r;
1363
Alex Bligh40daca52013-08-21 16:03:02 +01001364 /* Account partial waits to QEMU_CLOCK_VIRTUAL. */
1365 qemu_clock_warp(QEMU_CLOCK_VIRTUAL);
Paolo Bonziniab33fcd2011-04-13 10:03:44 +02001366
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001367 if (next_cpu == NULL) {
Blue Swirl296af7c2010-03-29 19:23:50 +00001368 next_cpu = first_cpu;
Jan Kiszka0ab07c62011-02-07 12:19:14 +01001369 }
Andreas Färberbdc44642013-06-24 23:50:24 +02001370 for (; next_cpu != NULL && !exit_request; next_cpu = CPU_NEXT(next_cpu)) {
Andreas Färber182735e2013-05-29 22:29:20 +02001371 CPUState *cpu = next_cpu;
1372 CPUArchState *env = cpu->env_ptr;
Blue Swirl296af7c2010-03-29 19:23:50 +00001373
Alex Bligh40daca52013-08-21 16:03:02 +01001374 qemu_clock_enable(QEMU_CLOCK_VIRTUAL,
Andreas Färbered2803d2013-06-21 20:20:45 +02001375 (cpu->singlestep_enabled & SSTEP_NOTIMER) == 0);
Blue Swirl296af7c2010-03-29 19:23:50 +00001376
Andreas Färbera1fcaa72012-05-02 23:42:26 +02001377 if (cpu_can_run(cpu)) {
Jan Kiszkabdb7ca62011-09-26 09:40:39 +02001378 r = tcg_cpu_exec(env);
Jan Kiszka9a360852011-02-01 22:15:55 +01001379 if (r == EXCP_DEBUG) {
Andreas Färber91325042013-05-27 02:07:49 +02001380 cpu_handle_guest_debug(cpu);
Jan Kiszka3c638d02010-06-25 16:56:56 +02001381 break;
1382 }
Andreas Färberf324e762012-05-02 23:26:21 +02001383 } else if (cpu->stop || cpu->stopped) {
Blue Swirl296af7c2010-03-29 19:23:50 +00001384 break;
1385 }
1386 }
Jan Kiszkac629a4b2010-06-25 16:56:52 +02001387 exit_request = 0;
Blue Swirl296af7c2010-03-29 19:23:50 +00001388}
1389
Stefan Weil9a78eea2010-10-22 23:03:33 +02001390void list_cpus(FILE *f, fprintf_function cpu_fprintf, const char *optarg)
Blue Swirl262353c2010-05-04 19:55:35 +00001391{
1392 /* XXX: implement xxx_cpu_list for targets that still miss it */
Peter Maydelle916cbf2012-09-05 17:41:08 -03001393#if defined(cpu_list)
1394 cpu_list(f, cpu_fprintf);
Blue Swirl262353c2010-05-04 19:55:35 +00001395#endif
1396}
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001397
1398CpuInfoList *qmp_query_cpus(Error **errp)
1399{
1400 CpuInfoList *head = NULL, *cur_item = NULL;
Andreas Färber182735e2013-05-29 22:29:20 +02001401 CPUState *cpu;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001402
Andreas Färberbdc44642013-06-24 23:50:24 +02001403 CPU_FOREACH(cpu) {
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001404 CpuInfoList *info;
Andreas Färber182735e2013-05-29 22:29:20 +02001405#if defined(TARGET_I386)
1406 X86CPU *x86_cpu = X86_CPU(cpu);
1407 CPUX86State *env = &x86_cpu->env;
1408#elif defined(TARGET_PPC)
1409 PowerPCCPU *ppc_cpu = POWERPC_CPU(cpu);
1410 CPUPPCState *env = &ppc_cpu->env;
1411#elif defined(TARGET_SPARC)
1412 SPARCCPU *sparc_cpu = SPARC_CPU(cpu);
1413 CPUSPARCState *env = &sparc_cpu->env;
1414#elif defined(TARGET_MIPS)
1415 MIPSCPU *mips_cpu = MIPS_CPU(cpu);
1416 CPUMIPSState *env = &mips_cpu->env;
Bastian Koppelmann48e06fe2014-09-01 12:59:46 +01001417#elif defined(TARGET_TRICORE)
1418 TriCoreCPU *tricore_cpu = TRICORE_CPU(cpu);
1419 CPUTriCoreState *env = &tricore_cpu->env;
Andreas Färber182735e2013-05-29 22:29:20 +02001420#endif
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001421
Andreas Färbercb446ec2013-05-01 14:24:52 +02001422 cpu_synchronize_state(cpu);
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001423
1424 info = g_malloc0(sizeof(*info));
1425 info->value = g_malloc0(sizeof(*info->value));
Andreas Färber55e5c282012-12-17 06:18:02 +01001426 info->value->CPU = cpu->cpu_index;
Andreas Färber182735e2013-05-29 22:29:20 +02001427 info->value->current = (cpu == first_cpu);
Andreas Färber259186a2013-01-17 18:51:17 +01001428 info->value->halted = cpu->halted;
Andreas Färber9f09e182012-05-03 06:59:07 +02001429 info->value->thread_id = cpu->thread_id;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001430#if defined(TARGET_I386)
1431 info->value->has_pc = true;
1432 info->value->pc = env->eip + env->segs[R_CS].base;
1433#elif defined(TARGET_PPC)
1434 info->value->has_nip = true;
1435 info->value->nip = env->nip;
1436#elif defined(TARGET_SPARC)
1437 info->value->has_pc = true;
1438 info->value->pc = env->pc;
1439 info->value->has_npc = true;
1440 info->value->npc = env->npc;
1441#elif defined(TARGET_MIPS)
1442 info->value->has_PC = true;
1443 info->value->PC = env->active_tc.PC;
Bastian Koppelmann48e06fe2014-09-01 12:59:46 +01001444#elif defined(TARGET_TRICORE)
1445 info->value->has_PC = true;
1446 info->value->PC = env->PC;
Luiz Capitulinode0b36b2011-09-21 16:38:35 -03001447#endif
1448
1449 /* XXX: waiting for the qapi to support GSList */
1450 if (!cur_item) {
1451 head = cur_item = info;
1452 } else {
1453 cur_item->next = info;
1454 cur_item = info;
1455 }
1456 }
1457
1458 return head;
1459}
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001460
1461void qmp_memsave(int64_t addr, int64_t size, const char *filename,
1462 bool has_cpu, int64_t cpu_index, Error **errp)
1463{
1464 FILE *f;
1465 uint32_t l;
Andreas Färber55e5c282012-12-17 06:18:02 +01001466 CPUState *cpu;
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001467 uint8_t buf[1024];
1468
1469 if (!has_cpu) {
1470 cpu_index = 0;
1471 }
1472
Andreas Färber151d1322013-02-15 15:41:49 +01001473 cpu = qemu_get_cpu(cpu_index);
1474 if (cpu == NULL) {
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001475 error_set(errp, QERR_INVALID_PARAMETER_VALUE, "cpu-index",
1476 "a CPU number");
1477 return;
1478 }
1479
1480 f = fopen(filename, "wb");
1481 if (!f) {
Luiz Capitulino618da852013-06-07 14:35:06 -04001482 error_setg_file_open(errp, errno, filename);
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001483 return;
1484 }
1485
1486 while (size != 0) {
1487 l = sizeof(buf);
1488 if (l > size)
1489 l = size;
Aneesh Kumar K.V2f4d0f52013-10-01 21:49:30 +05301490 if (cpu_memory_rw_debug(cpu, addr, buf, l, 0) != 0) {
1491 error_setg(errp, "Invalid addr 0x%016" PRIx64 "specified", addr);
1492 goto exit;
1493 }
Luiz Capitulino0cfd6a92011-11-22 16:32:37 -02001494 if (fwrite(buf, 1, l, f) != l) {
1495 error_set(errp, QERR_IO_ERROR);
1496 goto exit;
1497 }
1498 addr += l;
1499 size -= l;
1500 }
1501
1502exit:
1503 fclose(f);
1504}
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001505
1506void qmp_pmemsave(int64_t addr, int64_t size, const char *filename,
1507 Error **errp)
1508{
1509 FILE *f;
1510 uint32_t l;
1511 uint8_t buf[1024];
1512
1513 f = fopen(filename, "wb");
1514 if (!f) {
Luiz Capitulino618da852013-06-07 14:35:06 -04001515 error_setg_file_open(errp, errno, filename);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001516 return;
1517 }
1518
1519 while (size != 0) {
1520 l = sizeof(buf);
1521 if (l > size)
1522 l = size;
Stefan Weileb6282f2014-04-07 20:28:23 +02001523 cpu_physical_memory_read(addr, buf, l);
Luiz Capitulino6d3962b2011-11-22 17:26:46 -02001524 if (fwrite(buf, 1, l, f) != l) {
1525 error_set(errp, QERR_IO_ERROR);
1526 goto exit;
1527 }
1528 addr += l;
1529 size -= l;
1530 }
1531
1532exit:
1533 fclose(f);
1534}
Luiz Capitulinoab49ab52011-11-23 12:55:53 -02001535
1536void qmp_inject_nmi(Error **errp)
1537{
1538#if defined(TARGET_I386)
Andreas Färber182735e2013-05-29 22:29:20 +02001539 CPUState *cs;
Luiz Capitulinoab49ab52011-11-23 12:55:53 -02001540
Andreas Färberbdc44642013-06-24 23:50:24 +02001541 CPU_FOREACH(cs) {
Andreas Färber182735e2013-05-29 22:29:20 +02001542 X86CPU *cpu = X86_CPU(cs);
Andreas Färber182735e2013-05-29 22:29:20 +02001543
Chen Fan02e51482013-12-23 17:04:02 +08001544 if (!cpu->apic_state) {
Andreas Färber182735e2013-05-29 22:29:20 +02001545 cpu_interrupt(cs, CPU_INTERRUPT_NMI);
Jan Kiszka02c09192011-10-18 00:00:06 +08001546 } else {
Chen Fan02e51482013-12-23 17:04:02 +08001547 apic_deliver_nmi(cpu->apic_state);
Jan Kiszka02c09192011-10-18 00:00:06 +08001548 }
Luiz Capitulinoab49ab52011-11-23 12:55:53 -02001549 }
1550#else
Alexey Kardashevskiy9cb805f2014-08-20 22:16:33 +10001551 nmi_monitor_handle(monitor_get_cpu_index(), errp);
Luiz Capitulinoab49ab52011-11-23 12:55:53 -02001552#endif
1553}
Sebastian Tanase27498be2014-07-25 11:56:33 +02001554
1555void dump_drift_info(FILE *f, fprintf_function cpu_fprintf)
1556{
1557 if (!use_icount) {
1558 return;
1559 }
1560
1561 cpu_fprintf(f, "Host - Guest clock %"PRIi64" ms\n",
1562 (cpu_get_clock() - cpu_get_icount())/SCALE_MS);
1563 if (icount_align_option) {
1564 cpu_fprintf(f, "Max guest delay %"PRIi64" ms\n", -max_delay/SCALE_MS);
1565 cpu_fprintf(f, "Max guest advance %"PRIi64" ms\n", max_advance/SCALE_MS);
1566 } else {
1567 cpu_fprintf(f, "Max guest delay NA\n");
1568 cpu_fprintf(f, "Max guest advance NA\n");
1569 }
1570}