blob: 2320c5fdf41801d9f3b758302548fe2609b217d1 [file] [log] [blame]
aliguori5bb79102008-10-13 03:12:02 +00001/*
2 * QEMU live migration
3 *
4 * Copyright IBM, Corp. 2008
5 *
6 * Authors:
7 * Anthony Liguori <aliguori@us.ibm.com>
8 *
9 * This work is licensed under the terms of the GNU GPL, version 2. See
10 * the COPYING file in the top-level directory.
11 *
12 */
13
14#include "qemu-common.h"
15#include "migration.h"
aliguori376253e2009-03-05 23:01:23 +000016#include "monitor.h"
aliguori065e2812008-11-11 16:46:33 +000017#include "buffered_file.h"
18#include "sysemu.h"
19#include "block.h"
20#include "qemu_socket.h"
Jan Kiszka25f23642009-11-30 18:21:21 +010021#include "block-migration.h"
Luiz Capitulinoc86a6682009-12-10 17:16:05 -020022#include "qemu-objects.h"
aliguori065e2812008-11-11 16:46:33 +000023
24//#define DEBUG_MIGRATION
25
26#ifdef DEBUG_MIGRATION
malcd0f2c4c2010-02-07 02:03:50 +030027#define DPRINTF(fmt, ...) \
aliguori065e2812008-11-11 16:46:33 +000028 do { printf("migration: " fmt, ## __VA_ARGS__); } while (0)
29#else
malcd0f2c4c2010-02-07 02:03:50 +030030#define DPRINTF(fmt, ...) \
aliguori065e2812008-11-11 16:46:33 +000031 do { } while (0)
32#endif
aliguori5bb79102008-10-13 03:12:02 +000033
34/* Migration speed throttling */
35static uint32_t max_throttle = (32 << 20);
36
37static MigrationState *current_migration;
38
39void qemu_start_incoming_migration(const char *uri)
40{
aliguori34c9dd82008-10-13 03:14:31 +000041 const char *p;
42
43 if (strstart(uri, "tcp:", &p))
44 tcp_start_incoming_migration(p);
aliguori065e2812008-11-11 16:46:33 +000045#if !defined(WIN32)
46 else if (strstart(uri, "exec:", &p))
47 exec_start_incoming_migration(p);
Chris Lalancette4951f652009-08-05 17:24:29 +020048 else if (strstart(uri, "unix:", &p))
49 unix_start_incoming_migration(p);
Paolo Bonzini5ac1fad2009-08-18 15:56:25 +020050 else if (strstart(uri, "fd:", &p))
51 fd_start_incoming_migration(p);
aliguori065e2812008-11-11 16:46:33 +000052#endif
aliguori34c9dd82008-10-13 03:14:31 +000053 else
54 fprintf(stderr, "unknown migration protocol: %s\n", uri);
aliguori5bb79102008-10-13 03:12:02 +000055}
56
Luiz Capitulino5f79da02009-10-16 12:23:45 -030057void do_migrate(Monitor *mon, const QDict *qdict, QObject **ret_data)
aliguori5bb79102008-10-13 03:12:02 +000058{
aliguori34c9dd82008-10-13 03:14:31 +000059 MigrationState *s = NULL;
60 const char *p;
Luiz Capitulinof18c16d2009-08-28 15:27:14 -030061 int detach = qdict_get_int(qdict, "detach");
62 const char *uri = qdict_get_str(qdict, "uri");
Jan Kiszka13024252009-11-30 18:21:19 +010063
64 if (current_migration &&
65 current_migration->get_status(current_migration) == MIG_STATE_ACTIVE) {
66 monitor_printf(mon, "migration already in progress\n");
67 return;
68 }
69
aliguori34c9dd82008-10-13 03:14:31 +000070 if (strstart(uri, "tcp:", &p))
Jan Kiszkaf327aa02009-11-30 18:21:21 +010071 s = tcp_start_outgoing_migration(mon, p, max_throttle, detach,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +020072 (int)qdict_get_int(qdict, "blk"),
73 (int)qdict_get_int(qdict, "inc"));
aliguori065e2812008-11-11 16:46:33 +000074#if !defined(WIN32)
75 else if (strstart(uri, "exec:", &p))
Jan Kiszkaf327aa02009-11-30 18:21:21 +010076 s = exec_start_outgoing_migration(mon, p, max_throttle, detach,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +020077 (int)qdict_get_int(qdict, "blk"),
78 (int)qdict_get_int(qdict, "inc"));
Chris Lalancette4951f652009-08-05 17:24:29 +020079 else if (strstart(uri, "unix:", &p))
Jan Kiszkaf327aa02009-11-30 18:21:21 +010080 s = unix_start_outgoing_migration(mon, p, max_throttle, detach,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +020081 (int)qdict_get_int(qdict, "blk"),
82 (int)qdict_get_int(qdict, "inc"));
Paolo Bonzini5ac1fad2009-08-18 15:56:25 +020083 else if (strstart(uri, "fd:", &p))
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +020084 s = fd_start_outgoing_migration(mon, p, max_throttle, detach,
85 (int)qdict_get_int(qdict, "blk"),
86 (int)qdict_get_int(qdict, "inc"));
aliguori065e2812008-11-11 16:46:33 +000087#endif
aliguori34c9dd82008-10-13 03:14:31 +000088 else
aliguori376253e2009-03-05 23:01:23 +000089 monitor_printf(mon, "unknown migration protocol: %s\n", uri);
aliguori34c9dd82008-10-13 03:14:31 +000090
91 if (s == NULL)
aliguori376253e2009-03-05 23:01:23 +000092 monitor_printf(mon, "migration failed\n");
aliguori34c9dd82008-10-13 03:14:31 +000093 else {
aliguoriff8d81d2008-10-24 22:10:31 +000094 if (current_migration)
95 current_migration->release(current_migration);
aliguori34c9dd82008-10-13 03:14:31 +000096
aliguoriff8d81d2008-10-24 22:10:31 +000097 current_migration = s;
aliguori34c9dd82008-10-13 03:14:31 +000098 }
aliguori5bb79102008-10-13 03:12:02 +000099}
100
Luiz Capitulino911d2962009-10-16 12:23:47 -0300101void do_migrate_cancel(Monitor *mon, const QDict *qdict, QObject **ret_data)
aliguori5bb79102008-10-13 03:12:02 +0000102{
103 MigrationState *s = current_migration;
104
105 if (s)
aliguoriff8d81d2008-10-24 22:10:31 +0000106 s->cancel(s);
aliguori5bb79102008-10-13 03:12:02 +0000107}
108
Markus Armbruster5fd90832010-01-25 14:23:05 +0100109void do_migrate_set_speed(Monitor *mon, const QDict *qdict, QObject **ret_data)
aliguori5bb79102008-10-13 03:12:02 +0000110{
111 double d;
Glauber Costadaa91de2009-05-20 18:26:58 -0400112 FdMigrationState *s;
aliguori5bb79102008-10-13 03:12:02 +0000113
Markus Armbruster5667c492010-01-25 14:23:04 +0100114 d = qdict_get_double(qdict, "value");
115 d = MAX(0, MIN(UINT32_MAX, d));
116 max_throttle = d;
Glauber Costadaa91de2009-05-20 18:26:58 -0400117
Jan Kiszka5d39c792009-11-30 18:21:19 +0100118 s = migrate_to_fms(current_migration);
119 if (s && s->file) {
Glauber Costadaa91de2009-05-20 18:26:58 -0400120 qemu_file_set_rate_limit(s->file, max_throttle);
121 }
aliguori5bb79102008-10-13 03:12:02 +0000122}
123
Glauber Costaa0a3fd62009-05-28 15:22:57 -0400124/* amount of nanoseconds we are willing to wait for migration to be down.
125 * the choice of nanoseconds is because it is the maximum resolution that
126 * get_clock() can achieve. It is an internal measure. All user-visible
127 * units must be in seconds */
128static uint64_t max_downtime = 30000000;
129
130uint64_t migrate_max_downtime(void)
131{
132 return max_downtime;
133}
134
Markus Armbrusterc6027f52010-01-25 14:23:08 +0100135void do_migrate_set_downtime(Monitor *mon, const QDict *qdict,
136 QObject **ret_data)
Glauber Costa2ea42952009-05-28 15:22:58 -0400137{
Glauber Costa2ea42952009-05-28 15:22:58 -0400138 double d;
139
Markus Armbrusterb0fbf7d2010-01-25 14:23:07 +0100140 d = qdict_get_double(qdict, "value") * 1e9;
141 d = MAX(0, MIN(UINT64_MAX, d));
Glauber Costa2ea42952009-05-28 15:22:58 -0400142 max_downtime = (uint64_t)d;
143}
144
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200145static void migrate_print_status(Monitor *mon, const char *name,
146 const QDict *status_dict)
aliguori5bb79102008-10-13 03:12:02 +0000147{
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200148 QDict *qdict;
149
150 qdict = qobject_to_qdict(qdict_get(status_dict, name));
151
152 monitor_printf(mon, "transferred %s: %" PRIu64 " kbytes\n", name,
153 qdict_get_int(qdict, "transferred") >> 10);
154 monitor_printf(mon, "remaining %s: %" PRIu64 " kbytes\n", name,
155 qdict_get_int(qdict, "remaining") >> 10);
156 monitor_printf(mon, "total %s: %" PRIu64 " kbytes\n", name,
157 qdict_get_int(qdict, "total") >> 10);
158}
159
160void do_info_migrate_print(Monitor *mon, const QObject *data)
161{
162 QDict *qdict;
163
164 qdict = qobject_to_qdict(data);
165
166 monitor_printf(mon, "Migration status: %s\n",
167 qdict_get_str(qdict, "status"));
168
169 if (qdict_haskey(qdict, "ram")) {
170 migrate_print_status(mon, "ram", qdict);
171 }
172
173 if (qdict_haskey(qdict, "disk")) {
174 migrate_print_status(mon, "disk", qdict);
175 }
176}
177
178static void migrate_put_status(QDict *qdict, const char *name,
179 uint64_t trans, uint64_t rem, uint64_t total)
180{
181 QObject *obj;
182
183 obj = qobject_from_jsonf("{ 'transferred': %" PRId64 ", "
184 "'remaining': %" PRId64 ", "
185 "'total': %" PRId64 " }", trans, rem, total);
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200186 qdict_put_obj(qdict, name, obj);
187}
188
189/**
190 * do_info_migrate(): Migration status
191 *
192 * Return a QDict. If migration is active there will be another
193 * QDict with RAM migration status and if block migration is active
194 * another one with block migration status.
195 *
196 * The main QDict contains the following:
197 *
198 * - "status": migration status
199 * - "ram": only present if "status" is "active", it is a QDict with the
200 * following RAM information (in bytes):
201 * - "transferred": amount transferred
202 * - "remaining": amount remaining
203 * - "total": total
204 * - "disk": only present if "status" is "active" and it is a block migration,
205 * it is a QDict with the following disk information (in bytes):
206 * - "transferred": amount transferred
207 * - "remaining": amount remaining
208 * - "total": total
209 *
210 * Examples:
211 *
212 * 1. Migration is "completed":
213 *
214 * { "status": "completed" }
215 *
216 * 2. Migration is "active" and it is not a block migration:
217 *
218 * { "status": "active",
219 * "ram": { "transferred": 123, "remaining": 123, "total": 246 } }
220 *
221 * 3. Migration is "active" and it is a block migration:
222 *
223 * { "status": "active",
224 * "ram": { "total": 1057024, "remaining": 1053304, "transferred": 3720 },
225 * "disk": { "total": 20971520, "remaining": 20880384, "transferred": 91136 }}
226 */
227void do_info_migrate(Monitor *mon, QObject **ret_data)
228{
229 QDict *qdict;
aliguori5bb79102008-10-13 03:12:02 +0000230 MigrationState *s = current_migration;
aliguori376253e2009-03-05 23:01:23 +0000231
aliguori5bb79102008-10-13 03:12:02 +0000232 if (s) {
aliguoriff8d81d2008-10-24 22:10:31 +0000233 switch (s->get_status(s)) {
234 case MIG_STATE_ACTIVE:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200235 qdict = qdict_new();
236 qdict_put(qdict, "status", qstring_from_str("active"));
237
238 migrate_put_status(qdict, "ram", ram_bytes_transferred(),
239 ram_bytes_remaining(), ram_bytes_total());
240
Jan Kiszka25f23642009-11-30 18:21:21 +0100241 if (blk_mig_active()) {
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200242 migrate_put_status(qdict, "disk", blk_mig_bytes_transferred(),
243 blk_mig_bytes_remaining(),
244 blk_mig_bytes_total());
Jan Kiszka25f23642009-11-30 18:21:21 +0100245 }
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200246
247 *ret_data = QOBJECT(qdict);
aliguoriff8d81d2008-10-24 22:10:31 +0000248 break;
249 case MIG_STATE_COMPLETED:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200250 *ret_data = qobject_from_jsonf("{ 'status': 'completed' }");
aliguoriff8d81d2008-10-24 22:10:31 +0000251 break;
252 case MIG_STATE_ERROR:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200253 *ret_data = qobject_from_jsonf("{ 'status': 'failed' }");
aliguoriff8d81d2008-10-24 22:10:31 +0000254 break;
255 case MIG_STATE_CANCELLED:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200256 *ret_data = qobject_from_jsonf("{ 'status': 'cancelled' }");
aliguoriff8d81d2008-10-24 22:10:31 +0000257 break;
258 }
aliguori5bb79102008-10-13 03:12:02 +0000259 }
260}
261
aliguori065e2812008-11-11 16:46:33 +0000262/* shared migration helpers */
263
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100264void migrate_fd_monitor_suspend(FdMigrationState *s, Monitor *mon)
aliguori731b0362009-03-05 23:01:42 +0000265{
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100266 s->mon = mon;
267 if (monitor_suspend(mon) == 0) {
malcd0f2c4c2010-02-07 02:03:50 +0300268 DPRINTF("suspending monitor\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100269 } else {
270 monitor_printf(mon, "terminal does not allow synchronous "
aliguoricde76ee2009-03-05 23:01:51 +0000271 "migration, continuing detached\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100272 }
aliguori731b0362009-03-05 23:01:42 +0000273}
274
aliguori065e2812008-11-11 16:46:33 +0000275void migrate_fd_error(FdMigrationState *s)
276{
malcd0f2c4c2010-02-07 02:03:50 +0300277 DPRINTF("setting error state\n");
aliguori065e2812008-11-11 16:46:33 +0000278 s->state = MIG_STATE_ERROR;
279 migrate_fd_cleanup(s);
280}
281
282void migrate_fd_cleanup(FdMigrationState *s)
283{
284 qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
285
286 if (s->file) {
malcd0f2c4c2010-02-07 02:03:50 +0300287 DPRINTF("closing file\n");
aliguori065e2812008-11-11 16:46:33 +0000288 qemu_fclose(s->file);
Jan Kiszka5d39c792009-11-30 18:21:19 +0100289 s->file = NULL;
aliguori065e2812008-11-11 16:46:33 +0000290 }
291
292 if (s->fd != -1)
293 close(s->fd);
294
295 /* Don't resume monitor until we've flushed all of the buffers */
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100296 if (s->mon) {
297 monitor_resume(s->mon);
298 }
aliguori065e2812008-11-11 16:46:33 +0000299
300 s->fd = -1;
301}
302
303void migrate_fd_put_notify(void *opaque)
304{
305 FdMigrationState *s = opaque;
306
307 qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
308 qemu_file_put_notify(s->file);
309}
310
311ssize_t migrate_fd_put_buffer(void *opaque, const void *data, size_t size)
312{
313 FdMigrationState *s = opaque;
314 ssize_t ret;
315
316 do {
317 ret = s->write(s, data, size);
Uri Lublin95b134e2009-05-19 14:08:53 +0300318 } while (ret == -1 && ((s->get_error(s)) == EINTR));
aliguori065e2812008-11-11 16:46:33 +0000319
320 if (ret == -1)
321 ret = -(s->get_error(s));
322
323 if (ret == -EAGAIN)
324 qemu_set_fd_handler2(s->fd, NULL, NULL, migrate_fd_put_notify, s);
325
326 return ret;
327}
328
329void migrate_fd_connect(FdMigrationState *s)
330{
331 int ret;
332
333 s->file = qemu_fopen_ops_buffered(s,
334 s->bandwidth_limit,
335 migrate_fd_put_buffer,
336 migrate_fd_put_ready,
337 migrate_fd_wait_for_unfreeze,
338 migrate_fd_close);
339
malcd0f2c4c2010-02-07 02:03:50 +0300340 DPRINTF("beginning savevm\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100341 ret = qemu_savevm_state_begin(s->mon, s->file, s->mig_state.blk,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +0200342 s->mig_state.shared);
aliguori065e2812008-11-11 16:46:33 +0000343 if (ret < 0) {
malcd0f2c4c2010-02-07 02:03:50 +0300344 DPRINTF("failed, %d\n", ret);
aliguori065e2812008-11-11 16:46:33 +0000345 migrate_fd_error(s);
346 return;
347 }
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +0200348
aliguori065e2812008-11-11 16:46:33 +0000349 migrate_fd_put_ready(s);
350}
351
352void migrate_fd_put_ready(void *opaque)
353{
354 FdMigrationState *s = opaque;
355
356 if (s->state != MIG_STATE_ACTIVE) {
malcd0f2c4c2010-02-07 02:03:50 +0300357 DPRINTF("put_ready returning because of non-active state\n");
aliguori065e2812008-11-11 16:46:33 +0000358 return;
359 }
360
malcd0f2c4c2010-02-07 02:03:50 +0300361 DPRINTF("iterate\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100362 if (qemu_savevm_state_iterate(s->mon, s->file) == 1) {
aliguorib161d122009-04-05 19:30:33 +0000363 int state;
Anthony Liguorieeb34af2009-07-09 13:25:47 -0500364 int old_vm_running = vm_running;
365
malcd0f2c4c2010-02-07 02:03:50 +0300366 DPRINTF("done iterating\n");
aliguori065e2812008-11-11 16:46:33 +0000367 vm_stop(0);
368
Glauber Costa08846572009-07-06 09:32:09 -0400369 qemu_aio_flush();
aliguori065e2812008-11-11 16:46:33 +0000370 bdrv_flush_all();
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100371 if ((qemu_savevm_state_complete(s->mon, s->file)) < 0) {
Anthony Liguorieeb34af2009-07-09 13:25:47 -0500372 if (old_vm_running) {
373 vm_start();
374 }
aliguorib161d122009-04-05 19:30:33 +0000375 state = MIG_STATE_ERROR;
376 } else {
377 state = MIG_STATE_COMPLETED;
378 }
aliguori065e2812008-11-11 16:46:33 +0000379 migrate_fd_cleanup(s);
aliguorib161d122009-04-05 19:30:33 +0000380 s->state = state;
aliguori065e2812008-11-11 16:46:33 +0000381 }
382}
383
384int migrate_fd_get_status(MigrationState *mig_state)
385{
386 FdMigrationState *s = migrate_to_fms(mig_state);
387 return s->state;
388}
389
390void migrate_fd_cancel(MigrationState *mig_state)
391{
392 FdMigrationState *s = migrate_to_fms(mig_state);
393
394 if (s->state != MIG_STATE_ACTIVE)
395 return;
396
malcd0f2c4c2010-02-07 02:03:50 +0300397 DPRINTF("cancelling migration\n");
aliguori065e2812008-11-11 16:46:33 +0000398
399 s->state = MIG_STATE_CANCELLED;
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100400 qemu_savevm_state_cancel(s->mon, s->file);
aliguori065e2812008-11-11 16:46:33 +0000401
402 migrate_fd_cleanup(s);
403}
404
405void migrate_fd_release(MigrationState *mig_state)
406{
407 FdMigrationState *s = migrate_to_fms(mig_state);
408
malcd0f2c4c2010-02-07 02:03:50 +0300409 DPRINTF("releasing state\n");
aliguori065e2812008-11-11 16:46:33 +0000410
411 if (s->state == MIG_STATE_ACTIVE) {
412 s->state = MIG_STATE_CANCELLED;
413 migrate_fd_cleanup(s);
414 }
415 free(s);
416}
417
418void migrate_fd_wait_for_unfreeze(void *opaque)
419{
420 FdMigrationState *s = opaque;
421 int ret;
422
malcd0f2c4c2010-02-07 02:03:50 +0300423 DPRINTF("wait for unfreeze\n");
aliguori065e2812008-11-11 16:46:33 +0000424 if (s->state != MIG_STATE_ACTIVE)
425 return;
426
427 do {
428 fd_set wfds;
429
430 FD_ZERO(&wfds);
431 FD_SET(s->fd, &wfds);
432
433 ret = select(s->fd + 1, NULL, &wfds, NULL, NULL);
434 } while (ret == -1 && (s->get_error(s)) == EINTR);
435}
436
437int migrate_fd_close(void *opaque)
438{
439 FdMigrationState *s = opaque;
Uri Lubline19252d2009-06-08 14:28:01 +0300440
441 qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
aliguori065e2812008-11-11 16:46:33 +0000442 return s->close(s);
443}