blob: 468d51749f4cc190662e2741ebfaf27b3aab4719 [file] [log] [blame]
aliguori5bb79102008-10-13 03:12:02 +00001/*
2 * QEMU live migration
3 *
4 * Copyright IBM, Corp. 2008
5 *
6 * Authors:
7 * Anthony Liguori <aliguori@us.ibm.com>
8 *
9 * This work is licensed under the terms of the GNU GPL, version 2. See
10 * the COPYING file in the top-level directory.
11 *
12 */
13
14#include "qemu-common.h"
15#include "migration.h"
aliguori376253e2009-03-05 23:01:23 +000016#include "monitor.h"
aliguori065e2812008-11-11 16:46:33 +000017#include "buffered_file.h"
18#include "sysemu.h"
19#include "block.h"
20#include "qemu_socket.h"
Jan Kiszka25f23642009-11-30 18:21:21 +010021#include "block-migration.h"
Luiz Capitulinoc86a6682009-12-10 17:16:05 -020022#include "qemu-objects.h"
aliguori065e2812008-11-11 16:46:33 +000023
24//#define DEBUG_MIGRATION
25
26#ifdef DEBUG_MIGRATION
malcd0f2c4c2010-02-07 02:03:50 +030027#define DPRINTF(fmt, ...) \
aliguori065e2812008-11-11 16:46:33 +000028 do { printf("migration: " fmt, ## __VA_ARGS__); } while (0)
29#else
malcd0f2c4c2010-02-07 02:03:50 +030030#define DPRINTF(fmt, ...) \
aliguori065e2812008-11-11 16:46:33 +000031 do { } while (0)
32#endif
aliguori5bb79102008-10-13 03:12:02 +000033
34/* Migration speed throttling */
35static uint32_t max_throttle = (32 << 20);
36
37static MigrationState *current_migration;
38
Juan Quintela8ca5e802010-06-09 14:10:54 +020039int qemu_start_incoming_migration(const char *uri)
aliguori5bb79102008-10-13 03:12:02 +000040{
aliguori34c9dd82008-10-13 03:14:31 +000041 const char *p;
Juan Quintela8ca5e802010-06-09 14:10:54 +020042 int ret;
aliguori34c9dd82008-10-13 03:14:31 +000043
44 if (strstart(uri, "tcp:", &p))
Juan Quintela8ca5e802010-06-09 14:10:54 +020045 ret = tcp_start_incoming_migration(p);
aliguori065e2812008-11-11 16:46:33 +000046#if !defined(WIN32)
47 else if (strstart(uri, "exec:", &p))
Juan Quintela8ca5e802010-06-09 14:10:54 +020048 ret = exec_start_incoming_migration(p);
Chris Lalancette4951f652009-08-05 17:24:29 +020049 else if (strstart(uri, "unix:", &p))
Juan Quintela8ca5e802010-06-09 14:10:54 +020050 ret = unix_start_incoming_migration(p);
Paolo Bonzini5ac1fad2009-08-18 15:56:25 +020051 else if (strstart(uri, "fd:", &p))
Juan Quintela8ca5e802010-06-09 14:10:54 +020052 ret = fd_start_incoming_migration(p);
aliguori065e2812008-11-11 16:46:33 +000053#endif
Juan Quintela8ca5e802010-06-09 14:10:54 +020054 else {
aliguori34c9dd82008-10-13 03:14:31 +000055 fprintf(stderr, "unknown migration protocol: %s\n", uri);
Juan Quintela8ca5e802010-06-09 14:10:54 +020056 ret = -EPROTONOSUPPORT;
57 }
58 return ret;
aliguori5bb79102008-10-13 03:12:02 +000059}
60
Juan Quintela511c0232010-06-09 14:10:55 +020061void process_incoming_migration(QEMUFile *f)
62{
63 if (qemu_loadvm_state(f) < 0) {
64 fprintf(stderr, "load of migration failed\n");
65 exit(0);
66 }
67 qemu_announce_self();
68 DPRINTF("successfully loaded vm state\n");
69
Amit Shah8e848652010-07-27 15:49:19 +053070 incoming_expected = false;
71
Juan Quintela511c0232010-06-09 14:10:55 +020072 if (autostart)
73 vm_start();
74}
75
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020076int do_migrate(Monitor *mon, const QDict *qdict, QObject **ret_data)
aliguori5bb79102008-10-13 03:12:02 +000077{
aliguori34c9dd82008-10-13 03:14:31 +000078 MigrationState *s = NULL;
79 const char *p;
Luiz Capitulinoeb159d12010-05-28 15:25:24 -030080 int detach = qdict_get_try_bool(qdict, "detach", 0);
81 int blk = qdict_get_try_bool(qdict, "blk", 0);
82 int inc = qdict_get_try_bool(qdict, "inc", 0);
Luiz Capitulinof18c16d2009-08-28 15:27:14 -030083 const char *uri = qdict_get_str(qdict, "uri");
Jan Kiszka13024252009-11-30 18:21:19 +010084
85 if (current_migration &&
86 current_migration->get_status(current_migration) == MIG_STATE_ACTIVE) {
87 monitor_printf(mon, "migration already in progress\n");
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020088 return -1;
Jan Kiszka13024252009-11-30 18:21:19 +010089 }
90
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020091 if (strstart(uri, "tcp:", &p)) {
Jan Kiszkaf327aa02009-11-30 18:21:21 +010092 s = tcp_start_outgoing_migration(mon, p, max_throttle, detach,
Luiz Capitulinoeb159d12010-05-28 15:25:24 -030093 blk, inc);
aliguori065e2812008-11-11 16:46:33 +000094#if !defined(WIN32)
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020095 } else if (strstart(uri, "exec:", &p)) {
Jan Kiszkaf327aa02009-11-30 18:21:21 +010096 s = exec_start_outgoing_migration(mon, p, max_throttle, detach,
Luiz Capitulinoeb159d12010-05-28 15:25:24 -030097 blk, inc);
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020098 } else if (strstart(uri, "unix:", &p)) {
Jan Kiszkaf327aa02009-11-30 18:21:21 +010099 s = unix_start_outgoing_migration(mon, p, max_throttle, detach,
Luiz Capitulinoeb159d12010-05-28 15:25:24 -0300100 blk, inc);
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -0200101 } else if (strstart(uri, "fd:", &p)) {
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +0200102 s = fd_start_outgoing_migration(mon, p, max_throttle, detach,
Luiz Capitulinoeb159d12010-05-28 15:25:24 -0300103 blk, inc);
aliguori065e2812008-11-11 16:46:33 +0000104#endif
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -0200105 } else {
aliguori376253e2009-03-05 23:01:23 +0000106 monitor_printf(mon, "unknown migration protocol: %s\n", uri);
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -0200107 return -1;
aliguori34c9dd82008-10-13 03:14:31 +0000108 }
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -0200109
110 if (s == NULL) {
111 monitor_printf(mon, "migration failed\n");
112 return -1;
113 }
114
115 if (current_migration) {
116 current_migration->release(current_migration);
117 }
118
119 current_migration = s;
120 return 0;
aliguori5bb79102008-10-13 03:12:02 +0000121}
122
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200123int do_migrate_cancel(Monitor *mon, const QDict *qdict, QObject **ret_data)
aliguori5bb79102008-10-13 03:12:02 +0000124{
125 MigrationState *s = current_migration;
126
127 if (s)
aliguoriff8d81d2008-10-24 22:10:31 +0000128 s->cancel(s);
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200129
130 return 0;
aliguori5bb79102008-10-13 03:12:02 +0000131}
132
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200133int do_migrate_set_speed(Monitor *mon, const QDict *qdict, QObject **ret_data)
aliguori5bb79102008-10-13 03:12:02 +0000134{
135 double d;
Glauber Costadaa91de2009-05-20 18:26:58 -0400136 FdMigrationState *s;
aliguori5bb79102008-10-13 03:12:02 +0000137
Markus Armbruster5667c492010-01-25 14:23:04 +0100138 d = qdict_get_double(qdict, "value");
139 d = MAX(0, MIN(UINT32_MAX, d));
140 max_throttle = d;
Glauber Costadaa91de2009-05-20 18:26:58 -0400141
Jan Kiszka5d39c792009-11-30 18:21:19 +0100142 s = migrate_to_fms(current_migration);
143 if (s && s->file) {
Glauber Costadaa91de2009-05-20 18:26:58 -0400144 qemu_file_set_rate_limit(s->file, max_throttle);
145 }
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200146
147 return 0;
aliguori5bb79102008-10-13 03:12:02 +0000148}
149
Glauber Costaa0a3fd62009-05-28 15:22:57 -0400150/* amount of nanoseconds we are willing to wait for migration to be down.
151 * the choice of nanoseconds is because it is the maximum resolution that
152 * get_clock() can achieve. It is an internal measure. All user-visible
153 * units must be in seconds */
154static uint64_t max_downtime = 30000000;
155
156uint64_t migrate_max_downtime(void)
157{
158 return max_downtime;
159}
160
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200161int do_migrate_set_downtime(Monitor *mon, const QDict *qdict,
162 QObject **ret_data)
Glauber Costa2ea42952009-05-28 15:22:58 -0400163{
Glauber Costa2ea42952009-05-28 15:22:58 -0400164 double d;
165
Markus Armbrusterb0fbf7d2010-01-25 14:23:07 +0100166 d = qdict_get_double(qdict, "value") * 1e9;
167 d = MAX(0, MIN(UINT64_MAX, d));
Glauber Costa2ea42952009-05-28 15:22:58 -0400168 max_downtime = (uint64_t)d;
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200169
170 return 0;
Glauber Costa2ea42952009-05-28 15:22:58 -0400171}
172
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200173static void migrate_print_status(Monitor *mon, const char *name,
174 const QDict *status_dict)
aliguori5bb79102008-10-13 03:12:02 +0000175{
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200176 QDict *qdict;
177
178 qdict = qobject_to_qdict(qdict_get(status_dict, name));
179
180 monitor_printf(mon, "transferred %s: %" PRIu64 " kbytes\n", name,
181 qdict_get_int(qdict, "transferred") >> 10);
182 monitor_printf(mon, "remaining %s: %" PRIu64 " kbytes\n", name,
183 qdict_get_int(qdict, "remaining") >> 10);
184 monitor_printf(mon, "total %s: %" PRIu64 " kbytes\n", name,
185 qdict_get_int(qdict, "total") >> 10);
186}
187
188void do_info_migrate_print(Monitor *mon, const QObject *data)
189{
190 QDict *qdict;
191
192 qdict = qobject_to_qdict(data);
193
194 monitor_printf(mon, "Migration status: %s\n",
195 qdict_get_str(qdict, "status"));
196
197 if (qdict_haskey(qdict, "ram")) {
198 migrate_print_status(mon, "ram", qdict);
199 }
200
201 if (qdict_haskey(qdict, "disk")) {
202 migrate_print_status(mon, "disk", qdict);
203 }
204}
205
206static void migrate_put_status(QDict *qdict, const char *name,
207 uint64_t trans, uint64_t rem, uint64_t total)
208{
209 QObject *obj;
210
211 obj = qobject_from_jsonf("{ 'transferred': %" PRId64 ", "
212 "'remaining': %" PRId64 ", "
213 "'total': %" PRId64 " }", trans, rem, total);
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200214 qdict_put_obj(qdict, name, obj);
215}
216
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200217void do_info_migrate(Monitor *mon, QObject **ret_data)
218{
219 QDict *qdict;
aliguori5bb79102008-10-13 03:12:02 +0000220 MigrationState *s = current_migration;
aliguori376253e2009-03-05 23:01:23 +0000221
aliguori5bb79102008-10-13 03:12:02 +0000222 if (s) {
aliguoriff8d81d2008-10-24 22:10:31 +0000223 switch (s->get_status(s)) {
224 case MIG_STATE_ACTIVE:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200225 qdict = qdict_new();
226 qdict_put(qdict, "status", qstring_from_str("active"));
227
228 migrate_put_status(qdict, "ram", ram_bytes_transferred(),
229 ram_bytes_remaining(), ram_bytes_total());
230
Jan Kiszka25f23642009-11-30 18:21:21 +0100231 if (blk_mig_active()) {
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200232 migrate_put_status(qdict, "disk", blk_mig_bytes_transferred(),
233 blk_mig_bytes_remaining(),
234 blk_mig_bytes_total());
Jan Kiszka25f23642009-11-30 18:21:21 +0100235 }
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200236
237 *ret_data = QOBJECT(qdict);
aliguoriff8d81d2008-10-24 22:10:31 +0000238 break;
239 case MIG_STATE_COMPLETED:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200240 *ret_data = qobject_from_jsonf("{ 'status': 'completed' }");
aliguoriff8d81d2008-10-24 22:10:31 +0000241 break;
242 case MIG_STATE_ERROR:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200243 *ret_data = qobject_from_jsonf("{ 'status': 'failed' }");
aliguoriff8d81d2008-10-24 22:10:31 +0000244 break;
245 case MIG_STATE_CANCELLED:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200246 *ret_data = qobject_from_jsonf("{ 'status': 'cancelled' }");
aliguoriff8d81d2008-10-24 22:10:31 +0000247 break;
248 }
aliguori5bb79102008-10-13 03:12:02 +0000249 }
250}
251
aliguori065e2812008-11-11 16:46:33 +0000252/* shared migration helpers */
253
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100254void migrate_fd_monitor_suspend(FdMigrationState *s, Monitor *mon)
aliguori731b0362009-03-05 23:01:42 +0000255{
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100256 s->mon = mon;
257 if (monitor_suspend(mon) == 0) {
malcd0f2c4c2010-02-07 02:03:50 +0300258 DPRINTF("suspending monitor\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100259 } else {
260 monitor_printf(mon, "terminal does not allow synchronous "
aliguoricde76ee2009-03-05 23:01:51 +0000261 "migration, continuing detached\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100262 }
aliguori731b0362009-03-05 23:01:42 +0000263}
264
aliguori065e2812008-11-11 16:46:33 +0000265void migrate_fd_error(FdMigrationState *s)
266{
malcd0f2c4c2010-02-07 02:03:50 +0300267 DPRINTF("setting error state\n");
aliguori065e2812008-11-11 16:46:33 +0000268 s->state = MIG_STATE_ERROR;
269 migrate_fd_cleanup(s);
270}
271
Anthony Liguori41ef56e2010-06-02 14:55:25 -0500272int migrate_fd_cleanup(FdMigrationState *s)
aliguori065e2812008-11-11 16:46:33 +0000273{
Anthony Liguori41ef56e2010-06-02 14:55:25 -0500274 int ret = 0;
275
aliguori065e2812008-11-11 16:46:33 +0000276 qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
277
278 if (s->file) {
malcd0f2c4c2010-02-07 02:03:50 +0300279 DPRINTF("closing file\n");
Anthony Liguori41ef56e2010-06-02 14:55:25 -0500280 if (qemu_fclose(s->file) != 0) {
281 ret = -1;
282 }
Jan Kiszka5d39c792009-11-30 18:21:19 +0100283 s->file = NULL;
aliguori065e2812008-11-11 16:46:33 +0000284 }
285
286 if (s->fd != -1)
287 close(s->fd);
288
289 /* Don't resume monitor until we've flushed all of the buffers */
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100290 if (s->mon) {
291 monitor_resume(s->mon);
292 }
aliguori065e2812008-11-11 16:46:33 +0000293
294 s->fd = -1;
Anthony Liguori41ef56e2010-06-02 14:55:25 -0500295
296 return ret;
aliguori065e2812008-11-11 16:46:33 +0000297}
298
299void migrate_fd_put_notify(void *opaque)
300{
301 FdMigrationState *s = opaque;
302
303 qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
304 qemu_file_put_notify(s->file);
305}
306
307ssize_t migrate_fd_put_buffer(void *opaque, const void *data, size_t size)
308{
309 FdMigrationState *s = opaque;
310 ssize_t ret;
311
312 do {
313 ret = s->write(s, data, size);
Uri Lublin95b134e2009-05-19 14:08:53 +0300314 } while (ret == -1 && ((s->get_error(s)) == EINTR));
aliguori065e2812008-11-11 16:46:33 +0000315
316 if (ret == -1)
317 ret = -(s->get_error(s));
318
Marcelo Tosattie447b1a2010-08-19 10:18:39 -0300319 if (ret == -EAGAIN) {
aliguori065e2812008-11-11 16:46:33 +0000320 qemu_set_fd_handler2(s->fd, NULL, NULL, migrate_fd_put_notify, s);
Marcelo Tosattie447b1a2010-08-19 10:18:39 -0300321 } else if (ret < 0) {
322 if (s->mon) {
323 monitor_resume(s->mon);
324 }
325 s->state = MIG_STATE_ERROR;
326 }
aliguori065e2812008-11-11 16:46:33 +0000327
328 return ret;
329}
330
331void migrate_fd_connect(FdMigrationState *s)
332{
333 int ret;
334
335 s->file = qemu_fopen_ops_buffered(s,
336 s->bandwidth_limit,
337 migrate_fd_put_buffer,
338 migrate_fd_put_ready,
339 migrate_fd_wait_for_unfreeze,
340 migrate_fd_close);
341
malcd0f2c4c2010-02-07 02:03:50 +0300342 DPRINTF("beginning savevm\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100343 ret = qemu_savevm_state_begin(s->mon, s->file, s->mig_state.blk,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +0200344 s->mig_state.shared);
aliguori065e2812008-11-11 16:46:33 +0000345 if (ret < 0) {
malcd0f2c4c2010-02-07 02:03:50 +0300346 DPRINTF("failed, %d\n", ret);
aliguori065e2812008-11-11 16:46:33 +0000347 migrate_fd_error(s);
348 return;
349 }
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +0200350
aliguori065e2812008-11-11 16:46:33 +0000351 migrate_fd_put_ready(s);
352}
353
354void migrate_fd_put_ready(void *opaque)
355{
356 FdMigrationState *s = opaque;
357
358 if (s->state != MIG_STATE_ACTIVE) {
malcd0f2c4c2010-02-07 02:03:50 +0300359 DPRINTF("put_ready returning because of non-active state\n");
aliguori065e2812008-11-11 16:46:33 +0000360 return;
361 }
362
malcd0f2c4c2010-02-07 02:03:50 +0300363 DPRINTF("iterate\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100364 if (qemu_savevm_state_iterate(s->mon, s->file) == 1) {
aliguorib161d122009-04-05 19:30:33 +0000365 int state;
Anthony Liguorieeb34af2009-07-09 13:25:47 -0500366 int old_vm_running = vm_running;
367
malcd0f2c4c2010-02-07 02:03:50 +0300368 DPRINTF("done iterating\n");
aliguori065e2812008-11-11 16:46:33 +0000369 vm_stop(0);
370
Glauber Costa08846572009-07-06 09:32:09 -0400371 qemu_aio_flush();
aliguori065e2812008-11-11 16:46:33 +0000372 bdrv_flush_all();
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100373 if ((qemu_savevm_state_complete(s->mon, s->file)) < 0) {
Anthony Liguorieeb34af2009-07-09 13:25:47 -0500374 if (old_vm_running) {
375 vm_start();
376 }
aliguorib161d122009-04-05 19:30:33 +0000377 state = MIG_STATE_ERROR;
378 } else {
379 state = MIG_STATE_COMPLETED;
380 }
Anthony Liguori41ef56e2010-06-02 14:55:25 -0500381 if (migrate_fd_cleanup(s) < 0) {
382 if (old_vm_running) {
383 vm_start();
384 }
385 state = MIG_STATE_ERROR;
386 }
aliguorib161d122009-04-05 19:30:33 +0000387 s->state = state;
aliguori065e2812008-11-11 16:46:33 +0000388 }
389}
390
391int migrate_fd_get_status(MigrationState *mig_state)
392{
393 FdMigrationState *s = migrate_to_fms(mig_state);
394 return s->state;
395}
396
397void migrate_fd_cancel(MigrationState *mig_state)
398{
399 FdMigrationState *s = migrate_to_fms(mig_state);
400
401 if (s->state != MIG_STATE_ACTIVE)
402 return;
403
malcd0f2c4c2010-02-07 02:03:50 +0300404 DPRINTF("cancelling migration\n");
aliguori065e2812008-11-11 16:46:33 +0000405
406 s->state = MIG_STATE_CANCELLED;
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100407 qemu_savevm_state_cancel(s->mon, s->file);
aliguori065e2812008-11-11 16:46:33 +0000408
409 migrate_fd_cleanup(s);
410}
411
412void migrate_fd_release(MigrationState *mig_state)
413{
414 FdMigrationState *s = migrate_to_fms(mig_state);
415
malcd0f2c4c2010-02-07 02:03:50 +0300416 DPRINTF("releasing state\n");
aliguori065e2812008-11-11 16:46:33 +0000417
418 if (s->state == MIG_STATE_ACTIVE) {
419 s->state = MIG_STATE_CANCELLED;
420 migrate_fd_cleanup(s);
421 }
Yoshiaki Tamurafaa1f8d2010-06-09 14:44:31 +0900422 qemu_free(s);
aliguori065e2812008-11-11 16:46:33 +0000423}
424
425void migrate_fd_wait_for_unfreeze(void *opaque)
426{
427 FdMigrationState *s = opaque;
428 int ret;
429
malcd0f2c4c2010-02-07 02:03:50 +0300430 DPRINTF("wait for unfreeze\n");
aliguori065e2812008-11-11 16:46:33 +0000431 if (s->state != MIG_STATE_ACTIVE)
432 return;
433
434 do {
435 fd_set wfds;
436
437 FD_ZERO(&wfds);
438 FD_SET(s->fd, &wfds);
439
440 ret = select(s->fd + 1, NULL, &wfds, NULL, NULL);
441 } while (ret == -1 && (s->get_error(s)) == EINTR);
442}
443
444int migrate_fd_close(void *opaque)
445{
446 FdMigrationState *s = opaque;
Uri Lubline19252d2009-06-08 14:28:01 +0300447
448 qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
aliguori065e2812008-11-11 16:46:33 +0000449 return s->close(s);
450}