blob: 05f6cc5a0f5004301ff0cd0f5fa9163301480ba2 [file] [log] [blame]
aliguori5bb79102008-10-13 03:12:02 +00001/*
2 * QEMU live migration
3 *
4 * Copyright IBM, Corp. 2008
5 *
6 * Authors:
7 * Anthony Liguori <aliguori@us.ibm.com>
8 *
9 * This work is licensed under the terms of the GNU GPL, version 2. See
10 * the COPYING file in the top-level directory.
11 *
12 */
13
14#include "qemu-common.h"
15#include "migration.h"
aliguori376253e2009-03-05 23:01:23 +000016#include "monitor.h"
aliguori065e2812008-11-11 16:46:33 +000017#include "buffered_file.h"
18#include "sysemu.h"
19#include "block.h"
20#include "qemu_socket.h"
Jan Kiszka25f23642009-11-30 18:21:21 +010021#include "block-migration.h"
Luiz Capitulinoc86a6682009-12-10 17:16:05 -020022#include "qemu-objects.h"
aliguori065e2812008-11-11 16:46:33 +000023
24//#define DEBUG_MIGRATION
25
26#ifdef DEBUG_MIGRATION
malcd0f2c4c2010-02-07 02:03:50 +030027#define DPRINTF(fmt, ...) \
aliguori065e2812008-11-11 16:46:33 +000028 do { printf("migration: " fmt, ## __VA_ARGS__); } while (0)
29#else
malcd0f2c4c2010-02-07 02:03:50 +030030#define DPRINTF(fmt, ...) \
aliguori065e2812008-11-11 16:46:33 +000031 do { } while (0)
32#endif
aliguori5bb79102008-10-13 03:12:02 +000033
34/* Migration speed throttling */
35static uint32_t max_throttle = (32 << 20);
36
37static MigrationState *current_migration;
38
39void qemu_start_incoming_migration(const char *uri)
40{
aliguori34c9dd82008-10-13 03:14:31 +000041 const char *p;
42
43 if (strstart(uri, "tcp:", &p))
44 tcp_start_incoming_migration(p);
aliguori065e2812008-11-11 16:46:33 +000045#if !defined(WIN32)
46 else if (strstart(uri, "exec:", &p))
47 exec_start_incoming_migration(p);
Chris Lalancette4951f652009-08-05 17:24:29 +020048 else if (strstart(uri, "unix:", &p))
49 unix_start_incoming_migration(p);
Paolo Bonzini5ac1fad2009-08-18 15:56:25 +020050 else if (strstart(uri, "fd:", &p))
51 fd_start_incoming_migration(p);
aliguori065e2812008-11-11 16:46:33 +000052#endif
aliguori34c9dd82008-10-13 03:14:31 +000053 else
54 fprintf(stderr, "unknown migration protocol: %s\n", uri);
aliguori5bb79102008-10-13 03:12:02 +000055}
56
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020057int do_migrate(Monitor *mon, const QDict *qdict, QObject **ret_data)
aliguori5bb79102008-10-13 03:12:02 +000058{
aliguori34c9dd82008-10-13 03:14:31 +000059 MigrationState *s = NULL;
60 const char *p;
Luiz Capitulinof18c16d2009-08-28 15:27:14 -030061 int detach = qdict_get_int(qdict, "detach");
62 const char *uri = qdict_get_str(qdict, "uri");
Jan Kiszka13024252009-11-30 18:21:19 +010063
64 if (current_migration &&
65 current_migration->get_status(current_migration) == MIG_STATE_ACTIVE) {
66 monitor_printf(mon, "migration already in progress\n");
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020067 return -1;
Jan Kiszka13024252009-11-30 18:21:19 +010068 }
69
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020070 if (strstart(uri, "tcp:", &p)) {
Jan Kiszkaf327aa02009-11-30 18:21:21 +010071 s = tcp_start_outgoing_migration(mon, p, max_throttle, detach,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +020072 (int)qdict_get_int(qdict, "blk"),
73 (int)qdict_get_int(qdict, "inc"));
aliguori065e2812008-11-11 16:46:33 +000074#if !defined(WIN32)
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020075 } else if (strstart(uri, "exec:", &p)) {
Jan Kiszkaf327aa02009-11-30 18:21:21 +010076 s = exec_start_outgoing_migration(mon, p, max_throttle, detach,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +020077 (int)qdict_get_int(qdict, "blk"),
78 (int)qdict_get_int(qdict, "inc"));
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020079 } else if (strstart(uri, "unix:", &p)) {
Jan Kiszkaf327aa02009-11-30 18:21:21 +010080 s = unix_start_outgoing_migration(mon, p, max_throttle, detach,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +020081 (int)qdict_get_int(qdict, "blk"),
82 (int)qdict_get_int(qdict, "inc"));
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020083 } else if (strstart(uri, "fd:", &p)) {
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +020084 s = fd_start_outgoing_migration(mon, p, max_throttle, detach,
85 (int)qdict_get_int(qdict, "blk"),
86 (int)qdict_get_int(qdict, "inc"));
aliguori065e2812008-11-11 16:46:33 +000087#endif
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020088 } else {
aliguori376253e2009-03-05 23:01:23 +000089 monitor_printf(mon, "unknown migration protocol: %s\n", uri);
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020090 return -1;
aliguori34c9dd82008-10-13 03:14:31 +000091 }
Luiz Capitulinob5d17ad2010-02-10 23:49:57 -020092
93 if (s == NULL) {
94 monitor_printf(mon, "migration failed\n");
95 return -1;
96 }
97
98 if (current_migration) {
99 current_migration->release(current_migration);
100 }
101
102 current_migration = s;
103 return 0;
aliguori5bb79102008-10-13 03:12:02 +0000104}
105
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200106int do_migrate_cancel(Monitor *mon, const QDict *qdict, QObject **ret_data)
aliguori5bb79102008-10-13 03:12:02 +0000107{
108 MigrationState *s = current_migration;
109
110 if (s)
aliguoriff8d81d2008-10-24 22:10:31 +0000111 s->cancel(s);
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200112
113 return 0;
aliguori5bb79102008-10-13 03:12:02 +0000114}
115
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200116int do_migrate_set_speed(Monitor *mon, const QDict *qdict, QObject **ret_data)
aliguori5bb79102008-10-13 03:12:02 +0000117{
118 double d;
Glauber Costadaa91de2009-05-20 18:26:58 -0400119 FdMigrationState *s;
aliguori5bb79102008-10-13 03:12:02 +0000120
Markus Armbruster5667c492010-01-25 14:23:04 +0100121 d = qdict_get_double(qdict, "value");
122 d = MAX(0, MIN(UINT32_MAX, d));
123 max_throttle = d;
Glauber Costadaa91de2009-05-20 18:26:58 -0400124
Jan Kiszka5d39c792009-11-30 18:21:19 +0100125 s = migrate_to_fms(current_migration);
126 if (s && s->file) {
Glauber Costadaa91de2009-05-20 18:26:58 -0400127 qemu_file_set_rate_limit(s->file, max_throttle);
128 }
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200129
130 return 0;
aliguori5bb79102008-10-13 03:12:02 +0000131}
132
Glauber Costaa0a3fd62009-05-28 15:22:57 -0400133/* amount of nanoseconds we are willing to wait for migration to be down.
134 * the choice of nanoseconds is because it is the maximum resolution that
135 * get_clock() can achieve. It is an internal measure. All user-visible
136 * units must be in seconds */
137static uint64_t max_downtime = 30000000;
138
139uint64_t migrate_max_downtime(void)
140{
141 return max_downtime;
142}
143
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200144int do_migrate_set_downtime(Monitor *mon, const QDict *qdict,
145 QObject **ret_data)
Glauber Costa2ea42952009-05-28 15:22:58 -0400146{
Glauber Costa2ea42952009-05-28 15:22:58 -0400147 double d;
148
Markus Armbrusterb0fbf7d2010-01-25 14:23:07 +0100149 d = qdict_get_double(qdict, "value") * 1e9;
150 d = MAX(0, MIN(UINT64_MAX, d));
Glauber Costa2ea42952009-05-28 15:22:58 -0400151 max_downtime = (uint64_t)d;
Luiz Capitulinoef4b7ee2010-02-10 23:49:48 -0200152
153 return 0;
Glauber Costa2ea42952009-05-28 15:22:58 -0400154}
155
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200156static void migrate_print_status(Monitor *mon, const char *name,
157 const QDict *status_dict)
aliguori5bb79102008-10-13 03:12:02 +0000158{
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200159 QDict *qdict;
160
161 qdict = qobject_to_qdict(qdict_get(status_dict, name));
162
163 monitor_printf(mon, "transferred %s: %" PRIu64 " kbytes\n", name,
164 qdict_get_int(qdict, "transferred") >> 10);
165 monitor_printf(mon, "remaining %s: %" PRIu64 " kbytes\n", name,
166 qdict_get_int(qdict, "remaining") >> 10);
167 monitor_printf(mon, "total %s: %" PRIu64 " kbytes\n", name,
168 qdict_get_int(qdict, "total") >> 10);
169}
170
171void do_info_migrate_print(Monitor *mon, const QObject *data)
172{
173 QDict *qdict;
174
175 qdict = qobject_to_qdict(data);
176
177 monitor_printf(mon, "Migration status: %s\n",
178 qdict_get_str(qdict, "status"));
179
180 if (qdict_haskey(qdict, "ram")) {
181 migrate_print_status(mon, "ram", qdict);
182 }
183
184 if (qdict_haskey(qdict, "disk")) {
185 migrate_print_status(mon, "disk", qdict);
186 }
187}
188
189static void migrate_put_status(QDict *qdict, const char *name,
190 uint64_t trans, uint64_t rem, uint64_t total)
191{
192 QObject *obj;
193
194 obj = qobject_from_jsonf("{ 'transferred': %" PRId64 ", "
195 "'remaining': %" PRId64 ", "
196 "'total': %" PRId64 " }", trans, rem, total);
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200197 qdict_put_obj(qdict, name, obj);
198}
199
200/**
201 * do_info_migrate(): Migration status
202 *
203 * Return a QDict. If migration is active there will be another
204 * QDict with RAM migration status and if block migration is active
205 * another one with block migration status.
206 *
207 * The main QDict contains the following:
208 *
209 * - "status": migration status
210 * - "ram": only present if "status" is "active", it is a QDict with the
211 * following RAM information (in bytes):
212 * - "transferred": amount transferred
213 * - "remaining": amount remaining
214 * - "total": total
215 * - "disk": only present if "status" is "active" and it is a block migration,
216 * it is a QDict with the following disk information (in bytes):
217 * - "transferred": amount transferred
218 * - "remaining": amount remaining
219 * - "total": total
220 *
221 * Examples:
222 *
223 * 1. Migration is "completed":
224 *
225 * { "status": "completed" }
226 *
227 * 2. Migration is "active" and it is not a block migration:
228 *
229 * { "status": "active",
230 * "ram": { "transferred": 123, "remaining": 123, "total": 246 } }
231 *
232 * 3. Migration is "active" and it is a block migration:
233 *
234 * { "status": "active",
235 * "ram": { "total": 1057024, "remaining": 1053304, "transferred": 3720 },
236 * "disk": { "total": 20971520, "remaining": 20880384, "transferred": 91136 }}
237 */
238void do_info_migrate(Monitor *mon, QObject **ret_data)
239{
240 QDict *qdict;
aliguori5bb79102008-10-13 03:12:02 +0000241 MigrationState *s = current_migration;
aliguori376253e2009-03-05 23:01:23 +0000242
aliguori5bb79102008-10-13 03:12:02 +0000243 if (s) {
aliguoriff8d81d2008-10-24 22:10:31 +0000244 switch (s->get_status(s)) {
245 case MIG_STATE_ACTIVE:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200246 qdict = qdict_new();
247 qdict_put(qdict, "status", qstring_from_str("active"));
248
249 migrate_put_status(qdict, "ram", ram_bytes_transferred(),
250 ram_bytes_remaining(), ram_bytes_total());
251
Jan Kiszka25f23642009-11-30 18:21:21 +0100252 if (blk_mig_active()) {
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200253 migrate_put_status(qdict, "disk", blk_mig_bytes_transferred(),
254 blk_mig_bytes_remaining(),
255 blk_mig_bytes_total());
Jan Kiszka25f23642009-11-30 18:21:21 +0100256 }
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200257
258 *ret_data = QOBJECT(qdict);
aliguoriff8d81d2008-10-24 22:10:31 +0000259 break;
260 case MIG_STATE_COMPLETED:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200261 *ret_data = qobject_from_jsonf("{ 'status': 'completed' }");
aliguoriff8d81d2008-10-24 22:10:31 +0000262 break;
263 case MIG_STATE_ERROR:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200264 *ret_data = qobject_from_jsonf("{ 'status': 'failed' }");
aliguoriff8d81d2008-10-24 22:10:31 +0000265 break;
266 case MIG_STATE_CANCELLED:
Luiz Capitulinoc86a6682009-12-10 17:16:05 -0200267 *ret_data = qobject_from_jsonf("{ 'status': 'cancelled' }");
aliguoriff8d81d2008-10-24 22:10:31 +0000268 break;
269 }
aliguori5bb79102008-10-13 03:12:02 +0000270 }
271}
272
aliguori065e2812008-11-11 16:46:33 +0000273/* shared migration helpers */
274
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100275void migrate_fd_monitor_suspend(FdMigrationState *s, Monitor *mon)
aliguori731b0362009-03-05 23:01:42 +0000276{
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100277 s->mon = mon;
278 if (monitor_suspend(mon) == 0) {
malcd0f2c4c2010-02-07 02:03:50 +0300279 DPRINTF("suspending monitor\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100280 } else {
281 monitor_printf(mon, "terminal does not allow synchronous "
aliguoricde76ee2009-03-05 23:01:51 +0000282 "migration, continuing detached\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100283 }
aliguori731b0362009-03-05 23:01:42 +0000284}
285
aliguori065e2812008-11-11 16:46:33 +0000286void migrate_fd_error(FdMigrationState *s)
287{
malcd0f2c4c2010-02-07 02:03:50 +0300288 DPRINTF("setting error state\n");
aliguori065e2812008-11-11 16:46:33 +0000289 s->state = MIG_STATE_ERROR;
290 migrate_fd_cleanup(s);
291}
292
293void migrate_fd_cleanup(FdMigrationState *s)
294{
295 qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
296
297 if (s->file) {
malcd0f2c4c2010-02-07 02:03:50 +0300298 DPRINTF("closing file\n");
aliguori065e2812008-11-11 16:46:33 +0000299 qemu_fclose(s->file);
Jan Kiszka5d39c792009-11-30 18:21:19 +0100300 s->file = NULL;
aliguori065e2812008-11-11 16:46:33 +0000301 }
302
303 if (s->fd != -1)
304 close(s->fd);
305
306 /* Don't resume monitor until we've flushed all of the buffers */
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100307 if (s->mon) {
308 monitor_resume(s->mon);
309 }
aliguori065e2812008-11-11 16:46:33 +0000310
311 s->fd = -1;
312}
313
314void migrate_fd_put_notify(void *opaque)
315{
316 FdMigrationState *s = opaque;
317
318 qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
319 qemu_file_put_notify(s->file);
320}
321
322ssize_t migrate_fd_put_buffer(void *opaque, const void *data, size_t size)
323{
324 FdMigrationState *s = opaque;
325 ssize_t ret;
326
327 do {
328 ret = s->write(s, data, size);
Uri Lublin95b134e2009-05-19 14:08:53 +0300329 } while (ret == -1 && ((s->get_error(s)) == EINTR));
aliguori065e2812008-11-11 16:46:33 +0000330
331 if (ret == -1)
332 ret = -(s->get_error(s));
333
334 if (ret == -EAGAIN)
335 qemu_set_fd_handler2(s->fd, NULL, NULL, migrate_fd_put_notify, s);
336
337 return ret;
338}
339
340void migrate_fd_connect(FdMigrationState *s)
341{
342 int ret;
343
344 s->file = qemu_fopen_ops_buffered(s,
345 s->bandwidth_limit,
346 migrate_fd_put_buffer,
347 migrate_fd_put_ready,
348 migrate_fd_wait_for_unfreeze,
349 migrate_fd_close);
350
malcd0f2c4c2010-02-07 02:03:50 +0300351 DPRINTF("beginning savevm\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100352 ret = qemu_savevm_state_begin(s->mon, s->file, s->mig_state.blk,
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +0200353 s->mig_state.shared);
aliguori065e2812008-11-11 16:46:33 +0000354 if (ret < 0) {
malcd0f2c4c2010-02-07 02:03:50 +0300355 DPRINTF("failed, %d\n", ret);
aliguori065e2812008-11-11 16:46:33 +0000356 migrate_fd_error(s);
357 return;
358 }
lirans@il.ibm.comc163b5c2009-11-02 15:40:58 +0200359
aliguori065e2812008-11-11 16:46:33 +0000360 migrate_fd_put_ready(s);
361}
362
363void migrate_fd_put_ready(void *opaque)
364{
365 FdMigrationState *s = opaque;
366
367 if (s->state != MIG_STATE_ACTIVE) {
malcd0f2c4c2010-02-07 02:03:50 +0300368 DPRINTF("put_ready returning because of non-active state\n");
aliguori065e2812008-11-11 16:46:33 +0000369 return;
370 }
371
malcd0f2c4c2010-02-07 02:03:50 +0300372 DPRINTF("iterate\n");
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100373 if (qemu_savevm_state_iterate(s->mon, s->file) == 1) {
aliguorib161d122009-04-05 19:30:33 +0000374 int state;
Anthony Liguorieeb34af2009-07-09 13:25:47 -0500375 int old_vm_running = vm_running;
376
malcd0f2c4c2010-02-07 02:03:50 +0300377 DPRINTF("done iterating\n");
aliguori065e2812008-11-11 16:46:33 +0000378 vm_stop(0);
379
Glauber Costa08846572009-07-06 09:32:09 -0400380 qemu_aio_flush();
aliguori065e2812008-11-11 16:46:33 +0000381 bdrv_flush_all();
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100382 if ((qemu_savevm_state_complete(s->mon, s->file)) < 0) {
Anthony Liguorieeb34af2009-07-09 13:25:47 -0500383 if (old_vm_running) {
384 vm_start();
385 }
aliguorib161d122009-04-05 19:30:33 +0000386 state = MIG_STATE_ERROR;
387 } else {
388 state = MIG_STATE_COMPLETED;
389 }
aliguori065e2812008-11-11 16:46:33 +0000390 migrate_fd_cleanup(s);
aliguorib161d122009-04-05 19:30:33 +0000391 s->state = state;
aliguori065e2812008-11-11 16:46:33 +0000392 }
393}
394
395int migrate_fd_get_status(MigrationState *mig_state)
396{
397 FdMigrationState *s = migrate_to_fms(mig_state);
398 return s->state;
399}
400
401void migrate_fd_cancel(MigrationState *mig_state)
402{
403 FdMigrationState *s = migrate_to_fms(mig_state);
404
405 if (s->state != MIG_STATE_ACTIVE)
406 return;
407
malcd0f2c4c2010-02-07 02:03:50 +0300408 DPRINTF("cancelling migration\n");
aliguori065e2812008-11-11 16:46:33 +0000409
410 s->state = MIG_STATE_CANCELLED;
Jan Kiszkaf327aa02009-11-30 18:21:21 +0100411 qemu_savevm_state_cancel(s->mon, s->file);
aliguori065e2812008-11-11 16:46:33 +0000412
413 migrate_fd_cleanup(s);
414}
415
416void migrate_fd_release(MigrationState *mig_state)
417{
418 FdMigrationState *s = migrate_to_fms(mig_state);
419
malcd0f2c4c2010-02-07 02:03:50 +0300420 DPRINTF("releasing state\n");
aliguori065e2812008-11-11 16:46:33 +0000421
422 if (s->state == MIG_STATE_ACTIVE) {
423 s->state = MIG_STATE_CANCELLED;
424 migrate_fd_cleanup(s);
425 }
426 free(s);
427}
428
429void migrate_fd_wait_for_unfreeze(void *opaque)
430{
431 FdMigrationState *s = opaque;
432 int ret;
433
malcd0f2c4c2010-02-07 02:03:50 +0300434 DPRINTF("wait for unfreeze\n");
aliguori065e2812008-11-11 16:46:33 +0000435 if (s->state != MIG_STATE_ACTIVE)
436 return;
437
438 do {
439 fd_set wfds;
440
441 FD_ZERO(&wfds);
442 FD_SET(s->fd, &wfds);
443
444 ret = select(s->fd + 1, NULL, &wfds, NULL, NULL);
445 } while (ret == -1 && (s->get_error(s)) == EINTR);
446}
447
448int migrate_fd_close(void *opaque)
449{
450 FdMigrationState *s = opaque;
Uri Lubline19252d2009-06-08 14:28:01 +0300451
452 qemu_set_fd_handler2(s->fd, NULL, NULL, NULL, NULL);
aliguori065e2812008-11-11 16:46:33 +0000453 return s->close(s);
454}