Statistics
| Branch: | Revision:

root / migration.c @ e659586e

History | View | Annotate | Download (21 kB)

1
/*
2
 * QEMU live migration
3
 *
4
 * Copyright IBM, Corp. 2008
5
 *
6
 * Authors:
7
 *  Anthony Liguori   <aliguori@us.ibm.com>
8
 *
9
 * This work is licensed under the terms of the GNU GPL, version 2.  See
10
 * the COPYING file in the top-level directory.
11
 *
12
 * Contributions after 2012-01-13 are licensed under the terms of the
13
 * GNU GPL, version 2 or (at your option) any later version.
14
 */
15

    
16
#include "qemu-common.h"
17
#include "migration/migration.h"
18
#include "monitor/monitor.h"
19
#include "migration/qemu-file.h"
20
#include "sysemu/sysemu.h"
21
#include "block/block.h"
22
#include "qemu/sockets.h"
23
#include "migration/block.h"
24
#include "qemu/thread.h"
25
#include "qmp-commands.h"
26

    
27
//#define DEBUG_MIGRATION
28

    
29
#ifdef DEBUG_MIGRATION
30
#define DPRINTF(fmt, ...) \
31
    do { printf("migration: " fmt, ## __VA_ARGS__); } while (0)
32
#else
33
#define DPRINTF(fmt, ...) \
34
    do { } while (0)
35
#endif
36

    
37
enum {
38
    MIG_STATE_ERROR,
39
    MIG_STATE_SETUP,
40
    MIG_STATE_CANCELLED,
41
    MIG_STATE_ACTIVE,
42
    MIG_STATE_COMPLETED,
43
};
44

    
45
#define MAX_THROTTLE  (32 << 20)      /* Migration speed throttling */
46

    
47
/* Amount of time to allocate to each "chunk" of bandwidth-throttled
48
 * data. */
49
#define BUFFER_DELAY     100
50
#define XFER_LIMIT_RATIO (1000 / BUFFER_DELAY)
51

    
52
/* Migration XBZRLE default cache size */
53
#define DEFAULT_MIGRATE_CACHE_SIZE (64 * 1024 * 1024)
54

    
55
static NotifierList migration_state_notifiers =
56
    NOTIFIER_LIST_INITIALIZER(migration_state_notifiers);
57

    
58
/* When we add fault tolerance, we could have several
59
   migrations at once.  For now we don't need to add
60
   dynamic creation of migration */
61

    
62
MigrationState *migrate_get_current(void)
63
{
64
    static MigrationState current_migration = {
65
        .state = MIG_STATE_SETUP,
66
        .bandwidth_limit = MAX_THROTTLE,
67
        .xbzrle_cache_size = DEFAULT_MIGRATE_CACHE_SIZE,
68
    };
69

    
70
    return &current_migration;
71
}
72

    
73
void qemu_start_incoming_migration(const char *uri, Error **errp)
74
{
75
    const char *p;
76

    
77
    if (strstart(uri, "tcp:", &p))
78
        tcp_start_incoming_migration(p, errp);
79
#if !defined(WIN32)
80
    else if (strstart(uri, "exec:", &p))
81
        exec_start_incoming_migration(p, errp);
82
    else if (strstart(uri, "unix:", &p))
83
        unix_start_incoming_migration(p, errp);
84
    else if (strstart(uri, "fd:", &p))
85
        fd_start_incoming_migration(p, errp);
86
#endif
87
    else {
88
        error_setg(errp, "unknown migration protocol: %s\n", uri);
89
    }
90
}
91

    
92
static void process_incoming_migration_co(void *opaque)
93
{
94
    QEMUFile *f = opaque;
95
    int ret;
96

    
97
    ret = qemu_loadvm_state(f);
98
    qemu_set_fd_handler(qemu_get_fd(f), NULL, NULL, NULL);
99
    qemu_fclose(f);
100
    if (ret < 0) {
101
        fprintf(stderr, "load of migration failed\n");
102
        exit(0);
103
    }
104
    qemu_announce_self();
105
    DPRINTF("successfully loaded vm state\n");
106

    
107
    bdrv_clear_incoming_migration_all();
108
    /* Make sure all file formats flush their mutable metadata */
109
    bdrv_invalidate_cache_all();
110

    
111
    if (autostart) {
112
        vm_start();
113
    } else {
114
        runstate_set(RUN_STATE_PAUSED);
115
    }
116
}
117

    
118
static void enter_migration_coroutine(void *opaque)
119
{
120
    Coroutine *co = opaque;
121
    qemu_coroutine_enter(co, NULL);
122
}
123

    
124
void process_incoming_migration(QEMUFile *f)
125
{
126
    Coroutine *co = qemu_coroutine_create(process_incoming_migration_co);
127
    int fd = qemu_get_fd(f);
128

    
129
    assert(fd != -1);
130
    socket_set_nonblock(fd);
131
    qemu_set_fd_handler(fd, enter_migration_coroutine, NULL, co);
132
    qemu_coroutine_enter(co, f);
133
}
134

    
135
/* amount of nanoseconds we are willing to wait for migration to be down.
136
 * the choice of nanoseconds is because it is the maximum resolution that
137
 * get_clock() can achieve. It is an internal measure. All user-visible
138
 * units must be in seconds */
139
static uint64_t max_downtime = 30000000;
140

    
141
uint64_t migrate_max_downtime(void)
142
{
143
    return max_downtime;
144
}
145

    
146
MigrationCapabilityStatusList *qmp_query_migrate_capabilities(Error **errp)
147
{
148
    MigrationCapabilityStatusList *head = NULL;
149
    MigrationCapabilityStatusList *caps;
150
    MigrationState *s = migrate_get_current();
151
    int i;
152

    
153
    for (i = 0; i < MIGRATION_CAPABILITY_MAX; i++) {
154
        if (head == NULL) {
155
            head = g_malloc0(sizeof(*caps));
156
            caps = head;
157
        } else {
158
            caps->next = g_malloc0(sizeof(*caps));
159
            caps = caps->next;
160
        }
161
        caps->value =
162
            g_malloc(sizeof(*caps->value));
163
        caps->value->capability = i;
164
        caps->value->state = s->enabled_capabilities[i];
165
    }
166

    
167
    return head;
168
}
169

    
170
static void get_xbzrle_cache_stats(MigrationInfo *info)
171
{
172
    if (migrate_use_xbzrle()) {
173
        info->has_xbzrle_cache = true;
174
        info->xbzrle_cache = g_malloc0(sizeof(*info->xbzrle_cache));
175
        info->xbzrle_cache->cache_size = migrate_xbzrle_cache_size();
176
        info->xbzrle_cache->bytes = xbzrle_mig_bytes_transferred();
177
        info->xbzrle_cache->pages = xbzrle_mig_pages_transferred();
178
        info->xbzrle_cache->cache_miss = xbzrle_mig_pages_cache_miss();
179
        info->xbzrle_cache->overflow = xbzrle_mig_pages_overflow();
180
    }
181
}
182

    
183
MigrationInfo *qmp_query_migrate(Error **errp)
184
{
185
    MigrationInfo *info = g_malloc0(sizeof(*info));
186
    MigrationState *s = migrate_get_current();
187

    
188
    switch (s->state) {
189
    case MIG_STATE_SETUP:
190
        /* no migration has happened ever */
191
        break;
192
    case MIG_STATE_ACTIVE:
193
        info->has_status = true;
194
        info->status = g_strdup("active");
195
        info->has_total_time = true;
196
        info->total_time = qemu_get_clock_ms(rt_clock)
197
            - s->total_time;
198
        info->has_expected_downtime = true;
199
        info->expected_downtime = s->expected_downtime;
200

    
201
        info->has_ram = true;
202
        info->ram = g_malloc0(sizeof(*info->ram));
203
        info->ram->transferred = ram_bytes_transferred();
204
        info->ram->remaining = ram_bytes_remaining();
205
        info->ram->total = ram_bytes_total();
206
        info->ram->duplicate = dup_mig_pages_transferred();
207
        info->ram->normal = norm_mig_pages_transferred();
208
        info->ram->normal_bytes = norm_mig_bytes_transferred();
209
        info->ram->dirty_pages_rate = s->dirty_pages_rate;
210

    
211

    
212
        if (blk_mig_active()) {
213
            info->has_disk = true;
214
            info->disk = g_malloc0(sizeof(*info->disk));
215
            info->disk->transferred = blk_mig_bytes_transferred();
216
            info->disk->remaining = blk_mig_bytes_remaining();
217
            info->disk->total = blk_mig_bytes_total();
218
        }
219

    
220
        get_xbzrle_cache_stats(info);
221
        break;
222
    case MIG_STATE_COMPLETED:
223
        get_xbzrle_cache_stats(info);
224

    
225
        info->has_status = true;
226
        info->status = g_strdup("completed");
227
        info->total_time = s->total_time;
228
        info->has_downtime = true;
229
        info->downtime = s->downtime;
230

    
231
        info->has_ram = true;
232
        info->ram = g_malloc0(sizeof(*info->ram));
233
        info->ram->transferred = ram_bytes_transferred();
234
        info->ram->remaining = 0;
235
        info->ram->total = ram_bytes_total();
236
        info->ram->duplicate = dup_mig_pages_transferred();
237
        info->ram->normal = norm_mig_pages_transferred();
238
        info->ram->normal_bytes = norm_mig_bytes_transferred();
239
        break;
240
    case MIG_STATE_ERROR:
241
        info->has_status = true;
242
        info->status = g_strdup("failed");
243
        break;
244
    case MIG_STATE_CANCELLED:
245
        info->has_status = true;
246
        info->status = g_strdup("cancelled");
247
        break;
248
    }
249

    
250
    return info;
251
}
252

    
253
void qmp_migrate_set_capabilities(MigrationCapabilityStatusList *params,
254
                                  Error **errp)
255
{
256
    MigrationState *s = migrate_get_current();
257
    MigrationCapabilityStatusList *cap;
258

    
259
    if (s->state == MIG_STATE_ACTIVE) {
260
        error_set(errp, QERR_MIGRATION_ACTIVE);
261
        return;
262
    }
263

    
264
    for (cap = params; cap; cap = cap->next) {
265
        s->enabled_capabilities[cap->value->capability] = cap->value->state;
266
    }
267
}
268

    
269
/* shared migration helpers */
270

    
271
static int migrate_fd_cleanup(MigrationState *s)
272
{
273
    int ret = 0;
274

    
275
    if (s->file) {
276
        DPRINTF("closing file\n");
277
        ret = qemu_fclose(s->file);
278
        s->file = NULL;
279
    }
280

    
281
    assert(s->fd == -1);
282
    return ret;
283
}
284

    
285
void migrate_fd_error(MigrationState *s)
286
{
287
    DPRINTF("setting error state\n");
288
    s->state = MIG_STATE_ERROR;
289
    notifier_list_notify(&migration_state_notifiers, s);
290
    migrate_fd_cleanup(s);
291
}
292

    
293
static void migrate_fd_completed(MigrationState *s)
294
{
295
    DPRINTF("setting completed state\n");
296
    if (migrate_fd_cleanup(s) < 0) {
297
        s->state = MIG_STATE_ERROR;
298
    } else {
299
        s->state = MIG_STATE_COMPLETED;
300
        runstate_set(RUN_STATE_POSTMIGRATE);
301
    }
302
    notifier_list_notify(&migration_state_notifiers, s);
303
}
304

    
305
ssize_t migrate_fd_put_buffer(MigrationState *s, const void *data,
306
                              size_t size)
307
{
308
    ssize_t ret;
309

    
310
    if (s->state != MIG_STATE_ACTIVE) {
311
        return -EIO;
312
    }
313

    
314
    do {
315
        ret = s->write(s, data, size);
316
    } while (ret == -1 && ((s->get_error(s)) == EINTR));
317

    
318
    if (ret == -1)
319
        ret = -(s->get_error(s));
320

    
321
    return ret;
322
}
323

    
324
static void migrate_fd_cancel(MigrationState *s)
325
{
326
    if (s->state != MIG_STATE_ACTIVE)
327
        return;
328

    
329
    DPRINTF("cancelling migration\n");
330

    
331
    s->state = MIG_STATE_CANCELLED;
332
    notifier_list_notify(&migration_state_notifiers, s);
333
    qemu_savevm_state_cancel(s->file);
334

    
335
    migrate_fd_cleanup(s);
336
}
337

    
338
int migrate_fd_close(MigrationState *s)
339
{
340
    int rc = 0;
341
    if (s->fd != -1) {
342
        rc = s->close(s);
343
        s->fd = -1;
344
    }
345
    return rc;
346
}
347

    
348
void add_migration_state_change_notifier(Notifier *notify)
349
{
350
    notifier_list_add(&migration_state_notifiers, notify);
351
}
352

    
353
void remove_migration_state_change_notifier(Notifier *notify)
354
{
355
    notifier_remove(notify);
356
}
357

    
358
bool migration_is_active(MigrationState *s)
359
{
360
    return s->state == MIG_STATE_ACTIVE;
361
}
362

    
363
bool migration_has_finished(MigrationState *s)
364
{
365
    return s->state == MIG_STATE_COMPLETED;
366
}
367

    
368
bool migration_has_failed(MigrationState *s)
369
{
370
    return (s->state == MIG_STATE_CANCELLED ||
371
            s->state == MIG_STATE_ERROR);
372
}
373

    
374
static MigrationState *migrate_init(const MigrationParams *params)
375
{
376
    MigrationState *s = migrate_get_current();
377
    int64_t bandwidth_limit = s->bandwidth_limit;
378
    bool enabled_capabilities[MIGRATION_CAPABILITY_MAX];
379
    int64_t xbzrle_cache_size = s->xbzrle_cache_size;
380

    
381
    memcpy(enabled_capabilities, s->enabled_capabilities,
382
           sizeof(enabled_capabilities));
383

    
384
    memset(s, 0, sizeof(*s));
385
    s->bandwidth_limit = bandwidth_limit;
386
    s->params = *params;
387
    memcpy(s->enabled_capabilities, enabled_capabilities,
388
           sizeof(enabled_capabilities));
389
    s->xbzrle_cache_size = xbzrle_cache_size;
390

    
391
    s->bandwidth_limit = bandwidth_limit;
392
    s->state = MIG_STATE_SETUP;
393
    s->total_time = qemu_get_clock_ms(rt_clock);
394

    
395
    return s;
396
}
397

    
398
static GSList *migration_blockers;
399

    
400
void migrate_add_blocker(Error *reason)
401
{
402
    migration_blockers = g_slist_prepend(migration_blockers, reason);
403
}
404

    
405
void migrate_del_blocker(Error *reason)
406
{
407
    migration_blockers = g_slist_remove(migration_blockers, reason);
408
}
409

    
410
void qmp_migrate(const char *uri, bool has_blk, bool blk,
411
                 bool has_inc, bool inc, bool has_detach, bool detach,
412
                 Error **errp)
413
{
414
    Error *local_err = NULL;
415
    MigrationState *s = migrate_get_current();
416
    MigrationParams params;
417
    const char *p;
418

    
419
    params.blk = blk;
420
    params.shared = inc;
421

    
422
    if (s->state == MIG_STATE_ACTIVE) {
423
        error_set(errp, QERR_MIGRATION_ACTIVE);
424
        return;
425
    }
426

    
427
    if (qemu_savevm_state_blocked(errp)) {
428
        return;
429
    }
430

    
431
    if (migration_blockers) {
432
        *errp = error_copy(migration_blockers->data);
433
        return;
434
    }
435

    
436
    s = migrate_init(&params);
437

    
438
    if (strstart(uri, "tcp:", &p)) {
439
        tcp_start_outgoing_migration(s, p, &local_err);
440
#if !defined(WIN32)
441
    } else if (strstart(uri, "exec:", &p)) {
442
        exec_start_outgoing_migration(s, p, &local_err);
443
    } else if (strstart(uri, "unix:", &p)) {
444
        unix_start_outgoing_migration(s, p, &local_err);
445
    } else if (strstart(uri, "fd:", &p)) {
446
        fd_start_outgoing_migration(s, p, &local_err);
447
#endif
448
    } else {
449
        error_set(errp, QERR_INVALID_PARAMETER_VALUE, "uri", "a valid migration protocol");
450
        return;
451
    }
452

    
453
    if (local_err) {
454
        migrate_fd_error(s);
455
        error_propagate(errp, local_err);
456
        return;
457
    }
458
}
459

    
460
void qmp_migrate_cancel(Error **errp)
461
{
462
    migrate_fd_cancel(migrate_get_current());
463
}
464

    
465
void qmp_migrate_set_cache_size(int64_t value, Error **errp)
466
{
467
    MigrationState *s = migrate_get_current();
468

    
469
    /* Check for truncation */
470
    if (value != (size_t)value) {
471
        error_set(errp, QERR_INVALID_PARAMETER_VALUE, "cache size",
472
                  "exceeding address space");
473
        return;
474
    }
475

    
476
    s->xbzrle_cache_size = xbzrle_cache_resize(value);
477
}
478

    
479
int64_t qmp_query_migrate_cache_size(Error **errp)
480
{
481
    return migrate_xbzrle_cache_size();
482
}
483

    
484
void qmp_migrate_set_speed(int64_t value, Error **errp)
485
{
486
    MigrationState *s;
487

    
488
    if (value < 0) {
489
        value = 0;
490
    }
491

    
492
    s = migrate_get_current();
493
    s->bandwidth_limit = value;
494
    qemu_file_set_rate_limit(s->file, s->bandwidth_limit);
495
}
496

    
497
void qmp_migrate_set_downtime(double value, Error **errp)
498
{
499
    value *= 1e9;
500
    value = MAX(0, MIN(UINT64_MAX, value));
501
    max_downtime = (uint64_t)value;
502
}
503

    
504
int migrate_use_xbzrle(void)
505
{
506
    MigrationState *s;
507

    
508
    s = migrate_get_current();
509

    
510
    return s->enabled_capabilities[MIGRATION_CAPABILITY_XBZRLE];
511
}
512

    
513
int64_t migrate_xbzrle_cache_size(void)
514
{
515
    MigrationState *s;
516

    
517
    s = migrate_get_current();
518

    
519
    return s->xbzrle_cache_size;
520
}
521

    
522
/* migration thread support */
523

    
524
typedef struct QEMUFileBuffered {
525
    MigrationState *migration_state;
526
    QEMUFile *file;
527
    size_t bytes_xfer;
528
    size_t xfer_limit;
529
    uint8_t *buffer;
530
    size_t buffer_size;
531
    size_t buffer_capacity;
532
    QemuThread thread;
533
} QEMUFileBuffered;
534

    
535
static ssize_t buffered_flush(QEMUFileBuffered *s)
536
{
537
    size_t offset = 0;
538
    ssize_t ret = 0;
539

    
540
    DPRINTF("flushing %zu byte(s) of data\n", s->buffer_size);
541

    
542
    while (s->bytes_xfer < s->xfer_limit && offset < s->buffer_size) {
543
        size_t to_send = MIN(s->buffer_size - offset, s->xfer_limit - s->bytes_xfer);
544
        ret = migrate_fd_put_buffer(s->migration_state, s->buffer + offset,
545
                                    to_send);
546
        if (ret <= 0) {
547
            DPRINTF("error flushing data, %zd\n", ret);
548
            break;
549
        } else {
550
            DPRINTF("flushed %zd byte(s)\n", ret);
551
            offset += ret;
552
            s->bytes_xfer += ret;
553
        }
554
    }
555

    
556
    DPRINTF("flushed %zu of %zu byte(s)\n", offset, s->buffer_size);
557
    memmove(s->buffer, s->buffer + offset, s->buffer_size - offset);
558
    s->buffer_size -= offset;
559

    
560
    if (ret < 0) {
561
        return ret;
562
    }
563
    return offset;
564
}
565

    
566
static int buffered_put_buffer(void *opaque, const uint8_t *buf,
567
                               int64_t pos, int size)
568
{
569
    QEMUFileBuffered *s = opaque;
570
    ssize_t error;
571

    
572
    DPRINTF("putting %d bytes at %" PRId64 "\n", size, pos);
573

    
574
    error = qemu_file_get_error(s->file);
575
    if (error) {
576
        DPRINTF("flush when error, bailing: %s\n", strerror(-error));
577
        return error;
578
    }
579

    
580
    if (size <= 0) {
581
        return size;
582
    }
583

    
584
    if (size > (s->buffer_capacity - s->buffer_size)) {
585
        DPRINTF("increasing buffer capacity from %zu by %zu\n",
586
                s->buffer_capacity, size + 1024);
587

    
588
        s->buffer_capacity += size + 1024;
589

    
590
        s->buffer = g_realloc(s->buffer, s->buffer_capacity);
591
    }
592

    
593
    memcpy(s->buffer + s->buffer_size, buf, size);
594
    s->buffer_size += size;
595

    
596
    return size;
597
}
598

    
599
static int buffered_close(void *opaque)
600
{
601
    QEMUFileBuffered *s = opaque;
602
    ssize_t ret = 0;
603
    int ret2;
604

    
605
    DPRINTF("closing\n");
606

    
607
    s->xfer_limit = INT_MAX;
608
    while (!qemu_file_get_error(s->file) && s->buffer_size) {
609
        ret = buffered_flush(s);
610
        if (ret < 0) {
611
            break;
612
        }
613
    }
614

    
615
    ret2 = migrate_fd_close(s->migration_state);
616
    if (ret >= 0) {
617
        ret = ret2;
618
    }
619
    ret = migrate_fd_close(s->migration_state);
620
    s->migration_state->complete = true;
621
    return ret;
622
}
623

    
624
static int buffered_get_fd(void *opaque)
625
{
626
    QEMUFileBuffered *s = opaque;
627

    
628
    return s->migration_state->fd;
629
}
630

    
631
/*
632
 * The meaning of the return values is:
633
 *   0: We can continue sending
634
 *   1: Time to stop
635
 *   negative: There has been an error
636
 */
637
static int buffered_rate_limit(void *opaque)
638
{
639
    QEMUFileBuffered *s = opaque;
640
    int ret;
641

    
642
    ret = qemu_file_get_error(s->file);
643
    if (ret) {
644
        return ret;
645
    }
646

    
647
    if (s->bytes_xfer > s->xfer_limit) {
648
        return 1;
649
    }
650

    
651
    return 0;
652
}
653

    
654
static int64_t buffered_set_rate_limit(void *opaque, int64_t new_rate)
655
{
656
    QEMUFileBuffered *s = opaque;
657
    if (qemu_file_get_error(s->file)) {
658
        goto out;
659
    }
660
    if (new_rate > SIZE_MAX) {
661
        new_rate = SIZE_MAX;
662
    }
663

    
664
    s->xfer_limit = new_rate / 10;
665

    
666
out:
667
    return s->xfer_limit;
668
}
669

    
670
static int64_t buffered_get_rate_limit(void *opaque)
671
{
672
    QEMUFileBuffered *s = opaque;
673

    
674
    return s->xfer_limit;
675
}
676

    
677
static bool migrate_fd_put_ready(MigrationState *s, uint64_t max_size)
678
{
679
    int ret;
680
    uint64_t pending_size;
681
    bool last_round = false;
682

    
683
    qemu_mutex_lock_iothread();
684
    if (s->state != MIG_STATE_ACTIVE) {
685
        DPRINTF("put_ready returning because of non-active state\n");
686
        qemu_mutex_unlock_iothread();
687
        return false;
688
    }
689
    if (s->first_time) {
690
        s->first_time = false;
691
        DPRINTF("beginning savevm\n");
692
        ret = qemu_savevm_state_begin(s->file, &s->params);
693
        if (ret < 0) {
694
            DPRINTF("failed, %d\n", ret);
695
            migrate_fd_error(s);
696
            qemu_mutex_unlock_iothread();
697
            return false;
698
        }
699
    }
700

    
701
    DPRINTF("iterate\n");
702
    pending_size = qemu_savevm_state_pending(s->file, max_size);
703
    DPRINTF("pending size %lu max %lu\n", pending_size, max_size);
704
    if (pending_size >= max_size) {
705
        ret = qemu_savevm_state_iterate(s->file);
706
        if (ret < 0) {
707
            migrate_fd_error(s);
708
        }
709
    } else {
710
        int old_vm_running = runstate_is_running();
711
        int64_t start_time, end_time;
712

    
713
        DPRINTF("done iterating\n");
714
        start_time = qemu_get_clock_ms(rt_clock);
715
        qemu_system_wakeup_request(QEMU_WAKEUP_REASON_OTHER);
716
        if (old_vm_running) {
717
            vm_stop(RUN_STATE_FINISH_MIGRATE);
718
        } else {
719
            vm_stop_force_state(RUN_STATE_FINISH_MIGRATE);
720
        }
721

    
722
        if (qemu_savevm_state_complete(s->file) < 0) {
723
            migrate_fd_error(s);
724
        } else {
725
            migrate_fd_completed(s);
726
        }
727
        end_time = qemu_get_clock_ms(rt_clock);
728
        s->total_time = end_time - s->total_time;
729
        s->downtime = end_time - start_time;
730
        if (s->state != MIG_STATE_COMPLETED) {
731
            if (old_vm_running) {
732
                vm_start();
733
            }
734
        }
735
        last_round = true;
736
    }
737
    qemu_mutex_unlock_iothread();
738

    
739
    return last_round;
740
}
741

    
742
static void *buffered_file_thread(void *opaque)
743
{
744
    QEMUFileBuffered *s = opaque;
745
    int64_t initial_time = qemu_get_clock_ms(rt_clock);
746
    int64_t max_size = 0;
747
    bool last_round = false;
748

    
749
    while (true) {
750
        int64_t current_time = qemu_get_clock_ms(rt_clock);
751

    
752
        if (s->migration_state->complete) {
753
            break;
754
        }
755
        if (current_time >= initial_time + BUFFER_DELAY) {
756
            uint64_t transferred_bytes = s->bytes_xfer;
757
            uint64_t time_spent = current_time - initial_time;
758
            double bandwidth = transferred_bytes / time_spent;
759
            max_size = bandwidth * migrate_max_downtime() / 1000000;
760

    
761
            DPRINTF("transferred %" PRIu64 " time_spent %" PRIu64
762
                    " bandwidth %g max_size %" PRId64 "\n",
763
                    transferred_bytes, time_spent, bandwidth, max_size);
764

    
765
            s->bytes_xfer = 0;
766
            initial_time = current_time;
767
        }
768
        if (!last_round && (s->bytes_xfer >= s->xfer_limit)) {
769
            /* usleep expects microseconds */
770
            g_usleep((initial_time + BUFFER_DELAY - current_time)*1000);
771
        }
772
        if (buffered_flush(s) < 0) {
773
            break;
774
        }
775

    
776
        DPRINTF("file is ready\n");
777
        if (s->bytes_xfer < s->xfer_limit) {
778
            DPRINTF("notifying client\n");
779
            last_round = migrate_fd_put_ready(s->migration_state, max_size);
780
        }
781
    }
782

    
783
    g_free(s->buffer);
784
    g_free(s);
785
    return NULL;
786
}
787

    
788
static const QEMUFileOps buffered_file_ops = {
789
    .get_fd =         buffered_get_fd,
790
    .put_buffer =     buffered_put_buffer,
791
    .close =          buffered_close,
792
    .rate_limit =     buffered_rate_limit,
793
    .get_rate_limit = buffered_get_rate_limit,
794
    .set_rate_limit = buffered_set_rate_limit,
795
};
796

    
797
void migrate_fd_connect(MigrationState *migration_state)
798
{
799
    QEMUFileBuffered *s;
800

    
801
    migration_state->state = MIG_STATE_ACTIVE;
802
    migration_state->first_time = true;
803
    s = g_malloc0(sizeof(*s));
804

    
805
    s->migration_state = migration_state;
806
    s->xfer_limit = s->migration_state->bandwidth_limit / XFER_LIMIT_RATIO;
807
    s->migration_state->complete = false;
808

    
809
    s->file = qemu_fopen_ops(s, &buffered_file_ops);
810

    
811
    migration_state->file = s->file;
812

    
813
    qemu_thread_create(&s->thread, buffered_file_thread, s,
814
                       QEMU_THREAD_DETACHED);
815
    notifier_list_notify(&migration_state_notifiers, s);
816
}