migration.h 11.9 KB
Newer Older
A
aliguori 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/*
 * QEMU live migration
 *
 * Copyright IBM, Corp. 2008
 *
 * Authors:
 *  Anthony Liguori   <aliguori@us.ibm.com>
 *
 * This work is licensed under the terms of the GNU GPL, version 2.  See
 * the COPYING file in the top-level directory.
 *
 */

#ifndef QEMU_MIGRATION_H
#define QEMU_MIGRATION_H

17
#include "qapi/qmp/qdict.h"
A
aliguori 已提交
18
#include "qemu-common.h"
19
#include "qemu/thread.h"
20
#include "qemu/notify.h"
21
#include "migration/vmstate.h"
O
Orit Wasserman 已提交
22
#include "qapi-types.h"
M
Michael R. Hines 已提交
23
#include "exec/cpu-common.h"
24
#include "qemu/coroutine_int.h"
25
#include "qom/object.h"
A
aliguori 已提交
26

27 28 29 30 31 32 33 34 35 36
#define QEMU_VM_FILE_MAGIC           0x5145564d
#define QEMU_VM_FILE_VERSION_COMPAT  0x00000002
#define QEMU_VM_FILE_VERSION         0x00000003

#define QEMU_VM_EOF                  0x00
#define QEMU_VM_SECTION_START        0x01
#define QEMU_VM_SECTION_PART         0x02
#define QEMU_VM_SECTION_END          0x03
#define QEMU_VM_SECTION_FULL         0x04
#define QEMU_VM_SUBSECTION           0x05
37
#define QEMU_VM_VMDESCRIPTION        0x06
38
#define QEMU_VM_CONFIGURATION        0x07
D
Dr. David Alan Gilbert 已提交
39
#define QEMU_VM_COMMAND              0x08
40
#define QEMU_VM_SECTION_FOOTER       0x7e
41

42 43 44
/* for vl.c */
extern int only_migratable;

I
Isaku Yamahata 已提交
45 46 47 48 49
struct MigrationParams {
    bool blk;
    bool shared;
};

50 51 52 53 54 55
/* Messages sent on the return path from destination to source */
enum mig_rp_message_type {
    MIG_RP_MSG_INVALID = 0,  /* Must be 0 */
    MIG_RP_MSG_SHUT,         /* sibling will not send any more RP messages */
    MIG_RP_MSG_PONG,         /* Response to a PING; data (seq: be32 ) */

56 57 58
    MIG_RP_MSG_REQ_PAGES_ID, /* data (start: be64, len: be32, id: string) */
    MIG_RP_MSG_REQ_PAGES,    /* data (start: be64, len: be32) */

59 60 61
    MIG_RP_MSG_MAX
};

62
typedef QLIST_HEAD(, LoadStateEntry) LoadStateEntry_Head;
63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85

/* The current postcopy state is read/set by postcopy_state_get/set
 * which update it atomically.
 * The state is updated as postcopy messages are received, and
 * in general only one thread should be writing to the state at any one
 * time, initially the main thread and then the listen thread;
 * Corner cases are where either thread finishes early and/or errors.
 * The state is checked as messages are received to ensure that
 * the source is sending us messages in the correct order.
 * The state is also used by the RAM reception code to know if it
 * has to place pages atomically, and the cleanup code at the end of
 * the main thread to know if it has to delay cleanup until the end
 * of postcopy.
 */
typedef enum {
    POSTCOPY_INCOMING_NONE = 0,  /* Initial state - no postcopy */
    POSTCOPY_INCOMING_ADVISE,
    POSTCOPY_INCOMING_DISCARD,
    POSTCOPY_INCOMING_LISTENING,
    POSTCOPY_INCOMING_RUNNING,
    POSTCOPY_INCOMING_END
} PostcopyState;

86 87
/* State for the incoming migration */
struct MigrationIncomingState {
88
    QEMUFile *from_src_file;
89

90 91 92 93 94 95
    /*
     * Free at the start of the main state load, set as the main thread finishes
     * loading state.
     */
    QemuEvent main_thread_load_event;

96
    size_t         largest_page_size;
97
    bool           have_fault_thread;
98 99 100
    QemuThread     fault_thread;
    QemuSemaphore  fault_thread_sem;

101 102 103 104
    bool           have_listen_thread;
    QemuThread     listen_thread;
    QemuSemaphore  listen_thread_sem;

105 106
    /* For the kernel to send us notifications */
    int       userfault_fd;
107 108
    /* To tell the fault_thread to quit */
    int       userfault_quit_fd;
109
    QEMUFile *to_src_file;
110
    QemuMutex rp_mutex;    /* We send replies from multiple threads */
111
    void     *postcopy_tmp_page;
112
    void     *postcopy_tmp_zero_page;
113

114 115
    QEMUBH *bh;

116
    int state;
117 118 119 120 121

    bool have_colo_incoming_thread;
    QemuThread colo_incoming_thread;
    /* The coroutine we should enter (back) after failover */
    Coroutine *migration_incoming_co;
122
    QemuSemaphore colo_incoming_sem;
123

124 125
    /* See savevm.c */
    LoadStateEntry_Head loadvm_handlers;
126 127 128 129 130
};

MigrationIncomingState *migration_incoming_get_current(void);
void migration_incoming_state_destroy(void);

131
struct MigrationState
132
{
133 134 135
    size_t bytes_xfer;
    size_t xfer_limit;
    QemuThread thread;
136
    QEMUBH *cleanup_bh;
137
    QEMUFile *to_dst_file;
138 139 140

    /* New style params from 'migrate-set-parameters' */
    MigrationParameters parameters;
141 142

    int state;
143
    /* Old style params from 'migrate' command */
I
Isaku Yamahata 已提交
144
    MigrationParams params;
145 146 147 148 149 150 151 152

    /* State related to return path */
    struct {
        QEMUFile     *from_dst_file;
        QemuThread    rp_thread;
        bool          error;
    } rp_state;

153
    double mbps;
J
Juan Quintela 已提交
154
    int64_t total_time;
155
    int64_t downtime;
156
    int64_t expected_downtime;
157
    bool enabled_capabilities[MIGRATION_CAPABILITY__MAX];
158
    int64_t xbzrle_cache_size;
159
    int64_t setup_time;
160 161 162

    /* Flag set once the migration has been asked to enter postcopy */
    bool start_postcopy;
163 164
    /* Flag set after postcopy has sent the device state */
    bool postcopy_after_devices;
165 166 167

    /* Flag set once the migration thread is running (and needs joining) */
    bool migration_thread_running;
168

169 170 171
    /* Flag set once the migration thread called bdrv_inactivate_all */
    bool block_inactive;

172 173
    /* The semaphore is used to notify COLO thread that failover is finished */
    QemuSemaphore colo_exit_sem;
174

175 176 177 178 179
    /* The semaphore is used to notify COLO thread to do checkpoint */
    QemuSemaphore colo_checkpoint_sem;
    int64_t colo_checkpoint_time;
    QEMUTimer *colo_delay_timer;

180 181
    /* The last error that occurred */
    Error *error;
182 183
};

184 185
void migrate_set_state(int *state, int old_state, int new_state);

186
void migration_fd_process_incoming(QEMUFile *f);
187

188
void qemu_start_incoming_migration(const char *uri, Error **errp);
A
aliguori 已提交
189

190 191
void migration_channel_process_incoming(MigrationState *s,
                                        QIOChannel *ioc);
192

193 194 195
void migration_tls_channel_process_incoming(MigrationState *s,
                                            QIOChannel *ioc,
                                            Error **errp);
196

197 198 199
void migration_channel_connect(MigrationState *s,
                               QIOChannel *ioc,
                               const char *hostname);
200

201 202 203 204
void migration_tls_channel_connect(MigrationState *s,
                                   QIOChannel *ioc,
                                   const char *hostname,
                                   Error **errp);
205

206 207
uint64_t migrate_max_downtime(void);

208
void exec_start_incoming_migration(const char *host_port, Error **errp);
209

210
void exec_start_outgoing_migration(MigrationState *s, const char *host_port, Error **errp);
211

212
void tcp_start_incoming_migration(const char *host_port, Error **errp);
A
aliguori 已提交
213

214
void tcp_start_outgoing_migration(MigrationState *s, const char *host_port, Error **errp);
A
aliguori 已提交
215

216
void unix_start_incoming_migration(const char *path, Error **errp);
C
Chris Lalancette 已提交
217

218
void unix_start_outgoing_migration(MigrationState *s, const char *path, Error **errp);
C
Chris Lalancette 已提交
219

220
void fd_start_incoming_migration(const char *path, Error **errp);
P
Paolo Bonzini 已提交
221

222
void fd_start_outgoing_migration(MigrationState *s, const char *fdname, Error **errp);
P
Paolo Bonzini 已提交
223

M
Michael R. Hines 已提交
224 225 226 227
void rdma_start_outgoing_migration(void *opaque, const char *host_port, Error **errp);

void rdma_start_incoming_migration(const char *host_port, Error **errp);

228
void migrate_fd_error(MigrationState *s, const Error *error);
229

230
void migrate_fd_connect(MigrationState *s);
231

232 233
void add_migration_state_change_notifier(Notifier *notify);
void remove_migration_state_change_notifier(Notifier *notify);
234
MigrationState *migrate_init(const MigrationParams *params);
235
bool migration_is_blocked(Error **errp);
S
Stefan Hajnoczi 已提交
236
bool migration_in_setup(MigrationState *);
237
bool migration_is_idle(MigrationState *s);
238
bool migration_has_finished(MigrationState *);
239
bool migration_has_failed(MigrationState *);
240
/* True if outgoing migration has entered postcopy phase */
241
bool migration_in_postcopy(void);
242 243
/* ...and after the device transmission */
bool migration_in_postcopy_after_devices(MigrationState *);
244
MigrationState *migrate_get_current(void);
245

246 247
void migrate_compress_threads_create(void);
void migrate_compress_threads_join(void);
248 249
void migrate_decompress_threads_create(void);
void migrate_decompress_threads_join(void);
250 251 252
uint64_t ram_bytes_remaining(void);
uint64_t ram_bytes_transferred(void);
uint64_t ram_bytes_total(void);
253
uint64_t ram_dirty_sync_count(void);
254
uint64_t ram_dirty_pages_rate(void);
255
uint64_t ram_postcopy_requests(void);
256
void free_xbzrle_decoded_buf(void);
257

258 259
void acct_update_position(QEMUFile *f, size_t size, bool zero);

260 261
uint64_t dup_mig_pages_transferred(void);
uint64_t norm_mig_pages_transferred(void);
O
Orit Wasserman 已提交
262 263 264 265
uint64_t xbzrle_mig_bytes_transferred(void);
uint64_t xbzrle_mig_pages_transferred(void);
uint64_t xbzrle_mig_pages_overflow(void);
uint64_t xbzrle_mig_pages_cache_miss(void);
266
double xbzrle_mig_cache_miss_rate(void);
267

268
void ram_handle_compressed(void *host, uint8_t ch, uint64_t size);
269
void ram_debug_dump_bitmap(unsigned long *todump, bool expected);
270 271 272
/* For outgoing discard bitmap */
int ram_postcopy_send_discard_bitmap(MigrationState *ms);
/* For incoming postcopy discard */
273
int ram_discard_range(const char *block_name, uint64_t start, size_t length);
274
int ram_postcopy_incoming_init(MigrationIncomingState *mis);
275
void ram_postcopy_migrated_memory_release(MigrationState *ms);
276

A
Anthony Liguori 已提交
277 278 279 280
/**
 * @migrate_add_blocker - prevent migration from proceeding
 *
 * @reason - an error to be returned whenever migration is attempted
281 282 283
 *
 * @errp - [out] The reason (if any) we cannot block migration right now.
 *
284
 * @returns - 0 on success, -EBUSY/-EACCES on failure, with errp set.
A
Anthony Liguori 已提交
285
 */
286
int migrate_add_blocker(Error *reason, Error **errp);
A
Anthony Liguori 已提交
287 288 289 290 291 292 293 294

/**
 * @migrate_del_blocker - remove a blocking error from migration
 *
 * @reason - the error blocking migration
 */
void migrate_del_blocker(Error *reason);

295 296
int check_migratable(Object *obj, Error **err);

297
bool migrate_release_ram(void);
298
bool migrate_postcopy_ram(void);
299
bool migrate_zero_blocks(void);
300

301 302
bool migrate_auto_converge(void);

303 304 305 306
int xbzrle_encode_buffer(uint8_t *old_buf, uint8_t *new_buf, int slen,
                         uint8_t *dst, int dlen);
int xbzrle_decode_buffer(uint8_t *src, int slen, uint8_t *dst, int dlen);

307 308
int migrate_use_xbzrle(void);
int64_t migrate_xbzrle_cache_size(void);
309
bool migrate_colo_enabled(void);
310

311
int64_t xbzrle_cache_resize(int64_t new_size);
M
Michael R. Hines 已提交
312

313 314 315
bool migrate_use_compression(void);
int migrate_compress_level(void);
int migrate_compress_threads(void);
316
int migrate_decompress_threads(void);
317
bool migrate_use_events(void);
318

319 320 321 322 323 324 325 326
/* Sending on the return path - generic and then for each message type */
void migrate_send_rp_message(MigrationIncomingState *mis,
                             enum mig_rp_message_type message_type,
                             uint16_t len, void *data);
void migrate_send_rp_shut(MigrationIncomingState *mis,
                          uint32_t value);
void migrate_send_rp_pong(MigrationIncomingState *mis,
                          uint32_t value);
327 328
void migrate_send_rp_req_pages(MigrationIncomingState *mis, const char* rbname,
                              ram_addr_t start, size_t len);
329

M
Michael R. Hines 已提交
330 331
void ram_control_before_iterate(QEMUFile *f, uint64_t flags);
void ram_control_after_iterate(QEMUFile *f, uint64_t flags);
332
void ram_control_load_hook(QEMUFile *f, uint64_t flags, void *data);
M
Michael R. Hines 已提交
333 334 335 336 337 338 339 340 341 342 343 344 345

/* Whenever this is found in the data stream, the flags
 * will be passed to ram_control_load_hook in the incoming-migration
 * side. This lets before_ram_iterate/after_ram_iterate add
 * transport-specific sections to the RAM migration data.
 */
#define RAM_SAVE_FLAG_HOOK     0x80

#define RAM_SAVE_CONTROL_NOT_SUPP -1000
#define RAM_SAVE_CONTROL_DELAYED  -2000

size_t ram_control_save_page(QEMUFile *f, ram_addr_t block_offset,
                             ram_addr_t offset, size_t size,
346
                             uint64_t *bytes_sent);
M
Michael R. Hines 已提交
347

348
void ram_mig_init(void);
349
void savevm_skip_section_footers(void);
350
void register_global_state(void);
351
void global_state_set_optional(void);
352
void savevm_skip_configuration(void);
353
int global_state_store(void);
354
void global_state_store_running(void);
355

356
void migration_page_queue_free(void);
357
int ram_save_queue_pages(const char *rbname, ram_addr_t start, ram_addr_t len);
358
uint64_t ram_pagesize_summary(void);
359

360 361 362
PostcopyState postcopy_state_get(void);
/* Set the state and return the old state */
PostcopyState postcopy_state_set(PostcopyState new_state);
A
aliguori 已提交
363
#endif