Blame - migration/ram.c - qemu

2015-05-07 19:33:31 +0200

[diff] [blame]

1

/*

2

* QEMU System Emulator

3

*

4

Juan Quintela

76cc7b5

2015-05-08 13:20:21 +0200

[diff] [blame]

*

* Authors:

* Juan Quintela <quintela@redhat.com>

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

9

*

10

* Permission is hereby granted, free of charge, to any person obtaining a copy

11

* of this software and associated documentation files (the "Software"), to deal

12

* in the Software without restriction, including without limitation the rights

13

* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell

14

* copies of the Software, and to permit persons to whom the Software is

15

* furnished to do so, subject to the following conditions:

16

*

17

* The above copyright notice and this permission notice shall be included in

18

* all copies or substantial portions of the Software.

19

*

20

* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR

21

* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,

22

* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL

23

* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER

24

* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,

25

* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN

26

* THE SOFTWARE.

27

*/

Markus Armbruster

e688df6

2018-02-01 12:18:31 +0100

[diff] [blame]

28

Peter Maydell

1393a48

2016-01-26 18:16:54 +0000

[diff] [blame]

29

#include "qemu/osdep.h"

Paolo Bonzini

33c1187

2016-03-15 16:58:45 +0100

[diff] [blame]

30

#include "cpu.h"

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

31

#include <zlib.h>

Veronia Bahaa

f348b6d

2016-03-20 19:16:19 +0200

[diff] [blame]

32

#include "qemu/cutils.h"

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

33

#include "qemu/bitops.h"

34

#include "qemu/bitmap.h"

Juan Quintela

7205c9e

2015-05-08 13:54:36 +0200

[diff] [blame]

35

#include "qemu/main-loop.h"

Junyan He

56eb90a

2018-07-18 15:48:03 +0800

[diff] [blame]

36

#include "qemu/pmem.h"

Juan Quintela

709e3fe

2017-04-05 21:47:50 +0200

[diff] [blame]

37

#include "xbzrle.h"

Juan Quintela

7b1e1a2

2017-04-17 20:26:27 +0200

[diff] [blame]

38

#include "ram.h"

Juan Quintela

6666c96

2017-04-24 20:07:27 +0200

[diff] [blame]

39

#include "migration.h"

Juan Quintela

71bb07d

2018-02-19 19:01:03 +0100

[diff] [blame]

40

#include "socket.h"

Juan Quintela

f2a8f0a

2017-04-24 13:42:55 +0200

[diff] [blame]

41

#include "migration/register.h"

Juan Quintela

7b1e1a2

2017-04-17 20:26:27 +0200

[diff] [blame]

42

#include "migration/misc.h"

Juan Quintela

08a0aee

2017-04-20 18:52:18 +0200

[diff] [blame]

43

#include "qemu-file.h"

Juan Quintela

be07b0a

2017-04-20 13:12:24 +0200

[diff] [blame]

44

#include "postcopy-ram.h"

Michael S. Tsirkin

53d37d3

2018-05-03 22:50:51 +0300

[diff] [blame]

45

#include "page_cache.h"

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

46

#include "qemu/error-report.h"

Markus Armbruster

e688df6

2018-02-01 12:18:31 +0100

[diff] [blame]

47

#include "qapi/error.h"

Markus Armbruster

9af2398

2018-02-11 10:36:01 +0100

[diff] [blame]

48

#include "qapi/qapi-events-migration.h"

Juan Quintela

8acabf6

2017-10-05 22:00:31 +0200

[diff] [blame]

49

#include "qapi/qmp/qerror.h"

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

50

#include "trace.h"

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

51

#include "exec/ram_addr.h"

Alexey Perevalov

2017-10-05 14:13:20 +0300

[diff] [blame]

52

#include "exec/target_page.h"

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

53

#include "qemu/rcu_queue.h"

zhanghailiang

2016-10-27 14:42:59 +0800

[diff] [blame]

54

#include "migration/colo.h"

Michael S. Tsirkin

53d37d3

2018-05-03 22:50:51 +0300

[diff] [blame]

55

#include "block.h"

Juan Quintela

2018-04-06 19:32:12 +0200

[diff] [blame]

56

#include "sysemu/sysemu.h"

57

#include "qemu/uuid.h"

Peter Xu

2018-05-02 18:47:32 +0800

[diff] [blame]

58

#include "savevm.h"

Juan Quintela

2016-01-15 11:40:13 +0100

[diff] [blame]

59

#include "qemu/iov.h"

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

60

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

61

/***********************************************************/

62

/* ram save/restore */

63

Juan Quintela

2017-04-28 09:39:55 +0200

[diff] [blame]

64

/* RAM_SAVE_FLAG_ZERO used to be named RAM_SAVE_FLAG_COMPRESS, it

65

* worked for pages that where filled with the same char. We switched

66

* it to only search for the zero value. And to avoid confusion with

67

* RAM_SSAVE_FLAG_COMPRESS_PAGE just rename it.

68

*/

69

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

70

#define RAM_SAVE_FLAG_FULL 0x01 /* Obsolete, not used anymore */

Juan Quintela

2017-04-28 09:39:55 +0200

[diff] [blame]

71

#define RAM_SAVE_FLAG_ZERO 0x02

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

72

#define RAM_SAVE_FLAG_MEM_SIZE 0x04

73

#define RAM_SAVE_FLAG_PAGE 0x08

74

#define RAM_SAVE_FLAG_EOS 0x10

75

#define RAM_SAVE_FLAG_CONTINUE 0x20

76

#define RAM_SAVE_FLAG_XBZRLE 0x40

77

/* 0x80 is reserved in migration.h start with 0x100 next */

78

#define RAM_SAVE_FLAG_COMPRESS_PAGE 0x100

79

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

80

static inline bool is_zero_range(uint8_t *p, uint64_t size)

81

{

Richard Henderson

a1febc4

2016-08-29 11:46:14 -0700

[diff] [blame]

82

return buffer_is_zero(p, size);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

83

}

84

Juan Quintela

2017-06-06 19:49:03 +0200

[diff] [blame]

85

XBZRLECacheStats xbzrle_counters;

86

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

87

/* struct contains XBZRLE cache and a static page

88

used by the compression */

89

static struct {

90

/* buffer used for XBZRLE encoding */

91

uint8_t *encoded_buf;

92

/* buffer for storing page content */

93

uint8_t *current_buf;

94

/* Cache for XBZRLE, Protected by lock. */

95

PageCache *cache;

96

QemuMutex lock;

Juan Quintela

c00e092

2017-05-09 16:22:01 +0200

[diff] [blame]

97

/* it will store a page full of zeros */

98

uint8_t *zero_target_page;

Juan Quintela

2017-06-28 11:52:27 +0200

[diff] [blame]

99

/* buffer used for XBZRLE decoding */

100

uint8_t *decoded_buf;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

101

} XBZRLE;

102

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

103

static void XBZRLE_cache_lock(void)

104

{

105

if (migrate_use_xbzrle())

106

qemu_mutex_lock(&XBZRLE.lock);

107

}

108

109

static void XBZRLE_cache_unlock(void)

110

{

111

if (migrate_use_xbzrle())

112

qemu_mutex_unlock(&XBZRLE.lock);

113

}

114

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

115

/**

116

* xbzrle_cache_resize: resize the xbzrle cache

117

*

118

* This function is called from qmp_migrate_set_cache_size in main

119

* thread, possibly while a migration is in progress. A running

120

* migration may be using the cache and might finish during this call,

121

* hence changes to the cache are protected by XBZRLE.lock().

122

*

Juan Quintela

2017-10-06 23:03:55 +0200

[diff] [blame]

123

* Returns 0 for success or -1 for error

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

124

*

125

* @new_size: new cache size

Juan Quintela

8acabf6

2017-10-05 22:00:31 +0200

[diff] [blame]

126

* @errp: set *errp if the check failed, with reason

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

127

*/

Juan Quintela

2017-10-06 23:03:55 +0200

[diff] [blame]

128

int xbzrle_cache_resize(int64_t new_size, Error **errp)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

129

{

130

PageCache *new_cache;

Juan Quintela

2017-10-06 23:03:55 +0200

[diff] [blame]

131

int64_t ret = 0;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

132

Juan Quintela

8acabf6

2017-10-05 22:00:31 +0200

[diff] [blame]

133

/* Check for truncation */

134

if (new_size != (size_t)new_size) {

135

error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "cache size",

136

"exceeding address space");

return -1;

}

Juan Quintela

2017-10-06 23:00:12 +0200

[diff] [blame]

140

if (new_size == migrate_xbzrle_cache_size()) {

141

/* nothing to do */

Juan Quintela

2017-10-06 23:03:55 +0200

[diff] [blame]

142

return 0;

Juan Quintela

2a313e5

2017-10-06 23:00:12 +0200

[diff] [blame]

143

}

144

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

145

XBZRLE_cache_lock();

146

147

if (XBZRLE.cache != NULL) {

Juan Quintela

80f8dfd

2017-10-06 22:30:45 +0200

[diff] [blame]

148

new_cache = cache_init(new_size, TARGET_PAGE_SIZE, errp);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

149

if (!new_cache) {

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

ret = -1;

goto out;

}

cache_fini(XBZRLE.cache);

155

XBZRLE.cache = new_cache;

156

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

157

out:

158

XBZRLE_cache_unlock();

return ret;

}

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

162

static bool ramblock_is_ignored(RAMBlock *block)

163

{

164

return !qemu_ram_is_migratable(block) ||

165

(migrate_ignore_shared() && qemu_ram_is_shared(block));

166

}

167

Cédric Le Goater

2018-05-14 08:57:00 +0200

[diff] [blame]

168

/* Should be holding either ram_list.mutex, or the RCU lock. */

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

169

#define RAMBLOCK_FOREACH_NOT_IGNORED(block) \

170

INTERNAL_RAMBLOCK_FOREACH(block) \

171

if (ramblock_is_ignored(block)) {} else

172

Cédric Le Goater

2018-05-14 08:57:00 +0200

[diff] [blame]

173

#define RAMBLOCK_FOREACH_MIGRATABLE(block) \

Dr. David Alan Gilbert

343f632

2018-06-05 17:25:45 +0100

[diff] [blame]

174

INTERNAL_RAMBLOCK_FOREACH(block) \

Cédric Le Goater

2018-05-14 08:57:00 +0200

[diff] [blame]

175

if (!qemu_ram_is_migratable(block)) {} else

176

Dr. David Alan Gilbert

343f632

2018-06-05 17:25:45 +0100

[diff] [blame]

177

#undef RAMBLOCK_FOREACH

178

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

179

int foreach_not_ignored_block(RAMBlockIterFunc func, void *opaque)

{

RAMBlock *block;

int ret = 0;

rcu_read_lock();

RAMBLOCK_FOREACH_NOT_IGNORED(block) {

186

ret = func(block, opaque);

if (ret) {

break;

}

}

rcu_read_unlock();

return ret;

}

Alexey Perevalov

2017-10-05 14:13:20 +0300

[diff] [blame]

195

static void ramblock_recv_map_init(void)

{

RAMBlock *rb;

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

199

RAMBLOCK_FOREACH_NOT_IGNORED(rb) {

Alexey Perevalov

2017-10-05 14:13:20 +0300

[diff] [blame]

200

assert(!rb->receivedmap);

201

rb->receivedmap = bitmap_new(rb->max_length >> qemu_target_page_bits());

}

}

int ramblock_recv_bitmap_test(RAMBlock *rb, void *host_addr)

206

{

207

return test_bit(ramblock_recv_bitmap_offset(host_addr, rb),

208

rb->receivedmap);

209

}

210

Dr. David Alan Gilbert

1cba9f6

2018-03-12 17:21:08 +0000

[diff] [blame]

211

bool ramblock_recv_bitmap_test_byte_offset(RAMBlock *rb, uint64_t byte_offset)

212

{

213

return test_bit(byte_offset >> TARGET_PAGE_BITS, rb->receivedmap);

214

}

215

Alexey Perevalov

2017-10-05 14:13:20 +0300

[diff] [blame]

216

void ramblock_recv_bitmap_set(RAMBlock *rb, void *host_addr)

217

{

218

set_bit_atomic(ramblock_recv_bitmap_offset(host_addr, rb), rb->receivedmap);

219

}

220

221

void ramblock_recv_bitmap_set_range(RAMBlock *rb, void *host_addr,

222

size_t nr)

223

{

224

bitmap_set_atomic(rb->receivedmap,

225

ramblock_recv_bitmap_offset(host_addr, rb),

nr);

}

Peter Xu

2018-05-02 18:47:28 +0800

[diff] [blame]

229

#define RAMBLOCK_RECV_BITMAP_ENDING (0x0123456789abcdefULL)

230

231

/*

232

* Format: bitmap_size (8 bytes) + whole_bitmap (N bytes).

233

*

234

* Returns >0 if success with sent bytes, or <0 if error.

235

*/

236

int64_t ramblock_recv_bitmap_send(QEMUFile *file,

237

const char *block_name)

238

{

239

RAMBlock *block = qemu_ram_block_by_name(block_name);

240

unsigned long *le_bitmap, nbits;

uint64_t size;

if (!block) {

error_report("%s: invalid block name: %s", __func__, block_name);

return -1;

}

nbits = block->used_length >> TARGET_PAGE_BITS;

249

250

/*

251

* Make sure the tmp bitmap buffer is big enough, e.g., on 32bit

252

* machines we may need 4 more bytes for padding (see below

253

* comment). So extend it a bit before hand.

254

*/

255

le_bitmap = bitmap_new(nbits + BITS_PER_LONG);

256

257

/*

258

* Always use little endian when sending the bitmap. This is

259

* required that when source and destination VMs are not using the

260

* same endianess. (Note: big endian won't work.)

261

*/

262

bitmap_to_le(le_bitmap, block->receivedmap, nbits);

263

264

/* Size of the bitmap, in bytes */

Peter Xu

a725ef9

2018-07-10 17:18:55 +0800

[diff] [blame]

265

size = DIV_ROUND_UP(nbits, 8);

Peter Xu

2018-05-02 18:47:28 +0800

[diff] [blame]

266

267

/*

268

* size is always aligned to 8 bytes for 64bit machines, but it

269

* may not be true for 32bit machines. We need this padding to

270

* make sure the migration can survive even between 32bit and

271

* 64bit machines.

272

*/

273

size = ROUND_UP(size, 8);

274

275

qemu_put_be64(file, size);

276

qemu_put_buffer(file, (const uint8_t *)le_bitmap, size);

277

/*

278

* Mark as an end, in case the middle part is screwed up due to

279

* some "misterious" reason.

280

*/

281

qemu_put_be64(file, RAMBLOCK_RECV_BITMAP_ENDING);

282

qemu_fflush(file);

283

Peter Xu

bf26990

2018-05-25 09:50:42 +0800

[diff] [blame]

284

g_free(le_bitmap);

Peter Xu

2018-05-02 18:47:28 +0800

[diff] [blame]

285

286

if (qemu_file_get_error(file)) {

287

return qemu_file_get_error(file);

288

}

289

290

return size + sizeof(size);

291

}

292

Juan Quintela

2017-03-20 22:12:40 +0100

[diff] [blame]

293

/*

294

* An outstanding page request, on the source, having been received

295

* and queued

296

*/

297

struct RAMSrcPageRequest {

RAMBlock *rb;

hwaddr offset;

hwaddr len;

QSIMPLEQ_ENTRY(RAMSrcPageRequest) next_req;

303

};

304

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

305

/* State of RAM for migration */

306

struct RAMState {

Juan Quintela

204b88b

2017-03-15 09:16:57 +0100

[diff] [blame]

307

/* QEMUFile used for this migration */

308

QEMUFile *f;

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

309

/* Last block that we have visited searching for dirty pages */

310

RAMBlock *last_seen_block;

311

/* Last block from where we have sent data */

312

RAMBlock *last_sent_block;

Juan Quintela

269ace2

2017-03-21 15:23:31 +0100

[diff] [blame]

313

/* Last dirty target page we have sent */

314

ram_addr_t last_page;

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

315

/* last ram version we have seen */

316

uint32_t last_version;

317

/* We are in the first round */

318

bool ram_bulk_stage;

Wei Wang

6eeb63f

2018-12-11 16:24:52 +0800

[diff] [blame]

319

/* The free page optimization is enabled */

320

bool fpo_enabled;

Juan Quintela

8d820d6

2017-03-13 19:35:50 +0100

[diff] [blame]

321

/* How many times we have dirty too many pages */

322

int dirty_rate_high_cnt;

Juan Quintela

2017-03-13 19:44:57 +0100

[diff] [blame]

323

/* these variables are used for bitmap sync */

324

/* last time we did a full bitmap_sync */

325

int64_t time_last_bitmap_sync;

Juan Quintela

eac7415

2017-03-28 14:59:01 +0200

[diff] [blame]

326

/* bytes transferred at start_time */

Juan Quintela

c4bdf0c

2017-03-28 14:59:54 +0200

[diff] [blame]

327

uint64_t bytes_xfer_prev;

Juan Quintela

a66cd90

2017-03-28 15:02:43 +0200

[diff] [blame]

328

/* number of dirty pages since start_time */

Juan Quintela

68908ed

2017-03-28 15:05:53 +0200

[diff] [blame]

329

uint64_t num_dirty_pages_period;

Juan Quintela

b5833fd

2017-03-13 19:49:19 +0100

[diff] [blame]

330

/* xbzrle misses since the beginning of the period */

331

uint64_t xbzrle_cache_miss_prev;

Xiao Guangrong

2018-09-06 15:01:00 +0800

[diff] [blame]

332

333

/* compression statistics since the beginning of the period */

334

/* amount of count that no free thread to compress data */

335

uint64_t compress_thread_busy_prev;

336

/* amount bytes after compression */

337

uint64_t compressed_size_prev;

338

/* amount of compressed pages */

339

uint64_t compress_pages_prev;

340

Xiao Guangrong

2018-09-03 17:26:42 +0800

[diff] [blame]

341

/* total handled target pages at the beginning of period */

342

uint64_t target_page_count_prev;

343

/* total handled target pages since start */

344

uint64_t target_page_count;

Juan Quintela

2017-06-06 19:49:03 +0200

[diff] [blame]

345

/* number of dirty bits in the bitmap */

Peter Xu

2dfaf12

2017-08-02 17:41:19 +0800

[diff] [blame]

346

uint64_t migration_dirty_pages;

Wei Wang

386a907

2018-12-11 16:24:49 +0800

[diff] [blame]

347

/* Protects modification of the bitmap and migration dirty pages */

Juan Quintela

108cfae

2017-03-13 21:38:09 +0100

[diff] [blame]

348

QemuMutex bitmap_mutex;

Juan Quintela

68a098f

2017-03-14 13:48:42 +0100

[diff] [blame]

349

/* The RAMBlock used in the last src_page_requests */

350

RAMBlock *last_req_rb;

Juan Quintela

2017-03-20 22:12:40 +0100

[diff] [blame]

351

/* Queue of outstanding page requests from the destination */

352

QemuMutex src_page_req_mutex;

Paolo Bonzini

b58deb3

2018-12-06 11:58:10 +0100

[diff] [blame]

353

QSIMPLEQ_HEAD(, RAMSrcPageRequest) src_page_requests;

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

354

};

355

typedef struct RAMState RAMState;

356

Juan Quintela

2017-05-04 11:46:24 +0200

[diff] [blame]

357

static RAMState *ram_state;

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

358

Wei Wang

2018-12-11 16:24:51 +0800

[diff] [blame]

359

static NotifierWithReturnList precopy_notifier_list;

360

361

void precopy_infrastructure_init(void)

362

{

363

notifier_with_return_list_init(&precopy_notifier_list);

364

}

365

366

void precopy_add_notifier(NotifierWithReturn *n)

367

{

368

notifier_with_return_list_add(&precopy_notifier_list, n);

369

}

370

371

void precopy_remove_notifier(NotifierWithReturn *n)

372

{

373

notifier_with_return_remove(n);

374

}

375

376

int precopy_notify(PrecopyNotifyReason reason, Error **errp)

377

{

378

PrecopyNotifyData pnd;

pnd.reason = reason;

pnd.errp = errp;

return notifier_with_return_list_notify(&precopy_notifier_list, &pnd);

383

}

384

Wei Wang

6eeb63f

2018-12-11 16:24:52 +0800

[diff] [blame]

385

void precopy_enable_free_page_optimization(void)

{

if (!ram_state) {

return;

}

ram_state->fpo_enabled = true;

392

}

393

Juan Quintela

2017-03-14 12:02:16 +0100

[diff] [blame]

394

uint64_t ram_bytes_remaining(void)

395

{

Dr. David Alan Gilbert

bae416e

2017-12-15 11:51:23 +0000

[diff] [blame]

396

return ram_state ? (ram_state->migration_dirty_pages * TARGET_PAGE_SIZE) :

397

0;

Juan Quintela

2017-03-14 12:02:16 +0100

[diff] [blame]

398

}

399

Juan Quintela

2017-06-06 19:49:03 +0200

[diff] [blame]

400

MigrationStats ram_counters;

Juan Quintela

9650689

2017-03-14 18:41:03 +0100

[diff] [blame]

401

Dr. David Alan Gilbert

2015-09-23 15:27:10 +0100

[diff] [blame]

402

/* used by the search for pages to send */

403

struct PageSearchStatus {

404

/* Current block being searched */

405

RAMBlock *block;

Juan Quintela

2017-03-21 15:36:51 +0100

[diff] [blame]

406

/* Current page to search from */

407

unsigned long page;

Dr. David Alan Gilbert

2015-09-23 15:27:10 +0100

[diff] [blame]

408

/* Set once we wrap around */

409

bool complete_round;

410

};

411

typedef struct PageSearchStatus PageSearchStatus;

412

Xiao Guangrong

2018-09-06 15:01:00 +0800

[diff] [blame]

413

CompressionStats compression_counters;

414

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

415

struct CompressParam {

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

416

bool done;

Liang Li

2016-05-05 15:32:56 +0800

[diff] [blame]

417

bool quit;

Xiao Guangrong

2018-08-21 16:10:24 +0800

[diff] [blame]

418

bool zero_page;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

QEMUFile *file;

QemuMutex mutex;

QemuCond cond;

RAMBlock *block;

ram_addr_t offset;

Xiao Guangrong

2018-03-30 15:51:22 +0800

[diff] [blame]

424

425

/* internally used fields */

Xiao Guangrong

2018-03-30 15:51:20 +0800

[diff] [blame]

426

z_stream stream;

Xiao Guangrong

2018-03-30 15:51:22 +0800

[diff] [blame]

427

uint8_t *originbuf;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

428

};

429

typedef struct CompressParam CompressParam;

430

431

struct DecompressParam {

Liang Li

2016-05-05 15:32:51 +0800

[diff] [blame]

432

bool done;

Liang Li

2016-05-05 15:32:56 +0800

[diff] [blame]

433

bool quit;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

434

QemuMutex mutex;

435

QemuCond cond;

436

void *des;

Peter Maydell

d341d9f

2016-01-22 15:09:21 +0000

[diff] [blame]

437

uint8_t *compbuf;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

438

int len;

Xiao Guangrong

2018-03-30 15:51:21 +0800

[diff] [blame]

439

z_stream stream;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

440

};

441

typedef struct DecompressParam DecompressParam;

442

443

static CompressParam *comp_param;

444

static QemuThread *compress_threads;

445

/* comp_done_cond is used to wake up the migration thread when

446

* one of the compression threads has finished the compression.

447

* comp_done_lock is used to co-work with comp_done_cond.

448

*/

Liang Li

2016-05-05 15:32:59 +0800

[diff] [blame]

449

static QemuMutex comp_done_lock;

450

static QemuCond comp_done_cond;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

451

/* The empty QEMUFileOps will be used by file in CompressParam */

452

static const QEMUFileOps empty_ops = { };

453

Xiao Guangrong

2018-03-30 15:51:22 +0800

[diff] [blame]

454

static QEMUFile *decomp_file;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

455

static DecompressParam *decomp_param;

456

static QemuThread *decompress_threads;

Liang Li

2016-05-05 15:32:51 +0800

[diff] [blame]

457

static QemuMutex decomp_done_lock;

458

static QemuCond decomp_done_cond;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

459

Xiao Guangrong

2018-08-21 16:10:24 +0800

[diff] [blame]

460

static bool do_compress_ram_page(QEMUFile *f, z_stream *stream, RAMBlock *block,

Xiao Guangrong

2018-08-21 16:10:23 +0800

[diff] [blame]

461

ram_addr_t offset, uint8_t *source_buf);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

462

463

static void *do_data_compress(void *opaque)

464

{

465

CompressParam *param = opaque;

Liang Li

2016-05-05 15:32:57 +0800

[diff] [blame]

466

RAMBlock *block;

467

ram_addr_t offset;

Xiao Guangrong

2018-08-21 16:10:24 +0800

[diff] [blame]

468

bool zero_page;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

469

Liang Li

2016-05-05 15:32:57 +0800

[diff] [blame]

470

qemu_mutex_lock(&param->mutex);

Liang Li

2016-05-05 15:32:56 +0800

[diff] [blame]

471

while (!param->quit) {

Liang Li

2016-05-05 15:32:57 +0800

[diff] [blame]

472

if (param->block) {

473

block = param->block;

474

offset = param->offset;

475

param->block = NULL;

476

qemu_mutex_unlock(&param->mutex);

477

Xiao Guangrong

2018-08-21 16:10:24 +0800

[diff] [blame]

478

zero_page = do_compress_ram_page(param->file, &param->stream,

479

block, offset, param->originbuf);

Liang Li

2016-05-05 15:32:57 +0800

[diff] [blame]

480

Liang Li

2016-05-05 15:32:59 +0800

[diff] [blame]

481

qemu_mutex_lock(&comp_done_lock);

Liang Li

2016-05-05 15:32:57 +0800

[diff] [blame]

482

param->done = true;

Xiao Guangrong

2018-08-21 16:10:24 +0800

[diff] [blame]

483

param->zero_page = zero_page;

Liang Li

2016-05-05 15:32:59 +0800

[diff] [blame]

484

qemu_cond_signal(&comp_done_cond);

485

qemu_mutex_unlock(&comp_done_lock);

Liang Li

2016-05-05 15:32:57 +0800

[diff] [blame]

486

487

qemu_mutex_lock(&param->mutex);

488

} else {

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

489

qemu_cond_wait(&param->cond, &param->mutex);

490

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

491

}

Liang Li

2016-05-05 15:32:57 +0800

[diff] [blame]

492

qemu_mutex_unlock(&param->mutex);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

return NULL;

}

Juan Quintela

2017-06-28 11:52:28 +0200

[diff] [blame]

497

static void compress_threads_save_cleanup(void)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

{

int i, thread_count;

Fei Li

2018-09-25 17:14:40 +0800

[diff] [blame]

501

if (!migrate_use_compression() || !comp_param) {

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

502

return;

503

}

Fei Li

0530693

2018-09-25 17:14:40 +0800

[diff] [blame]

504

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

505

thread_count = migrate_compress_threads();

506

for (i = 0; i < thread_count; i++) {

Xiao Guangrong

2018-03-30 15:51:20 +0800

[diff] [blame]

507

/*

508

* we use it as a indicator which shows if the thread is

509

* properly init'd or not

510

*/

511

if (!comp_param[i].file) {

512

break;

513

}

Fei Li

0530693

2018-09-25 17:14:40 +0800

[diff] [blame]

514

515

qemu_mutex_lock(&comp_param[i].mutex);

516

comp_param[i].quit = true;

517

qemu_cond_signal(&comp_param[i].cond);

518

qemu_mutex_unlock(&comp_param[i].mutex);

519

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

520

qemu_thread_join(compress_threads + i);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

521

qemu_mutex_destroy(&comp_param[i].mutex);

522

qemu_cond_destroy(&comp_param[i].cond);

Xiao Guangrong

2018-03-30 15:51:20 +0800

[diff] [blame]

523

deflateEnd(&comp_param[i].stream);

Xiao Guangrong

2018-03-30 15:51:22 +0800

[diff] [blame]

524

g_free(comp_param[i].originbuf);

Xiao Guangrong

2018-03-30 15:51:20 +0800

[diff] [blame]

525

qemu_fclose(comp_param[i].file);

526

comp_param[i].file = NULL;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

527

}

Liang Li

2016-05-05 15:32:59 +0800

[diff] [blame]

528

qemu_mutex_destroy(&comp_done_lock);

529

qemu_cond_destroy(&comp_done_cond);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

530

g_free(compress_threads);

531

g_free(comp_param);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

532

compress_threads = NULL;

533

comp_param = NULL;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

534

}

535

Xiao Guangrong

2018-03-30 15:51:20 +0800

[diff] [blame]

536

static int compress_threads_save_setup(void)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

{

int i, thread_count;

if (!migrate_use_compression()) {

Xiao Guangrong

2018-03-30 15:51:20 +0800

[diff] [blame]

541

return 0;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

542

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

543

thread_count = migrate_compress_threads();

544

compress_threads = g_new0(QemuThread, thread_count);

545

comp_param = g_new0(CompressParam, thread_count);

Liang Li

2016-05-05 15:32:59 +0800

[diff] [blame]

546

qemu_cond_init(&comp_done_cond);

547

qemu_mutex_init(&comp_done_lock);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

548

for (i = 0; i < thread_count; i++) {

Xiao Guangrong

2018-03-30 15:51:22 +0800

[diff] [blame]

549

comp_param[i].originbuf = g_try_malloc(TARGET_PAGE_SIZE);

550

if (!comp_param[i].originbuf) {

goto exit;

}

Xiao Guangrong

2018-03-30 15:51:20 +0800

[diff] [blame]

554

if (deflateInit(&comp_param[i].stream,

555

migrate_compress_level()) != Z_OK) {

Xiao Guangrong

2018-03-30 15:51:22 +0800

[diff] [blame]

556

g_free(comp_param[i].originbuf);

Xiao Guangrong

2018-03-30 15:51:20 +0800

[diff] [blame]

goto exit;

}

Cao jin

2016-07-29 15:10:31 +0800

[diff] [blame]

560

/* comp_param[i].file is just used as a dummy buffer to save data,

561

* set its ops to empty.

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

562

*/

563

comp_param[i].file = qemu_fopen_ops(NULL, &empty_ops);

564

comp_param[i].done = true;

Liang Li

2016-05-05 15:32:56 +0800

[diff] [blame]

565

comp_param[i].quit = false;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

566

qemu_mutex_init(&comp_param[i].mutex);

567

qemu_cond_init(&comp_param[i].cond);

568

qemu_thread_create(compress_threads + i, "compress",

569

do_data_compress, comp_param + i,

570

QEMU_THREAD_JOINABLE);

571

}

Xiao Guangrong

2018-03-30 15:51:20 +0800

[diff] [blame]

return 0;

exit:

compress_threads_save_cleanup();

576

return -1;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

577

}

578

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

579

/* Multiple fd's */

580

Juan Quintela

2018-04-06 19:32:12 +0200

[diff] [blame]

581

#define MULTIFD_MAGIC 0x11223344U

582

#define MULTIFD_VERSION 1

583

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

584

#define MULTIFD_FLAG_SYNC (1 << 0)

585

Juan Quintela

2019-02-20 12:06:03 +0100

[diff] [blame]

586

/* This value needs to be a multiple of qemu_target_page_size() */

Juan Quintela

4b0c726

2019-02-20 12:45:57 +0100

[diff] [blame]

587

#define MULTIFD_PACKET_SIZE (512 * 1024)

Juan Quintela

2019-02-20 12:06:03 +0100

[diff] [blame]

588

Juan Quintela

2018-04-06 19:32:12 +0200

[diff] [blame]

typedef struct {

uint32_t magic;

uint32_t version;

unsigned char uuid[16]; /* QemuUUID */

593

uint8_t id;

Juan Quintela

5fbd8b4

2019-03-13 10:54:58 +0100

[diff] [blame]

594

uint8_t unused1[7]; /* Reserved for future use */

595

uint64_t unused2[4]; /* Reserved for future use */

Juan Quintela

2018-04-06 19:32:12 +0200

[diff] [blame]

596

} __attribute__((packed)) MultiFDInit_t;

597

Juan Quintela

2018-04-07 13:59:07 +0200

[diff] [blame]

598

typedef struct {

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

599

uint32_t magic;

600

uint32_t version;

601

uint32_t flags;

Juan Quintela

2019-02-20 12:04:04 +0100

[diff] [blame]

602

/* maximum number of allocated pages */

603

uint32_t pages_alloc;

604

uint32_t pages_used;

Juan Quintela

2019-01-04 19:45:39 +0100

[diff] [blame]

605

/* size of the next packet that contains pages */

606

uint32_t next_packet_size;

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

607

uint64_t packet_num;

Juan Quintela

5fbd8b4

2019-03-13 10:54:58 +0100

[diff] [blame]

608

uint64_t unused[4]; /* Reserved for future use */

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

609

char ramblock[256];

610

uint64_t offset[];

611

} __attribute__((packed)) MultiFDPacket_t;

612

613

typedef struct {

Juan Quintela

2018-04-10 23:35:15 +0200

[diff] [blame]

614

/* number of used pages */

615

uint32_t used;

616

/* number of allocated pages */

617

uint32_t allocated;

618

/* global number of generated multifd packets */

619

uint64_t packet_num;

620

/* offset of each page */

621

ram_addr_t *offset;

622

/* pointer to each page */

struct iovec *iov;

RAMBlock *block;

} MultiFDPages_t;

typedef struct {

Juan Quintela

2018-04-07 13:59:07 +0200

[diff] [blame]

628

/* this fields are not changed once the thread is created */

629

/* channel number */

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

630

uint8_t id;

Juan Quintela

2018-04-07 13:59:07 +0200

[diff] [blame]

631

/* channel thread name */

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

632

char *name;

Juan Quintela

2018-04-07 13:59:07 +0200

[diff] [blame]

633

/* channel thread id */

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

634

QemuThread thread;

Juan Quintela

2018-04-07 13:59:07 +0200

[diff] [blame]

635

/* communication channel */

Juan Quintela

2018-03-07 07:56:15 +0100

[diff] [blame]

636

QIOChannel *c;

Juan Quintela

2018-04-07 13:59:07 +0200

[diff] [blame]

637

/* sem where to wait for more work */

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

638

QemuSemaphore sem;

Juan Quintela

2018-04-07 13:59:07 +0200

[diff] [blame]

639

/* this mutex protects the following parameters */

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

640

QemuMutex mutex;

Juan Quintela

2018-04-07 13:59:07 +0200

[diff] [blame]

641

/* is this channel thread running */

Juan Quintela

2018-02-19 19:01:45 +0100

[diff] [blame]

642

bool running;

Juan Quintela

2018-04-07 13:59:07 +0200

[diff] [blame]

643

/* should this thread finish */

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

644

bool quit;

Juan Quintela

2018-04-11 03:02:10 +0200

[diff] [blame]

645

/* thread has work to do */

646

int pending_job;

Juan Quintela

2018-04-10 23:35:15 +0200

[diff] [blame]

647

/* array of pages to sent */

648

MultiFDPages_t *pages;

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

649

/* packet allocated len */

650

uint32_t packet_len;

651

/* pointer to the packet */

652

MultiFDPacket_t *packet;

653

/* multifd flags for each packet */

654

uint32_t flags;

Juan Quintela

2019-01-04 19:45:39 +0100

[diff] [blame]

655

/* size of the next packet that contains pages */

656

uint32_t next_packet_size;

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

657

/* global number of generated multifd packets */

658

uint64_t packet_num;

Juan Quintela

2018-04-06 18:28:59 +0200

[diff] [blame]

659

/* thread local variables */

660

/* packets sent through this channel */

661

uint64_t num_packets;

662

/* pages sent through this channel */

663

uint64_t num_pages;

Juan Quintela

2018-04-07 13:59:07 +0200

[diff] [blame]

} MultiFDSendParams;

typedef struct {

/* this fields are not changed once the thread is created */

668

/* channel number */

669

uint8_t id;

670

/* channel thread name */

671

char *name;

672

/* channel thread id */

673

QemuThread thread;

674

/* communication channel */

675

QIOChannel *c;

Juan Quintela

2018-04-07 13:59:07 +0200

[diff] [blame]

676

/* this mutex protects the following parameters */

677

QemuMutex mutex;

678

/* is this channel thread running */

679

bool running;

Juan Quintela

2018-04-10 23:35:15 +0200

[diff] [blame]

680

/* array of pages to receive */

681

MultiFDPages_t *pages;

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

682

/* packet allocated len */

683

uint32_t packet_len;

684

/* pointer to the packet */

685

MultiFDPacket_t *packet;

686

/* multifd flags for each packet */

687

uint32_t flags;

688

/* global number of generated multifd packets */

689

uint64_t packet_num;

Juan Quintela

2018-04-06 18:28:59 +0200

[diff] [blame]

690

/* thread local variables */

Juan Quintela

2019-01-04 19:45:39 +0100

[diff] [blame]

691

/* size of the next packet that contains pages */

692

uint32_t next_packet_size;

Juan Quintela

2018-04-06 18:28:59 +0200

[diff] [blame]

693

/* packets sent through this channel */

694

uint64_t num_packets;

695

/* pages sent through this channel */

696

uint64_t num_pages;

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

697

/* syncs main thread and channels */

698

QemuSemaphore sem_sync;

Juan Quintela

2018-04-07 13:59:07 +0200

[diff] [blame]

699

} MultiFDRecvParams;

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

700

Juan Quintela

2018-04-06 19:32:12 +0200

[diff] [blame]

701

static int multifd_send_initial_packet(MultiFDSendParams *p, Error **errp)

{

MultiFDInit_t msg;

int ret;

msg.magic = cpu_to_be32(MULTIFD_MAGIC);

707

msg.version = cpu_to_be32(MULTIFD_VERSION);

708

msg.id = p->id;

709

memcpy(msg.uuid, &qemu_uuid.data, sizeof(msg.uuid));

710

711

ret = qio_channel_write_all(p->c, (char *)&msg, sizeof(msg), errp);

if (ret != 0) {

return -1;

}

return 0;

}

static int multifd_recv_initial_packet(QIOChannel *c, Error **errp)

{

MultiFDInit_t msg;

int ret;

ret = qio_channel_read_all(c, (char *)&msg, sizeof(msg), errp);

if (ret != 0) {

return -1;

}

Peter Maydell

2018-09-25 17:19:24 +0100

[diff] [blame]

728

msg.magic = be32_to_cpu(msg.magic);

729

msg.version = be32_to_cpu(msg.version);

Juan Quintela

2018-04-06 19:32:12 +0200

[diff] [blame]

730

731

if (msg.magic != MULTIFD_MAGIC) {

732

error_setg(errp, "multifd: received packet magic %x "

733

"expected %x", msg.magic, MULTIFD_MAGIC);

return -1;

}

if (msg.version != MULTIFD_VERSION) {

738

error_setg(errp, "multifd: received packet version %d "

739

"expected %d", msg.version, MULTIFD_VERSION);

return -1;

}

if (memcmp(msg.uuid, &qemu_uuid, sizeof(qemu_uuid))) {

744

char *uuid = qemu_uuid_unparse_strdup(&qemu_uuid);

745

char *msg_uuid = qemu_uuid_unparse_strdup((const QemuUUID *)msg.uuid);

746

747

error_setg(errp, "multifd: received uuid '%s' and expected "

748

"uuid '%s' for channel %hhd", msg_uuid, uuid, msg.id);

g_free(uuid);

g_free(msg_uuid);

return -1;

}

if (msg.id > migrate_multifd_channels()) {

755

error_setg(errp, "multifd: received channel version %d "

756

"expected %d", msg.version, MULTIFD_VERSION);

return -1;

}

return msg.id;

}

Juan Quintela

2018-04-10 23:35:15 +0200

[diff] [blame]

763

static MultiFDPages_t *multifd_pages_init(size_t size)

764

{

765

MultiFDPages_t *pages = g_new0(MultiFDPages_t, 1);

766

767

pages->allocated = size;

768

pages->iov = g_new0(struct iovec, size);

769

pages->offset = g_new0(ram_addr_t, size);

return pages;

}

static void multifd_pages_clear(MultiFDPages_t *pages)

775

{

776

pages->used = 0;

777

pages->allocated = 0;

778

pages->packet_num = 0;

pages->block = NULL;

g_free(pages->iov);

pages->iov = NULL;

g_free(pages->offset);

783

pages->offset = NULL;

g_free(pages);

}

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

787

static void multifd_send_fill_packet(MultiFDSendParams *p)

788

{

789

MultiFDPacket_t *packet = p->packet;

Juan Quintela

2019-02-20 12:44:07 +0100

[diff] [blame]

790

uint32_t page_max = MULTIFD_PACKET_SIZE / qemu_target_page_size();

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

791

int i;

792

793

packet->magic = cpu_to_be32(MULTIFD_MAGIC);

794

packet->version = cpu_to_be32(MULTIFD_VERSION);

795

packet->flags = cpu_to_be32(p->flags);

Juan Quintela

2019-02-20 12:44:07 +0100

[diff] [blame]

796

packet->pages_alloc = cpu_to_be32(page_max);

Juan Quintela

2019-02-20 12:04:04 +0100

[diff] [blame]

797

packet->pages_used = cpu_to_be32(p->pages->used);

Juan Quintela

2019-01-04 19:45:39 +0100

[diff] [blame]

798

packet->next_packet_size = cpu_to_be32(p->next_packet_size);

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

799

packet->packet_num = cpu_to_be64(p->packet_num);

800

801

if (p->pages->block) {

802

strncpy(packet->ramblock, p->pages->block->idstr, 256);

803

}

804

805

for (i = 0; i < p->pages->used; i++) {

806

packet->offset[i] = cpu_to_be64(p->pages->offset[i]);

}

}

static int multifd_recv_unfill_packet(MultiFDRecvParams *p, Error **errp)

811

{

812

MultiFDPacket_t *packet = p->packet;

Juan Quintela

2019-02-20 12:44:07 +0100

[diff] [blame]

813

uint32_t pages_max = MULTIFD_PACKET_SIZE / qemu_target_page_size();

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

RAMBlock *block;

int i;

Peter Maydell

2018-09-25 17:19:24 +0100

[diff] [blame]

817

packet->magic = be32_to_cpu(packet->magic);

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

818

if (packet->magic != MULTIFD_MAGIC) {

819

error_setg(errp, "multifd: received packet "

820

"magic %x and expected magic %x",

821

packet->magic, MULTIFD_MAGIC);

return -1;

}

Peter Maydell

2018-09-25 17:19:24 +0100

[diff] [blame]

825

packet->version = be32_to_cpu(packet->version);

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

826

if (packet->version != MULTIFD_VERSION) {

827

error_setg(errp, "multifd: received packet "

828

"version %d and expected version %d",

829

packet->version, MULTIFD_VERSION);

return -1;

}

p->flags = be32_to_cpu(packet->flags);

834

Juan Quintela

2019-02-20 12:04:04 +0100

[diff] [blame]

835

packet->pages_alloc = be32_to_cpu(packet->pages_alloc);

Juan Quintela

2019-02-20 12:44:07 +0100

[diff] [blame]

836

/*

837

* If we recevied a packet that is 100 times bigger than expected

838

* just stop migration. It is a magic number.

839

*/

840

if (packet->pages_alloc > pages_max * 100) {

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

841

error_setg(errp, "multifd: received packet "

Juan Quintela

2019-02-20 12:44:07 +0100

[diff] [blame]

842

"with size %d and expected a maximum size of %d",

843

packet->pages_alloc, pages_max * 100) ;

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

844

return -1;

845

}

Juan Quintela

2019-02-20 12:44:07 +0100

[diff] [blame]

846

/*

847

* We received a packet that is bigger than expected but inside

848

* reasonable limits (see previous comment). Just reallocate.

849

*/

850

if (packet->pages_alloc > p->pages->allocated) {

851

multifd_pages_clear(p->pages);

Peter Maydell

f151f8a

2019-04-09 16:18:30 +0100

[diff] [blame]

852

p->pages = multifd_pages_init(packet->pages_alloc);

Juan Quintela

2019-02-20 12:44:07 +0100

[diff] [blame]

853

}

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

854

Juan Quintela

2019-02-20 12:04:04 +0100

[diff] [blame]

855

p->pages->used = be32_to_cpu(packet->pages_used);

856

if (p->pages->used > packet->pages_alloc) {

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

857

error_setg(errp, "multifd: received packet "

Juan Quintela

2019-02-20 12:04:04 +0100

[diff] [blame]

858

"with %d pages and expected maximum pages are %d",

859

p->pages->used, packet->pages_alloc) ;

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

return -1;

}

Juan Quintela

2019-01-04 19:45:39 +0100

[diff] [blame]

863

p->next_packet_size = be32_to_cpu(packet->next_packet_size);

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

864

p->packet_num = be64_to_cpu(packet->packet_num);

865

866

if (p->pages->used) {

867

/* make sure that ramblock is 0 terminated */

868

packet->ramblock[255] = 0;

869

block = qemu_ram_block_by_name(packet->ramblock);

870

if (!block) {

871

error_setg(errp, "multifd: unknown ram block %s",

packet->ramblock);

return -1;

}

}

for (i = 0; i < p->pages->used; i++) {

878

ram_addr_t offset = be64_to_cpu(packet->offset[i]);

879

880

if (offset > (block->used_length - TARGET_PAGE_SIZE)) {

881

error_setg(errp, "multifd: offset too long " RAM_ADDR_FMT

882

" (max " RAM_ADDR_FMT ")",

883

offset, block->max_length);

884

return -1;

885

}

886

p->pages->iov[i].iov_base = block->host + offset;

887

p->pages->iov[i].iov_len = TARGET_PAGE_SIZE;

}

return 0;

}

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

893

struct {

894

MultiFDSendParams *params;

Juan Quintela

2018-04-10 23:35:15 +0200

[diff] [blame]

895

/* array of pages to sent */

896

MultiFDPages_t *pages;

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

897

/* syncs main thread and channels */

898

QemuSemaphore sem_sync;

899

/* global number of generated multifd packets */

900

uint64_t packet_num;

Juan Quintela

2016-01-15 11:40:13 +0100

[diff] [blame]

901

/* send channels ready */

902

QemuSemaphore channels_ready;

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

903

} *multifd_send_state;

904

Juan Quintela

2016-01-15 11:40:13 +0100

[diff] [blame]

905

/*

906

* How we use multifd_send_state->pages and channel->pages?

907

*

908

* We create a pages for each channel, and a main one. Each time that

909

* we need to send a batch of pages we interchange the ones between

910

* multifd_send_state and the channel that is sending it. There are

911

* two reasons for that:

912

* - to not have to do so many mallocs during migration

913

* - to make easier to know what to free at the end of migration

914

*

915

* This way we always know who is the owner of each "pages" struct,

Wei Yang

2019-05-11 07:37:29 +0800

[diff] [blame]

916

* and we don't need any locking. It belongs to the migration thread

Juan Quintela

2016-01-15 11:40:13 +0100

[diff] [blame]

917

* or to the channel thread. Switching is safe because the migration

918

* thread is using the channel mutex when changing it, and the channel

919

* have to had finish with its own, otherwise pending_job can't be

* false.

*/

static void multifd_send_pages(void)

924

{

925

int i;

926

static int next_channel;

927

MultiFDSendParams *p = NULL; /* make happy gcc */

928

MultiFDPages_t *pages = multifd_send_state->pages;

929

uint64_t transferred;

930

931

qemu_sem_wait(&multifd_send_state->channels_ready);

932

for (i = next_channel;; i = (i + 1) % migrate_multifd_channels()) {

933

p = &multifd_send_state->params[i];

934

935

qemu_mutex_lock(&p->mutex);

936

if (!p->pending_job) {

937

p->pending_job++;

938

next_channel = (i + 1) % migrate_multifd_channels();

939

break;

940

}

941

qemu_mutex_unlock(&p->mutex);

}

p->pages->used = 0;

p->packet_num = multifd_send_state->packet_num++;

946

p->pages->block = NULL;

947

multifd_send_state->pages = p->pages;

948

p->pages = pages;

Peter Xu

4fcefd4

2018-07-20 11:47:13 +0800

[diff] [blame]

949

transferred = ((uint64_t) pages->used) * TARGET_PAGE_SIZE + p->packet_len;

Juan Quintela

2016-01-15 11:40:13 +0100

[diff] [blame]

950

ram_counters.multifd_bytes += transferred;

951

ram_counters.transferred += transferred;;

952

qemu_mutex_unlock(&p->mutex);

953

qemu_sem_post(&p->sem);

954

}

955

956

static void multifd_queue_page(RAMBlock *block, ram_addr_t offset)

957

{

958

MultiFDPages_t *pages = multifd_send_state->pages;

959

960

if (!pages->block) {

961

pages->block = block;

962

}

963

964

if (pages->block == block) {

965

pages->offset[pages->used] = offset;

966

pages->iov[pages->used].iov_base = block->host + offset;

967

pages->iov[pages->used].iov_len = TARGET_PAGE_SIZE;

968

pages->used++;

969

970

if (pages->used < pages->allocated) {

return;

}

}

multifd_send_pages();

976

977

if (pages->block != block) {

978

multifd_queue_page(block, offset);

}

}

Juan Quintela

2018-02-19 19:01:45 +0100

[diff] [blame]

982

static void multifd_send_terminate_threads(Error *err)

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

{

int i;

Juan Quintela

2018-02-19 19:01:15 +0100

[diff] [blame]

986

if (err) {

987

MigrationState *s = migrate_get_current();

988

migrate_set_error(s, err);

989

if (s->state == MIGRATION_STATUS_SETUP ||

990

s->state == MIGRATION_STATUS_PRE_SWITCHOVER ||

991

s->state == MIGRATION_STATUS_DEVICE ||

992

s->state == MIGRATION_STATUS_ACTIVE) {

993

migrate_set_state(&s->state, s->state,

994

MIGRATION_STATUS_FAILED);

}

}

Juan Quintela

2018-02-19 19:01:45 +0100

[diff] [blame]

998

for (i = 0; i < migrate_multifd_channels(); i++) {

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

999

MultiFDSendParams *p = &multifd_send_state->params[i];

1000

1001

qemu_mutex_lock(&p->mutex);

1002

p->quit = true;

1003

qemu_sem_post(&p->sem);

1004

qemu_mutex_unlock(&p->mutex);

}

}

Fei Li

2019-01-13 22:08:47 +0800

[diff] [blame]

1008

void multifd_save_cleanup(void)

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1009

{

1010

int i;

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1011

1012

if (!migrate_use_multifd()) {

Fei Li

1398b2e

2019-01-13 22:08:47 +0800

[diff] [blame]

1013

return;

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1014

}

Juan Quintela

2018-02-19 19:01:45 +0100

[diff] [blame]

1015

multifd_send_terminate_threads(NULL);

1016

for (i = 0; i < migrate_multifd_channels(); i++) {

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1017

MultiFDSendParams *p = &multifd_send_state->params[i];

1018

Juan Quintela

2018-02-19 19:01:45 +0100

[diff] [blame]

1019

if (p->running) {

1020

qemu_thread_join(&p->thread);

1021

}

Juan Quintela

2018-03-07 07:56:15 +0100

[diff] [blame]

1022

socket_send_channel_destroy(p->c);

1023

p->c = NULL;

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1024

qemu_mutex_destroy(&p->mutex);

1025

qemu_sem_destroy(&p->sem);

1026

g_free(p->name);

1027

p->name = NULL;

Juan Quintela

2018-04-10 23:35:15 +0200

[diff] [blame]

1028

multifd_pages_clear(p->pages);

1029

p->pages = NULL;

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

1030

p->packet_len = 0;

1031

g_free(p->packet);

1032

p->packet = NULL;

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1033

}

Juan Quintela

2016-01-15 11:40:13 +0100

[diff] [blame]

1034

qemu_sem_destroy(&multifd_send_state->channels_ready);

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1035

qemu_sem_destroy(&multifd_send_state->sem_sync);

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1036

g_free(multifd_send_state->params);

1037

multifd_send_state->params = NULL;

Juan Quintela

2018-04-10 23:35:15 +0200

[diff] [blame]

1038

multifd_pages_clear(multifd_send_state->pages);

1039

multifd_send_state->pages = NULL;

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1040

g_free(multifd_send_state);

1041

multifd_send_state = NULL;

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1042

}

1043

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1044

static void multifd_send_sync_main(void)

{

int i;

if (!migrate_use_multifd()) {

1049

return;

1050

}

Juan Quintela

2016-01-15 11:40:13 +0100

[diff] [blame]

1051

if (multifd_send_state->pages->used) {

1052

multifd_send_pages();

1053

}

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1054

for (i = 0; i < migrate_multifd_channels(); i++) {

1055

MultiFDSendParams *p = &multifd_send_state->params[i];

1056

1057

trace_multifd_send_sync_main_signal(p->id);

1058

1059

qemu_mutex_lock(&p->mutex);

Juan Quintela

2016-01-15 11:40:13 +0100

[diff] [blame]

1060

1061

p->packet_num = multifd_send_state->packet_num++;

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1062

p->flags |= MULTIFD_FLAG_SYNC;

1063

p->pending_job++;

1064

qemu_mutex_unlock(&p->mutex);

1065

qemu_sem_post(&p->sem);

1066

}

1067

for (i = 0; i < migrate_multifd_channels(); i++) {

1068

MultiFDSendParams *p = &multifd_send_state->params[i];

1069

1070

trace_multifd_send_sync_main_wait(p->id);

1071

qemu_sem_wait(&multifd_send_state->sem_sync);

1072

}

1073

trace_multifd_send_sync_main(multifd_send_state->packet_num);

1074

}

1075

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1076

static void *multifd_send_thread(void *opaque)

1077

{

1078

MultiFDSendParams *p = opaque;

Juan Quintela

2018-04-06 19:32:12 +0200

[diff] [blame]

1079

Error *local_err = NULL;

Juan Quintela

2018-04-11 12:36:13 +0200

[diff] [blame]

1080

int ret;

Juan Quintela

2018-04-06 19:32:12 +0200

[diff] [blame]

1081

Juan Quintela

2018-04-06 18:28:59 +0200

[diff] [blame]

1082

trace_multifd_send_thread_start(p->id);

Lidong Chen

2018-08-06 21:29:29 +0800

[diff] [blame]

1083

rcu_register_thread();

Juan Quintela

2018-04-06 18:28:59 +0200

[diff] [blame]

1084

Juan Quintela

2018-04-06 19:32:12 +0200

[diff] [blame]

1085

if (multifd_send_initial_packet(p, &local_err) < 0) {

1086

goto out;

1087

}

Juan Quintela

2018-04-06 18:28:59 +0200

[diff] [blame]

1088

/* initial packet */

1089

p->num_packets = 1;

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1090

1091

while (true) {

Juan Quintela

d82628e

2018-04-11 02:44:24 +0200

[diff] [blame]

1092

qemu_sem_wait(&p->sem);

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1093

qemu_mutex_lock(&p->mutex);

Juan Quintela

2018-04-11 03:02:10 +0200

[diff] [blame]

1094

1095

if (p->pending_job) {

1096

uint32_t used = p->pages->used;

1097

uint64_t packet_num = p->packet_num;

1098

uint32_t flags = p->flags;

1099

Juan Quintela

2019-01-04 19:45:39 +0100

[diff] [blame]

1100

p->next_packet_size = used * qemu_target_page_size();

Juan Quintela

2018-04-11 03:02:10 +0200

[diff] [blame]

1101

multifd_send_fill_packet(p);

1102

p->flags = 0;

1103

p->num_packets++;

1104

p->num_pages += used;

1105

p->pages->used = 0;

1106

qemu_mutex_unlock(&p->mutex);

1107

Juan Quintela

2019-01-04 19:45:39 +0100

[diff] [blame]

1108

trace_multifd_send(p->id, packet_num, used, flags,

1109

p->next_packet_size);

Juan Quintela

2018-04-11 03:02:10 +0200

[diff] [blame]

1110

Juan Quintela

2018-04-11 12:36:13 +0200

[diff] [blame]

1111

ret = qio_channel_write_all(p->c, (void *)p->packet,

1112

p->packet_len, &local_err);

if (ret != 0) {

break;

}

Juan Quintela

2019-01-04 19:12:35 +0100

[diff] [blame]

1117

if (used) {

1118

ret = qio_channel_writev_all(p->c, p->pages->iov,

used, &local_err);

if (ret != 0) {

break;

}

Juan Quintela

2018-04-11 12:36:13 +0200

[diff] [blame]

1123

}

Juan Quintela

2018-04-11 03:02:10 +0200

[diff] [blame]

1124

1125

qemu_mutex_lock(&p->mutex);

1126

p->pending_job--;

1127

qemu_mutex_unlock(&p->mutex);

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1128

1129

if (flags & MULTIFD_FLAG_SYNC) {

1130

qemu_sem_post(&multifd_send_state->sem_sync);

1131

}

Juan Quintela

2016-01-15 11:40:13 +0100

[diff] [blame]

1132

qemu_sem_post(&multifd_send_state->channels_ready);

Juan Quintela

2018-04-11 03:02:10 +0200

[diff] [blame]

1133

} else if (p->quit) {

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1134

qemu_mutex_unlock(&p->mutex);

1135

break;

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1136

} else {

1137

qemu_mutex_unlock(&p->mutex);

1138

/* sometimes there are spurious wakeups */

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1139

}

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1140

}

1141

Juan Quintela

2018-04-06 19:32:12 +0200

[diff] [blame]

1142

out:

1143

if (local_err) {

1144

multifd_send_terminate_threads(local_err);

1145

}

1146

Juan Quintela

2018-02-19 19:01:45 +0100

[diff] [blame]

1147

qemu_mutex_lock(&p->mutex);

1148

p->running = false;

1149

qemu_mutex_unlock(&p->mutex);

1150

Lidong Chen

2018-08-06 21:29:29 +0800

[diff] [blame]

1151

rcu_unregister_thread();

Juan Quintela

2018-04-06 18:28:59 +0200

[diff] [blame]

1152

trace_multifd_send_thread_end(p->id, p->num_packets, p->num_pages);

1153

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

return NULL;

}

Juan Quintela

2018-03-07 07:56:15 +0100

[diff] [blame]

1157

static void multifd_new_send_channel_async(QIOTask *task, gpointer opaque)

1158

{

1159

MultiFDSendParams *p = opaque;

1160

QIOChannel *sioc = QIO_CHANNEL(qio_task_get_source(task));

1161

Error *local_err = NULL;

1162

1163

if (qio_task_propagate_error(task, &local_err)) {

Fei Li

1398b2e

2019-01-13 22:08:47 +0800

[diff] [blame]

1164

migrate_set_error(migrate_get_current(), local_err);

1165

multifd_save_cleanup();

Juan Quintela

2018-03-07 07:56:15 +0100

[diff] [blame]

1166

} else {

1167

p->c = QIO_CHANNEL(sioc);

1168

qio_channel_set_delay(p->c, false);

1169

p->running = true;

1170

qemu_thread_create(&p->thread, p->name, multifd_send_thread, p,

1171

QEMU_THREAD_JOINABLE);

Juan Quintela

2018-03-07 07:56:15 +0100

[diff] [blame]

}

}

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1175

int multifd_save_setup(void)

1176

{

1177

int thread_count;

Juan Quintela

2019-02-20 12:06:03 +0100

[diff] [blame]

1178

uint32_t page_count = MULTIFD_PACKET_SIZE / qemu_target_page_size();

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1179

uint8_t i;

1180

1181

if (!migrate_use_multifd()) {

1182

return 0;

1183

}

1184

thread_count = migrate_multifd_channels();

1185

multifd_send_state = g_malloc0(sizeof(*multifd_send_state));

1186

multifd_send_state->params = g_new0(MultiFDSendParams, thread_count);

Juan Quintela

2018-04-10 23:35:15 +0200

[diff] [blame]

1187

multifd_send_state->pages = multifd_pages_init(page_count);

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1188

qemu_sem_init(&multifd_send_state->sem_sync, 0);

Juan Quintela

2016-01-15 11:40:13 +0100

[diff] [blame]

1189

qemu_sem_init(&multifd_send_state->channels_ready, 0);

Juan Quintela

2018-04-10 23:35:15 +0200

[diff] [blame]

1190

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1191

for (i = 0; i < thread_count; i++) {

1192

MultiFDSendParams *p = &multifd_send_state->params[i];

1193

1194

qemu_mutex_init(&p->mutex);

1195

qemu_sem_init(&p->sem, 0);

1196

p->quit = false;

Juan Quintela

2018-04-11 03:02:10 +0200

[diff] [blame]

1197

p->pending_job = 0;

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1198

p->id = i;

Juan Quintela

2018-04-10 23:35:15 +0200

[diff] [blame]

1199

p->pages = multifd_pages_init(page_count);

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

1200

p->packet_len = sizeof(MultiFDPacket_t)

1201

+ sizeof(ram_addr_t) * page_count;

1202

p->packet = g_malloc0(p->packet_len);

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1203

p->name = g_strdup_printf("multifdsend_%d", i);

Juan Quintela

2018-03-07 07:56:15 +0100

[diff] [blame]

1204

socket_send_channel_create(multifd_new_send_channel_async, p);

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

}

return 0;

}

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1209

struct {

1210

MultiFDRecvParams *params;

1211

/* number of created threads */

1212

int count;

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1213

/* syncs main thread and channels */

1214

QemuSemaphore sem_sync;

1215

/* global number of generated multifd packets */

1216

uint64_t packet_num;

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1217

} *multifd_recv_state;

1218

Juan Quintela

2018-02-19 19:01:45 +0100

[diff] [blame]

1219

static void multifd_recv_terminate_threads(Error *err)

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

{

int i;

Juan Quintela

2018-02-19 19:01:15 +0100

[diff] [blame]

1223

if (err) {

1224

MigrationState *s = migrate_get_current();

1225

migrate_set_error(s, err);

1226

if (s->state == MIGRATION_STATUS_SETUP ||

1227

s->state == MIGRATION_STATUS_ACTIVE) {

1228

migrate_set_state(&s->state, s->state,

1229

MIGRATION_STATUS_FAILED);

}

}

Juan Quintela

2018-02-19 19:01:45 +0100

[diff] [blame]

1233

for (i = 0; i < migrate_multifd_channels(); i++) {

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1234

MultiFDRecvParams *p = &multifd_recv_state->params[i];

1235

1236

qemu_mutex_lock(&p->mutex);

Juan Quintela

7a5cc33

2018-04-18 00:49:19 +0200

[diff] [blame]

1237

/* We could arrive here for two reasons:

1238

- normal quit, i.e. everything went fine, just finished

1239

- error quit: We close the channels so the channel threads

1240

finish the qio_channel_read_all_eof() */

1241

qio_channel_shutdown(p->c, QIO_CHANNEL_SHUTDOWN_BOTH, NULL);

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1242

qemu_mutex_unlock(&p->mutex);

}

}

int multifd_load_cleanup(Error **errp)

{

int i;

int ret = 0;

if (!migrate_use_multifd()) {

1252

return 0;

1253

}

Juan Quintela

2018-02-19 19:01:45 +0100

[diff] [blame]

1254

multifd_recv_terminate_threads(NULL);

1255

for (i = 0; i < migrate_multifd_channels(); i++) {

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1256

MultiFDRecvParams *p = &multifd_recv_state->params[i];

1257

Juan Quintela

2018-02-19 19:01:45 +0100

[diff] [blame]

1258

if (p->running) {

1259

qemu_thread_join(&p->thread);

1260

}

Juan Quintela

2018-03-07 07:56:15 +0100

[diff] [blame]

1261

object_unref(OBJECT(p->c));

1262

p->c = NULL;

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1263

qemu_mutex_destroy(&p->mutex);

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1264

qemu_sem_destroy(&p->sem_sync);

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1265

g_free(p->name);

1266

p->name = NULL;

Juan Quintela

2018-04-10 23:35:15 +0200

[diff] [blame]

1267

multifd_pages_clear(p->pages);

1268

p->pages = NULL;

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

1269

p->packet_len = 0;

1270

g_free(p->packet);

1271

p->packet = NULL;

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1272

}

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1273

qemu_sem_destroy(&multifd_recv_state->sem_sync);

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1274

g_free(multifd_recv_state->params);

1275

multifd_recv_state->params = NULL;

1276

g_free(multifd_recv_state);

1277

multifd_recv_state = NULL;

return ret;

}

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1282

static void multifd_recv_sync_main(void)

{

int i;

if (!migrate_use_multifd()) {

1287

return;

1288

}

1289

for (i = 0; i < migrate_multifd_channels(); i++) {

1290

MultiFDRecvParams *p = &multifd_recv_state->params[i];

1291

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1292

trace_multifd_recv_sync_main_wait(p->id);

1293

qemu_sem_wait(&multifd_recv_state->sem_sync);

1294

qemu_mutex_lock(&p->mutex);

1295

if (multifd_recv_state->packet_num < p->packet_num) {

1296

multifd_recv_state->packet_num = p->packet_num;

1297

}

1298

qemu_mutex_unlock(&p->mutex);

1299

}

1300

for (i = 0; i < migrate_multifd_channels(); i++) {

1301

MultiFDRecvParams *p = &multifd_recv_state->params[i];

1302

1303

trace_multifd_recv_sync_main_signal(p->id);

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1304

qemu_sem_post(&p->sem_sync);

1305

}

1306

trace_multifd_recv_sync_main(multifd_recv_state->packet_num);

1307

}

1308

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1309

static void *multifd_recv_thread(void *opaque)

1310

{

1311

MultiFDRecvParams *p = opaque;

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

1312

Error *local_err = NULL;

1313

int ret;

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1314

Juan Quintela

2018-04-06 18:28:59 +0200

[diff] [blame]

1315

trace_multifd_recv_thread_start(p->id);

Lidong Chen

2018-08-06 21:29:29 +0800

[diff] [blame]

1316

rcu_register_thread();

Juan Quintela

2018-04-06 18:28:59 +0200

[diff] [blame]

1317

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1318

while (true) {

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

uint32_t used;

uint32_t flags;

Juan Quintela

2018-04-11 12:36:13 +0200

[diff] [blame]

1322

ret = qio_channel_read_all_eof(p->c, (void *)p->packet,

1323

p->packet_len, &local_err);

1324

if (ret == 0) { /* EOF */

1325

break;

1326

}

1327

if (ret == -1) { /* Error */

1328

break;

1329

}

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1330

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1331

qemu_mutex_lock(&p->mutex);

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1332

ret = multifd_recv_unfill_packet(p, &local_err);

1333

if (ret) {

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1334

qemu_mutex_unlock(&p->mutex);

1335

break;

1336

}

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1337

1338

used = p->pages->used;

1339

flags = p->flags;

Juan Quintela

2019-01-04 19:45:39 +0100

[diff] [blame]

1340

trace_multifd_recv(p->id, p->packet_num, used, flags,

1341

p->next_packet_size);

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1342

p->num_packets++;

1343

p->num_pages += used;

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1344

qemu_mutex_unlock(&p->mutex);

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1345

Juan Quintela

ad24c7c

2019-01-04 19:12:35 +0100

[diff] [blame]

1346

if (used) {

1347

ret = qio_channel_readv_all(p->c, p->pages->iov,

used, &local_err);

if (ret != 0) {

break;

}

Juan Quintela

2018-04-11 12:36:13 +0200

[diff] [blame]

1352

}

1353

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1354

if (flags & MULTIFD_FLAG_SYNC) {

1355

qemu_sem_post(&multifd_recv_state->sem_sync);

1356

qemu_sem_wait(&p->sem_sync);

1357

}

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1358

}

1359

Juan Quintela

d82628e

2018-04-11 02:44:24 +0200

[diff] [blame]

1360

if (local_err) {

1361

multifd_recv_terminate_threads(local_err);

1362

}

Juan Quintela

2018-02-19 19:01:45 +0100

[diff] [blame]

1363

qemu_mutex_lock(&p->mutex);

1364

p->running = false;

1365

qemu_mutex_unlock(&p->mutex);

1366

Lidong Chen

2018-08-06 21:29:29 +0800

[diff] [blame]

1367

rcu_unregister_thread();

Juan Quintela

2018-04-06 18:28:59 +0200

[diff] [blame]

1368

trace_multifd_recv_thread_end(p->id, p->num_packets, p->num_pages);

1369

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

return NULL;

}

int multifd_load_setup(void)

1374

{

1375

int thread_count;

Juan Quintela

2019-02-20 12:06:03 +0100

[diff] [blame]

1376

uint32_t page_count = MULTIFD_PACKET_SIZE / qemu_target_page_size();

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1377

uint8_t i;

1378

1379

if (!migrate_use_multifd()) {

1380

return 0;

1381

}

1382

thread_count = migrate_multifd_channels();

1383

multifd_recv_state = g_malloc0(sizeof(*multifd_recv_state));

1384

multifd_recv_state->params = g_new0(MultiFDRecvParams, thread_count);

Juan Quintela

2018-02-19 19:01:45 +0100

[diff] [blame]

1385

atomic_set(&multifd_recv_state->count, 0);

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1386

qemu_sem_init(&multifd_recv_state->sem_sync, 0);

Juan Quintela

2018-04-10 23:35:15 +0200

[diff] [blame]

1387

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1388

for (i = 0; i < thread_count; i++) {

1389

MultiFDRecvParams *p = &multifd_recv_state->params[i];

1390

1391

qemu_mutex_init(&p->mutex);

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

1392

qemu_sem_init(&p->sem_sync, 0);

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1393

p->id = i;

Juan Quintela

2018-04-10 23:35:15 +0200

[diff] [blame]

1394

p->pages = multifd_pages_init(page_count);

Juan Quintela

2018-04-04 11:26:58 +0200

[diff] [blame]

1395

p->packet_len = sizeof(MultiFDPacket_t)

1396

+ sizeof(ram_addr_t) * page_count;

1397

p->packet = g_malloc0(p->packet_len);

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

1398

p->name = g_strdup_printf("multifdrecv_%d", i);

Juan Quintela

2016-01-14 16:52:55 +0100

[diff] [blame]

}

return 0;

}

Juan Quintela

2018-02-19 18:59:02 +0100

[diff] [blame]

1403

bool multifd_recv_all_channels_created(void)

1404

{

1405

int thread_count = migrate_multifd_channels();

1406

1407

if (!migrate_use_multifd()) {

return true;

}

return thread_count == atomic_read(&multifd_recv_state->count);

1412

}

1413

Fei Li

2019-01-13 22:08:46 +0800

[diff] [blame]

1414

/*

1415

* Try to receive all multifd channels to get ready for the migration.

1416

* - Return true and do not set @errp when correctly receving all channels;

1417

* - Return false and do not set @errp when correctly receiving the current one;

1418

* - Return false and set @errp when failing to receive the current channel.

1419

*/

1420

bool multifd_recv_new_channel(QIOChannel *ioc, Error **errp)

Juan Quintela

71bb07d

2018-02-19 19:01:03 +0100

[diff] [blame]

1421

{

Juan Quintela

2018-03-07 07:56:15 +0100

[diff] [blame]

1422

MultiFDRecvParams *p;

Juan Quintela

2018-04-06 19:32:12 +0200

[diff] [blame]

1423

Error *local_err = NULL;

1424

int id;

Juan Quintela

2018-03-07 07:56:15 +0100

[diff] [blame]

1425

Juan Quintela

2018-04-06 19:32:12 +0200

[diff] [blame]

1426

id = multifd_recv_initial_packet(ioc, &local_err);

1427

if (id < 0) {

1428

multifd_recv_terminate_threads(local_err);

Fei Li

2019-01-13 22:08:46 +0800

[diff] [blame]

1429

error_propagate_prepend(errp, local_err,

1430

"failed to receive packet"

1431

" via multifd channel %d: ",

1432

atomic_read(&multifd_recv_state->count));

Peter Xu

81e6205

2018-06-27 21:22:44 +0800

[diff] [blame]

1433

return false;

Juan Quintela

2018-04-06 19:32:12 +0200

[diff] [blame]

1434

}

1435

1436

p = &multifd_recv_state->params[id];

1437

if (p->c != NULL) {

1438

error_setg(&local_err, "multifd: received id '%d' already setup'",

1439

id);

1440

multifd_recv_terminate_threads(local_err);

Fei Li

2019-01-13 22:08:46 +0800

[diff] [blame]

1441

error_propagate(errp, local_err);

Peter Xu

81e6205

2018-06-27 21:22:44 +0800

[diff] [blame]

1442

return false;

Juan Quintela

2018-04-06 19:32:12 +0200

[diff] [blame]

1443

}

Juan Quintela

2018-03-07 07:56:15 +0100

[diff] [blame]

1444

p->c = ioc;

1445

object_ref(OBJECT(ioc));

Juan Quintela

2018-04-06 18:28:59 +0200

[diff] [blame]

1446

/* initial packet */

1447

p->num_packets = 1;

Juan Quintela

2018-03-07 07:56:15 +0100

[diff] [blame]

1448

1449

p->running = true;

1450

qemu_thread_create(&p->thread, p->name, multifd_recv_thread, p,

1451

QEMU_THREAD_JOINABLE);

1452

atomic_inc(&multifd_recv_state->count);

Fei Li

2019-01-13 22:08:46 +0800

[diff] [blame]

1453

return atomic_read(&multifd_recv_state->count) ==

1454

migrate_multifd_channels();

Juan Quintela

71bb07d

2018-02-19 19:01:03 +0100

[diff] [blame]

1455

}

1456

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1457

/**

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

1458

* save_page_header: write page header to wire

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1459

*

1460

* If this is the 1st block, it also writes the block identification

1461

*

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

1462

* Returns the number of bytes written

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1463

*

1464

* @f: QEMUFile where to send the data

1465

* @block: block that contains the page we want to send

1466

* @offset: offset inside the block for the page

1467

* in the lower bits, it contains flags

1468

*/

Juan Quintela

2017-05-10 13:28:13 +0200

[diff] [blame]

1469

static size_t save_page_header(RAMState *rs, QEMUFile *f, RAMBlock *block,

1470

ram_addr_t offset)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1471

{

Liang Li

9f5f380

2015-07-13 17:34:10 +0800

[diff] [blame]

1472

size_t size, len;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1473

Juan Quintela

2479569

2017-03-21 11:45:01 +0100

[diff] [blame]

1474

if (block == rs->last_sent_block) {

1475

offset |= RAM_SAVE_FLAG_CONTINUE;

1476

}

Juan Quintela

2017-05-10 13:28:13 +0200

[diff] [blame]

1477

qemu_put_be64(f, offset);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1478

size = 8;

1479

1480

if (!(offset & RAM_SAVE_FLAG_CONTINUE)) {

Liang Li

9f5f380

2015-07-13 17:34:10 +0800

[diff] [blame]

1481

len = strlen(block->idstr);

Juan Quintela

2017-05-10 13:28:13 +0200

[diff] [blame]

1482

qemu_put_byte(f, len);

1483

qemu_put_buffer(f, (uint8_t *)block->idstr, len);

Liang Li

9f5f380

2015-07-13 17:34:10 +0800

[diff] [blame]

1484

size += 1 + len;

Juan Quintela

2479569

2017-03-21 11:45:01 +0100

[diff] [blame]

1485

rs->last_sent_block = block;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

}

return size;

}

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

1490

/**

1491

* mig_throttle_guest_down: throotle down the guest

1492

*

1493

* Reduce amount of guest cpu execution to hopefully slow down memory

1494

* writes. If guest dirty memory rate is reduced below the rate at

1495

* which we can transfer pages to the destination then we should be

1496

* able to complete migration. Some workloads dirty memory way too

1497

* fast and will not effectively converge, even with auto-converge.

Jason J. Herne

2015-09-08 13:12:35 -0400

[diff] [blame]

1498

*/

1499

static void mig_throttle_guest_down(void)

1500

{

1501

MigrationState *s = migrate_get_current();

Daniel P. Berrange

2594f56

2016-04-27 11:05:14 +0100

[diff] [blame]

1502

uint64_t pct_initial = s->parameters.cpu_throttle_initial;

1503

uint64_t pct_icrement = s->parameters.cpu_throttle_increment;

Li Qiang

4cbc9c7

2018-08-01 06:00:20 -0700

[diff] [blame]

1504

int pct_max = s->parameters.max_cpu_throttle;

Jason J. Herne

2015-09-08 13:12:35 -0400

[diff] [blame]

1505

1506

/* We have not started throttling yet. Let's start it. */

1507

if (!cpu_throttle_active()) {

1508

cpu_throttle_set(pct_initial);

1509

} else {

1510

/* Throttling already on, just increase the rate */

Li Qiang

4cbc9c7

2018-08-01 06:00:20 -0700

[diff] [blame]

1511

cpu_throttle_set(MIN(cpu_throttle_get_percentage() + pct_icrement,

1512

pct_max));

Jason J. Herne

2015-09-08 13:12:35 -0400

[diff] [blame]

}

}

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

1516

/**

1517

* xbzrle_cache_zero_page: insert a zero page in the XBZRLE cache

1518

*

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

1519

* @rs: current RAM state

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

1520

* @current_addr: address for the zero page

1521

*

1522

* Update the xbzrle cache to reflect a page that's been sent as all 0.

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1523

* The important thing is that a stale (not-yet-0'd) page be replaced

1524

* by the new data.

1525

* As a bonus, if the page wasn't in the cache it gets added so that

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

1526

* when a small write is made into the 0'd page it gets XBZRLE sent.

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1527

*/

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

1528

static void xbzrle_cache_zero_page(RAMState *rs, ram_addr_t current_addr)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1529

{

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

1530

if (rs->ram_bulk_stage || !migrate_use_xbzrle()) {

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

return;

}

/* We don't care if this fails to allocate a new cache page

1535

* as long as it updated an old one */

Juan Quintela

c00e092

2017-05-09 16:22:01 +0200

[diff] [blame]

1536

cache_insert(XBZRLE.cache, current_addr, XBZRLE.zero_target_page,

Juan Quintela

2017-06-06 19:49:03 +0200

[diff] [blame]

1537

ram_counters.dirty_sync_count);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1538

}

1539

1540

#define ENCODING_FLAG_XBZRLE 0x1

1541

1542

/**

1543

* save_xbzrle_page: compress and send current page

1544

*

1545

* Returns: 1 means that we wrote the page

1546

* 0 means that page is identical to the one already sent

1547

* -1 means that xbzrle would be longer than normal

1548

*

Juan Quintela

5a98773

2017-03-13 19:39:02 +0100

[diff] [blame]

1549

* @rs: current RAM state

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

1550

* @current_data: pointer to the address of the page contents

1551

* @current_addr: addr of the page

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1552

* @block: block that contains the page we want to send

1553

* @offset: offset inside the block for the page

1554

* @last_stage: if we are at the completion stage

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1555

*/

Juan Quintela

204b88b

2017-03-15 09:16:57 +0100

[diff] [blame]

1556

static int save_xbzrle_page(RAMState *rs, uint8_t **current_data,

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1557

ram_addr_t current_addr, RAMBlock *block,

Juan Quintela

072c251

2017-03-14 10:27:31 +0100

[diff] [blame]

1558

ram_addr_t offset, bool last_stage)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1559

{

1560

int encoded_len = 0, bytes_xbzrle;

1561

uint8_t *prev_cached_page;

1562

Juan Quintela

2017-06-06 19:49:03 +0200

[diff] [blame]

1563

if (!cache_is_cached(XBZRLE.cache, current_addr,

1564

ram_counters.dirty_sync_count)) {

1565

xbzrle_counters.cache_miss++;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1566

if (!last_stage) {

1567

if (cache_insert(XBZRLE.cache, current_addr, *current_data,

Juan Quintela

2017-06-06 19:49:03 +0200

[diff] [blame]

1568

ram_counters.dirty_sync_count) == -1) {

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1569

return -1;

1570

} else {

1571

/* update *current_data when the page has been

1572

inserted into cache */

1573

*current_data = get_cached_data(XBZRLE.cache, current_addr);

}

}

return -1;

}

prev_cached_page = get_cached_data(XBZRLE.cache, current_addr);

1580

1581

/* save current buffer into memory */

1582

memcpy(XBZRLE.current_buf, *current_data, TARGET_PAGE_SIZE);

1583

1584

/* XBZRLE encoding (if there is no overflow) */

1585

encoded_len = xbzrle_encode_buffer(prev_cached_page, XBZRLE.current_buf,

1586

TARGET_PAGE_SIZE, XBZRLE.encoded_buf,

1587

TARGET_PAGE_SIZE);

1588

if (encoded_len == 0) {

Juan Quintela

2017-01-23 22:32:05 +0100

[diff] [blame]

1589

trace_save_xbzrle_page_skipping();

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1590

return 0;

1591

} else if (encoded_len == -1) {

Juan Quintela

2017-01-23 22:32:05 +0100

[diff] [blame]

1592

trace_save_xbzrle_page_overflow();

Juan Quintela

2017-06-06 19:49:03 +0200

[diff] [blame]

1593

xbzrle_counters.overflow++;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1594

/* update data in the cache */

1595

if (!last_stage) {

1596

memcpy(prev_cached_page, *current_data, TARGET_PAGE_SIZE);

1597

*current_data = prev_cached_page;

}

return -1;

}

/* we need to update the data in the cache, in order to get the same data */

1603

if (!last_stage) {

1604

memcpy(prev_cached_page, XBZRLE.current_buf, TARGET_PAGE_SIZE);

1605

}

1606

1607

/* Send XBZRLE based compressed page */

Juan Quintela

2017-05-10 13:28:13 +0200

[diff] [blame]

1608

bytes_xbzrle = save_page_header(rs, rs->f, block,

Juan Quintela

204b88b

2017-03-15 09:16:57 +0100

[diff] [blame]

1609

offset | RAM_SAVE_FLAG_XBZRLE);

1610

qemu_put_byte(rs->f, ENCODING_FLAG_XBZRLE);

1611

qemu_put_be16(rs->f, encoded_len);

1612

qemu_put_buffer(rs->f, XBZRLE.encoded_buf, encoded_len);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1613

bytes_xbzrle += encoded_len + 1 + 2;

Juan Quintela

2017-06-06 19:49:03 +0200

[diff] [blame]

1614

xbzrle_counters.pages++;

1615

xbzrle_counters.bytes += bytes_xbzrle;

1616

ram_counters.transferred += bytes_xbzrle;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

return 1;

}

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

1621

/**

1622

* migration_bitmap_find_dirty: find the next dirty page from start

Dr. David Alan Gilbert

f3f491f

2015-11-05 18:11:01 +0000

[diff] [blame]

1623

*

Wei Yang

2019-05-11 07:37:29 +0800

[diff] [blame]

1624

* Returns the page offset within memory region of the start of a dirty page

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

1625

*

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

1626

* @rs: current RAM state

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

1627

* @rb: RAMBlock where to search for dirty pages

Juan Quintela

2017-03-21 15:36:51 +0100

[diff] [blame]

1628

* @start: page where we start the search

Dr. David Alan Gilbert

f3f491f

2015-11-05 18:11:01 +0000

[diff] [blame]

1629

*/

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1630

static inline

Juan Quintela

2017-03-21 15:36:51 +0100

[diff] [blame]

1631

unsigned long migration_bitmap_find_dirty(RAMState *rs, RAMBlock *rb,

Juan Quintela

2017-03-21 16:19:05 +0100

[diff] [blame]

1632

unsigned long start)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1633

{

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

1634

unsigned long size = rb->used_length >> TARGET_PAGE_BITS;

1635

unsigned long *bitmap = rb->bmap;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1636

unsigned long next;

1637

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

1638

if (ramblock_is_ignored(rb)) {

Cédric Le Goater

2018-05-14 08:57:00 +0200

[diff] [blame]

return size;

}

Wei Wang

2018-12-11 16:24:52 +0800

[diff] [blame]

1642

/*

1643

* When the free page optimization is enabled, we need to check the bitmap

1644

* to send the non-free pages rather than all the pages in the bulk stage.

1645

*/

1646

if (!rs->fpo_enabled && rs->ram_bulk_stage && start > 0) {

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

1647

next = start + 1;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1648

} else {

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

1649

next = find_next_bit(bitmap, size, start);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1650

}

1651

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

1652

return next;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1653

}

1654

Juan Quintela

06b1068

2017-03-21 15:18:05 +0100

[diff] [blame]

1655

static inline bool migration_bitmap_clear_dirty(RAMState *rs,

Juan Quintela

2017-03-21 16:19:05 +0100

[diff] [blame]

1656

RAMBlock *rb,

1657

unsigned long page)

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

1658

{

1659

bool ret;

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

1660

Wei Wang

386a907

2018-12-11 16:24:49 +0800

[diff] [blame]

1661

qemu_mutex_lock(&rs->bitmap_mutex);

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

1662

ret = test_and_clear_bit(page, rb->bmap);

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

1663

1664

if (ret) {

Juan Quintela

2017-03-13 21:21:41 +0100

[diff] [blame]

1665

rs->migration_dirty_pages--;

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

1666

}

Wei Wang

386a907

2018-12-11 16:24:49 +0800

[diff] [blame]

1667

qemu_mutex_unlock(&rs->bitmap_mutex);

1668

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

return ret;

}

Juan Quintela

2017-03-21 09:35:04 +0100

[diff] [blame]

1672

static void migration_bitmap_sync_range(RAMState *rs, RAMBlock *rb,

Wei Yang

2019-04-30 11:44:10 +0800

[diff] [blame]

1673

ram_addr_t length)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1674

{

Juan Quintela

2017-03-13 21:21:41 +0100

[diff] [blame]

1675

rs->migration_dirty_pages +=

Wei Yang

2019-04-30 11:44:10 +0800

[diff] [blame]

1676

cpu_physical_memory_sync_dirty_bitmap(rb, 0, length,

Juan Quintela

2017-03-13 21:21:41 +0100

[diff] [blame]

1677

&rs->num_dirty_pages_period);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1678

}

1679

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

1680

/**

1681

* ram_pagesize_summary: calculate all the pagesizes of a VM

1682

*

1683

* Returns a summary bitmap of the page sizes of all RAMBlocks

1684

*

1685

* For VMs with just normal pages this is equivalent to the host page

1686

* size. If it's got some huge pages then it's the OR of all the

1687

* different page sizes.

Dr. David Alan Gilbert

e8ca1db

2017-02-24 18:28:29 +0000

[diff] [blame]

1688

*/

1689

uint64_t ram_pagesize_summary(void)

1690

{

1691

RAMBlock *block;

1692

uint64_t summary = 0;

1693

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

1694

RAMBLOCK_FOREACH_NOT_IGNORED(block) {

Dr. David Alan Gilbert

e8ca1db

2017-02-24 18:28:29 +0000

[diff] [blame]

1695

summary |= block->page_size;

}

return summary;

}

Xiao Guangrong

2019-01-11 14:37:30 +0800

[diff] [blame]

1701

uint64_t ram_get_total_transferred_pages(void)

1702

{

1703

return ram_counters.normal + ram_counters.duplicate +

1704

compression_counters.pages + xbzrle_counters.pages;

1705

}

1706

Xiao Guangrong

2018-06-04 17:55:12 +0800

[diff] [blame]

1707

static void migration_update_rates(RAMState *rs, int64_t end_time)

1708

{

Xiao Guangrong

2018-09-03 17:26:42 +0800

[diff] [blame]

1709

uint64_t page_count = rs->target_page_count - rs->target_page_count_prev;

Xiao Guangrong

2018-09-06 15:01:00 +0800

[diff] [blame]

1710

double compressed_size;

Xiao Guangrong

2018-06-04 17:55:12 +0800

[diff] [blame]

1711

1712

/* calculate period counters */

1713

ram_counters.dirty_pages_rate = rs->num_dirty_pages_period * 1000

1714

/ (end_time - rs->time_last_bitmap_sync);

1715

Xiao Guangrong

2018-09-03 17:26:42 +0800

[diff] [blame]

1716

if (!page_count) {

Xiao Guangrong

2018-06-04 17:55:12 +0800

[diff] [blame]

return;

}

if (migrate_use_xbzrle()) {

1721

xbzrle_counters.cache_miss_rate = (double)(xbzrle_counters.cache_miss -

Xiao Guangrong

2018-09-03 17:26:42 +0800

[diff] [blame]

1722

rs->xbzrle_cache_miss_prev) / page_count;

Xiao Guangrong

2018-06-04 17:55:12 +0800

[diff] [blame]

1723

rs->xbzrle_cache_miss_prev = xbzrle_counters.cache_miss;

1724

}

Xiao Guangrong

2018-09-06 15:01:00 +0800

[diff] [blame]

1725

1726

if (migrate_use_compression()) {

1727

compression_counters.busy_rate = (double)(compression_counters.busy -

1728

rs->compress_thread_busy_prev) / page_count;

1729

rs->compress_thread_busy_prev = compression_counters.busy;

1730

1731

compressed_size = compression_counters.compressed_size -

1732

rs->compressed_size_prev;

1733

if (compressed_size) {

1734

double uncompressed_size = (compression_counters.pages -

1735

rs->compress_pages_prev) * TARGET_PAGE_SIZE;

1736

1737

/* Compression-Ratio = Uncompressed-size / Compressed-size */

1738

compression_counters.compression_rate =

1739

uncompressed_size / compressed_size;

1740

1741

rs->compress_pages_prev = compression_counters.pages;

1742

rs->compressed_size_prev = compression_counters.compressed_size;

1743

}

1744

}

Xiao Guangrong

2018-06-04 17:55:12 +0800

[diff] [blame]

1745

}

1746

Juan Quintela

8d820d6

2017-03-13 19:35:50 +0100

[diff] [blame]

1747

static void migration_bitmap_sync(RAMState *rs)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1748

{

1749

RAMBlock *block;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1750

int64_t end_time;

Juan Quintela

c4bdf0c

2017-03-28 14:59:54 +0200

[diff] [blame]

1751

uint64_t bytes_xfer_now;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1752

Juan Quintela

2017-06-06 19:49:03 +0200

[diff] [blame]

1753

ram_counters.dirty_sync_count++;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1754

Juan Quintela

2017-03-13 19:44:57 +0100

[diff] [blame]

1755

if (!rs->time_last_bitmap_sync) {

1756

rs->time_last_bitmap_sync = qemu_clock_get_ms(QEMU_CLOCK_REALTIME);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1757

}

1758

1759

trace_migration_bitmap_sync_start();

Paolo Bonzini

9c1f8f4

2016-09-22 16:08:31 +0200

[diff] [blame]

1760

memory_global_dirty_log_sync();

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1761

Juan Quintela

108cfae

2017-03-13 21:38:09 +0100

[diff] [blame]

1762

qemu_mutex_lock(&rs->bitmap_mutex);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1763

rcu_read_lock();

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

1764

RAMBLOCK_FOREACH_NOT_IGNORED(block) {

Wei Yang

2019-04-30 11:44:10 +0800

[diff] [blame]

1765

migration_bitmap_sync_range(rs, block, block->used_length);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1766

}

Balamuruhan S

650af89

2018-06-12 14:20:09 +0530

[diff] [blame]

1767

ram_counters.remaining = ram_bytes_remaining();

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1768

rcu_read_unlock();

Juan Quintela

108cfae

2017-03-13 21:38:09 +0100

[diff] [blame]

1769

qemu_mutex_unlock(&rs->bitmap_mutex);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1770

Juan Quintela

a66cd90

2017-03-28 15:02:43 +0200

[diff] [blame]

1771

trace_migration_bitmap_sync_end(rs->num_dirty_pages_period);

Chao Fan

1ffb5df

2017-03-14 09:55:07 +0800

[diff] [blame]

1772

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1773

end_time = qemu_clock_get_ms(QEMU_CLOCK_REALTIME);

1774

1775

/* more than 1 second = 1000 millisecons */

Juan Quintela

2017-03-13 19:44:57 +0100

[diff] [blame]

1776

if (end_time > rs->time_last_bitmap_sync + 1000) {

Juan Quintela

2017-06-06 19:49:03 +0200

[diff] [blame]

1777

bytes_xfer_now = ram_counters.transferred;

Felipe Franciosi

2017-05-24 17:10:01 +0100

[diff] [blame]

1778

Peter Lieven

9ac78b6

2017-09-26 12:33:16 +0200

[diff] [blame]

1779

/* During block migration the auto-converge logic incorrectly detects

1780

* that ram migration makes no progress. Avoid this by disabling the

1781

* throttling logic during the bulk phase of block migration. */

1782

if (migrate_auto_converge() && !blk_mig_bulk_active()) {

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1783

/* The following detection logic can be refined later. For now:

1784

Check to see if the dirtied bytes is 50% more than the approx.

1785

amount of bytes that just got transferred since the last time we

Jason J. Herne

2015-09-08 13:12:35 -0400

[diff] [blame]

1786

were in this routine. If that happens twice, start or increase

1787

throttling */

Jason J. Herne

2015-09-08 13:12:35 -0400

[diff] [blame]

1788

Felipe Franciosi

2017-05-24 17:10:01 +0100

[diff] [blame]

1789

if ((rs->num_dirty_pages_period * TARGET_PAGE_SIZE >

Juan Quintela

eac7415

2017-03-28 14:59:01 +0200

[diff] [blame]

1790

(bytes_xfer_now - rs->bytes_xfer_prev) / 2) &&

Felipe Franciosi

b4a3c64

2017-05-24 17:10:03 +0100

[diff] [blame]

1791

(++rs->dirty_rate_high_cnt >= 2)) {

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1792

trace_migration_throttle();

Juan Quintela

8d820d6

2017-03-13 19:35:50 +0100

[diff] [blame]

1793

rs->dirty_rate_high_cnt = 0;

Jason J. Herne

2015-09-08 13:12:35 -0400

[diff] [blame]

1794

mig_throttle_guest_down();

Felipe Franciosi

2017-05-24 17:10:01 +0100

[diff] [blame]

1795

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1796

}

Jason J. Herne

2015-09-08 13:12:35 -0400

[diff] [blame]

1797

Xiao Guangrong

2018-06-04 17:55:12 +0800

[diff] [blame]

1798

migration_update_rates(rs, end_time);

1799

Xiao Guangrong

2018-09-03 17:26:42 +0800

[diff] [blame]

1800

rs->target_page_count_prev = rs->target_page_count;

Felipe Franciosi

2017-05-24 17:10:01 +0100

[diff] [blame]

1801

1802

/* reset period counters */

Juan Quintela

2017-03-13 19:44:57 +0100

[diff] [blame]

1803

rs->time_last_bitmap_sync = end_time;

Juan Quintela

a66cd90

2017-03-28 15:02:43 +0200

[diff] [blame]

1804

rs->num_dirty_pages_period = 0;

Felipe Franciosi

d2a4d85

2017-05-24 17:10:02 +0100

[diff] [blame]

1805

rs->bytes_xfer_prev = bytes_xfer_now;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1806

}

Dr. David Alan Gilbert

4addcd4

2015-12-16 11:47:36 +0000

[diff] [blame]

1807

if (migrate_use_events()) {

Peter Xu

3ab7238

2018-08-15 21:37:37 +0800

[diff] [blame]

1808

qapi_event_send_migration_pass(ram_counters.dirty_sync_count);

Dr. David Alan Gilbert

4addcd4

2015-12-16 11:47:36 +0000

[diff] [blame]

1809

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1810

}

1811

Wei Wang

2018-12-11 16:24:51 +0800

[diff] [blame]

1812

static void migration_bitmap_sync_precopy(RAMState *rs)

1813

{

1814

Error *local_err = NULL;

1815

1816

/*

1817

* The current notifier usage is just an optimization to migration, so we

1818

* don't stop the normal migration process in the error case.

1819

*/

1820

if (precopy_notify(PRECOPY_NOTIFY_BEFORE_BITMAP_SYNC, &local_err)) {

1821

error_report_err(local_err);

1822

}

1823

1824

migration_bitmap_sync(rs);

1825

1826

if (precopy_notify(PRECOPY_NOTIFY_AFTER_BITMAP_SYNC, &local_err)) {

1827

error_report_err(local_err);

}

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1831

/**

Xiao Guangrong

2018-08-21 16:10:22 +0800

[diff] [blame]

1832

* save_zero_page_to_file: send the zero page to the file

1833

*

1834

* Returns the size of data written to the file, 0 means the page is not

1835

* a zero page

1836

*

1837

* @rs: current RAM state

1838

* @file: the file where the data is saved

1839

* @block: block that contains the page we want to send

1840

* @offset: offset inside the block for the page

1841

*/

1842

static int save_zero_page_to_file(RAMState *rs, QEMUFile *file,

1843

RAMBlock *block, ram_addr_t offset)

1844

{

1845

uint8_t *p = block->host + offset;

1846

int len = 0;

1847

1848

if (is_zero_range(p, TARGET_PAGE_SIZE)) {

1849

len += save_page_header(rs, file, block, offset | RAM_SAVE_FLAG_ZERO);

1850

qemu_put_byte(file, 0);

len += 1;

}

return len;

}

/**

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

1857

* save_zero_page: send the zero page to the stream

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1858

*

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

1859

* Returns the number of pages written.

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1860

*

Juan Quintela

f7ccd61

2017-03-13 20:30:21 +0100

[diff] [blame]

1861

* @rs: current RAM state

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1862

* @block: block that contains the page we want to send

1863

* @offset: offset inside the block for the page

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1864

*/

Juan Quintela

7faccdc

2018-01-08 18:58:17 +0100

[diff] [blame]

1865

static int save_zero_page(RAMState *rs, RAMBlock *block, ram_addr_t offset)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1866

{

Xiao Guangrong

2018-08-21 16:10:22 +0800

[diff] [blame]

1867

int len = save_zero_page_to_file(rs, rs->f, block, offset);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1868

Xiao Guangrong

2018-08-21 16:10:22 +0800

[diff] [blame]

1869

if (len) {

Juan Quintela

2017-06-06 19:49:03 +0200

[diff] [blame]

1870

ram_counters.duplicate++;

Xiao Guangrong

2018-08-21 16:10:22 +0800

[diff] [blame]

1871

ram_counters.transferred += len;

1872

return 1;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1873

}

Xiao Guangrong

2018-08-21 16:10:22 +0800

[diff] [blame]

1874

return -1;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1875

}

1876

Juan Quintela

2017-03-20 22:25:28 +0100

[diff] [blame]

1877

static void ram_release_pages(const char *rbname, uint64_t offset, int pages)

Pavel Butsykin

53f09a1

2017-02-03 18:23:20 +0300

[diff] [blame]

1878

{

Juan Quintela

2017-03-20 22:25:28 +0100

[diff] [blame]

1879

if (!migrate_release_ram() || !migration_in_postcopy()) {

Pavel Butsykin

53f09a1

2017-02-03 18:23:20 +0300

[diff] [blame]

return;

}

Juan Quintela

2017-03-21 11:35:24 +0100

[diff] [blame]

1883

ram_discard_range(rbname, offset, pages << TARGET_PAGE_BITS);

Pavel Butsykin

53f09a1

2017-02-03 18:23:20 +0300

[diff] [blame]

1884

}

1885

Xiao Guangrong

2018-03-30 15:51:23 +0800

[diff] [blame]

1886

/*

1887

* @pages: the number of pages written by the control path,

1888

* < 0 - error

1889

* > 0 - number of pages written

1890

*

1891

* Return true if the pages has been saved, otherwise false is returned.

1892

*/

1893

static bool control_save_page(RAMState *rs, RAMBlock *block, ram_addr_t offset,

1894

int *pages)

1895

{

1896

uint64_t bytes_xmit = 0;

int ret;

*pages = -1;

ret = ram_control_save_page(rs->f, block->offset, offset, TARGET_PAGE_SIZE,

1901

&bytes_xmit);

1902

if (ret == RAM_SAVE_CONTROL_NOT_SUPP) {

return false;

}

if (bytes_xmit) {

ram_counters.transferred += bytes_xmit;

*pages = 1;

}

if (ret == RAM_SAVE_CONTROL_DELAYED) {

return true;

}

if (bytes_xmit > 0) {

1916

ram_counters.normal++;

1917

} else if (bytes_xmit == 0) {

1918

ram_counters.duplicate++;

}

return true;

}

Xiao Guangrong

2018-03-30 15:51:27 +0800

[diff] [blame]

1924

/*

1925

* directly send the page to the stream

1926

*

1927

* Returns the number of pages written.

1928

*

1929

* @rs: current RAM state

1930

* @block: block that contains the page we want to send

1931

* @offset: offset inside the block for the page

1932

* @buf: the page to be sent

1933

* @async: send to page asyncly

1934

*/

1935

static int save_normal_page(RAMState *rs, RAMBlock *block, ram_addr_t offset,

1936

uint8_t *buf, bool async)

1937

{

1938

ram_counters.transferred += save_page_header(rs, rs->f, block,

1939

offset | RAM_SAVE_FLAG_PAGE);

1940

if (async) {

1941

qemu_put_buffer_async(rs->f, buf, TARGET_PAGE_SIZE,

1942

migrate_release_ram() &

1943

migration_in_postcopy());

1944

} else {

1945

qemu_put_buffer(rs->f, buf, TARGET_PAGE_SIZE);

1946

}

1947

ram_counters.transferred += TARGET_PAGE_SIZE;

1948

ram_counters.normal++;

return 1;

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1952

/**

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

1953

* ram_save_page: send the given page to the stream

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1954

*

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

1955

* Returns the number of pages written.

Dr. David Alan Gilbert

3fd3c4b

2015-12-10 16:31:46 +0000

[diff] [blame]

1956

* < 0 - error

1957

* >=0 - Number of pages written - this might legally be 0

1958

* if xbzrle noticed the page was the same.

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1959

*

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

1960

* @rs: current RAM state

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1961

* @block: block that contains the page we want to send

1962

* @offset: offset inside the block for the page

1963

* @last_stage: if we are at the completion stage

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1964

*/

Juan Quintela

a0a8aa1

2017-03-20 22:29:07 +0100

[diff] [blame]

1965

static int ram_save_page(RAMState *rs, PageSearchStatus *pss, bool last_stage)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1966

{

1967

int pages = -1;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1968

uint8_t *p;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1969

bool send_async = true;

zhanghailiang

a08f689

2016-01-15 11:37:44 +0800

[diff] [blame]

1970

RAMBlock *block = pss->block;

Juan Quintela

2017-03-21 15:36:51 +0100

[diff] [blame]

1971

ram_addr_t offset = pss->page << TARGET_PAGE_BITS;

Xiao Guangrong

2018-03-30 15:51:23 +0800

[diff] [blame]

1972

ram_addr_t current_addr = block->offset + offset;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1973

Dr. David Alan Gilbert

2f68e39

2015-08-13 11:51:30 +0100

[diff] [blame]

1974

p = block->host + offset;

Dr. David Alan Gilbert

1db9d8e

2017-04-26 19:37:21 +0100

[diff] [blame]

1975

trace_ram_save_page(block->idstr, (uint64_t)offset, p);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1976

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1977

XBZRLE_cache_lock();

Xiao Guangrong

d7400a3

2018-03-30 15:51:26 +0800

[diff] [blame]

1978

if (!rs->ram_bulk_stage && !migration_in_postcopy() &&

1979

migrate_use_xbzrle()) {

Xiao Guangrong

2018-03-30 15:51:23 +0800

[diff] [blame]

1980

pages = save_xbzrle_page(rs, &p, current_addr, block,

1981

offset, last_stage);

1982

if (!last_stage) {

1983

/* Can't send this cached data async, since the cache page

1984

* might get updated before it gets to the wire

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1985

*/

Xiao Guangrong

2018-03-30 15:51:23 +0800

[diff] [blame]

1986

send_async = false;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

}

}

/* XBZRLE overflow or normal page */

1991

if (pages == -1) {

Xiao Guangrong

65dacaa

2018-03-30 15:51:27 +0800

[diff] [blame]

1992

pages = save_normal_page(rs, block, offset, p, send_async);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

1993

}

1994

1995

XBZRLE_cache_unlock();

return pages;

}

Juan Quintela

2016-01-15 11:40:13 +0100

[diff] [blame]

2000

static int ram_save_multifd_page(RAMState *rs, RAMBlock *block,

2001

ram_addr_t offset)

2002

{

Juan Quintela

2016-01-15 11:40:13 +0100

[diff] [blame]

2003

multifd_queue_page(block, offset);

Juan Quintela

2016-01-15 11:40:13 +0100

[diff] [blame]

2004

ram_counters.normal++;

return 1;

}

Xiao Guangrong

2018-08-21 16:10:24 +0800

[diff] [blame]

2009

static bool do_compress_ram_page(QEMUFile *f, z_stream *stream, RAMBlock *block,

Xiao Guangrong

2018-08-21 16:10:23 +0800

[diff] [blame]

2010

ram_addr_t offset, uint8_t *source_buf)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2011

{

Juan Quintela

2017-05-04 11:46:24 +0200

[diff] [blame]

2012

RAMState *rs = ram_state;

Liang Li

2016-05-05 15:32:57 +0800

[diff] [blame]

2013

uint8_t *p = block->host + (offset & TARGET_PAGE_MASK);

Xiao Guangrong

2018-08-21 16:10:24 +0800

[diff] [blame]

2014

bool zero_page = false;

Xiao Guangrong

2018-08-21 16:10:23 +0800

[diff] [blame]

2015

int ret;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2016

Xiao Guangrong

2018-08-21 16:10:24 +0800

[diff] [blame]

2017

if (save_zero_page_to_file(rs, f, block, offset)) {

zero_page = true;

goto exit;

}

Xiao Guangrong

2018-08-21 16:10:23 +0800

[diff] [blame]

2022

save_page_header(rs, f, block, offset | RAM_SAVE_FLAG_COMPRESS_PAGE);

Xiao Guangrong

2018-03-30 15:51:22 +0800

[diff] [blame]

2023

2024

/*

2025

* copy it to a internal buffer to avoid it being modified by VM

2026

* so that we can catch up the error during compression and

2027

* decompression

2028

*/

2029

memcpy(source_buf, p, TARGET_PAGE_SIZE);

Xiao Guangrong

2018-08-21 16:10:23 +0800

[diff] [blame]

2030

ret = qemu_put_compression_data(f, stream, source_buf, TARGET_PAGE_SIZE);

2031

if (ret < 0) {

2032

qemu_file_set_error(migrate_get_current()->to_dst_file, ret);

Liang Li

b3be289

2016-05-05 15:32:54 +0800

[diff] [blame]

2033

error_report("compressed data failed!");

Xiao Guangrong

2018-08-21 16:10:24 +0800

[diff] [blame]

2034

return false;

Liang Li

b3be289

2016-05-05 15:32:54 +0800

[diff] [blame]

2035

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2036

Xiao Guangrong

2018-08-21 16:10:24 +0800

[diff] [blame]

2037

exit:

Xiao Guangrong

2018-08-21 16:10:23 +0800

[diff] [blame]

2038

ram_release_pages(block->idstr, offset & TARGET_PAGE_MASK, 1);

Xiao Guangrong

2018-08-21 16:10:24 +0800

[diff] [blame]

return zero_page;

}

static void

update_compress_thread_counts(const CompressParam *param, int bytes_xmit)

2044

{

Xiao Guangrong

2018-09-06 15:01:00 +0800

[diff] [blame]

2045

ram_counters.transferred += bytes_xmit;

2046

Xiao Guangrong

2018-08-21 16:10:24 +0800

[diff] [blame]

2047

if (param->zero_page) {

2048

ram_counters.duplicate++;

Xiao Guangrong

2018-09-06 15:01:00 +0800

[diff] [blame]

2049

return;

Xiao Guangrong

2018-08-21 16:10:24 +0800

[diff] [blame]

2050

}

Xiao Guangrong

2018-09-06 15:01:00 +0800

[diff] [blame]

2051

2052

/* 8 means a header with RAM_SAVE_FLAG_CONTINUE. */

2053

compression_counters.compressed_size += bytes_xmit - 8;

2054

compression_counters.pages++;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2055

}

2056

Xiao Guangrong

32b0549

2018-09-06 15:01:01 +0800

[diff] [blame]

2057

static bool save_page_use_compression(RAMState *rs);

2058

Juan Quintela

2017-03-15 11:00:51 +0100

[diff] [blame]

2059

static void flush_compressed_data(RAMState *rs)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2060

{

2061

int idx, len, thread_count;

2062

Xiao Guangrong

32b0549

2018-09-06 15:01:01 +0800

[diff] [blame]

2063

if (!save_page_use_compression(rs)) {

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2064

return;

2065

}

2066

thread_count = migrate_compress_threads();

Liang Li

2016-05-05 15:32:57 +0800

[diff] [blame]

2067

Liang Li

2016-05-05 15:32:59 +0800

[diff] [blame]

2068

qemu_mutex_lock(&comp_done_lock);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2069

for (idx = 0; idx < thread_count; idx++) {

Liang Li

2016-05-05 15:32:57 +0800

[diff] [blame]

2070

while (!comp_param[idx].done) {

Liang Li

2016-05-05 15:32:59 +0800

[diff] [blame]

2071

qemu_cond_wait(&comp_done_cond, &comp_done_lock);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2072

}

Liang Li

2016-05-05 15:32:57 +0800

[diff] [blame]

2073

}

Liang Li

2016-05-05 15:32:59 +0800

[diff] [blame]

2074

qemu_mutex_unlock(&comp_done_lock);

Liang Li

2016-05-05 15:32:57 +0800

[diff] [blame]

2075

2076

for (idx = 0; idx < thread_count; idx++) {

2077

qemu_mutex_lock(&comp_param[idx].mutex);

Liang Li

2016-05-05 15:32:56 +0800

[diff] [blame]

2078

if (!comp_param[idx].quit) {

Juan Quintela

2017-03-15 11:00:51 +0100

[diff] [blame]

2079

len = qemu_put_qemu_file(rs->f, comp_param[idx].file);

Xiao Guangrong

2018-08-21 16:10:24 +0800

[diff] [blame]

2080

/*

2081

* it's safe to fetch zero_page without holding comp_done_lock

2082

* as there is no further request submitted to the thread,

2083

* i.e, the thread should be waiting for a request at this point.

2084

*/

2085

update_compress_thread_counts(&comp_param[idx], len);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2086

}

Liang Li

2016-05-05 15:32:57 +0800

[diff] [blame]

2087

qemu_mutex_unlock(&comp_param[idx].mutex);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

}

}

static inline void set_compress_params(CompressParam *param, RAMBlock *block,

2092

ram_addr_t offset)

2093

{

2094

param->block = block;

2095

param->offset = offset;

2096

}

2097

Juan Quintela

2017-03-15 11:00:51 +0100

[diff] [blame]

2098

static int compress_page_with_multi_thread(RAMState *rs, RAMBlock *block,

2099

ram_addr_t offset)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2100

{

2101

int idx, thread_count, bytes_xmit = -1, pages = -1;

Xiao Guangrong

1d58872

2018-08-21 16:10:20 +0800

[diff] [blame]

2102

bool wait = migrate_compress_wait_thread();

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2103

2104

thread_count = migrate_compress_threads();

Liang Li

2016-05-05 15:32:59 +0800

[diff] [blame]

2105

qemu_mutex_lock(&comp_done_lock);

Xiao Guangrong

1d58872

2018-08-21 16:10:20 +0800

[diff] [blame]

2106

retry:

2107

for (idx = 0; idx < thread_count; idx++) {

2108

if (comp_param[idx].done) {

2109

comp_param[idx].done = false;

2110

bytes_xmit = qemu_put_qemu_file(rs->f, comp_param[idx].file);

2111

qemu_mutex_lock(&comp_param[idx].mutex);

2112

set_compress_params(&comp_param[idx], block, offset);

2113

qemu_cond_signal(&comp_param[idx].cond);

2114

qemu_mutex_unlock(&comp_param[idx].mutex);

2115

pages = 1;

Xiao Guangrong

2018-08-21 16:10:24 +0800

[diff] [blame]

2116

update_compress_thread_counts(&comp_param[idx], bytes_xmit);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2117

break;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2118

}

2119

}

Xiao Guangrong

1d58872

2018-08-21 16:10:20 +0800

[diff] [blame]

2120

2121

/*

2122

* wait for the free thread if the user specifies 'compress-wait-thread',

2123

* otherwise we will post the page out in the main thread as normal page.

2124

*/

2125

if (pages < 0 && wait) {

2126

qemu_cond_wait(&comp_done_cond, &comp_done_lock);

2127

goto retry;

2128

}

Liang Li

2016-05-05 15:32:59 +0800

[diff] [blame]

2129

qemu_mutex_unlock(&comp_done_lock);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

return pages;

}

/**

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2135

* find_dirty_block: find the next dirty page and update any state

2136

* associated with the search process.

Dr. David Alan Gilbert

2015-09-23 15:27:11 +0100

[diff] [blame]

2137

*

Wei Yang

2019-05-11 07:37:29 +0800

[diff] [blame]

2138

* Returns true if a page is found

Dr. David Alan Gilbert

2015-09-23 15:27:11 +0100

[diff] [blame]

2139

*

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

2140

* @rs: current RAM state

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2141

* @pss: data about the state of the current dirty page scan

2142

* @again: set to false if the search has scanned the whole of RAM

Dr. David Alan Gilbert

2015-09-23 15:27:11 +0100

[diff] [blame]

2143

*/

Juan Quintela

2017-03-21 16:19:05 +0100

[diff] [blame]

2144

static bool find_dirty_block(RAMState *rs, PageSearchStatus *pss, bool *again)

Dr. David Alan Gilbert

2015-09-23 15:27:11 +0100

[diff] [blame]

2145

{

Juan Quintela

2017-03-21 16:19:05 +0100

[diff] [blame]

2146

pss->page = migration_bitmap_find_dirty(rs, pss->block, pss->page);

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

2147

if (pss->complete_round && pss->block == rs->last_seen_block &&

Juan Quintela

2017-03-21 15:36:51 +0100

[diff] [blame]

2148

pss->page >= rs->last_page) {

Dr. David Alan Gilbert

2015-09-23 15:27:11 +0100

[diff] [blame]

2149

/*

2150

* We've been once around the RAM and haven't found anything.

* Give up.

*/

*again = false;

return false;

}

Juan Quintela

2017-03-21 15:36:51 +0100

[diff] [blame]

2156

if ((pss->page << TARGET_PAGE_BITS) >= pss->block->used_length) {

Dr. David Alan Gilbert

2015-09-23 15:27:11 +0100

[diff] [blame]

2157

/* Didn't find anything in this RAM Block */

Juan Quintela

2017-03-21 15:36:51 +0100

[diff] [blame]

2158

pss->page = 0;

Dr. David Alan Gilbert

2015-09-23 15:27:11 +0100

[diff] [blame]

2159

pss->block = QLIST_NEXT_RCU(pss->block, next);

2160

if (!pss->block) {

Xiao Guangrong

48df9d8

2018-09-06 15:00:59 +0800

[diff] [blame]

2161

/*

2162

* If memory migration starts over, we will meet a dirtied page

2163

* which may still exists in compression threads's ring, so we

2164

* should flush the compressed data to make sure the new page

2165

* is not overwritten by the old one in the destination.

2166

*

2167

* Also If xbzrle is on, stop using the data compression at this

2168

* point. In theory, xbzrle can do better than compression.

2169

*/

2170

flush_compressed_data(rs);

2171

Dr. David Alan Gilbert

2015-09-23 15:27:11 +0100

[diff] [blame]

2172

/* Hit the end of the list */

2173

pss->block = QLIST_FIRST_RCU(&ram_list.blocks);

2174

/* Flag that we've looped */

2175

pss->complete_round = true;

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

2176

rs->ram_bulk_stage = false;

Dr. David Alan Gilbert

2015-09-23 15:27:11 +0100

[diff] [blame]

2177

}

2178

/* Didn't find anything this time, but try again on the new block */

*again = true;

return false;

} else {

/* Can go around again, but... */

2183

*again = true;

2184

/* We've found something so probably don't need to */

return true;

}

}

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2189

/**

2190

* unqueue_page: gets a page of the queue

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2191

*

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2192

* Helper for 'get_queued_page' - gets a page off the queue

2193

*

2194

* Returns the block of the page (or NULL if none available)

2195

*

Juan Quintela

2017-03-20 22:12:40 +0100

[diff] [blame]

2196

* @rs: current RAM state

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2197

* @offset: used to return the offset within the RAMBlock

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2198

*/

Juan Quintela

2017-03-21 16:19:05 +0100

[diff] [blame]

2199

static RAMBlock *unqueue_page(RAMState *rs, ram_addr_t *offset)

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2200

{

2201

RAMBlock *block = NULL;

2202

Xiao Guangrong

ae526e3

2018-08-21 16:10:25 +0800

[diff] [blame]

2203

if (QSIMPLEQ_EMPTY_ATOMIC(&rs->src_page_requests)) {

return NULL;

}

Juan Quintela

2017-03-20 22:12:40 +0100

[diff] [blame]

2207

qemu_mutex_lock(&rs->src_page_req_mutex);

2208

if (!QSIMPLEQ_EMPTY(&rs->src_page_requests)) {

2209

struct RAMSrcPageRequest *entry =

2210

QSIMPLEQ_FIRST(&rs->src_page_requests);

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2211

block = entry->rb;

2212

*offset = entry->offset;

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2213

2214

if (entry->len > TARGET_PAGE_SIZE) {

2215

entry->len -= TARGET_PAGE_SIZE;

2216

entry->offset += TARGET_PAGE_SIZE;

2217

} else {

2218

memory_region_unref(block->mr);

Juan Quintela

2017-03-20 22:12:40 +0100

[diff] [blame]

2219

QSIMPLEQ_REMOVE_HEAD(&rs->src_page_requests, next_req);

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2220

g_free(entry);

Dr. David Alan Gilbert

2018-06-13 11:26:42 +0100

[diff] [blame]

2221

migration_consume_urgent_request();

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2222

}

2223

}

Juan Quintela

2017-03-20 22:12:40 +0100

[diff] [blame]

2224

qemu_mutex_unlock(&rs->src_page_req_mutex);

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

return block;

}

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2229

/**

2230

* get_queued_page: unqueue a page from the postocpy requests

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2231

*

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2232

* Skips pages that are already sent (!dirty)

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2233

*

Wei Yang

2019-05-11 07:37:29 +0800

[diff] [blame]

2234

* Returns true if a queued page is found

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2235

*

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

2236

* @rs: current RAM state

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2237

* @pss: data about the state of the current dirty page scan

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2238

*/

Juan Quintela

2017-03-21 16:19:05 +0100

[diff] [blame]

2239

static bool get_queued_page(RAMState *rs, PageSearchStatus *pss)

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

{

RAMBlock *block;

ram_addr_t offset;

bool dirty;

do {

Juan Quintela

2017-03-21 16:19:05 +0100

[diff] [blame]

2246

block = unqueue_page(rs, &offset);

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2247

/*

2248

* We're sending this page, and since it's postcopy nothing else

2249

* will dirty it, and we must make sure it doesn't get sent again

2250

* even if this queue request was received after the background

2251

* search already sent it.

2252

*/

2253

if (block) {

Juan Quintela

2017-03-21 16:19:05 +0100

[diff] [blame]

2254

unsigned long page;

2255

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2256

page = offset >> TARGET_PAGE_BITS;

2257

dirty = test_bit(page, block->bmap);

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2258

if (!dirty) {

Juan Quintela

06b1068

2017-03-21 15:18:05 +0100

[diff] [blame]

2259

trace_get_queued_page_not_dirty(block->idstr, (uint64_t)offset,

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2260

page, test_bit(page, block->unsentmap));

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2261

} else {

Juan Quintela

2017-03-21 16:19:05 +0100

[diff] [blame]

2262

trace_get_queued_page(block->idstr, (uint64_t)offset, page);

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

}

}

} while (block && !dirty);

if (block) {

/*

* As soon as we start servicing pages out of order, then we have

2271

* to kill the bulk stage, since the bulk stage assumes

2272

* in (migration_bitmap_find_and_reset_dirty) that every page is

2273

* dirty, that's no longer true.

2274

*/

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

2275

rs->ram_bulk_stage = false;

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2276

2277

/*

2278

* We want the background search to continue from the queued page

2279

* since the guest is likely to want other pages near to the page

2280

* it just requested.

2281

*/

2282

pss->block = block;

Juan Quintela

2017-03-21 15:36:51 +0100

[diff] [blame]

2283

pss->page = offset >> TARGET_PAGE_BITS;

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

}

return !!block;

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2289

/**

Juan Quintela

5e58f96

2017-04-03 22:06:54 +0200

[diff] [blame]

2290

* migration_page_queue_free: drop any remaining pages in the ram

2291

* request queue

Dr. David Alan Gilbert

2015-11-05 18:11:08 +0000

[diff] [blame]

2292

*

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2293

* It should be empty at the end anyway, but in error cases there may

2294

* be some left. in case that there is any page left, we drop it.

2295

*

Dr. David Alan Gilbert

2015-11-05 18:11:08 +0000

[diff] [blame]

2296

*/

Juan Quintela

83c1338

2017-05-04 11:45:01 +0200

[diff] [blame]

2297

static void migration_page_queue_free(RAMState *rs)

Dr. David Alan Gilbert

2015-11-05 18:11:08 +0000

[diff] [blame]

2298

{

Juan Quintela

2017-03-20 22:12:40 +0100

[diff] [blame]

2299

struct RAMSrcPageRequest *mspr, *next_mspr;

Dr. David Alan Gilbert

2015-11-05 18:11:08 +0000

[diff] [blame]

2300

/* This queue generally should be empty - but in the case of a failed

2301

* migration might have some droppings in.

2302

*/

2303

rcu_read_lock();

Juan Quintela

2017-03-20 22:12:40 +0100

[diff] [blame]

2304

QSIMPLEQ_FOREACH_SAFE(mspr, &rs->src_page_requests, next_req, next_mspr) {

Dr. David Alan Gilbert

2015-11-05 18:11:08 +0000

[diff] [blame]

2305

memory_region_unref(mspr->rb->mr);

Juan Quintela

2017-03-20 22:12:40 +0100

[diff] [blame]

2306

QSIMPLEQ_REMOVE_HEAD(&rs->src_page_requests, next_req);

Dr. David Alan Gilbert

2015-11-05 18:11:08 +0000

[diff] [blame]

g_free(mspr);

}

rcu_read_unlock();

}

/**

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2313

* ram_save_queue_pages: queue the page for transmission

2314

*

2315

* A request from postcopy destination for example.

2316

*

2317

* Returns zero on success or negative on error

2318

*

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2319

* @rbname: Name of the RAMBLock of the request. NULL means the

2320

* same that last one.

2321

* @start: starting address from the start of the RAMBlock

2322

* @len: length (in bytes) to send

Dr. David Alan Gilbert

2015-11-05 18:11:08 +0000

[diff] [blame]

2323

*/

Juan Quintela

9650689

2017-03-14 18:41:03 +0100

[diff] [blame]

2324

int ram_save_queue_pages(const char *rbname, ram_addr_t start, ram_addr_t len)

Dr. David Alan Gilbert

2015-11-05 18:11:08 +0000

[diff] [blame]

2325

{

2326

RAMBlock *ramblock;

Juan Quintela

2017-05-04 11:46:24 +0200

[diff] [blame]

2327

RAMState *rs = ram_state;

Dr. David Alan Gilbert

2015-11-05 18:11:08 +0000

[diff] [blame]

2328

Juan Quintela

2017-06-06 19:49:03 +0200

[diff] [blame]

2329

ram_counters.postcopy_requests++;

Dr. David Alan Gilbert

2015-11-05 18:11:08 +0000

[diff] [blame]

2330

rcu_read_lock();

2331

if (!rbname) {

2332

/* Reuse last RAMBlock */

Juan Quintela

68a098f

2017-03-14 13:48:42 +0100

[diff] [blame]

2333

ramblock = rs->last_req_rb;

Dr. David Alan Gilbert

2015-11-05 18:11:08 +0000

[diff] [blame]

if (!ramblock) {

/*

* Shouldn't happen, we can't reuse the last RAMBlock if

2338

* it's the 1st request.

2339

*/

2340

error_report("ram_save_queue_pages no previous block");

goto err;

}

} else {

ramblock = qemu_ram_block_by_name(rbname);

2345

2346

if (!ramblock) {

2347

/* We shouldn't be asked for a non-existent RAMBlock */

2348

error_report("ram_save_queue_pages no block '%s'", rbname);

2349

goto err;

2350

}

Juan Quintela

68a098f

2017-03-14 13:48:42 +0100

[diff] [blame]

2351

rs->last_req_rb = ramblock;

Dr. David Alan Gilbert

2015-11-05 18:11:08 +0000

[diff] [blame]

2352

}

2353

trace_ram_save_queue_pages(ramblock->idstr, start, len);

2354

if (start+len > ramblock->used_length) {

Juan Quintela

9458ad6

2015-11-10 17:42:05 +0100

[diff] [blame]

2355

error_report("%s request overrun start=" RAM_ADDR_FMT " len="

2356

RAM_ADDR_FMT " blocklen=" RAM_ADDR_FMT,

Dr. David Alan Gilbert

2015-11-05 18:11:08 +0000

[diff] [blame]

2357

__func__, start, len, ramblock->used_length);

goto err;

}

Juan Quintela

2017-03-20 22:12:40 +0100

[diff] [blame]

2361

struct RAMSrcPageRequest *new_entry =

2362

g_malloc0(sizeof(struct RAMSrcPageRequest));

Dr. David Alan Gilbert

2015-11-05 18:11:08 +0000

[diff] [blame]

2363

new_entry->rb = ramblock;

2364

new_entry->offset = start;

2365

new_entry->len = len;

2366

2367

memory_region_ref(ramblock->mr);

Juan Quintela

2017-03-20 22:12:40 +0100

[diff] [blame]

2368

qemu_mutex_lock(&rs->src_page_req_mutex);

2369

QSIMPLEQ_INSERT_TAIL(&rs->src_page_requests, new_entry, next_req);

Dr. David Alan Gilbert

2018-06-13 11:26:42 +0100

[diff] [blame]

2370

migration_make_urgent_request();

Juan Quintela

2017-03-20 22:12:40 +0100

[diff] [blame]

2371

qemu_mutex_unlock(&rs->src_page_req_mutex);

Dr. David Alan Gilbert

2015-11-05 18:11:08 +0000

[diff] [blame]

rcu_read_unlock();

return 0;

err:

rcu_read_unlock();

return -1;

}

Xiao Guangrong

2018-03-30 15:51:26 +0800

[diff] [blame]

2381

static bool save_page_use_compression(RAMState *rs)

2382

{

2383

if (!migrate_use_compression()) {

return false;

}

/*

* If xbzrle is on, stop using the data compression after first

2389

* round of migration even if compression is enabled. In theory,

2390

* xbzrle can do better than compression.

2391

*/

2392

if (rs->ram_bulk_stage || !migrate_use_xbzrle()) {

return true;

}

return false;

}

Xiao Guangrong

2018-08-21 16:10:24 +0800

[diff] [blame]

2399

/*

2400

* try to compress the page before posting it out, return true if the page

2401

* has been properly handled by compression, otherwise needs other

2402

* paths to handle it

2403

*/

2404

static bool save_compress_page(RAMState *rs, RAMBlock *block, ram_addr_t offset)

2405

{

2406

if (!save_page_use_compression(rs)) {

return false;

}

/*

* When starting the process of a new block, the first page of

2412

* the block should be sent out before other pages in the same

2413

* block, and all the pages in last block should have been sent

2414

* out, keeping this order is important, because the 'cont' flag

2415

* is used to avoid resending the block name.

2416

*

2417

* We post the fist page as normal page as compression will take

2418

* much CPU resource.

2419

*/

2420

if (block != rs->last_sent_block) {

2421

flush_compressed_data(rs);

return false;

}

if (compress_page_with_multi_thread(rs, block, offset) > 0) {

return true;

}

Xiao Guangrong

2018-09-06 15:01:00 +0800

[diff] [blame]

2429

compression_counters.busy++;

Xiao Guangrong

2018-08-21 16:10:24 +0800

[diff] [blame]

2430

return false;

2431

}

2432

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2433

/**

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2434

* ram_save_target_page: save one target page

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2435

*

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2436

* Returns the number of pages written

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2437

*

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

2438

* @rs: current RAM state

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2439

* @pss: data about the page we want to send

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2440

* @last_stage: if we are at the completion stage

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2441

*/

Juan Quintela

a0a8aa1

2017-03-20 22:29:07 +0100

[diff] [blame]

2442

static int ram_save_target_page(RAMState *rs, PageSearchStatus *pss,

Juan Quintela

2017-03-21 16:19:05 +0100

[diff] [blame]

2443

bool last_stage)

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2444

{

Xiao Guangrong

a8ec91f

2018-03-30 15:51:25 +0800

[diff] [blame]

2445

RAMBlock *block = pss->block;

2446

ram_addr_t offset = pss->page << TARGET_PAGE_BITS;

2447

int res;

2448

2449

if (control_save_page(rs, block, offset, &res)) {

return res;

}

Xiao Guangrong

2018-08-21 16:10:24 +0800

[diff] [blame]

2453

if (save_compress_page(rs, block, offset)) {

2454

return 1;

Xiao Guangrong

d7400a3

2018-03-30 15:51:26 +0800

[diff] [blame]

2455

}

2456

2457

res = save_zero_page(rs, block, offset);

2458

if (res > 0) {

2459

/* Must let xbzrle know, otherwise a previous (now 0'd) cached

2460

* page would be stale

2461

*/

2462

if (!save_page_use_compression(rs)) {

2463

XBZRLE_cache_lock();

2464

xbzrle_cache_zero_page(rs, block->offset + offset);

2465

XBZRLE_cache_unlock();

2466

}

2467

ram_release_pages(block->idstr, offset, res);

return res;

}

Xiao Guangrong

2018-03-30 15:51:28 +0800

[diff] [blame]

2471

/*

Xiao Guangrong

2018-08-21 16:10:24 +0800

[diff] [blame]

2472

* do not use multifd for compression as the first page in the new

2473

* block should be posted out before sending the compressed page

Xiao Guangrong

da3f56c

2018-03-30 15:51:28 +0800

[diff] [blame]

2474

*/

Xiao Guangrong

2018-08-21 16:10:24 +0800

[diff] [blame]

2475

if (!save_page_use_compression(rs) && migrate_use_multifd()) {

Juan Quintela

2016-01-15 11:40:13 +0100

[diff] [blame]

2476

return ram_save_multifd_page(rs, block, offset);

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2477

}

2478

Xiao Guangrong

1faa566

2018-03-30 15:51:24 +0800

[diff] [blame]

2479

return ram_save_page(rs, pss, last_stage);

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2480

}

2481

2482

/**

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2483

* ram_save_host_page: save a whole host page

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2484

*

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2485

* Starting at *offset send pages up to the end of the current host

2486

* page. It's valid for the initial offset to point into the middle of

2487

* a host page in which case the remainder of the hostpage is sent.

2488

* Only dirty target pages are sent. Note that the host page size may

2489

* be a huge page for this block.

Dr. David Alan Gilbert

1eb3fc0

2017-05-17 17:58:09 +0100

[diff] [blame]

2490

* The saving stops at the boundary of the used_length of the block

2491

* if the RAMBlock isn't a multiple of the host page size.

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2492

*

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2493

* Returns the number of pages written or negative on error

2494

*

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

2495

* @rs: current RAM state

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2496

* @ms: current migration state

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2497

* @pss: data about the page we want to send

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2498

* @last_stage: if we are at the completion stage

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2499

*/

Juan Quintela

a0a8aa1

2017-03-20 22:29:07 +0100

[diff] [blame]

2500

static int ram_save_host_page(RAMState *rs, PageSearchStatus *pss,

Juan Quintela

2017-03-21 16:19:05 +0100

[diff] [blame]

2501

bool last_stage)

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2502

{

2503

int tmppages, pages = 0;

Juan Quintela

2017-03-21 15:36:51 +0100

[diff] [blame]

2504

size_t pagesize_bits =

2505

qemu_ram_pagesize(pss->block) >> TARGET_PAGE_BITS;

Dr. David Alan Gilbert

4c011c3

2017-02-24 18:28:39 +0000

[diff] [blame]

2506

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

2507

if (ramblock_is_ignored(pss->block)) {

Cédric Le Goater

2018-05-14 08:57:00 +0200

[diff] [blame]

2508

error_report("block %s should not be migrated !", pss->block->idstr);

2509

return 0;

2510

}

2511

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2512

do {

Xiao Guangrong

1faa566

2018-03-30 15:51:24 +0800

[diff] [blame]

2513

/* Check the pages is dirty and if it is send it */

2514

if (!migration_bitmap_clear_dirty(rs, pss->block, pss->page)) {

pss->page++;

continue;

}

Juan Quintela

2017-03-21 16:19:05 +0100

[diff] [blame]

2519

tmppages = ram_save_target_page(rs, pss, last_stage);

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

if (tmppages < 0) {

return tmppages;

}

pages += tmppages;

Xiao Guangrong

1faa566

2018-03-30 15:51:24 +0800

[diff] [blame]

2525

if (pss->block->unsentmap) {

2526

clear_bit(pss->page, pss->block->unsentmap);

2527

}

2528

Juan Quintela

2017-03-21 15:36:51 +0100

[diff] [blame]

2529

pss->page++;

Dr. David Alan Gilbert

1eb3fc0

2017-05-17 17:58:09 +0100

[diff] [blame]

2530

} while ((pss->page & (pagesize_bits - 1)) &&

2531

offset_in_ramblock(pss->block, pss->page << TARGET_PAGE_BITS));

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2532

2533

/* The offset we leave with is the last one we looked at */

Juan Quintela

2017-03-21 15:36:51 +0100

[diff] [blame]

2534

pss->page--;

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2535

return pages;

2536

}

Dr. David Alan Gilbert

2015-11-05 18:11:08 +0000

[diff] [blame]

2537

2538

/**

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2539

* ram_find_and_save_block: finds a dirty page and sends it to f

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2540

*

2541

* Called within an RCU critical section.

2542

*

Xiao Guangrong

2018-09-03 17:26:44 +0800

[diff] [blame]

2543

* Returns the number of pages written where zero means no dirty pages,

2544

* or negative on error

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2545

*

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

2546

* @rs: current RAM state

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2547

* @last_stage: if we are at the completion stage

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2548

*

2549

* On systems where host-page-size > target-page-size it will send all the

2550

* pages in a host page that are dirty.

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2551

*/

2552

Juan Quintela

2017-03-15 11:00:51 +0100

[diff] [blame]

2553

static int ram_find_and_save_block(RAMState *rs, bool last_stage)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2554

{

Dr. David Alan Gilbert

2015-09-23 15:27:10 +0100

[diff] [blame]

2555

PageSearchStatus pss;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2556

int pages = 0;

Dr. David Alan Gilbert

2015-09-23 15:27:11 +0100

[diff] [blame]

2557

bool again, found;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2558

Ashijeet Acharya

0827b9e

2017-02-08 19:58:45 +0530

[diff] [blame]

2559

/* No dirty page as there is zero RAM */

2560

if (!ram_bytes_total()) {

return pages;

}

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

2564

pss.block = rs->last_seen_block;

Juan Quintela

2017-03-21 15:36:51 +0100

[diff] [blame]

2565

pss.page = rs->last_page;

Dr. David Alan Gilbert

2015-09-23 15:27:10 +0100

[diff] [blame]

2566

pss.complete_round = false;

2567

2568

if (!pss.block) {

2569

pss.block = QLIST_FIRST_RCU(&ram_list.blocks);

2570

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2571

Dr. David Alan Gilbert

2015-09-23 15:27:11 +0100

[diff] [blame]

2572

do {

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2573

again = true;

Juan Quintela

2017-03-21 16:19:05 +0100

[diff] [blame]

2574

found = get_queued_page(rs, &pss);

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2575

2576

if (!found) {

2577

/* priority queue empty, so just search for something dirty */

Juan Quintela

2017-03-21 16:19:05 +0100

[diff] [blame]

2578

found = find_dirty_block(rs, &pss, &again);

Dr. David Alan Gilbert

2015-11-05 18:11:09 +0000

[diff] [blame]

2579

}

Dr. David Alan Gilbert

2015-09-23 15:27:11 +0100

[diff] [blame]

2580

2581

if (found) {

Juan Quintela

2017-03-21 16:19:05 +0100

[diff] [blame]

2582

pages = ram_save_host_page(rs, &pss, last_stage);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2583

}

Dr. David Alan Gilbert

2015-09-23 15:27:11 +0100

[diff] [blame]

2584

} while (!pages && again);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2585

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

2586

rs->last_seen_block = pss.block;

Juan Quintela

2017-03-21 15:36:51 +0100

[diff] [blame]

2587

rs->last_page = pss.page;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

return pages;

}

void acct_update_position(QEMUFile *f, size_t size, bool zero)

2593

{

2594

uint64_t pages = size / TARGET_PAGE_SIZE;

Juan Quintela

f7ccd61

2017-03-13 20:30:21 +0100

[diff] [blame]

2595

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2596

if (zero) {

Juan Quintela

2017-06-06 19:49:03 +0200

[diff] [blame]

2597

ram_counters.duplicate += pages;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2598

} else {

Juan Quintela

2017-06-06 19:49:03 +0200

[diff] [blame]

2599

ram_counters.normal += pages;

2600

ram_counters.transferred += size;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2601

qemu_update_position(f, size);

}

}

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

2605

static uint64_t ram_bytes_total_common(bool count_ignored)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

{

RAMBlock *block;

uint64_t total = 0;

rcu_read_lock();

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

2611

if (count_ignored) {

2612

RAMBLOCK_FOREACH_MIGRATABLE(block) {

2613

total += block->used_length;

2614

}

2615

} else {

2616

RAMBLOCK_FOREACH_NOT_IGNORED(block) {

2617

total += block->used_length;

2618

}

Peter Xu

99e1558

2017-05-12 12:17:39 +0800

[diff] [blame]

2619

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

rcu_read_unlock();

return total;

}

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

2624

uint64_t ram_bytes_total(void)

2625

{

2626

return ram_bytes_total_common(false);

2627

}

2628

Juan Quintela

2017-06-28 11:52:27 +0200

[diff] [blame]

2629

static void xbzrle_load_setup(void)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2630

{

Juan Quintela

2017-06-28 11:52:27 +0200

[diff] [blame]

2631

XBZRLE.decoded_buf = g_malloc(TARGET_PAGE_SIZE);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2632

}

2633

Juan Quintela

2017-06-28 11:52:27 +0200

[diff] [blame]

2634

static void xbzrle_load_cleanup(void)

2635

{

2636

g_free(XBZRLE.decoded_buf);

2637

XBZRLE.decoded_buf = NULL;

2638

}

2639

Peter Xu

7d7c96b

2017-10-19 14:31:58 +0800

[diff] [blame]

2640

static void ram_state_cleanup(RAMState **rsp)

2641

{

Dr. David Alan Gilbert

b9ccaf6

2018-02-12 16:03:39 +0000

[diff] [blame]

2642

if (*rsp) {

2643

migration_page_queue_free(*rsp);

2644

qemu_mutex_destroy(&(*rsp)->bitmap_mutex);

2645

qemu_mutex_destroy(&(*rsp)->src_page_req_mutex);

2646

g_free(*rsp);

2647

*rsp = NULL;

2648

}

Peter Xu

7d7c96b

2017-10-19 14:31:58 +0800

[diff] [blame]

2649

}

2650

Peter Xu

84593a0

2017-10-19 14:31:59 +0800

[diff] [blame]

2651

static void xbzrle_cleanup(void)

{

XBZRLE_cache_lock();

if (XBZRLE.cache) {

cache_fini(XBZRLE.cache);

2656

g_free(XBZRLE.encoded_buf);

2657

g_free(XBZRLE.current_buf);

2658

g_free(XBZRLE.zero_target_page);

2659

XBZRLE.cache = NULL;

2660

XBZRLE.encoded_buf = NULL;

2661

XBZRLE.current_buf = NULL;

2662

XBZRLE.zero_target_page = NULL;

2663

}

2664

XBZRLE_cache_unlock();

2665

}

2666

Juan Quintela

2017-06-28 11:52:27 +0200

[diff] [blame]

2667

static void ram_save_cleanup(void *opaque)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2668

{

Juan Quintela

2017-05-04 11:46:24 +0200

[diff] [blame]

2669

RAMState **rsp = opaque;

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2670

RAMBlock *block;

Juan Quintela

eb859c5

2017-03-13 21:51:55 +0100

[diff] [blame]

2671

Li Zhijian

2ff6403

2015-07-02 20:18:05 +0800

[diff] [blame]

2672

/* caller have hold iothread lock or is in a bh, so there is

Yi Wang

4633456

2019-04-15 14:51:29 +0800

[diff] [blame]

2673

* no writing race against the migration bitmap

Li Zhijian

2ff6403

2015-07-02 20:18:05 +0800

[diff] [blame]

2674

*/

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2675

memory_global_dirty_log_stop();

2676

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

2677

RAMBLOCK_FOREACH_NOT_IGNORED(block) {

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2678

g_free(block->bmap);

2679

block->bmap = NULL;

2680

g_free(block->unsentmap);

2681

block->unsentmap = NULL;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2682

}

2683

Peter Xu

84593a0

2017-10-19 14:31:59 +0800

[diff] [blame]

2684

xbzrle_cleanup();

Juan Quintela

f0afa33

2017-06-28 11:52:28 +0200

[diff] [blame]

2685

compress_threads_save_cleanup();

Peter Xu

7d7c96b

2017-10-19 14:31:58 +0800

[diff] [blame]

2686

ram_state_cleanup(rsp);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2687

}

2688

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

2689

static void ram_state_reset(RAMState *rs)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2690

{

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

2691

rs->last_seen_block = NULL;

2692

rs->last_sent_block = NULL;

Juan Quintela

269ace2

2017-03-21 15:23:31 +0100

[diff] [blame]

2693

rs->last_page = 0;

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

2694

rs->last_version = ram_list.version;

2695

rs->ram_bulk_stage = true;

Wei Wang

6eeb63f

2018-12-11 16:24:52 +0800

[diff] [blame]

2696

rs->fpo_enabled = false;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

2697

}

2698

2699

#define MAX_WAIT 50 /* ms, half buffered_file limit */

2700

Dr. David Alan Gilbert

2015-11-05 18:10:38 +0000

[diff] [blame]

2701

/*

2702

* 'expected' is the value you expect the bitmap mostly to be full

2703

* of; it won't bother printing lines that are all this value.

2704

* If 'todump' is null the migration bitmap is dumped.

2705

*/

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2706

void ram_debug_dump_bitmap(unsigned long *todump, bool expected,

2707

unsigned long pages)

Dr. David Alan Gilbert

2015-11-05 18:10:38 +0000

[diff] [blame]

2708

{

Dr. David Alan Gilbert

2015-11-05 18:10:38 +0000

[diff] [blame]

2709

int64_t cur;

2710

int64_t linelen = 128;

2711

char linebuf[129];

2712

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2713

for (cur = 0; cur < pages; cur += linelen) {

Dr. David Alan Gilbert

2015-11-05 18:10:38 +0000

[diff] [blame]

int64_t curb;

bool found = false;

/*

* Last line; catch the case where the line length

2718

* is longer than remaining ram

2719

*/

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2720

if (cur + linelen > pages) {

2721

linelen = pages - cur;

Dr. David Alan Gilbert

2015-11-05 18:10:38 +0000

[diff] [blame]

2722

}

2723

for (curb = 0; curb < linelen; curb++) {

2724

bool thisbit = test_bit(cur + curb, todump);

2725

linebuf[curb] = thisbit ? '1' : '.';

2726

found = found || (thisbit != expected);

2727

}

2728

if (found) {

2729

linebuf[curb] = '\0';

2730

fprintf(stderr, "0x%08" PRIx64 " : %s\n", cur, linebuf);

}

}

}

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

2735

/* **** functions for postcopy ***** */

2736

Pavel Butsykin

2017-02-03 18:23:21 +0300

[diff] [blame]

2737

void ram_postcopy_migrated_memory_release(MigrationState *ms)

2738

{

2739

struct RAMBlock *block;

Pavel Butsykin

2017-02-03 18:23:21 +0300

[diff] [blame]

2740

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

2741

RAMBLOCK_FOREACH_NOT_IGNORED(block) {

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2742

unsigned long *bitmap = block->bmap;

2743

unsigned long range = block->used_length >> TARGET_PAGE_BITS;

2744

unsigned long run_start = find_next_zero_bit(bitmap, range, 0);

Pavel Butsykin

2017-02-03 18:23:21 +0300

[diff] [blame]

2745

2746

while (run_start < range) {

2747

unsigned long run_end = find_next_bit(bitmap, range, run_start + 1);

Juan Quintela

aaa2064

2017-03-21 11:35:24 +0100

[diff] [blame]

2748

ram_discard_range(block->idstr, run_start << TARGET_PAGE_BITS,

Pavel Butsykin

2017-02-03 18:23:21 +0300

[diff] [blame]

2749

(run_end - run_start) << TARGET_PAGE_BITS);

2750

run_start = find_next_zero_bit(bitmap, range, run_end + 1);

}

}

}

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2755

/**

2756

* postcopy_send_discard_bm_ram: discard a RAMBlock

2757

*

2758

* Returns zero on success

2759

*

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

2760

* Callback from postcopy_each_ram_send_discard for each RAMBlock

2761

* Note: At this point the 'unsentmap' is the processed bitmap combined

2762

* with the dirtymap; so a '1' means it's either dirty or unsent.

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2763

*

2764

* @ms: current migration state

2765

* @pds: state for postcopy

2766

* @start: RAMBlock starting page

2767

* @length: RAMBlock size

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

2768

*/

2769

static int postcopy_send_discard_bm_ram(MigrationState *ms,

2770

PostcopyDiscardState *pds,

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2771

RAMBlock *block)

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

2772

{

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2773

unsigned long end = block->used_length >> TARGET_PAGE_BITS;

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

2774

unsigned long current;

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2775

unsigned long *unsentmap = block->unsentmap;

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

2776

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2777

for (current = 0; current < end; ) {

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

2778

unsigned long one = find_next_bit(unsentmap, end, current);

2779

2780

if (one <= end) {

2781

unsigned long zero = find_next_zero_bit(unsentmap, end, one + 1);

2782

unsigned long discard_length;

2783

2784

if (zero >= end) {

2785

discard_length = end - one;

2786

} else {

2787

discard_length = zero - one;

2788

}

Dr. David Alan Gilbert

d688c62

2016-06-13 12:16:40 +0100

[diff] [blame]

2789

if (discard_length) {

2790

postcopy_discard_send_range(ms, pds, one, discard_length);

2791

}

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

2792

current = one + discard_length;

} else {

current = one;

}

}

return 0;

}

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2801

/**

2802

* postcopy_each_ram_send_discard: discard all RAMBlocks

2803

*

2804

* Returns 0 for success or negative for error

2805

*

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

2806

* Utility for the outgoing postcopy code.

2807

* Calls postcopy_send_discard_bm_ram for each RAMBlock

2808

* passing it bitmap indexes and name.

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

2809

* (qemu_ram_foreach_block ends up passing unscaled lengths

2810

* which would mean postcopy code would have to deal with target page)

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2811

*

2812

* @ms: current migration state

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

2813

*/

2814

static int postcopy_each_ram_send_discard(MigrationState *ms)

2815

{

2816

struct RAMBlock *block;

2817

int ret;

2818

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

2819

RAMBLOCK_FOREACH_NOT_IGNORED(block) {

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2820

PostcopyDiscardState *pds =

2821

postcopy_discard_send_init(ms, block->idstr);

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

2822

2823

/*

2824

* Postcopy sends chunks of bitmap over the wire, but it

2825

* just needs indexes at this point, avoids it having

2826

* target page specific code.

2827

*/

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2828

ret = postcopy_send_discard_bm_ram(ms, pds, block);

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

2829

postcopy_discard_send_finish(ms, pds);

if (ret) {

return ret;

}

}

return 0;

}

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2838

/**

2839

* postcopy_chunk_hostpages_pass: canocalize bitmap in hostpages

Dr. David Alan Gilbert

2015-11-05 18:11:15 +0000

[diff] [blame]

2840

*

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2841

* Helper for postcopy_chunk_hostpages; it's called twice to

2842

* canonicalize the two bitmaps, that are similar, but one is

2843

* inverted.

Dr. David Alan Gilbert

2015-11-05 18:11:15 +0000

[diff] [blame]

2844

*

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2845

* Postcopy requires that all target pages in a hostpage are dirty or

2846

* clean, not a mix. This function canonicalizes the bitmaps.

2847

*

2848

* @ms: current migration state

2849

* @unsent_pass: if true we need to canonicalize partially unsent host pages

2850

* otherwise we need to canonicalize partially dirty host pages

2851

* @block: block that contains the page we want to canonicalize

2852

* @pds: state for postcopy

Dr. David Alan Gilbert

2015-11-05 18:11:15 +0000

[diff] [blame]

2853

*/

2854

static void postcopy_chunk_hostpages_pass(MigrationState *ms, bool unsent_pass,

2855

RAMBlock *block,

2856

PostcopyDiscardState *pds)

2857

{

Juan Quintela

2017-05-04 11:46:24 +0200

[diff] [blame]

2858

RAMState *rs = ram_state;

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2859

unsigned long *bitmap = block->bmap;

2860

unsigned long *unsentmap = block->unsentmap;

Dr. David Alan Gilbert

29c5917

2017-02-24 18:28:31 +0000

[diff] [blame]

2861

unsigned int host_ratio = block->page_size / TARGET_PAGE_SIZE;

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2862

unsigned long pages = block->used_length >> TARGET_PAGE_BITS;

Dr. David Alan Gilbert

2015-11-05 18:11:15 +0000

[diff] [blame]

2863

unsigned long run_start;

2864

Dr. David Alan Gilbert

29c5917

2017-02-24 18:28:31 +0000

[diff] [blame]

2865

if (block->page_size == TARGET_PAGE_SIZE) {

2866

/* Easy case - TPS==HPS for a non-huge page RAMBlock */

2867

return;

2868

}

2869

Dr. David Alan Gilbert

2015-11-05 18:11:15 +0000

[diff] [blame]

2870

if (unsent_pass) {

2871

/* Find a sent page */

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2872

run_start = find_next_zero_bit(unsentmap, pages, 0);

Dr. David Alan Gilbert

2015-11-05 18:11:15 +0000

[diff] [blame]

2873

} else {

2874

/* Find a dirty page */

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2875

run_start = find_next_bit(bitmap, pages, 0);

Dr. David Alan Gilbert

2015-11-05 18:11:15 +0000

[diff] [blame]

2876

}

2877

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2878

while (run_start < pages) {

Dr. David Alan Gilbert

2015-11-05 18:11:15 +0000

[diff] [blame]

2879

bool do_fixup = false;

2880

unsigned long fixup_start_addr;

2881

unsigned long host_offset;

2882

2883

/*

2884

* If the start of this run of pages is in the middle of a host

2885

* page, then we need to fixup this host page.

2886

*/

2887

host_offset = run_start % host_ratio;

2888

if (host_offset) {

2889

do_fixup = true;

2890

run_start -= host_offset;

2891

fixup_start_addr = run_start;

2892

/* For the next pass */

2893

run_start = run_start + host_ratio;

2894

} else {

2895

/* Find the end of this run */

2896

unsigned long run_end;

2897

if (unsent_pass) {

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2898

run_end = find_next_bit(unsentmap, pages, run_start + 1);

Dr. David Alan Gilbert

2015-11-05 18:11:15 +0000

[diff] [blame]

2899

} else {

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2900

run_end = find_next_zero_bit(bitmap, pages, run_start + 1);

Dr. David Alan Gilbert

2015-11-05 18:11:15 +0000

[diff] [blame]

2901

}

2902

/*

2903

* If the end isn't at the start of a host page, then the

2904

* run doesn't finish at the end of a host page

2905

* and we need to discard.

2906

*/

2907

host_offset = run_end % host_ratio;

2908

if (host_offset) {

2909

do_fixup = true;

2910

fixup_start_addr = run_end - host_offset;

2911

/*

2912

* This host page has gone, the next loop iteration starts

2913

* from after the fixup

2914

*/

2915

run_start = fixup_start_addr + host_ratio;

2916

} else {

2917

/*

2918

* No discards on this iteration, next loop starts from

2919

* next sent/dirty page

2920

*/

2921

run_start = run_end + 1;

}

}

if (do_fixup) {

unsigned long page;

/* Tell the destination to discard this page */

2929

if (unsent_pass || !test_bit(fixup_start_addr, unsentmap)) {

2930

/* For the unsent_pass we:

2931

* discard partially sent pages

2932

* For the !unsent_pass (dirty) we:

2933

* discard partially dirty pages that were sent

2934

* (any partially sent pages were already discarded

2935

* by the previous unsent_pass)

2936

*/

2937

postcopy_discard_send_range(ms, pds, fixup_start_addr,

host_ratio);

}

/* Clean up the bitmap */

2942

for (page = fixup_start_addr;

2943

page < fixup_start_addr + host_ratio; page++) {

2944

/* All pages in this host page are now not sent */

2945

set_bit(page, unsentmap);

2946

2947

/*

2948

* Remark them as dirty, updating the count for any pages

2949

* that weren't previously dirty.

2950

*/

Juan Quintela

2017-03-13 21:21:41 +0100

[diff] [blame]

2951

rs->migration_dirty_pages += !test_and_set_bit(page, bitmap);

Dr. David Alan Gilbert

2015-11-05 18:11:15 +0000

[diff] [blame]

}

}

if (unsent_pass) {

/* Find the next sent page for the next iteration */

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2957

run_start = find_next_zero_bit(unsentmap, pages, run_start);

Dr. David Alan Gilbert

2015-11-05 18:11:15 +0000

[diff] [blame]

2958

} else {

2959

/* Find the next dirty page for the next iteration */

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2960

run_start = find_next_bit(bitmap, pages, run_start);

Dr. David Alan Gilbert

2015-11-05 18:11:15 +0000

[diff] [blame]

}

}

}

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2965

/**

2966

* postcopy_chuck_hostpages: discrad any partially sent host page

2967

*

Dr. David Alan Gilbert

2015-11-05 18:11:15 +0000

[diff] [blame]

2968

* Utility for the outgoing postcopy code.

2969

*

2970

* Discard any partially sent host-page size chunks, mark any partially

Dr. David Alan Gilbert

29c5917

2017-02-24 18:28:31 +0000

[diff] [blame]

2971

* dirty host-page size chunks as all dirty. In this case the host-page

2972

* is the host-page for the particular RAMBlock, i.e. it might be a huge page

Dr. David Alan Gilbert

2015-11-05 18:11:15 +0000

[diff] [blame]

2973

*

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2974

* Returns zero on success

2975

*

2976

* @ms: current migration state

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2977

* @block: block we want to work with

Dr. David Alan Gilbert

2015-11-05 18:11:15 +0000

[diff] [blame]

2978

*/

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2979

static int postcopy_chunk_hostpages(MigrationState *ms, RAMBlock *block)

Dr. David Alan Gilbert

2015-11-05 18:11:15 +0000

[diff] [blame]

2980

{

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2981

PostcopyDiscardState *pds =

2982

postcopy_discard_send_init(ms, block->idstr);

Dr. David Alan Gilbert

2015-11-05 18:11:15 +0000

[diff] [blame]

2983

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2984

/* First pass: Discard all partially sent host pages */

2985

postcopy_chunk_hostpages_pass(ms, true, block, pds);

2986

/*

2987

* Second pass: Ensure that all partially dirty host pages are made

2988

* fully dirty.

2989

*/

2990

postcopy_chunk_hostpages_pass(ms, false, block, pds);

Dr. David Alan Gilbert

2015-11-05 18:11:15 +0000

[diff] [blame]

2991

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

2992

postcopy_discard_send_finish(ms, pds);

Dr. David Alan Gilbert

2015-11-05 18:11:15 +0000

[diff] [blame]

return 0;

}

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

2996

/**

2997

* ram_postcopy_send_discard_bitmap: transmit the discard bitmap

2998

*

2999

* Returns zero on success

3000

*

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

3001

* Transmit the set of pages to be discarded after precopy to the target

3002

* these are pages that:

3003

* a) Have been previously transmitted but are now dirty again

3004

* b) Pages that have never been transmitted, this ensures that

3005

* any pages on the destination that have been mapped by background

3006

* tasks get discarded (transparent huge pages is the specific concern)

3007

* Hopefully this is pretty sparse

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

3008

*

3009

* @ms: current migration state

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

3010

*/

3011

int ram_postcopy_send_discard_bitmap(MigrationState *ms)

3012

{

Juan Quintela

2017-05-04 11:46:24 +0200

[diff] [blame]

3013

RAMState *rs = ram_state;

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

3014

RAMBlock *block;

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

3015

int ret;

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

rcu_read_lock();

/* This should be our last sync, the src is now paused */

Juan Quintela

eb859c5

2017-03-13 21:51:55 +0100

[diff] [blame]

3020

migration_bitmap_sync(rs);

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

3021

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

3022

/* Easiest way to make sure we don't resume in the middle of a host-page */

3023

rs->last_seen_block = NULL;

3024

rs->last_sent_block = NULL;

3025

rs->last_page = 0;

3026

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

3027

RAMBLOCK_FOREACH_NOT_IGNORED(block) {

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

3028

unsigned long pages = block->used_length >> TARGET_PAGE_BITS;

3029

unsigned long *bitmap = block->bmap;

3030

unsigned long *unsentmap = block->unsentmap;

3031

3032

if (!unsentmap) {

3033

/* We don't have a safe way to resize the sentmap, so

3034

* if the bitmap was resized it will be NULL at this

3035

* point.

3036

*/

3037

error_report("migration ram resized during precopy phase");

rcu_read_unlock();

return -EINVAL;

}

/* Deal with TPS != HPS and huge pages */

3042

ret = postcopy_chunk_hostpages(ms, block);

if (ret) {

rcu_read_unlock();

return ret;

}

/*

* Update the unsentmap to be unsentmap = unsentmap | dirty

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

3050

*/

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

3051

bitmap_or(unsentmap, unsentmap, bitmap, pages);

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

3052

#ifdef DEBUG_POSTCOPY

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

3053

ram_debug_dump_bitmap(unsentmap, true, pages);

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

3054

#endif

Juan Quintela

2017-03-22 15:18:04 +0100

[diff] [blame]

3055

}

3056

trace_ram_postcopy_send_discard_bitmap();

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

3057

3058

ret = postcopy_each_ram_send_discard(ms);

rcu_read_unlock();

return ret;

}

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

3064

/**

3065

* ram_discard_range: discard dirtied pages at the beginning of postcopy

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

3066

*

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

3067

* Returns zero on success

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

3068

*

Juan Quintela

3644915

2017-03-23 15:11:59 +0100

[diff] [blame]

3069

* @rbname: name of the RAMBlock of the request. NULL means the

3070

* same that last one.

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

3071

* @start: RAMBlock starting page

3072

* @length: RAMBlock size

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

3073

*/

Juan Quintela

aaa2064

2017-03-21 11:35:24 +0100

[diff] [blame]

3074

int ram_discard_range(const char *rbname, uint64_t start, size_t length)

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

{

int ret = -1;

Juan Quintela

2017-03-23 15:11:59 +0100

[diff] [blame]

3078

trace_ram_discard_range(rbname, start, length);

Dr. David Alan Gilbert

d3a5038

2017-02-24 18:28:32 +0000

[diff] [blame]

3079

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

3080

rcu_read_lock();

Juan Quintela

3644915

2017-03-23 15:11:59 +0100

[diff] [blame]

3081

RAMBlock *rb = qemu_ram_block_by_name(rbname);

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

3082

3083

if (!rb) {

Juan Quintela

3644915

2017-03-23 15:11:59 +0100

[diff] [blame]

3084

error_report("ram_discard_range: Failed to find block '%s'", rbname);

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

goto err;

}

Peter Xu

2018-07-23 20:33:02 +0800

[diff] [blame]

3088

/*

3089

* On source VM, we don't need to update the received bitmap since

3090

* we don't even have one.

3091

*/

3092

if (rb->receivedmap) {

3093

bitmap_clear(rb->receivedmap, start >> qemu_target_page_bits(),

3094

length >> qemu_target_page_bits());

3095

}

3096

Dr. David Alan Gilbert

d3a5038

2017-02-24 18:28:32 +0000

[diff] [blame]

3097

ret = ram_block_discard_range(rb, start, length);

Dr. David Alan Gilbert

2015-11-05 18:11:02 +0000

[diff] [blame]

err:

rcu_read_unlock();

return ret;

}

Peter Xu

2017-10-19 14:31:59 +0800

[diff] [blame]

3105

/*

3106

* For every allocation, we will try not to crash the VM if the

3107

* allocation failed.

3108

*/

3109

static int xbzrle_init(void)

3110

{

3111

Error *local_err = NULL;

3112

3113

if (!migrate_use_xbzrle()) {

return 0;

}

XBZRLE_cache_lock();

XBZRLE.zero_target_page = g_try_malloc0(TARGET_PAGE_SIZE);

3120

if (!XBZRLE.zero_target_page) {

3121

error_report("%s: Error allocating zero page", __func__);

goto err_out;

}

XBZRLE.cache = cache_init(migrate_xbzrle_cache_size(),

3126

TARGET_PAGE_SIZE, &local_err);

3127

if (!XBZRLE.cache) {

3128

error_report_err(local_err);

goto free_zero_page;

}

XBZRLE.encoded_buf = g_try_malloc0(TARGET_PAGE_SIZE);

3133

if (!XBZRLE.encoded_buf) {

3134

error_report("%s: Error allocating encoded_buf", __func__);

goto free_cache;

}

XBZRLE.current_buf = g_try_malloc(TARGET_PAGE_SIZE);

3139

if (!XBZRLE.current_buf) {

3140

error_report("%s: Error allocating current_buf", __func__);

3141

goto free_encoded_buf;

3142

}

3143

3144

/* We are all good */

3145

XBZRLE_cache_unlock();

return 0;

free_encoded_buf:

g_free(XBZRLE.encoded_buf);

3150

XBZRLE.encoded_buf = NULL;

3151

free_cache:

3152

cache_fini(XBZRLE.cache);

3153

XBZRLE.cache = NULL;

3154

free_zero_page:

3155

g_free(XBZRLE.zero_target_page);

3156

XBZRLE.zero_target_page = NULL;

3157

err_out:

3158

XBZRLE_cache_unlock();

return -ENOMEM;

}

Juan Quintela

2017-05-04 11:46:24 +0200

[diff] [blame]

3162

static int ram_state_init(RAMState **rsp)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3163

{

Peter Xu

2017-10-19 14:31:57 +0800

[diff] [blame]

3164

*rsp = g_try_new0(RAMState, 1);

3165

3166

if (!*rsp) {

3167

error_report("%s: Init ramstate fail", __func__);

3168

return -1;

3169

}

Juan Quintela

2017-05-04 11:46:24 +0200

[diff] [blame]

3170

3171

qemu_mutex_init(&(*rsp)->bitmap_mutex);

3172

qemu_mutex_init(&(*rsp)->src_page_req_mutex);

3173

QSIMPLEQ_INIT(&(*rsp)->src_page_requests);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3174

Peter Xu

2017-10-19 14:31:57 +0800

[diff] [blame]

3175

/*

Wei Yang

0315851

2019-06-04 14:17:27 +0800

[diff] [blame^]

3176

* This must match with the initial values of dirty bitmap.

3177

* Currently we initialize the dirty bitmap to all zeros so

3178

* here the total dirty page count is zero.

Peter Xu

2017-10-19 14:31:57 +0800

[diff] [blame]

3179

*/

Wei Yang

0315851

2019-06-04 14:17:27 +0800

[diff] [blame^]

3180

(*rsp)->migration_dirty_pages = 0;

Peter Xu

2017-10-19 14:31:57 +0800

[diff] [blame]

3181

ram_state_reset(*rsp);

return 0;

}

Peter Xu

2017-10-19 14:32:00 +0800

[diff] [blame]

3186

static void ram_list_init_bitmaps(void)

{

RAMBlock *block;

unsigned long pages;

/* Skip setting bitmap if there is no RAM */

3192

if (ram_bytes_total()) {

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

3193

RAMBLOCK_FOREACH_NOT_IGNORED(block) {

Peter Xu

2017-10-19 14:32:00 +0800

[diff] [blame]

3194

pages = block->max_length >> TARGET_PAGE_BITS;

Wei Yang

0315851

2019-06-04 14:17:27 +0800

[diff] [blame^]

3195

/*

3196

* The initial dirty bitmap for migration must be set with all

3197

* ones to make sure we'll migrate every guest RAM page to

3198

* destination.

3199

* Here we didn't set RAMBlock.bmap simply because it is already

3200

* set in ram_list.dirty_memory[DIRTY_MEMORY_MIGRATION] in

3201

* ram_block_add, and that's where we'll sync the dirty bitmaps.

3202

* Here setting RAMBlock.bmap would be fine too but not necessary.

3203

*/

Peter Xu

2017-10-19 14:32:00 +0800

[diff] [blame]

3204

block->bmap = bitmap_new(pages);

Peter Xu

2017-10-19 14:32:00 +0800

[diff] [blame]

3205

if (migrate_postcopy_ram()) {

3206

block->unsentmap = bitmap_new(pages);

3207

bitmap_set(block->unsentmap, 0, pages);

}

}

}

}

static void ram_init_bitmaps(RAMState *rs)

3214

{

3215

/* For memory_global_dirty_log_start below. */

3216

qemu_mutex_lock_iothread();

3217

qemu_mutex_lock_ramlist();

3218

rcu_read_lock();

3219

3220

ram_list_init_bitmaps();

3221

memory_global_dirty_log_start();

Wei Wang

2018-12-11 16:24:51 +0800

[diff] [blame]

3222

migration_bitmap_sync_precopy(rs);

Peter Xu

2017-10-19 14:32:00 +0800

[diff] [blame]

3223

3224

rcu_read_unlock();

3225

qemu_mutex_unlock_ramlist();

3226

qemu_mutex_unlock_iothread();

3227

}

3228

Peter Xu

2017-10-19 14:31:57 +0800

[diff] [blame]

3229

static int ram_init_all(RAMState **rsp)

3230

{

Peter Xu

2017-10-19 14:31:57 +0800

[diff] [blame]

3231

if (ram_state_init(rsp)) {

return -1;

}

Peter Xu

2017-10-19 14:31:59 +0800

[diff] [blame]

3235

if (xbzrle_init()) {

3236

ram_state_cleanup(rsp);

3237

return -1;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3238

}

3239

Peter Xu

2017-10-19 14:32:00 +0800

[diff] [blame]

3240

ram_init_bitmaps(*rsp);

zhanghailiang

2016-10-27 14:42:59 +0800

[diff] [blame]

return 0;

}

Peter Xu

2018-05-02 18:47:33 +0800

[diff] [blame]

3245

static void ram_state_resume_prepare(RAMState *rs, QEMUFile *out)

{

RAMBlock *block;

uint64_t pages = 0;

/*

* Postcopy is not using xbzrle/compression, so no need for that.

3252

* Also, since source are already halted, we don't need to care

3253

* about dirty page logging as well.

3254

*/

3255

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

3256

RAMBLOCK_FOREACH_NOT_IGNORED(block) {

Peter Xu

08614f3

2018-05-02 18:47:33 +0800

[diff] [blame]

3257

pages += bitmap_count_one(block->bmap,

3258

block->used_length >> TARGET_PAGE_BITS);

3259

}

3260

3261

/* This may not be aligned with current bitmaps. Recalculate. */

3262

rs->migration_dirty_pages = pages;

3263

3264

rs->last_seen_block = NULL;

3265

rs->last_sent_block = NULL;

3266

rs->last_page = 0;

3267

rs->last_version = ram_list.version;

3268

/*

3269

* Disable the bulk stage, otherwise we'll resend the whole RAM no

3270

* matter what we have sent.

3271

*/

3272

rs->ram_bulk_stage = false;

3273

3274

/* Update RAMState cache of output QEMUFile */

3275

rs->f = out;

3276

3277

trace_ram_state_resume_prepare(pages);

3278

}

3279

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

3280

/*

Wei Wang

6bcb05f

2018-12-11 16:24:50 +0800

[diff] [blame]

3281

* This function clears bits of the free pages reported by the caller from the

3282

* migration dirty bitmap. @addr is the host address corresponding to the

3283

* start of the continuous guest free pages, and @len is the total bytes of

3284

* those pages.

3285

*/

3286

void qemu_guest_free_page_hint(void *addr, size_t len)

{

RAMBlock *block;

ram_addr_t offset;

size_t used_len, start, npages;

3291

MigrationState *s = migrate_get_current();

3292

3293

/* This function is currently expected to be used during live migration */

3294

if (!migration_is_setup_or_active(s->state)) {

return;

}

for (; len > 0; len -= used_len, addr += used_len) {

3299

block = qemu_ram_block_from_host(addr, false, &offset);

3300

if (unlikely(!block || offset >= block->used_length)) {

3301

/*

3302

* The implementation might not support RAMBlock resize during

3303

* live migration, but it could happen in theory with future

3304

* updates. So we add a check here to capture that case.

3305

*/

3306

error_report_once("%s unexpected error", __func__);

return;

}

if (len <= block->used_length - offset) {

3311

used_len = len;

3312

} else {

3313

used_len = block->used_length - offset;

3314

}

3315

3316

start = offset >> TARGET_PAGE_BITS;

3317

npages = used_len >> TARGET_PAGE_BITS;

3318

3319

qemu_mutex_lock(&ram_state->bitmap_mutex);

3320

ram_state->migration_dirty_pages -=

3321

bitmap_count_one_with_offset(block->bmap, start, npages);

3322

bitmap_clear(block->bmap, start, npages);

3323

qemu_mutex_unlock(&ram_state->bitmap_mutex);

}

}

/*

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

3328

* Each of ram_save_setup, ram_save_iterate and ram_save_complete has

zhanghailiang

2016-10-27 14:42:59 +0800

[diff] [blame]

3329

* long-running RCU critical section. When rcu-reclaims in the code

3330

* start to become numerous it will be necessary to reduce the

3331

* granularity of these critical sections.

3332

*/

3333

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

3334

/**

3335

* ram_save_setup: Setup RAM for migration

3336

*

3337

* Returns zero to indicate success and negative for error

3338

*

3339

* @f: QEMUFile where to send the data

3340

* @opaque: RAMState pointer

3341

*/

zhanghailiang

2016-10-27 14:42:59 +0800

[diff] [blame]

3342

static int ram_save_setup(QEMUFile *f, void *opaque)

3343

{

Juan Quintela

2017-05-04 11:46:24 +0200

[diff] [blame]

3344

RAMState **rsp = opaque;

zhanghailiang

2016-10-27 14:42:59 +0800

[diff] [blame]

3345

RAMBlock *block;

3346

Xiao Guangrong

2018-03-30 15:51:20 +0800

[diff] [blame]

3347

if (compress_threads_save_setup()) {

return -1;

}

zhanghailiang

2016-10-27 14:42:59 +0800

[diff] [blame]

3351

/* migration has already setup the bitmap, reuse it. */

3352

if (!migration_in_colo_state()) {

Peter Xu

2017-10-19 14:31:57 +0800

[diff] [blame]

3353

if (ram_init_all(rsp) != 0) {

Xiao Guangrong

2018-03-30 15:51:20 +0800

[diff] [blame]

3354

compress_threads_save_cleanup();

zhanghailiang

2016-10-27 14:42:59 +0800

[diff] [blame]

3355

return -1;

Juan Quintela

2017-05-04 11:46:24 +0200

[diff] [blame]

3356

}

zhanghailiang

2016-10-27 14:42:59 +0800

[diff] [blame]

3357

}

Juan Quintela

2017-05-04 11:46:24 +0200

[diff] [blame]

3358

(*rsp)->f = f;

zhanghailiang

2016-10-27 14:42:59 +0800

[diff] [blame]

3359

3360

rcu_read_lock();

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3361

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

3362

qemu_put_be64(f, ram_bytes_total_common(true) | RAM_SAVE_FLAG_MEM_SIZE);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3363

Cédric Le Goater

2018-05-14 08:57:00 +0200

[diff] [blame]

3364

RAMBLOCK_FOREACH_MIGRATABLE(block) {

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3365

qemu_put_byte(f, strlen(block->idstr));

3366

qemu_put_buffer(f, (uint8_t *)block->idstr, strlen(block->idstr));

3367

qemu_put_be64(f, block->used_length);

Dr. David Alan Gilbert

ef08fb3

2017-02-24 18:28:30 +0000

[diff] [blame]

3368

if (migrate_postcopy_ram() && block->page_size != qemu_host_page_size) {

3369

qemu_put_be64(f, block->page_size);

3370

}

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

3371

if (migrate_ignore_shared()) {

3372

qemu_put_be64(f, block->mr->addr);

3373

qemu_put_byte(f, ramblock_is_ignored(block) ? 1 : 0);

3374

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

}

rcu_read_unlock();

ram_control_before_iterate(f, RAM_CONTROL_SETUP);

3380

ram_control_after_iterate(f, RAM_CONTROL_SETUP);

3381

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

3382

multifd_send_sync_main();

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3383

qemu_put_be64(f, RAM_SAVE_FLAG_EOS);

Juan Quintela

35374cb

2018-04-18 10:13:21 +0200

[diff] [blame]

3384

qemu_fflush(f);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

return 0;

}

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

3389

/**

3390

* ram_save_iterate: iterative stage for migration

3391

*

3392

* Returns zero to indicate success and negative for error

3393

*

3394

* @f: QEMUFile where to send the data

3395

* @opaque: RAMState pointer

3396

*/

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3397

static int ram_save_iterate(QEMUFile *f, void *opaque)

3398

{

Juan Quintela

2017-05-04 11:46:24 +0200

[diff] [blame]

3399

RAMState **temp = opaque;

3400

RAMState *rs = *temp;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3401

int ret;

3402

int i;

3403

int64_t t0;

Thomas Huth

5c90308

2016-11-04 14:10:17 +0100

[diff] [blame]

3404

int done = 0;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3405

Peter Lieven

b255734

2018-03-08 12:18:24 +0100

[diff] [blame]

3406

if (blk_mig_bulk_active()) {

3407

/* Avoid transferring ram during bulk phase of block migration as

3408

* the bulk phase will usually take a long time and transferring

3409

* ram updates during that time is pointless. */

goto out;

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3413

rcu_read_lock();

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

3414

if (ram_list.version != rs->last_version) {

3415

ram_state_reset(rs);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3416

}

3417

3418

/* Read version before ram_list.blocks */

3419

smp_rmb();

3420

3421

ram_control_before_iterate(f, RAM_CONTROL_ROUND);

3422

3423

t0 = qemu_clock_get_ns(QEMU_CLOCK_REALTIME);

3424

i = 0;

Dr. David Alan Gilbert

2018-06-13 11:26:42 +0100

[diff] [blame]

3425

while ((ret = qemu_file_rate_limit(f)) == 0 ||

3426

!QSIMPLEQ_EMPTY(&rs->src_page_requests)) {

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3427

int pages;

3428

Dr. David Alan Gilbert

2018-06-13 11:26:42 +0100

[diff] [blame]

3429

if (qemu_file_get_error(f)) {

break;

}

Juan Quintela

2017-03-15 11:00:51 +0100

[diff] [blame]

3433

pages = ram_find_and_save_block(rs, false);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3434

/* no more pages to sent */

3435

if (pages == 0) {

Thomas Huth

5c90308

2016-11-04 14:10:17 +0100

[diff] [blame]

3436

done = 1;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3437

break;

3438

}

Xiao Guangrong

2018-09-03 17:26:44 +0800

[diff] [blame]

3439

3440

if (pages < 0) {

3441

qemu_file_set_error(f, pages);

break;

}

Xiao Guangrong

2018-09-03 17:26:42 +0800

[diff] [blame]

3445

rs->target_page_count += pages;

Jason J. Herne

2015-09-08 13:12:35 -0400

[diff] [blame]

3446

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3447

/* we want to check in the 1st loop, just in case it was the 1st time

3448

and we had to sync the dirty bitmap.

Wei Yang

2019-05-11 07:37:29 +0800

[diff] [blame]

3449

qemu_clock_get_ns() is a bit expensive, so we only check each some

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

iterations

*/

if ((i & 63) == 0) {

uint64_t t1 = (qemu_clock_get_ns(QEMU_CLOCK_REALTIME) - t0) / 1000000;

3454

if (t1 > MAX_WAIT) {

Juan Quintela

2017-01-23 22:32:05 +0100

[diff] [blame]

3455

trace_ram_save_iterate_big_wait(t1, i);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

break;

}

}

i++;

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

rcu_read_unlock();

/*

* Must occur before EOS (or any QEMUFile operation)

3465

* because of RDMA protocol.

3466

*/

3467

ram_control_after_iterate(f, RAM_CONTROL_ROUND);

3468

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

3469

multifd_send_sync_main();

Peter Lieven

b255734

2018-03-08 12:18:24 +0100

[diff] [blame]

3470

out:

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3471

qemu_put_be64(f, RAM_SAVE_FLAG_EOS);

Juan Quintela

35374cb

2018-04-18 10:13:21 +0200

[diff] [blame]

3472

qemu_fflush(f);

Juan Quintela

2017-06-06 19:49:03 +0200

[diff] [blame]

3473

ram_counters.transferred += 8;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3474

3475

ret = qemu_file_get_error(f);

if (ret < 0) {

return ret;

}

Thomas Huth

2016-11-04 14:10:17 +0100

[diff] [blame]

3480

return done;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3481

}

3482

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

3483

/**

3484

* ram_save_complete: function called to send the remaining amount of ram

3485

*

Xiao Guangrong

2018-09-03 17:26:44 +0800

[diff] [blame]

3486

* Returns zero to indicate success or negative on error

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

3487

*

3488

* Called with iothread lock

3489

*

3490

* @f: QEMUFile where to send the data

3491

* @opaque: RAMState pointer

3492

*/

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3493

static int ram_save_complete(QEMUFile *f, void *opaque)

3494

{

Juan Quintela

2017-05-04 11:46:24 +0200

[diff] [blame]

3495

RAMState **temp = opaque;

3496

RAMState *rs = *temp;

Xiao Guangrong

2018-09-03 17:26:44 +0800

[diff] [blame]

3497

int ret = 0;

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

3498

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3499

rcu_read_lock();

3500

Juan Quintela

2017-03-20 22:25:28 +0100

[diff] [blame]

3501

if (!migration_in_postcopy()) {

Wei Wang

2018-12-11 16:24:51 +0800

[diff] [blame]

3502

migration_bitmap_sync_precopy(rs);

Dr. David Alan Gilbert

663e6c1

2015-11-05 18:11:13 +0000

[diff] [blame]

3503

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3504

3505

ram_control_before_iterate(f, RAM_CONTROL_FINISH);

3506

3507

/* try transferring iterative blocks of memory */

3508

3509

/* flush all remaining blocks regardless of rate limiting */

while (true) {

int pages;

Juan Quintela

2017-03-15 11:00:51 +0100

[diff] [blame]

3513

pages = ram_find_and_save_block(rs, !migration_in_colo_state());

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3514

/* no more blocks to sent */

3515

if (pages == 0) {

3516

break;

3517

}

Xiao Guangrong

2018-09-03 17:26:44 +0800

[diff] [blame]

if (pages < 0) {

ret = pages;

break;

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3522

}

3523

Juan Quintela

2017-03-15 11:00:51 +0100

[diff] [blame]

3524

flush_compressed_data(rs);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3525

ram_control_after_iterate(f, RAM_CONTROL_FINISH);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3526

3527

rcu_read_unlock();

Paolo Bonzini

d09a6fd

2015-07-09 08:47:58 +0200

[diff] [blame]

3528

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

3529

multifd_send_sync_main();

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3530

qemu_put_be64(f, RAM_SAVE_FLAG_EOS);

Juan Quintela

35374cb

2018-04-18 10:13:21 +0200

[diff] [blame]

3531

qemu_fflush(f);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3532

Xiao Guangrong

2018-09-03 17:26:44 +0800

[diff] [blame]

3533

return ret;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3534

}

3535

Dr. David Alan Gilbert

c31b098

2015-11-05 18:10:54 +0000

[diff] [blame]

3536

static void ram_save_pending(QEMUFile *f, void *opaque, uint64_t max_size,

Vladimir Sementsov-Ogievskiy

4799502

2018-03-13 15:34:00 -0400

[diff] [blame]

3537

uint64_t *res_precopy_only,

3538

uint64_t *res_compatible,

3539

uint64_t *res_postcopy_only)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3540

{

Juan Quintela

2017-05-04 11:46:24 +0200

[diff] [blame]

3541

RAMState **temp = opaque;

3542

RAMState *rs = *temp;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3543

uint64_t remaining_size;

3544

Juan Quintela

2017-03-14 12:02:16 +0100

[diff] [blame]

3545

remaining_size = rs->migration_dirty_pages * TARGET_PAGE_SIZE;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3546

Juan Quintela

2017-03-20 22:25:28 +0100

[diff] [blame]

3547

if (!migration_in_postcopy() &&

Dr. David Alan Gilbert

663e6c1

2015-11-05 18:11:13 +0000

[diff] [blame]

3548

remaining_size < max_size) {

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3549

qemu_mutex_lock_iothread();

3550

rcu_read_lock();

Wei Wang

2018-12-11 16:24:51 +0800

[diff] [blame]

3551

migration_bitmap_sync_precopy(rs);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3552

rcu_read_unlock();

3553

qemu_mutex_unlock_iothread();

Juan Quintela

2017-03-14 12:02:16 +0100

[diff] [blame]

3554

remaining_size = rs->migration_dirty_pages * TARGET_PAGE_SIZE;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3555

}

Dr. David Alan Gilbert

c31b098

2015-11-05 18:10:54 +0000

[diff] [blame]

3556

Vladimir Sementsov-Ogievskiy

86e1167

2017-07-10 19:30:15 +0300

[diff] [blame]

3557

if (migrate_postcopy_ram()) {

3558

/* We can do postcopy, and all the data is postcopiable */

Vladimir Sementsov-Ogievskiy

4799502

2018-03-13 15:34:00 -0400

[diff] [blame]

3559

*res_compatible += remaining_size;

Vladimir Sementsov-Ogievskiy

86e1167

2017-07-10 19:30:15 +0300

[diff] [blame]

3560

} else {

Vladimir Sementsov-Ogievskiy

4799502

2018-03-13 15:34:00 -0400

[diff] [blame]

3561

*res_precopy_only += remaining_size;

Vladimir Sementsov-Ogievskiy

86e1167

2017-07-10 19:30:15 +0300

[diff] [blame]

3562

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3563

}

3564

3565

static int load_xbzrle(QEMUFile *f, ram_addr_t addr, void *host)

3566

{

3567

unsigned int xh_len;

3568

int xh_flags;

Dr. David Alan Gilbert

063e760

2015-12-16 11:47:37 +0000

[diff] [blame]

3569

uint8_t *loaded_data;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3570

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3571

/* extract RLE header */

3572

xh_flags = qemu_get_byte(f);

3573

xh_len = qemu_get_be16(f);

3574

3575

if (xh_flags != ENCODING_FLAG_XBZRLE) {

3576

error_report("Failed to load XBZRLE page - wrong compression!");

return -1;

}

if (xh_len > TARGET_PAGE_SIZE) {

3581

error_report("Failed to load XBZRLE page - len overflow!");

3582

return -1;

3583

}

Juan Quintela

2017-06-28 11:52:27 +0200

[diff] [blame]

3584

loaded_data = XBZRLE.decoded_buf;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3585

/* load data and decode */

Juan Quintela

2017-06-28 11:52:27 +0200

[diff] [blame]

3586

/* it can change loaded_data to point to an internal buffer */

Dr. David Alan Gilbert

063e760

2015-12-16 11:47:37 +0000

[diff] [blame]

3587

qemu_get_buffer_in_place(f, &loaded_data, xh_len);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3588

3589

/* decode RLE */

Dr. David Alan Gilbert

063e760

2015-12-16 11:47:37 +0000

[diff] [blame]

3590

if (xbzrle_decode_buffer(loaded_data, xh_len, host,

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3591

TARGET_PAGE_SIZE) == -1) {

3592

error_report("Failed to load XBZRLE page - decode error!");

return -1;

}

return 0;

}

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

3599

/**

3600

* ram_block_from_stream: read a RAMBlock id from the migration stream

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

3601

*

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

3602

* Must be called from within a rcu critical section.

3603

*

3604

* Returns a pointer from within the RCU-protected ram_list.

3605

*

3606

* @f: QEMUFile where to read the data from

3607

* @flags: Page flags (mostly to see if it's a continuation of previous block)

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

3608

*/

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

3609

static inline RAMBlock *ram_block_from_stream(QEMUFile *f, int flags)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3610

{

3611

static RAMBlock *block = NULL;

char id[256];

uint8_t len;

if (flags & RAM_SAVE_FLAG_CONTINUE) {

zhanghailiang

2016-01-15 11:37:41 +0800

[diff] [blame]

3616

if (!block) {

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3617

error_report("Ack, bad migration stream!");

3618

return NULL;

3619

}

zhanghailiang

2016-01-15 11:37:41 +0800

[diff] [blame]

3620

return block;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3621

}

3622

3623

len = qemu_get_byte(f);

3624

qemu_get_buffer(f, (uint8_t *)id, len);

3625

id[len] = 0;

3626

Dr. David Alan Gilbert

2015-11-05 18:10:33 +0000

[diff] [blame]

3627

block = qemu_ram_block_by_name(id);

zhanghailiang

2016-01-15 11:37:41 +0800

[diff] [blame]

3628

if (!block) {

3629

error_report("Can't find block %s", id);

3630

return NULL;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3631

}

3632

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

3633

if (ramblock_is_ignored(block)) {

Cédric Le Goater

2018-05-14 08:57:00 +0200

[diff] [blame]

3634

error_report("block %s should not be migrated !", id);

return NULL;

}

zhanghailiang

2016-01-15 11:37:41 +0800

[diff] [blame]

return block;

}

static inline void *host_from_ram_block_offset(RAMBlock *block,

3642

ram_addr_t offset)

3643

{

3644

if (!offset_in_ramblock(block, offset)) {

return NULL;

}

return block->host + offset;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3649

}

3650

Zhang Chen

2018-09-03 12:38:48 +0800

[diff] [blame]

3651

static inline void *colo_cache_from_block_offset(RAMBlock *block,

3652

ram_addr_t offset)

3653

{

3654

if (!offset_in_ramblock(block, offset)) {

3655

return NULL;

3656

}

3657

if (!block->colo_cache) {

3658

error_report("%s: colo_cache is NULL in block :%s",

3659

__func__, block->idstr);

3660

return NULL;

3661

}

Zhang Chen

2018-09-03 12:38:49 +0800

[diff] [blame]

3662

3663

/*

3664

* During colo checkpoint, we need bitmap of these migrated pages.

3665

* It help us to decide which pages in ram cache should be flushed

3666

* into VM's RAM later.

3667

*/

3668

if (!test_and_set_bit(offset >> TARGET_PAGE_BITS, block->bmap)) {

3669

ram_state->migration_dirty_pages++;

3670

}

Zhang Chen

2018-09-03 12:38:48 +0800

[diff] [blame]

3671

return block->colo_cache + offset;

3672

}

3673

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

3674

/**

3675

* ram_handle_compressed: handle the zero page case

3676

*

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3677

* If a page (or a whole RDMA chunk) has been

3678

* determined to be zero, then zap it.

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

3679

*

3680

* @host: host address for the zero page

3681

* @ch: what the page is filled from. We only support zero

3682

* @size: size of the zero page

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3683

*/

3684

void ram_handle_compressed(void *host, uint8_t ch, uint64_t size)

3685

{

3686

if (ch != 0 || !is_zero_range(host, size)) {

3687

memset(host, ch, size);

}

}

Xiao Guangrong

2018-03-30 15:51:21 +0800

[diff] [blame]

3691

/* return the size after decompression, or negative value on error */

3692

static int

3693

qemu_uncompress_data(z_stream *stream, uint8_t *dest, size_t dest_len,

3694

const uint8_t *source, size_t source_len)

{

int err;

err = inflateReset(stream);

if (err != Z_OK) {

return -1;

}

stream->avail_in = source_len;

3704

stream->next_in = (uint8_t *)source;

3705

stream->avail_out = dest_len;

3706

stream->next_out = dest;

3707

3708

err = inflate(stream, Z_NO_FLUSH);

3709

if (err != Z_STREAM_END) {

return -1;

}

return stream->total_out;

3714

}

3715

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3716

static void *do_data_decompress(void *opaque)

3717

{

3718

DecompressParam *param = opaque;

3719

unsigned long pagesize;

Liang Li

2016-05-05 15:32:58 +0800

[diff] [blame]

3720

uint8_t *des;

Xiao Guangrong

2018-03-30 15:51:22 +0800

[diff] [blame]

3721

int len, ret;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3722

Liang Li

2016-05-05 15:32:58 +0800

[diff] [blame]

3723

qemu_mutex_lock(&param->mutex);

Liang Li

2016-05-05 15:32:56 +0800

[diff] [blame]

3724

while (!param->quit) {

Liang Li

2016-05-05 15:32:58 +0800

[diff] [blame]

if (param->des) {

des = param->des;

len = param->len;

param->des = 0;

qemu_mutex_unlock(&param->mutex);

3730

Liang Li

2016-05-05 15:32:51 +0800

[diff] [blame]

3731

pagesize = TARGET_PAGE_SIZE;

Xiao Guangrong

2018-03-30 15:51:22 +0800

[diff] [blame]

3732

3733

ret = qemu_uncompress_data(&param->stream, des, pagesize,

3734

param->compbuf, len);

Xiao Guangrong

f548222

2018-05-03 16:06:11 +0800

[diff] [blame]

3735

if (ret < 0 && migrate_get_current()->decompress_error_check) {

Xiao Guangrong

2018-03-30 15:51:22 +0800

[diff] [blame]

3736

error_report("decompress data failed");

3737

qemu_file_set_error(decomp_file, ret);

3738

}

Liang Li

2016-05-05 15:32:51 +0800

[diff] [blame]

3739

Liang Li

2016-05-05 15:32:58 +0800

[diff] [blame]

3740

qemu_mutex_lock(&decomp_done_lock);

3741

param->done = true;

3742

qemu_cond_signal(&decomp_done_cond);

3743

qemu_mutex_unlock(&decomp_done_lock);

3744

3745

qemu_mutex_lock(&param->mutex);

3746

} else {

3747

qemu_cond_wait(&param->cond, &param->mutex);

3748

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3749

}

Liang Li

2016-05-05 15:32:58 +0800

[diff] [blame]

3750

qemu_mutex_unlock(&param->mutex);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

return NULL;

}

Xiao Guangrong

2018-03-30 15:51:22 +0800

[diff] [blame]

3755

static int wait_for_decompress_done(void)

Liang Li

5533b2e

2016-05-05 15:32:52 +0800

[diff] [blame]

3756

{

3757

int idx, thread_count;

3758

3759

if (!migrate_use_compression()) {

Xiao Guangrong

2018-03-30 15:51:22 +0800

[diff] [blame]

3760

return 0;

Liang Li

5533b2e

2016-05-05 15:32:52 +0800

[diff] [blame]

3761

}

3762

3763

thread_count = migrate_decompress_threads();

3764

qemu_mutex_lock(&decomp_done_lock);

3765

for (idx = 0; idx < thread_count; idx++) {

3766

while (!decomp_param[idx].done) {

3767

qemu_cond_wait(&decomp_done_cond, &decomp_done_lock);

3768

}

3769

}

3770

qemu_mutex_unlock(&decomp_done_lock);

Xiao Guangrong

2018-03-30 15:51:22 +0800

[diff] [blame]

3771

return qemu_file_get_error(decomp_file);

Liang Li

5533b2e

2016-05-05 15:32:52 +0800

[diff] [blame]

3772

}

3773

Juan Quintela

f0afa33

2017-06-28 11:52:28 +0200

[diff] [blame]

3774

static void compress_threads_load_cleanup(void)

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

{

int i, thread_count;

Juan Quintela

2016-04-20 11:56:01 +0200

[diff] [blame]

3778

if (!migrate_use_compression()) {

3779

return;

3780

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3781

thread_count = migrate_decompress_threads();

3782

for (i = 0; i < thread_count; i++) {

Xiao Guangrong

2018-03-30 15:51:21 +0800

[diff] [blame]

3783

/*

3784

* we use it as a indicator which shows if the thread is

3785

* properly init'd or not

3786

*/

3787

if (!decomp_param[i].compbuf) {

break;

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3791

qemu_mutex_lock(&decomp_param[i].mutex);

Liang Li

2016-05-05 15:32:56 +0800

[diff] [blame]

3792

decomp_param[i].quit = true;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3793

qemu_cond_signal(&decomp_param[i].cond);

3794

qemu_mutex_unlock(&decomp_param[i].mutex);

3795

}

3796

for (i = 0; i < thread_count; i++) {

Xiao Guangrong

2018-03-30 15:51:21 +0800

[diff] [blame]

3797

if (!decomp_param[i].compbuf) {

break;

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3801

qemu_thread_join(decompress_threads + i);

3802

qemu_mutex_destroy(&decomp_param[i].mutex);

3803

qemu_cond_destroy(&decomp_param[i].cond);

Xiao Guangrong

2018-03-30 15:51:21 +0800

[diff] [blame]

3804

inflateEnd(&decomp_param[i].stream);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3805

g_free(decomp_param[i].compbuf);

Xiao Guangrong

2018-03-30 15:51:21 +0800

[diff] [blame]

3806

decomp_param[i].compbuf = NULL;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3807

}

3808

g_free(decompress_threads);

3809

g_free(decomp_param);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3810

decompress_threads = NULL;

3811

decomp_param = NULL;

Xiao Guangrong

2018-03-30 15:51:22 +0800

[diff] [blame]

3812

decomp_file = NULL;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3813

}

3814

Xiao Guangrong

2018-03-30 15:51:22 +0800

[diff] [blame]

3815

static int compress_threads_load_setup(QEMUFile *f)

Xiao Guangrong

2018-03-30 15:51:21 +0800

[diff] [blame]

{

int i, thread_count;

if (!migrate_use_compression()) {

return 0;

}

thread_count = migrate_decompress_threads();

3824

decompress_threads = g_new0(QemuThread, thread_count);

3825

decomp_param = g_new0(DecompressParam, thread_count);

3826

qemu_mutex_init(&decomp_done_lock);

3827

qemu_cond_init(&decomp_done_cond);

Xiao Guangrong

2018-03-30 15:51:22 +0800

[diff] [blame]

3828

decomp_file = f;

Xiao Guangrong

2018-03-30 15:51:21 +0800

[diff] [blame]

3829

for (i = 0; i < thread_count; i++) {

3830

if (inflateInit(&decomp_param[i].stream) != Z_OK) {

goto exit;

}

decomp_param[i].compbuf = g_malloc0(compressBound(TARGET_PAGE_SIZE));

3835

qemu_mutex_init(&decomp_param[i].mutex);

3836

qemu_cond_init(&decomp_param[i].cond);

3837

decomp_param[i].done = true;

3838

decomp_param[i].quit = false;

3839

qemu_thread_create(decompress_threads + i, "decompress",

3840

do_data_decompress, decomp_param + i,

3841

QEMU_THREAD_JOINABLE);

}

return 0;

exit:

compress_threads_load_cleanup();

3846

return -1;

3847

}

3848

Dr. David Alan Gilbert

c1bc662

2015-12-16 11:47:38 +0000

[diff] [blame]

3849

static void decompress_data_with_multi_threads(QEMUFile *f,

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3850

void *host, int len)

3851

{

3852

int idx, thread_count;

3853

3854

thread_count = migrate_decompress_threads();

Liang Li

2016-05-05 15:32:51 +0800

[diff] [blame]

3855

qemu_mutex_lock(&decomp_done_lock);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3856

while (true) {

3857

for (idx = 0; idx < thread_count; idx++) {

Liang Li

2016-05-05 15:32:51 +0800

[diff] [blame]

3858

if (decomp_param[idx].done) {

Liang Li

2016-05-05 15:32:58 +0800

[diff] [blame]

3859

decomp_param[idx].done = false;

3860

qemu_mutex_lock(&decomp_param[idx].mutex);

Dr. David Alan Gilbert

c1bc662

2015-12-16 11:47:38 +0000

[diff] [blame]

3861

qemu_get_buffer(f, decomp_param[idx].compbuf, len);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3862

decomp_param[idx].des = host;

3863

decomp_param[idx].len = len;

Liang Li

2016-05-05 15:32:58 +0800

[diff] [blame]

3864

qemu_cond_signal(&decomp_param[idx].cond);

3865

qemu_mutex_unlock(&decomp_param[idx].mutex);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

break;

}

}

if (idx < thread_count) {

3870

break;

Liang Li

2016-05-05 15:32:51 +0800

[diff] [blame]

3871

} else {

3872

qemu_cond_wait(&decomp_done_cond, &decomp_done_lock);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3873

}

3874

}

Liang Li

2016-05-05 15:32:51 +0800

[diff] [blame]

3875

qemu_mutex_unlock(&decomp_done_lock);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

3876

}

3877

Zhang Chen

2018-09-03 12:38:48 +0800

[diff] [blame]

3878

/*

3879

* colo cache: this is for secondary VM, we cache the whole

3880

* memory of the secondary VM, it is need to hold the global lock

3881

* to call this helper.

3882

*/

3883

int colo_init_ram_cache(void)

{

RAMBlock *block;

rcu_read_lock();

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

3888

RAMBLOCK_FOREACH_NOT_IGNORED(block) {

Zhang Chen

2018-09-03 12:38:48 +0800

[diff] [blame]

3889

block->colo_cache = qemu_anon_ram_alloc(block->used_length,

3890

NULL,

3891

false);

3892

if (!block->colo_cache) {

3893

error_report("%s: Can't alloc memory for COLO cache of block %s,"

3894

"size 0x" RAM_ADDR_FMT, __func__, block->idstr,

block->used_length);

goto out_locked;

}

memcpy(block->colo_cache, block->host, block->used_length);

3899

}

3900

rcu_read_unlock();

Zhang Chen

2018-09-03 12:38:49 +0800

[diff] [blame]

3901

/*

3902

* Record the dirty pages that sent by PVM, we use this dirty bitmap together

3903

* with to decide which page in cache should be flushed into SVM's RAM. Here

3904

* we use the same name 'ram_bitmap' as for migration.

3905

*/

3906

if (ram_bytes_total()) {

3907

RAMBlock *block;

3908

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

3909

RAMBLOCK_FOREACH_NOT_IGNORED(block) {

Zhang Chen

2018-09-03 12:38:49 +0800

[diff] [blame]

3910

unsigned long pages = block->max_length >> TARGET_PAGE_BITS;

3911

3912

block->bmap = bitmap_new(pages);

3913

bitmap_set(block->bmap, 0, pages);

3914

}

3915

}

3916

ram_state = g_new0(RAMState, 1);

3917

ram_state->migration_dirty_pages = 0;

Zhang Chen

c6e5baf

2019-03-30 06:29:51 +0800

[diff] [blame]

3918

qemu_mutex_init(&ram_state->bitmap_mutex);

zhanghailiang

d1955d2

2018-09-03 12:38:55 +0800

[diff] [blame]

3919

memory_global_dirty_log_start();

Zhang Chen

2018-09-03 12:38:49 +0800

[diff] [blame]

3920

Zhang Chen

2018-09-03 12:38:48 +0800

[diff] [blame]

3921

return 0;

3922

3923

out_locked:

Zhang Chen

2018-09-03 12:38:49 +0800

[diff] [blame]

3924

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

3925

RAMBLOCK_FOREACH_NOT_IGNORED(block) {

Zhang Chen

2018-09-03 12:38:48 +0800

[diff] [blame]

3926

if (block->colo_cache) {

3927

qemu_anon_ram_free(block->colo_cache, block->used_length);

3928

block->colo_cache = NULL;

}

}

rcu_read_unlock();

return -errno;

}

/* It is need to hold the global lock to call this helper */

3937

void colo_release_ram_cache(void)

{

RAMBlock *block;

zhanghailiang

2018-09-03 12:38:55 +0800

[diff] [blame]

3941

memory_global_dirty_log_stop();

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

3942

RAMBLOCK_FOREACH_NOT_IGNORED(block) {

Zhang Chen

2018-09-03 12:38:49 +0800

[diff] [blame]

g_free(block->bmap);

block->bmap = NULL;

}

Zhang Chen

2018-09-03 12:38:48 +0800

[diff] [blame]

3947

rcu_read_lock();

Zhang Chen

2018-09-03 12:38:49 +0800

[diff] [blame]

3948

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

3949

RAMBLOCK_FOREACH_NOT_IGNORED(block) {

Zhang Chen

2018-09-03 12:38:48 +0800

[diff] [blame]

3950

if (block->colo_cache) {

3951

qemu_anon_ram_free(block->colo_cache, block->used_length);

3952

block->colo_cache = NULL;

3953

}

3954

}

Zhang Chen

2018-09-03 12:38:49 +0800

[diff] [blame]

3955

Zhang Chen

2018-09-03 12:38:48 +0800

[diff] [blame]

3956

rcu_read_unlock();

Zhang Chen

c6e5baf

2019-03-30 06:29:51 +0800

[diff] [blame]

3957

qemu_mutex_destroy(&ram_state->bitmap_mutex);

Zhang Chen

2018-09-03 12:38:49 +0800

[diff] [blame]

3958

g_free(ram_state);

3959

ram_state = NULL;

Zhang Chen

2018-09-03 12:38:48 +0800

[diff] [blame]

3960

}

3961

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

3962

/**

Juan Quintela

2017-06-28 11:52:27 +0200

[diff] [blame]

3963

* ram_load_setup: Setup RAM for migration incoming side

3964

*

3965

* Returns zero to indicate success and negative for error

3966

*

3967

* @f: QEMUFile where to receive the data

3968

* @opaque: RAMState pointer

3969

*/

3970

static int ram_load_setup(QEMUFile *f, void *opaque)

3971

{

Xiao Guangrong

2018-03-30 15:51:22 +0800

[diff] [blame]

3972

if (compress_threads_load_setup(f)) {

Xiao Guangrong

2018-03-30 15:51:21 +0800

[diff] [blame]

return -1;

}

Juan Quintela

2017-06-28 11:52:27 +0200

[diff] [blame]

3976

xbzrle_load_setup();

Alexey Perevalov

2017-10-05 14:13:20 +0300

[diff] [blame]

3977

ramblock_recv_map_init();

Zhang Chen

2018-09-03 12:38:48 +0800

[diff] [blame]

3978

Juan Quintela

2017-06-28 11:52:27 +0200

[diff] [blame]

return 0;

}

static int ram_load_cleanup(void *opaque)

3983

{

Alexey Perevalov

2017-10-05 14:13:20 +0300

[diff] [blame]

3984

RAMBlock *rb;

Junyan He

56eb90a

2018-07-18 15:48:03 +0800

[diff] [blame]

3985

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

3986

RAMBLOCK_FOREACH_NOT_IGNORED(rb) {

Junyan He

56eb90a

2018-07-18 15:48:03 +0800

[diff] [blame]

3987

if (ramblock_is_pmem(rb)) {

3988

pmem_persist(rb->host, rb->used_length);

}

}

Juan Quintela

2017-06-28 11:52:27 +0200

[diff] [blame]

3992

xbzrle_load_cleanup();

Juan Quintela

f0afa33

2017-06-28 11:52:28 +0200

[diff] [blame]

3993

compress_threads_load_cleanup();

Alexey Perevalov

2017-10-05 14:13:20 +0300

[diff] [blame]

3994

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

3995

RAMBLOCK_FOREACH_NOT_IGNORED(rb) {

Alexey Perevalov

2017-10-05 14:13:20 +0300

[diff] [blame]

3996

g_free(rb->receivedmap);

3997

rb->receivedmap = NULL;

3998

}

Zhang Chen

2018-09-03 12:38:48 +0800

[diff] [blame]

3999

Juan Quintela

2017-06-28 11:52:27 +0200

[diff] [blame]

return 0;

}

/**

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

4004

* ram_postcopy_incoming_init: allocate postcopy data structures

4005

*

4006

* Returns 0 for success and negative if there was one error

4007

*

4008

* @mis: current migration incoming state

4009

*

4010

* Allocate data structures etc needed by incoming migration with

4011

* postcopy-ram. postcopy-ram's similarly names

4012

* postcopy_ram_incoming_init does the work.

Dr. David Alan Gilbert

1caddf8

2015-11-05 18:11:03 +0000

[diff] [blame]

4013

*/

4014

int ram_postcopy_incoming_init(MigrationIncomingState *mis)

4015

{

David Hildenbrand

c136180

2018-06-20 22:27:36 +0200

[diff] [blame]

4016

return postcopy_ram_incoming_init(mis);

Dr. David Alan Gilbert

1caddf8

2015-11-05 18:11:03 +0000

[diff] [blame]

4017

}

4018

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

4019

/**

4020

* ram_load_postcopy: load a page in postcopy case

4021

*

4022

* Returns 0 for success or -errno in case of error

4023

*

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4024

* Called in postcopy mode by ram_load().

4025

* rcu_read_lock is taken prior to this being called.

Juan Quintela

2017-03-23 15:06:39 +0100

[diff] [blame]

4026

*

4027

* @f: QEMUFile where to send the data

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4028

*/

4029

static int ram_load_postcopy(QEMUFile *f)

4030

{

4031

int flags = 0, ret = 0;

4032

bool place_needed = false;

Peter Xu

2018-07-10 17:18:53 +0800

[diff] [blame]

4033

bool matches_target_page_size = false;

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4034

MigrationIncomingState *mis = migration_incoming_get_current();

4035

/* Temporary page that is later 'placed' */

4036

void *postcopy_host_page = postcopy_get_tmp_page(mis);

Dr. David Alan Gilbert

2015-11-05 18:11:12 +0000

[diff] [blame]

4037

void *last_host = NULL;

Dr. David Alan Gilbert

a3b6ff6

2015-11-11 14:02:28 +0000

[diff] [blame]

4038

bool all_zero = false;

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4039

4040

while (!ret && !(flags & RAM_SAVE_FLAG_EOS)) {

4041

ram_addr_t addr;

4042

void *host = NULL;

4043

void *page_buffer = NULL;

4044

void *place_source = NULL;

Dr. David Alan Gilbert

2017-02-24 18:28:35 +0000

[diff] [blame]

4045

RAMBlock *block = NULL;

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4046

uint8_t ch;

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4047

4048

addr = qemu_get_be64(f);

Peter Xu

7a9ddfb

2018-02-08 18:31:05 +0800

[diff] [blame]

4049

4050

/*

4051

* If qemu file error, we should stop here, and then "addr"

4052

* may be invalid

4053

*/

4054

ret = qemu_file_get_error(f);

if (ret) {

break;

}

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4059

flags = addr & ~TARGET_PAGE_MASK;

4060

addr &= TARGET_PAGE_MASK;

4061

4062

trace_ram_load_postcopy_loop((uint64_t)addr, flags);

4063

place_needed = false;

Juan Quintela

2017-04-28 09:39:55 +0200

[diff] [blame]

4064

if (flags & (RAM_SAVE_FLAG_ZERO | RAM_SAVE_FLAG_PAGE)) {

Dr. David Alan Gilbert

2017-02-24 18:28:35 +0000

[diff] [blame]

4065

block = ram_block_from_stream(f, flags);

zhanghailiang

2016-01-15 11:37:41 +0800

[diff] [blame]

4066

4067

host = host_from_ram_block_offset(block, addr);

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4068

if (!host) {

4069

error_report("Illegal RAM offset " RAM_ADDR_FMT, addr);

4070

ret = -EINVAL;

4071

break;

4072

}

Peter Xu

2018-07-10 17:18:53 +0800

[diff] [blame]

4073

matches_target_page_size = block->page_size == TARGET_PAGE_SIZE;

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4074

/*

Dr. David Alan Gilbert

2017-02-24 18:28:37 +0000

[diff] [blame]

4075

* Postcopy requires that we place whole host pages atomically;

4076

* these may be huge pages for RAMBlocks that are backed by

4077

* hugetlbfs.

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4078

* To make it atomic, the data is read into a temporary page

4079

* that's moved into place later.

4080

* The migration protocol uses, possibly smaller, target-pages

4081

* however the source ensures it always sends all the components

4082

* of a host page in order.

4083

*/

4084

page_buffer = postcopy_host_page +

Dr. David Alan Gilbert

2017-02-24 18:28:37 +0000

[diff] [blame]

4085

((uintptr_t)host & (block->page_size - 1));

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4086

/* If all TP are zero then we can optimise the place */

Dr. David Alan Gilbert

2017-02-24 18:28:37 +0000

[diff] [blame]

4087

if (!((uintptr_t)host & (block->page_size - 1))) {

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4088

all_zero = true;

Dr. David Alan Gilbert

2015-11-05 18:11:12 +0000

[diff] [blame]

4089

} else {

4090

/* not the 1st TP within the HP */

4091

if (host != (last_host + TARGET_PAGE_SIZE)) {

Markus Armbruster

9af9e0f

2015-12-18 16:35:19 +0100

[diff] [blame]

4092

error_report("Non-sequential target page %p/%p",

Dr. David Alan Gilbert

2015-11-05 18:11:12 +0000

[diff] [blame]

host, last_host);

ret = -EINVAL;

break;

}

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4097

}

4098

Dr. David Alan Gilbert

2015-11-05 18:11:12 +0000

[diff] [blame]

4099

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4100

/*

4101

* If it's the last part of a host page then we place the host

4102

* page

4103

*/

4104

place_needed = (((uintptr_t)host + TARGET_PAGE_SIZE) &

Dr. David Alan Gilbert

2017-02-24 18:28:37 +0000

[diff] [blame]

4105

(block->page_size - 1)) == 0;

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4106

place_source = postcopy_host_page;

4107

}

Dr. David Alan Gilbert

2015-11-05 18:11:12 +0000

[diff] [blame]

4108

last_host = host;

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4109

4110

switch (flags & ~RAM_SAVE_FLAG_CONTINUE) {

Juan Quintela

2017-04-28 09:39:55 +0200

[diff] [blame]

4111

case RAM_SAVE_FLAG_ZERO:

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4112

ch = qemu_get_byte(f);

4113

memset(page_buffer, ch, TARGET_PAGE_SIZE);

if (ch) {

all_zero = false;

}

break;

case RAM_SAVE_FLAG_PAGE:

4120

all_zero = false;

Peter Xu

2018-07-10 17:18:53 +0800

[diff] [blame]

4121

if (!matches_target_page_size) {

4122

/* For huge pages, we always use temporary buffer */

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4123

qemu_get_buffer(f, page_buffer, TARGET_PAGE_SIZE);

4124

} else {

Peter Xu

2018-07-10 17:18:53 +0800

[diff] [blame]

4125

/*

4126

* For small pages that matches target page size, we

4127

* avoid the qemu_file copy. Instead we directly use

4128

* the buffer of QEMUFile to place the page. Note: we

4129

* cannot do any QEMUFile operation before using that

4130

* buffer to make sure the buffer is valid when

4131

* placing the page.

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4132

*/

4133

qemu_get_buffer_in_place(f, (uint8_t **)&place_source,

TARGET_PAGE_SIZE);

}

break;

case RAM_SAVE_FLAG_EOS:

4138

/* normal exit */

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

4139

multifd_recv_sync_main();

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4140

break;

4141

default:

4142

error_report("Unknown combination of migration flags: %#x"

4143

" (postcopy mode)", flags);

4144

ret = -EINVAL;

Peter Xu

7a9ddfb

2018-02-08 18:31:05 +0800

[diff] [blame]

4145

break;

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4146

}

4147

Peter Xu

7a9ddfb

2018-02-08 18:31:05 +0800

[diff] [blame]

4148

/* Detect for any possible file errors */

4149

if (!ret && qemu_file_get_error(f)) {

4150

ret = qemu_file_get_error(f);

4151

}

4152

4153

if (!ret && place_needed) {

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4154

/* This gets called at the last target page in the host page */

Dr. David Alan Gilbert

2017-02-24 18:28:35 +0000

[diff] [blame]

4155

void *place_dest = host + TARGET_PAGE_SIZE - block->page_size;

4156

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4157

if (all_zero) {

Dr. David Alan Gilbert

2017-02-24 18:28:35 +0000

[diff] [blame]

4158

ret = postcopy_place_page_zero(mis, place_dest,

Alexey Perevalov

8be4620

2017-10-05 14:13:18 +0300

[diff] [blame]

4159

block);

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4160

} else {

Dr. David Alan Gilbert

2017-02-24 18:28:35 +0000

[diff] [blame]

4161

ret = postcopy_place_page(mis, place_dest,

Alexey Perevalov

8be4620

2017-10-05 14:13:18 +0300

[diff] [blame]

4162

place_source, block);

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4163

}

4164

}

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

}

return ret;

}

Daniel Henrique Barboza

acab30b

2017-11-16 20:35:26 -0200

[diff] [blame]

4170

static bool postcopy_is_advised(void)

4171

{

4172

PostcopyState ps = postcopy_state_get();

4173

return ps >= POSTCOPY_INCOMING_ADVISE && ps < POSTCOPY_INCOMING_END;

4174

}

4175

4176

static bool postcopy_is_running(void)

4177

{

4178

PostcopyState ps = postcopy_state_get();

4179

return ps >= POSTCOPY_INCOMING_LISTENING && ps < POSTCOPY_INCOMING_END;

4180

}

4181

Zhang Chen

e6f4aa1

2018-09-03 12:38:50 +0800

[diff] [blame]

4182

/*

4183

* Flush content of RAM cache into SVM's memory.

4184

* Only flush the pages that be dirtied by PVM or SVM or both.

4185

*/

4186

static void colo_flush_ram_cache(void)

4187

{

4188

RAMBlock *block = NULL;

4189

void *dst_host;

4190

void *src_host;

4191

unsigned long offset = 0;

4192

zhanghailiang

d1955d2

2018-09-03 12:38:55 +0800

[diff] [blame]

4193

memory_global_dirty_log_sync();

4194

rcu_read_lock();

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

4195

RAMBLOCK_FOREACH_NOT_IGNORED(block) {

Wei Yang

2019-04-30 11:44:10 +0800

[diff] [blame]

4196

migration_bitmap_sync_range(ram_state, block, block->used_length);

zhanghailiang

d1955d2

2018-09-03 12:38:55 +0800

[diff] [blame]

}

rcu_read_unlock();

Zhang Chen

2018-09-03 12:38:50 +0800

[diff] [blame]

4200

trace_colo_flush_ram_cache_begin(ram_state->migration_dirty_pages);

4201

rcu_read_lock();

4202

block = QLIST_FIRST_RCU(&ram_list.blocks);

4203

4204

while (block) {

4205

offset = migration_bitmap_find_dirty(ram_state, block, offset);

4206

4207

if (offset << TARGET_PAGE_BITS >= block->used_length) {

4208

offset = 0;

4209

block = QLIST_NEXT_RCU(block, next);

4210

} else {

4211

migration_bitmap_clear_dirty(ram_state, block, offset);

4212

dst_host = block->host + (offset << TARGET_PAGE_BITS);

4213

src_host = block->colo_cache + (offset << TARGET_PAGE_BITS);

4214

memcpy(dst_host, src_host, TARGET_PAGE_SIZE);

}

}

rcu_read_unlock();

trace_colo_flush_ram_cache_end();

4220

}

4221

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4222

static int ram_load(QEMUFile *f, void *opaque, int version_id)

4223

{

Juan Quintela

edc6012

2016-11-02 12:40:46 +0100

[diff] [blame]

4224

int flags = 0, ret = 0, invalid_flags = 0;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4225

static uint64_t seq_iter;

4226

int len = 0;

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4227

/*

4228

* If system is running in postcopy mode, page inserts to host memory must

4229

* be atomic

4230

*/

Daniel Henrique Barboza

acab30b

2017-11-16 20:35:26 -0200

[diff] [blame]

4231

bool postcopy_running = postcopy_is_running();

Dr. David Alan Gilbert

ef08fb3

2017-02-24 18:28:30 +0000

[diff] [blame]

4232

/* ADVISE is earlier, it shows the source has the postcopy capability on */

Daniel Henrique Barboza

acab30b

2017-11-16 20:35:26 -0200

[diff] [blame]

4233

bool postcopy_advised = postcopy_is_advised();

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

seq_iter++;

if (version_id != 4) {

ret = -EINVAL;

}

Juan Quintela

2016-11-02 12:40:46 +0100

[diff] [blame]

4241

if (!migrate_use_compression()) {

4242

invalid_flags |= RAM_SAVE_FLAG_COMPRESS_PAGE;

4243

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4244

/* This RCU critical section can be very long running.

4245

* When RCU reclaims in the code start to become numerous,

4246

* it will be necessary to reduce the granularity of this

4247

* critical section.

4248

*/

4249

rcu_read_lock();

Dr. David Alan Gilbert

2015-11-05 18:11:11 +0000

[diff] [blame]

4250

4251

if (postcopy_running) {

4252

ret = ram_load_postcopy(f);

4253

}

4254

4255

while (!postcopy_running && !ret && !(flags & RAM_SAVE_FLAG_EOS)) {

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4256

ram_addr_t addr, total_ram_bytes;

Dr. David Alan Gilbert

2015-11-05 18:10:39 +0000

[diff] [blame]

4257

void *host = NULL;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4258

uint8_t ch;

4259

4260

addr = qemu_get_be64(f);

4261

flags = addr & ~TARGET_PAGE_MASK;

4262

addr &= TARGET_PAGE_MASK;

4263

Juan Quintela

edc6012

2016-11-02 12:40:46 +0100

[diff] [blame]

4264

if (flags & invalid_flags) {

4265

if (flags & invalid_flags & RAM_SAVE_FLAG_COMPRESS_PAGE) {

4266

error_report("Received an unexpected compressed page");

}

ret = -EINVAL;

break;

}

Juan Quintela

2017-04-28 09:39:55 +0200

[diff] [blame]

4273

if (flags & (RAM_SAVE_FLAG_ZERO | RAM_SAVE_FLAG_PAGE |

Dr. David Alan Gilbert

2015-11-05 18:10:39 +0000

[diff] [blame]

4274

RAM_SAVE_FLAG_COMPRESS_PAGE | RAM_SAVE_FLAG_XBZRLE)) {

zhanghailiang

2016-01-15 11:37:41 +0800

[diff] [blame]

4275

RAMBlock *block = ram_block_from_stream(f, flags);

4276

Zhang Chen

2018-09-03 12:38:48 +0800

[diff] [blame]

4277

/*

4278

* After going into COLO, we should load the Page into colo_cache.

4279

*/

4280

if (migration_incoming_in_colo_state()) {

4281

host = colo_cache_from_block_offset(block, addr);

4282

} else {

4283

host = host_from_ram_block_offset(block, addr);

4284

}

Dr. David Alan Gilbert

2015-11-05 18:10:39 +0000

[diff] [blame]

4285

if (!host) {

4286

error_report("Illegal RAM offset " RAM_ADDR_FMT, addr);

4287

ret = -EINVAL;

4288

break;

4289

}

Zhang Chen

2018-09-03 12:38:48 +0800

[diff] [blame]

4290

4291

if (!migration_incoming_in_colo_state()) {

4292

ramblock_recv_bitmap_set(block, host);

4293

}

4294

Dr. David Alan Gilbert

1db9d8e

2017-04-26 19:37:21 +0100

[diff] [blame]

4295

trace_ram_load_loop(block->idstr, (uint64_t)addr, flags, host);

Dr. David Alan Gilbert

2015-11-05 18:10:39 +0000

[diff] [blame]

4296

}

4297

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4298

switch (flags & ~RAM_SAVE_FLAG_CONTINUE) {

4299

case RAM_SAVE_FLAG_MEM_SIZE:

4300

/* Synchronize RAM block list */

4301

total_ram_bytes = addr;

4302

while (!ret && total_ram_bytes) {

4303

RAMBlock *block;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

char id[256];

ram_addr_t length;

len = qemu_get_byte(f);

4308

qemu_get_buffer(f, (uint8_t *)id, len);

4309

id[len] = 0;

4310

length = qemu_get_be64(f);

4311

Dr. David Alan Gilbert

2015-11-05 18:10:33 +0000

[diff] [blame]

4312

block = qemu_ram_block_by_name(id);

Cédric Le Goater

2018-05-14 08:57:00 +0200

[diff] [blame]

4313

if (block && !qemu_ram_is_migratable(block)) {

4314

error_report("block %s should not be migrated !", id);

4315

ret = -EINVAL;

4316

} else if (block) {

Dr. David Alan Gilbert

2015-11-05 18:10:33 +0000

[diff] [blame]

4317

if (length != block->used_length) {

4318

Error *local_err = NULL;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4319

Gonglei

fa53a0e

2016-05-10 10:04:59 +0800

[diff] [blame]

4320

ret = qemu_ram_resize(block, length,

Dr. David Alan Gilbert

2015-11-05 18:10:33 +0000

[diff] [blame]

4321

&local_err);

4322

if (local_err) {

4323

error_report_err(local_err);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4324

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4325

}

Dr. David Alan Gilbert

ef08fb3

2017-02-24 18:28:30 +0000

[diff] [blame]

4326

/* For postcopy we need to check hugepage sizes match */

4327

if (postcopy_advised &&

4328

block->page_size != qemu_host_page_size) {

4329

uint64_t remote_page_size = qemu_get_be64(f);

4330

if (remote_page_size != block->page_size) {

4331

error_report("Mismatched RAM page size %s "

4332

"(local) %zd != %" PRId64,

4333

id, block->page_size,

remote_page_size);

ret = -EINVAL;

}

}

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

4338

if (migrate_ignore_shared()) {

4339

hwaddr addr = qemu_get_be64(f);

4340

bool ignored = qemu_get_byte(f);

4341

if (ignored != ramblock_is_ignored(block)) {

4342

error_report("RAM block %s should %s be migrated",

4343

id, ignored ? "" : "not");

4344

ret = -EINVAL;

4345

}

4346

if (ramblock_is_ignored(block) &&

4347

block->mr->addr != addr) {

4348

error_report("Mismatched GPAs for block %s "

4349

"%" PRId64 "!= %" PRId64,

4350

id, (uint64_t)addr,

4351

(uint64_t)block->mr->addr);

4352

ret = -EINVAL;

4353

}

4354

}

Dr. David Alan Gilbert

2015-11-05 18:10:33 +0000

[diff] [blame]

4355

ram_control_load_hook(f, RAM_CONTROL_BLOCK_REG,

4356

block->idstr);

4357

} else {

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4358

error_report("Unknown ramblock \"%s\", cannot "

4359

"accept migration", id);

ret = -EINVAL;

}

total_ram_bytes -= length;

4364

}

4365

break;

Dr. David Alan Gilbert

2015-11-05 18:10:39 +0000

[diff] [blame]

4366

Juan Quintela

2017-04-28 09:39:55 +0200

[diff] [blame]

4367

case RAM_SAVE_FLAG_ZERO:

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4368

ch = qemu_get_byte(f);

4369

ram_handle_compressed(host, ch, TARGET_PAGE_SIZE);

4370

break;

Dr. David Alan Gilbert

2015-11-05 18:10:39 +0000

[diff] [blame]

4371

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4372

case RAM_SAVE_FLAG_PAGE:

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4373

qemu_get_buffer(f, host, TARGET_PAGE_SIZE);

4374

break;

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4375

Dr. David Alan Gilbert

2015-11-05 18:10:39 +0000

[diff] [blame]

4376

case RAM_SAVE_FLAG_COMPRESS_PAGE:

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4377

len = qemu_get_be32(f);

4378

if (len < 0 || len > compressBound(TARGET_PAGE_SIZE)) {

4379

error_report("Invalid compressed data length: %d", len);

4380

ret = -EINVAL;

4381

break;

4382

}

Dr. David Alan Gilbert

c1bc662

2015-12-16 11:47:38 +0000

[diff] [blame]

4383

decompress_data_with_multi_threads(f, host, len);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4384

break;

Dr. David Alan Gilbert

2015-11-05 18:10:39 +0000

[diff] [blame]

4385

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4386

case RAM_SAVE_FLAG_XBZRLE:

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4387

if (load_xbzrle(f, addr, host) < 0) {

4388

error_report("Failed to decompress XBZRLE page at "

RAM_ADDR_FMT, addr);

ret = -EINVAL;

break;

}

break;

case RAM_SAVE_FLAG_EOS:

4395

/* normal exit */

Juan Quintela

2018-02-28 09:10:07 +0100

[diff] [blame]

4396

multifd_recv_sync_main();

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4397

break;

4398

default:

4399

if (flags & RAM_SAVE_FLAG_HOOK) {

Dr. David Alan Gilbert

632e3a5

2015-06-11 18:17:23 +0100

[diff] [blame]

4400

ram_control_load_hook(f, RAM_CONTROL_HOOK, NULL);

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4401

} else {

4402

error_report("Unknown combination of migration flags: %#x",

flags);

ret = -EINVAL;

}

}

if (!ret) {

ret = qemu_file_get_error(f);

}

}

Xiao Guangrong

2018-03-30 15:51:22 +0800

[diff] [blame]

4412

ret |= wait_for_decompress_done();

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4413

rcu_read_unlock();

Juan Quintela

2017-01-23 22:32:05 +0100

[diff] [blame]

4414

trace_ram_load_complete(ret, seq_iter);

Zhang Chen

e6f4aa1

2018-09-03 12:38:50 +0800

[diff] [blame]

4415

4416

if (!ret && migration_incoming_in_colo_state()) {

4417

colo_flush_ram_cache();

4418

}

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4419

return ret;

4420

}

4421

Vladimir Sementsov-Ogievskiy

c646762

2017-07-10 19:30:14 +0300

[diff] [blame]

4422

static bool ram_has_postcopy(void *opaque)

4423

{

Junyan He

469dd51

2018-07-18 15:48:02 +0800

[diff] [blame]

4424

RAMBlock *rb;

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

4425

RAMBLOCK_FOREACH_NOT_IGNORED(rb) {

Junyan He

469dd51

2018-07-18 15:48:02 +0800

[diff] [blame]

4426

if (ramblock_is_pmem(rb)) {

4427

info_report("Block: %s, host: %p is a nvdimm memory, postcopy"

4428

"is not supported now!", rb->idstr, rb->host);

return false;

}

}

Vladimir Sementsov-Ogievskiy

c646762

2017-07-10 19:30:14 +0300

[diff] [blame]

4433

return migrate_postcopy_ram();

4434

}

4435

Peter Xu

2018-05-02 18:47:32 +0800

[diff] [blame]

4436

/* Sync all the dirty bitmap with destination VM. */

4437

static int ram_dirty_bitmap_sync_all(MigrationState *s, RAMState *rs)

4438

{

4439

RAMBlock *block;

4440

QEMUFile *file = s->to_dst_file;

4441

int ramblock_count = 0;

4442

4443

trace_ram_dirty_bitmap_sync_start();

4444

Yury Kotov

2019-02-15 20:45:46 +0300

[diff] [blame]

4445

RAMBLOCK_FOREACH_NOT_IGNORED(block) {

Peter Xu

2018-05-02 18:47:32 +0800

[diff] [blame]

4446

qemu_savevm_send_recv_bitmap(file, block->idstr);

4447

trace_ram_dirty_bitmap_request(block->idstr);

ramblock_count++;

}

trace_ram_dirty_bitmap_sync_wait();

4452

4453

/* Wait until all the ramblocks' dirty bitmap synced */

4454

while (ramblock_count--) {

4455

qemu_sem_wait(&s->rp_state.rp_sem);

4456

}

4457

4458

trace_ram_dirty_bitmap_sync_complete();

return 0;

}

static void ram_dirty_bitmap_reload_notify(MigrationState *s)

4464

{

4465

qemu_sem_post(&s->rp_state.rp_sem);

4466

}

4467

Peter Xu

2018-05-02 18:47:28 +0800

[diff] [blame]

4468

/*

4469

* Read the received bitmap, revert it as the initial dirty bitmap.

4470

* This is only used when the postcopy migration is paused but wants

4471

* to resume from a middle point.

4472

*/

4473

int ram_dirty_bitmap_reload(MigrationState *s, RAMBlock *block)

4474

{

4475

int ret = -EINVAL;

4476

QEMUFile *file = s->rp_state.from_dst_file;

4477

unsigned long *le_bitmap, nbits = block->used_length >> TARGET_PAGE_BITS;

Peter Xu

a725ef9

2018-07-10 17:18:55 +0800

[diff] [blame]

4478

uint64_t local_size = DIV_ROUND_UP(nbits, 8);

Peter Xu

2018-05-02 18:47:28 +0800

[diff] [blame]

4479

uint64_t size, end_mark;

4480

4481

trace_ram_dirty_bitmap_reload_begin(block->idstr);

4482

4483

if (s->state != MIGRATION_STATUS_POSTCOPY_RECOVER) {

4484

error_report("%s: incorrect state %s", __func__,

4485

MigrationStatus_str(s->state));

return -EINVAL;

}

/*

* Note: see comments in ramblock_recv_bitmap_send() on why we

4491

* need the endianess convertion, and the paddings.

4492

*/

4493

local_size = ROUND_UP(local_size, 8);

4494

4495

/* Add paddings */

4496

le_bitmap = bitmap_new(nbits + BITS_PER_LONG);

4497

4498

size = qemu_get_be64(file);

4499

4500

/* The size of the bitmap should match with our ramblock */

4501

if (size != local_size) {

4502

error_report("%s: ramblock '%s' bitmap size mismatch "

4503

"(0x%"PRIx64" != 0x%"PRIx64")", __func__,

4504

block->idstr, size, local_size);

ret = -EINVAL;

goto out;

}

size = qemu_get_buffer(file, (uint8_t *)le_bitmap, local_size);

4510

end_mark = qemu_get_be64(file);

4511

4512

ret = qemu_file_get_error(file);

4513

if (ret || size != local_size) {

4514

error_report("%s: read bitmap failed for ramblock '%s': %d"

4515

" (size 0x%"PRIx64", got: 0x%"PRIx64")",

4516

__func__, block->idstr, ret, local_size, size);

ret = -EIO;

goto out;

}

if (end_mark != RAMBLOCK_RECV_BITMAP_ENDING) {

4522

error_report("%s: ramblock '%s' end mark incorrect: 0x%"PRIu64,

4523

__func__, block->idstr, end_mark);

ret = -EINVAL;

goto out;

}

/*

* Endianess convertion. We are during postcopy (though paused).

4530

* The dirty bitmap won't change. We can directly modify it.

4531

*/

4532

bitmap_from_le(block->bmap, le_bitmap, nbits);

4533

4534

/*

4535

* What we received is "received bitmap". Revert it as the initial

4536

* dirty bitmap for this ramblock.

4537

*/

4538

bitmap_complement(block->bmap, block->bmap, nbits);

4539

4540

trace_ram_dirty_bitmap_reload_complete(block->idstr);

4541

Peter Xu

2018-05-02 18:47:32 +0800

[diff] [blame]

4542

/*

4543

* We succeeded to sync bitmap for current ramblock. If this is

4544

* the last one to sync, we need to notify the main send thread.

4545

*/

4546

ram_dirty_bitmap_reload_notify(s);

4547

Peter Xu

2018-05-02 18:47:28 +0800

[diff] [blame]

4548

ret = 0;

4549

out:

Peter Xu

bf26990

2018-05-25 09:50:42 +0800

[diff] [blame]

4550

g_free(le_bitmap);

Peter Xu

2018-05-02 18:47:28 +0800

[diff] [blame]

return ret;

}

Peter Xu

2018-05-02 18:47:32 +0800

[diff] [blame]

4554

static int ram_resume_prepare(MigrationState *s, void *opaque)

4555

{

4556

RAMState *rs = *(RAMState **)opaque;

Peter Xu

08614f3

2018-05-02 18:47:33 +0800

[diff] [blame]

4557

int ret;

Peter Xu

2018-05-02 18:47:32 +0800

[diff] [blame]

4558

Peter Xu

08614f3

2018-05-02 18:47:33 +0800

[diff] [blame]

4559

ret = ram_dirty_bitmap_sync_all(s, rs);

if (ret) {

return ret;

}

ram_state_resume_prepare(rs, s->to_dst_file);

4565

4566

return 0;

Peter Xu

2018-05-02 18:47:32 +0800

[diff] [blame]

4567

}

4568

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4569

static SaveVMHandlers savevm_ram_handlers = {

Juan Quintela

9907e84

2017-06-28 11:52:24 +0200

[diff] [blame]

4570

.save_setup = ram_save_setup,

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4571

.save_live_iterate = ram_save_iterate,

Dr. David Alan Gilbert

763c906

2015-11-05 18:11:00 +0000

[diff] [blame]

4572

.save_live_complete_postcopy = ram_save_complete,

Dr. David Alan Gilbert

a3e06c3

2015-11-05 18:10:41 +0000

[diff] [blame]

4573

.save_live_complete_precopy = ram_save_complete,

Vladimir Sementsov-Ogievskiy

c646762

2017-07-10 19:30:14 +0300

[diff] [blame]

4574

.has_postcopy = ram_has_postcopy,

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4575

.save_live_pending = ram_save_pending,

4576

.load_state = ram_load,

Juan Quintela

2017-06-28 11:52:27 +0200

[diff] [blame]

4577

.save_cleanup = ram_save_cleanup,

4578

.load_setup = ram_load_setup,

4579

.load_cleanup = ram_load_cleanup,

Peter Xu

2018-05-02 18:47:32 +0800

[diff] [blame]

4580

.resume_prepare = ram_resume_prepare,

Juan Quintela

2015-05-07 19:33:31 +0200

[diff] [blame]

4581

};

4582

4583

void ram_mig_init(void)

4584

{

4585

qemu_mutex_init(&XBZRLE.lock);

Juan Quintela

2017-03-13 19:26:29 +0100

[diff] [blame]

4586

register_savevm_live(NULL, "ram", 0, 4, &savevm_ram_handlers, &ram_state);

Juan Quintela