s390x/pci: let pci devices start in configured mode

[mirror_qemu.git] / migration / ram.c
diff --git a/migration/ram.c b/migration/ram.c

index c07a9c08d94d0449609a37a0272cae2389f563b2..8620aa400ab80a3ce7be41cddf86fb6ccb5ebb67 100644 (file)
--- a/migration/ram.c
+++ b/migration/ram.c
@@ -26,27 +26,29 @@
   * THE SOFTWARE.
   */
  #include "qemu/osdep.h"
-#include "qemu-common.h"
  #include "cpu.h"
  #include <zlib.h>
  #include "qapi-event.h"
  #include "qemu/cutils.h"
  #include "qemu/bitops.h"
  #include "qemu/bitmap.h"
-#include "qemu/timer.h"
  #include "qemu/main-loop.h"
  #include "xbzrle.h"
-#include "migration/migration.h"
-#include "migration/qemu-file.h"
-#include "migration/vmstate.h"
+#include "ram.h"
+#include "migration.h"
+#include "migration/register.h"
+#include "migration/misc.h"
+#include "qemu-file.h"
  #include "postcopy-ram.h"
-#include "exec/address-spaces.h"
  #include "migration/page_cache.h"
  #include "qemu/error-report.h"
+#include "qapi/qmp/qerror.h"
  #include "trace.h"
  #include "exec/ram_addr.h"
+#include "exec/target_page.h"
  #include "qemu/rcu_queue.h"
  #include "migration/colo.h"
+#include "migration/block.h"
  
  /***********************************************************/
  /* ram save/restore */
@@ -67,13 +69,13 @@
  /* 0x80 is reserved in migration.h start with 0x100 next */
  #define RAM_SAVE_FLAG_COMPRESS_PAGE    0x100
  
-static uint8_t *ZERO_TARGET_PAGE;
-
  static inline bool is_zero_range(uint8_t *p, uint64_t size)
  {
      return buffer_is_zero(p, size);
  }
  
+XBZRLECacheStats xbzrle_counters;
+
  /* struct contains XBZRLE cache and a static page
     used by the compression */
  static struct {
@@ -84,11 +86,12 @@ static struct {
      /* Cache for XBZRLE, Protected by lock. */
      PageCache *cache;
      QemuMutex lock;
+    /* it will store a page full of zeros */
+    uint8_t *zero_target_page;
+    /* buffer used for XBZRLE decoding */
+    uint8_t *decoded_buf;
  } XBZRLE;
  
-/* buffer used for XBZRLE decoding */
-static uint8_t *xbzrle_decoded_buf;
-
  static void XBZRLE_cache_lock(void)
  {
      if (migrate_use_xbzrle())
@@ -109,29 +112,33 @@ static void XBZRLE_cache_unlock(void)
   * migration may be using the cache and might finish during this call,
   * hence changes to the cache are protected by XBZRLE.lock().
   *
- * Returns the new_size or negative in case of error.
+ * Returns 0 for success or -1 for error
   *
   * @new_size: new cache size
+ * @errp: set *errp if the check failed, with reason
   */
-int64_t xbzrle_cache_resize(int64_t new_size)
+int xbzrle_cache_resize(int64_t new_size, Error **errp)
  {
      PageCache *new_cache;
-    int64_t ret;
+    int64_t ret = 0;
  
-    if (new_size < TARGET_PAGE_SIZE) {
+    /* Check for truncation */
+    if (new_size != (size_t)new_size) {
+        error_setg(errp, QERR_INVALID_PARAMETER_VALUE, "cache size",
+                   "exceeding address space");
          return -1;
      }
  
+    if (new_size == migrate_xbzrle_cache_size()) {
+        /* nothing to do */
+        return 0;
+    }
+
      XBZRLE_cache_lock();
  
      if (XBZRLE.cache != NULL) {
-        if (pow2floor(new_size) == migrate_xbzrle_cache_size()) {
-            goto out_new_size;
-        }
-        new_cache = cache_init(new_size / TARGET_PAGE_SIZE,
-                                        TARGET_PAGE_SIZE);
+        new_cache = cache_init(new_size, TARGET_PAGE_SIZE, errp);
          if (!new_cache) {
-            error_report("Error creating cache");
              ret = -1;
              goto out;
          }
@@ -139,14 +146,40 @@ int64_t xbzrle_cache_resize(int64_t new_size)
          cache_fini(XBZRLE.cache);
          XBZRLE.cache = new_cache;
      }
-
-out_new_size:
-    ret = pow2floor(new_size);
  out:
      XBZRLE_cache_unlock();
      return ret;
  }
  
+static void ramblock_recv_map_init(void)
+{
+    RAMBlock *rb;
+
+    RAMBLOCK_FOREACH(rb) {
+        assert(!rb->receivedmap);
+        rb->receivedmap = bitmap_new(rb->max_length >> qemu_target_page_bits());
+    }
+}
+
+int ramblock_recv_bitmap_test(RAMBlock *rb, void *host_addr)
+{
+    return test_bit(ramblock_recv_bitmap_offset(host_addr, rb),
+                    rb->receivedmap);
+}
+
+void ramblock_recv_bitmap_set(RAMBlock *rb, void *host_addr)
+{
+    set_bit_atomic(ramblock_recv_bitmap_offset(host_addr, rb), rb->receivedmap);
+}
+
+void ramblock_recv_bitmap_set_range(RAMBlock *rb, void *host_addr,
+                                    size_t nr)
+{
+    bitmap_set_atomic(rb->receivedmap,
+                      ramblock_recv_bitmap_offset(host_addr, rb),
+                      nr);
+}
+
  /*
   * An outstanding page request, on the source, having been received
   * and queued
@@ -175,8 +208,6 @@ struct RAMState {
      bool ram_bulk_stage;
      /* How many times we have dirty too many pages */
      int dirty_rate_high_cnt;
-    /* How many times we have synchronized the bitmap */
-    uint64_t bitmap_sync_count;
      /* these variables are used for bitmap sync */
      /* last time we did a full bitmap_sync */
      int64_t time_last_bitmap_sync;
@@ -188,32 +219,10 @@ struct RAMState {
      uint64_t xbzrle_cache_miss_prev;
      /* number of iterations at the beginning of period */
      uint64_t iterations_prev;
-    /* Accounting fields */
-    /* number of zero pages.  It used to be pages filled by the same char. */
-    uint64_t zero_pages;
-    /* number of normal transferred pages */
-    uint64_t norm_pages;
      /* Iterations since start */
      uint64_t iterations;
-    /* xbzrle transmitted bytes.  Notice that this is with
-     * compression, they can't be calculated from the pages */
-    uint64_t xbzrle_bytes;
-    /* xbzrle transmmited pages */
-    uint64_t xbzrle_pages;
-    /* xbzrle number of cache miss */
-    uint64_t xbzrle_cache_miss;
-    /* xbzrle miss rate */
-    double xbzrle_cache_miss_rate;
-    /* xbzrle number of overflows */
-    uint64_t xbzrle_overflows;
      /* number of dirty bits in the bitmap */
      uint64_t migration_dirty_pages;
-    /* total number of bytes transferred */
-    uint64_t bytes_transferred;
-    /* number of dirtied pages in the last second */
-    uint64_t dirty_pages_rate;
-    /* Count of requests incoming from destination */
-    uint64_t postcopy_requests;
      /* protects modification of the bitmap */
      QemuMutex bitmap_mutex;
      /* The RAMBlock used in the last src_page_requests */
@@ -224,67 +233,14 @@ struct RAMState {
  };
  typedef struct RAMState RAMState;
  
-static RAMState ram_state;
-
-uint64_t dup_mig_pages_transferred(void)
-{
-    return ram_state.zero_pages;
-}
-
-uint64_t norm_mig_pages_transferred(void)
-{
-    return ram_state.norm_pages;
-}
-
-uint64_t xbzrle_mig_bytes_transferred(void)
-{
-    return ram_state.xbzrle_bytes;
-}
-
-uint64_t xbzrle_mig_pages_transferred(void)
-{
-    return ram_state.xbzrle_pages;
-}
-
-uint64_t xbzrle_mig_pages_cache_miss(void)
-{
-    return ram_state.xbzrle_cache_miss;
-}
-
-double xbzrle_mig_cache_miss_rate(void)
-{
-    return ram_state.xbzrle_cache_miss_rate;
-}
-
-uint64_t xbzrle_mig_pages_overflow(void)
-{
-    return ram_state.xbzrle_overflows;
-}
-
-uint64_t ram_bytes_transferred(void)
-{
-    return ram_state.bytes_transferred;
-}
+static RAMState *ram_state;
  
  uint64_t ram_bytes_remaining(void)
  {
-    return ram_state.migration_dirty_pages * TARGET_PAGE_SIZE;
-}
-
-uint64_t ram_dirty_sync_count(void)
-{
-    return ram_state.bitmap_sync_count;
+    return ram_state->migration_dirty_pages * TARGET_PAGE_SIZE;
  }
  
-uint64_t ram_dirty_pages_rate(void)
-{
-    return ram_state.dirty_pages_rate;
-}
-
-uint64_t ram_postcopy_requests(void)
-{
-    return ram_state.postcopy_requests;
-}
+MigrationStats ram_counters;
  
  /* used by the search for pages to send */
  struct PageSearchStatus {
@@ -383,7 +339,7 @@ static inline void terminate_compression_threads(void)
      }
  }
  
-void migrate_compress_threads_join(void)
+static void compress_threads_save_cleanup(void)
  {
      int i, thread_count;
  
@@ -406,7 +362,7 @@ void migrate_compress_threads_join(void)
      comp_param = NULL;
  }
  
-void migrate_compress_threads_create(void)
+static void compress_threads_save_setup(void)
  {
      int i, thread_count;
  
@@ -433,6 +389,208 @@ void migrate_compress_threads_create(void)
      }
  }
  
+/* Multiple fd's */
+
+struct MultiFDSendParams {
+    uint8_t id;
+    char *name;
+    QemuThread thread;
+    QemuSemaphore sem;
+    QemuMutex mutex;
+    bool quit;
+};
+typedef struct MultiFDSendParams MultiFDSendParams;
+
+struct {
+    MultiFDSendParams *params;
+    /* number of created threads */
+    int count;
+} *multifd_send_state;
+
+static void terminate_multifd_send_threads(Error *errp)
+{
+    int i;
+
+    for (i = 0; i < multifd_send_state->count; i++) {
+        MultiFDSendParams *p = &multifd_send_state->params[i];
+
+        qemu_mutex_lock(&p->mutex);
+        p->quit = true;
+        qemu_sem_post(&p->sem);
+        qemu_mutex_unlock(&p->mutex);
+    }
+}
+
+int multifd_save_cleanup(Error **errp)
+{
+    int i;
+    int ret = 0;
+
+    if (!migrate_use_multifd()) {
+        return 0;
+    }
+    terminate_multifd_send_threads(NULL);
+    for (i = 0; i < multifd_send_state->count; i++) {
+        MultiFDSendParams *p = &multifd_send_state->params[i];
+
+        qemu_thread_join(&p->thread);
+        qemu_mutex_destroy(&p->mutex);
+        qemu_sem_destroy(&p->sem);
+        g_free(p->name);
+        p->name = NULL;
+    }
+    g_free(multifd_send_state->params);
+    multifd_send_state->params = NULL;
+    g_free(multifd_send_state);
+    multifd_send_state = NULL;
+    return ret;
+}
+
+static void *multifd_send_thread(void *opaque)
+{
+    MultiFDSendParams *p = opaque;
+
+    while (true) {
+        qemu_mutex_lock(&p->mutex);
+        if (p->quit) {
+            qemu_mutex_unlock(&p->mutex);
+            break;
+        }
+        qemu_mutex_unlock(&p->mutex);
+        qemu_sem_wait(&p->sem);
+    }
+
+    return NULL;
+}
+
+int multifd_save_setup(void)
+{
+    int thread_count;
+    uint8_t i;
+
+    if (!migrate_use_multifd()) {
+        return 0;
+    }
+    thread_count = migrate_multifd_channels();
+    multifd_send_state = g_malloc0(sizeof(*multifd_send_state));
+    multifd_send_state->params = g_new0(MultiFDSendParams, thread_count);
+    multifd_send_state->count = 0;
+    for (i = 0; i < thread_count; i++) {
+        MultiFDSendParams *p = &multifd_send_state->params[i];
+
+        qemu_mutex_init(&p->mutex);
+        qemu_sem_init(&p->sem, 0);
+        p->quit = false;
+        p->id = i;
+        p->name = g_strdup_printf("multifdsend_%d", i);
+        qemu_thread_create(&p->thread, p->name, multifd_send_thread, p,
+                           QEMU_THREAD_JOINABLE);
+
+        multifd_send_state->count++;
+    }
+    return 0;
+}
+
+struct MultiFDRecvParams {
+    uint8_t id;
+    char *name;
+    QemuThread thread;
+    QemuSemaphore sem;
+    QemuMutex mutex;
+    bool quit;
+};
+typedef struct MultiFDRecvParams MultiFDRecvParams;
+
+struct {
+    MultiFDRecvParams *params;
+    /* number of created threads */
+    int count;
+} *multifd_recv_state;
+
+static void terminate_multifd_recv_threads(Error *errp)
+{
+    int i;
+
+    for (i = 0; i < multifd_recv_state->count; i++) {
+        MultiFDRecvParams *p = &multifd_recv_state->params[i];
+
+        qemu_mutex_lock(&p->mutex);
+        p->quit = true;
+        qemu_sem_post(&p->sem);
+        qemu_mutex_unlock(&p->mutex);
+    }
+}
+
+int multifd_load_cleanup(Error **errp)
+{
+    int i;
+    int ret = 0;
+
+    if (!migrate_use_multifd()) {
+        return 0;
+    }
+    terminate_multifd_recv_threads(NULL);
+    for (i = 0; i < multifd_recv_state->count; i++) {
+        MultiFDRecvParams *p = &multifd_recv_state->params[i];
+
+        qemu_thread_join(&p->thread);
+        qemu_mutex_destroy(&p->mutex);
+        qemu_sem_destroy(&p->sem);
+        g_free(p->name);
+        p->name = NULL;
+    }
+    g_free(multifd_recv_state->params);
+    multifd_recv_state->params = NULL;
+    g_free(multifd_recv_state);
+    multifd_recv_state = NULL;
+
+    return ret;
+}
+
+static void *multifd_recv_thread(void *opaque)
+{
+    MultiFDRecvParams *p = opaque;
+
+    while (true) {
+        qemu_mutex_lock(&p->mutex);
+        if (p->quit) {
+            qemu_mutex_unlock(&p->mutex);
+            break;
+        }
+        qemu_mutex_unlock(&p->mutex);
+        qemu_sem_wait(&p->sem);
+    }
+
+    return NULL;
+}
+
+int multifd_load_setup(void)
+{
+    int thread_count;
+    uint8_t i;
+
+    if (!migrate_use_multifd()) {
+        return 0;
+    }
+    thread_count = migrate_multifd_channels();
+    multifd_recv_state = g_malloc0(sizeof(*multifd_recv_state));
+    multifd_recv_state->params = g_new0(MultiFDRecvParams, thread_count);
+    multifd_recv_state->count = 0;
+    for (i = 0; i < thread_count; i++) {
+        MultiFDRecvParams *p = &multifd_recv_state->params[i];
+
+        qemu_mutex_init(&p->mutex);
+        qemu_sem_init(&p->sem, 0);
+        p->quit = false;
+        p->id = i;
+        p->name = g_strdup_printf("multifdrecv_%d", i);
+        qemu_thread_create(&p->thread, p->name, multifd_recv_thread, p,
+                           QEMU_THREAD_JOINABLE);
+        multifd_recv_state->count++;
+    }
+    return 0;
+}
+
  /**
   * save_page_header: write page header to wire
   *
@@ -510,8 +668,8 @@ static void xbzrle_cache_zero_page(RAMState *rs, ram_addr_t current_addr)
  
      /* We don't care if this fails to allocate a new cache page
       * as long as it updated an old one */
-    cache_insert(XBZRLE.cache, current_addr, ZERO_TARGET_PAGE,
-                 rs->bitmap_sync_count);
+    cache_insert(XBZRLE.cache, current_addr, XBZRLE.zero_target_page,
+                 ram_counters.dirty_sync_count);
  }
  
  #define ENCODING_FLAG_XBZRLE 0x1
@@ -537,11 +695,12 @@ static int save_xbzrle_page(RAMState *rs, uint8_t **current_data,
      int encoded_len = 0, bytes_xbzrle;
      uint8_t *prev_cached_page;
  
-    if (!cache_is_cached(XBZRLE.cache, current_addr, rs->bitmap_sync_count)) {
-        rs->xbzrle_cache_miss++;
+    if (!cache_is_cached(XBZRLE.cache, current_addr,
+                         ram_counters.dirty_sync_count)) {
+        xbzrle_counters.cache_miss++;
          if (!last_stage) {
              if (cache_insert(XBZRLE.cache, current_addr, *current_data,
-                             rs->bitmap_sync_count) == -1) {
+                             ram_counters.dirty_sync_count) == -1) {
                  return -1;
              } else {
                  /* update *current_data when the page has been
@@ -566,7 +725,7 @@ static int save_xbzrle_page(RAMState *rs, uint8_t **current_data,
          return 0;
      } else if (encoded_len == -1) {
          trace_save_xbzrle_page_overflow();
-        rs->xbzrle_overflows++;
+        xbzrle_counters.overflow++;
          /* update data in the cache */
          if (!last_stage) {
              memcpy(prev_cached_page, *current_data, TARGET_PAGE_SIZE);
@@ -587,9 +746,9 @@ static int save_xbzrle_page(RAMState *rs, uint8_t **current_data,
      qemu_put_be16(rs->f, encoded_len);
      qemu_put_buffer(rs->f, XBZRLE.encoded_buf, encoded_len);
      bytes_xbzrle += encoded_len + 1 + 2;
-    rs->xbzrle_pages++;
-    rs->xbzrle_bytes += bytes_xbzrle;
-    rs->bytes_transferred += bytes_xbzrle;
+    xbzrle_counters.pages++;
+    xbzrle_counters.bytes += bytes_xbzrle;
+    ram_counters.transferred += bytes_xbzrle;
  
      return 1;
  }
@@ -671,11 +830,7 @@ static void migration_bitmap_sync(RAMState *rs)
      int64_t end_time;
      uint64_t bytes_xfer_now;
  
-    rs->bitmap_sync_count++;
-
-    if (!rs->bytes_xfer_prev) {
-        rs->bytes_xfer_prev = ram_bytes_transferred();
-    }
+    ram_counters.dirty_sync_count++;
  
      if (!rs->time_last_bitmap_sync) {
          rs->time_last_bitmap_sync = qemu_clock_get_ms(QEMU_CLOCK_REALTIME);
@@ -698,42 +853,48 @@ static void migration_bitmap_sync(RAMState *rs)
  
      /* more than 1 second = 1000 millisecons */
      if (end_time > rs->time_last_bitmap_sync + 1000) {
-        if (migrate_auto_converge()) {
+        /* calculate period counters */
+        ram_counters.dirty_pages_rate = rs->num_dirty_pages_period * 1000
+            / (end_time - rs->time_last_bitmap_sync);
+        bytes_xfer_now = ram_counters.transferred;
+
+        /* During block migration the auto-converge logic incorrectly detects
+         * that ram migration makes no progress. Avoid this by disabling the
+         * throttling logic during the bulk phase of block migration. */
+        if (migrate_auto_converge() && !blk_mig_bulk_active()) {
              /* The following detection logic can be refined later. For now:
                 Check to see if the dirtied bytes is 50% more than the approx.
                 amount of bytes that just got transferred since the last time we
                 were in this routine. If that happens twice, start or increase
                 throttling */
-            bytes_xfer_now = ram_bytes_transferred();
  
-            if (rs->dirty_pages_rate &&
-               (rs->num_dirty_pages_period * TARGET_PAGE_SIZE >
+            if ((rs->num_dirty_pages_period * TARGET_PAGE_SIZE >
                     (bytes_xfer_now - rs->bytes_xfer_prev) / 2) &&
-               (rs->dirty_rate_high_cnt++ >= 2)) {
+                (++rs->dirty_rate_high_cnt >= 2)) {
                      trace_migration_throttle();
                      rs->dirty_rate_high_cnt = 0;
                      mig_throttle_guest_down();
-             }
-             rs->bytes_xfer_prev = bytes_xfer_now;
+            }
          }
  
          if (migrate_use_xbzrle()) {
              if (rs->iterations_prev != rs->iterations) {
-                rs->xbzrle_cache_miss_rate =
-                   (double)(rs->xbzrle_cache_miss -
+                xbzrle_counters.cache_miss_rate =
+                   (double)(xbzrle_counters.cache_miss -
                              rs->xbzrle_cache_miss_prev) /
                     (rs->iterations - rs->iterations_prev);
              }
              rs->iterations_prev = rs->iterations;
-            rs->xbzrle_cache_miss_prev = rs->xbzrle_cache_miss;
+            rs->xbzrle_cache_miss_prev = xbzrle_counters.cache_miss;
          }
-        rs->dirty_pages_rate = rs->num_dirty_pages_period * 1000
-            / (end_time - rs->time_last_bitmap_sync);
+
+        /* reset period counters */
          rs->time_last_bitmap_sync = end_time;
          rs->num_dirty_pages_period = 0;
+        rs->bytes_xfer_prev = bytes_xfer_now;
      }
      if (migrate_use_events()) {
-        qapi_event_send_migration_pass(rs->bitmap_sync_count, NULL);
+        qapi_event_send_migration_pass(ram_counters.dirty_sync_count, NULL);
      }
  }
  
@@ -753,11 +914,11 @@ static int save_zero_page(RAMState *rs, RAMBlock *block, ram_addr_t offset,
      int pages = -1;
  
      if (is_zero_range(p, TARGET_PAGE_SIZE)) {
-        rs->zero_pages++;
-        rs->bytes_transferred +=
+        ram_counters.duplicate++;
+        ram_counters.transferred +=
              save_page_header(rs, rs->f, block, offset | RAM_SAVE_FLAG_ZERO);
          qemu_put_byte(rs->f, 0);
-        rs->bytes_transferred += 1;
+        ram_counters.transferred += 1;
          pages = 1;
      }
  
@@ -805,7 +966,7 @@ static int ram_save_page(RAMState *rs, PageSearchStatus *pss, bool last_stage)
      ret = ram_control_save_page(rs->f, block->offset,
                             offset, TARGET_PAGE_SIZE, &bytes_xmit);
      if (bytes_xmit) {
-        rs->bytes_transferred += bytes_xmit;
+        ram_counters.transferred += bytes_xmit;
          pages = 1;
      }
  
@@ -816,9 +977,9 @@ static int ram_save_page(RAMState *rs, PageSearchStatus *pss, bool last_stage)
      if (ret != RAM_SAVE_CONTROL_NOT_SUPP) {
          if (ret != RAM_SAVE_CONTROL_DELAYED) {
              if (bytes_xmit > 0) {
-                rs->norm_pages++;
+                ram_counters.normal++;
              } else if (bytes_xmit == 0) {
-                rs->zero_pages++;
+                ram_counters.duplicate++;
              }
          }
      } else {
@@ -844,8 +1005,8 @@ static int ram_save_page(RAMState *rs, PageSearchStatus *pss, bool last_stage)
  
      /* XBZRLE overflow or normal page */
      if (pages == -1) {
-        rs->bytes_transferred += save_page_header(rs, rs->f, block,
-                                                  offset | RAM_SAVE_FLAG_PAGE);
+        ram_counters.transferred +=
+            save_page_header(rs, rs->f, block, offset | RAM_SAVE_FLAG_PAGE);
          if (send_async) {
              qemu_put_buffer_async(rs->f, p, TARGET_PAGE_SIZE,
                                    migrate_release_ram() &
@@ -853,9 +1014,9 @@ static int ram_save_page(RAMState *rs, PageSearchStatus *pss, bool last_stage)
          } else {
              qemu_put_buffer(rs->f, p, TARGET_PAGE_SIZE);
          }
-        rs->bytes_transferred += TARGET_PAGE_SIZE;
+        ram_counters.transferred += TARGET_PAGE_SIZE;
          pages = 1;
-        rs->norm_pages++;
+        ram_counters.normal++;
      }
  
      XBZRLE_cache_unlock();
@@ -866,7 +1027,7 @@ static int ram_save_page(RAMState *rs, PageSearchStatus *pss, bool last_stage)
  static int do_compress_ram_page(QEMUFile *f, RAMBlock *block,
                                  ram_addr_t offset)
  {
-    RAMState *rs = &ram_state;
+    RAMState *rs = ram_state;
      int bytes_sent, blen;
      uint8_t *p = block->host + (offset & TARGET_PAGE_MASK);
  
@@ -907,7 +1068,7 @@ static void flush_compressed_data(RAMState *rs)
          qemu_mutex_lock(&comp_param[idx].mutex);
          if (!comp_param[idx].quit) {
              len = qemu_put_qemu_file(rs->f, comp_param[idx].file);
-            rs->bytes_transferred += len;
+            ram_counters.transferred += len;
          }
          qemu_mutex_unlock(&comp_param[idx].mutex);
      }
@@ -937,8 +1098,8 @@ static int compress_page_with_multi_thread(RAMState *rs, RAMBlock *block,
                  qemu_cond_signal(&comp_param[idx].cond);
                  qemu_mutex_unlock(&comp_param[idx].mutex);
                  pages = 1;
-                rs->norm_pages++;
-                rs->bytes_transferred += bytes_xmit;
+                ram_counters.normal++;
+                ram_counters.transferred += bytes_xmit;
                  break;
              }
          }
@@ -978,15 +1139,15 @@ static int ram_save_compressed_page(RAMState *rs, PageSearchStatus *pss,
      ret = ram_control_save_page(rs->f, block->offset,
                                  offset, TARGET_PAGE_SIZE, &bytes_xmit);
      if (bytes_xmit) {
-        rs->bytes_transferred += bytes_xmit;
+        ram_counters.transferred += bytes_xmit;
          pages = 1;
      }
      if (ret != RAM_SAVE_CONTROL_NOT_SUPP) {
          if (ret != RAM_SAVE_CONTROL_DELAYED) {
              if (bytes_xmit > 0) {
-                rs->norm_pages++;
+                ram_counters.normal++;
              } else if (bytes_xmit == 0) {
-                rs->zero_pages++;
+                ram_counters.duplicate++;
              }
          }
      } else {
@@ -1006,8 +1167,8 @@ static int ram_save_compressed_page(RAMState *rs, PageSearchStatus *pss,
                  blen = qemu_put_compression_data(rs->f, p, TARGET_PAGE_SIZE,
                                                   migrate_compress_level());
                  if (blen > 0) {
-                    rs->bytes_transferred += bytes_xmit + blen;
-                    rs->norm_pages++;
+                    ram_counters.transferred += bytes_xmit + blen;
+                    ram_counters.normal++;
                      pages = 1;
                  } else {
                      qemu_file_set_error(rs->f, blen);
@@ -1183,10 +1344,9 @@ static bool get_queued_page(RAMState *rs, PageSearchStatus *pss)
   * be some left.  in case that there is any page left, we drop it.
   *
   */
-void migration_page_queue_free(void)
+static void migration_page_queue_free(RAMState *rs)
  {
      struct RAMSrcPageRequest *mspr, *next_mspr;
-    RAMState *rs = &ram_state;
      /* This queue generally should be empty - but in the case of a failed
       * migration might have some droppings in.
       */
@@ -1214,9 +1374,9 @@ void migration_page_queue_free(void)
  int ram_save_queue_pages(const char *rbname, ram_addr_t start, ram_addr_t len)
  {
      RAMBlock *ramblock;
-    RAMState *rs = &ram_state;
+    RAMState *rs = ram_state;
  
-    rs->postcopy_requests++;
+    ram_counters.postcopy_requests++;
      rcu_read_lock();
      if (!rbname) {
          /* Reuse last RAMBlock */
@@ -1404,13 +1564,12 @@ static int ram_find_and_save_block(RAMState *rs, bool last_stage)
  void acct_update_position(QEMUFile *f, size_t size, bool zero)
  {
      uint64_t pages = size / TARGET_PAGE_SIZE;
-    RAMState *rs = &ram_state;
  
      if (zero) {
-        rs->zero_pages += pages;
+        ram_counters.duplicate += pages;
      } else {
-        rs->norm_pages += pages;
-        rs->bytes_transferred += size;
+        ram_counters.normal += pages;
+        ram_counters.transferred += size;
          qemu_update_position(f, size);
      }
  }
@@ -1428,14 +1587,45 @@ uint64_t ram_bytes_total(void)
      return total;
  }
  
-void free_xbzrle_decoded_buf(void)
+static void xbzrle_load_setup(void)
+{
+    XBZRLE.decoded_buf = g_malloc(TARGET_PAGE_SIZE);
+}
+
+static void xbzrle_load_cleanup(void)
  {
-    g_free(xbzrle_decoded_buf);
-    xbzrle_decoded_buf = NULL;
+    g_free(XBZRLE.decoded_buf);
+    XBZRLE.decoded_buf = NULL;
+}
+
+static void ram_state_cleanup(RAMState **rsp)
+{
+    migration_page_queue_free(*rsp);
+    qemu_mutex_destroy(&(*rsp)->bitmap_mutex);
+    qemu_mutex_destroy(&(*rsp)->src_page_req_mutex);
+    g_free(*rsp);
+    *rsp = NULL;
+}
+
+static void xbzrle_cleanup(void)
+{
+    XBZRLE_cache_lock();
+    if (XBZRLE.cache) {
+        cache_fini(XBZRLE.cache);
+        g_free(XBZRLE.encoded_buf);
+        g_free(XBZRLE.current_buf);
+        g_free(XBZRLE.zero_target_page);
+        XBZRLE.cache = NULL;
+        XBZRLE.encoded_buf = NULL;
+        XBZRLE.current_buf = NULL;
+        XBZRLE.zero_target_page = NULL;
+    }
+    XBZRLE_cache_unlock();
  }
  
-static void ram_migration_cleanup(void *opaque)
+static void ram_save_cleanup(void *opaque)
  {
+    RAMState **rsp = opaque;
      RAMBlock *block;
  
      /* caller have hold iothread lock or is in a bh, so there is
@@ -1450,17 +1640,9 @@ static void ram_migration_cleanup(void *opaque)
          block->unsentmap = NULL;
      }
  
-    XBZRLE_cache_lock();
-    if (XBZRLE.cache) {
-        cache_fini(XBZRLE.cache);
-        g_free(XBZRLE.encoded_buf);
-        g_free(XBZRLE.current_buf);
-        g_free(ZERO_TARGET_PAGE);
-        XBZRLE.cache = NULL;
-        XBZRLE.encoded_buf = NULL;
-        XBZRLE.current_buf = NULL;
-    }
-    XBZRLE_cache_unlock();
+    xbzrle_cleanup();
+    compress_threads_save_cleanup();
+    ram_state_cleanup(rsp);
  }
  
  static void ram_state_reset(RAMState *rs)
@@ -1631,7 +1813,7 @@ static void postcopy_chunk_hostpages_pass(MigrationState *ms, bool unsent_pass,
                                            RAMBlock *block,
                                            PostcopyDiscardState *pds)
  {
-    RAMState *rs = &ram_state;
+    RAMState *rs = ram_state;
      unsigned long *bitmap = block->bmap;
      unsigned long *unsentmap = block->unsentmap;
      unsigned int host_ratio = block->page_size / TARGET_PAGE_SIZE;
@@ -1786,7 +1968,7 @@ static int postcopy_chunk_hostpages(MigrationState *ms, RAMBlock *block)
   */
  int ram_postcopy_send_discard_bitmap(MigrationState *ms)
  {
-    RAMState *rs = &ram_state;
+    RAMState *rs = ram_state;
      RAMBlock *block;
      int ret;
  
@@ -1861,6 +2043,8 @@ int ram_discard_range(const char *rbname, uint64_t start, size_t length)
          goto err;
      }
  
+    bitmap_clear(rb->receivedmap, start >> qemu_target_page_bits(),
+                 length >> qemu_target_page_bits());
      ret = ram_block_discard_range(rb, start, length);
  
  err:
@@ -1869,56 +2053,96 @@ err:
      return ret;
  }
  
-static int ram_state_init(RAMState *rs)
+/*
+ * For every allocation, we will try not to crash the VM if the
+ * allocation failed.
+ */
+static int xbzrle_init(void)
  {
-    memset(rs, 0, sizeof(*rs));
-    qemu_mutex_init(&rs->bitmap_mutex);
-    qemu_mutex_init(&rs->src_page_req_mutex);
-    QSIMPLEQ_INIT(&rs->src_page_requests);
+    Error *local_err = NULL;
  
-    if (migrate_use_xbzrle()) {
-        XBZRLE_cache_lock();
-        ZERO_TARGET_PAGE = g_malloc0(TARGET_PAGE_SIZE);
-        XBZRLE.cache = cache_init(migrate_xbzrle_cache_size() /
-                                  TARGET_PAGE_SIZE,
-                                  TARGET_PAGE_SIZE);
-        if (!XBZRLE.cache) {
-            XBZRLE_cache_unlock();
-            error_report("Error creating cache");
-            return -1;
-        }
-        XBZRLE_cache_unlock();
+    if (!migrate_use_xbzrle()) {
+        return 0;
+    }
  
-        /* We prefer not to abort if there is no memory */
-        XBZRLE.encoded_buf = g_try_malloc0(TARGET_PAGE_SIZE);
-        if (!XBZRLE.encoded_buf) {
-            error_report("Error allocating encoded_buf");
-            return -1;
-        }
+    XBZRLE_cache_lock();
  
-        XBZRLE.current_buf = g_try_malloc(TARGET_PAGE_SIZE);
-        if (!XBZRLE.current_buf) {
-            error_report("Error allocating current_buf");
-            g_free(XBZRLE.encoded_buf);
-            XBZRLE.encoded_buf = NULL;
-            return -1;
-        }
+    XBZRLE.zero_target_page = g_try_malloc0(TARGET_PAGE_SIZE);
+    if (!XBZRLE.zero_target_page) {
+        error_report("%s: Error allocating zero page", __func__);
+        goto err_out;
      }
  
-    /* For memory_global_dirty_log_start below.  */
-    qemu_mutex_lock_iothread();
+    XBZRLE.cache = cache_init(migrate_xbzrle_cache_size(),
+                              TARGET_PAGE_SIZE, &local_err);
+    if (!XBZRLE.cache) {
+        error_report_err(local_err);
+        goto free_zero_page;
+    }
  
-    qemu_mutex_lock_ramlist();
-    rcu_read_lock();
-    ram_state_reset(rs);
+    XBZRLE.encoded_buf = g_try_malloc0(TARGET_PAGE_SIZE);
+    if (!XBZRLE.encoded_buf) {
+        error_report("%s: Error allocating encoded_buf", __func__);
+        goto free_cache;
+    }
+
+    XBZRLE.current_buf = g_try_malloc(TARGET_PAGE_SIZE);
+    if (!XBZRLE.current_buf) {
+        error_report("%s: Error allocating current_buf", __func__);
+        goto free_encoded_buf;
+    }
+
+    /* We are all good */
+    XBZRLE_cache_unlock();
+    return 0;
+
+free_encoded_buf:
+    g_free(XBZRLE.encoded_buf);
+    XBZRLE.encoded_buf = NULL;
+free_cache:
+    cache_fini(XBZRLE.cache);
+    XBZRLE.cache = NULL;
+free_zero_page:
+    g_free(XBZRLE.zero_target_page);
+    XBZRLE.zero_target_page = NULL;
+err_out:
+    XBZRLE_cache_unlock();
+    return -ENOMEM;
+}
+
+static int ram_state_init(RAMState **rsp)
+{
+    *rsp = g_try_new0(RAMState, 1);
+
+    if (!*rsp) {
+        error_report("%s: Init ramstate fail", __func__);
+        return -1;
+    }
+
+    qemu_mutex_init(&(*rsp)->bitmap_mutex);
+    qemu_mutex_init(&(*rsp)->src_page_req_mutex);
+    QSIMPLEQ_INIT(&(*rsp)->src_page_requests);
+
+    /*
+     * Count the total number of pages used by ram blocks not including any
+     * gaps due to alignment or unplugs.
+     */
+    (*rsp)->migration_dirty_pages = ram_bytes_total() >> TARGET_PAGE_BITS;
+
+    ram_state_reset(*rsp);
+
+    return 0;
+}
+
+static void ram_list_init_bitmaps(void)
+{
+    RAMBlock *block;
+    unsigned long pages;
  
      /* Skip setting bitmap if there is no RAM */
      if (ram_bytes_total()) {
-        RAMBlock *block;
-
          QLIST_FOREACH_RCU(block, &ram_list.blocks, next) {
-            unsigned long pages = block->max_length >> TARGET_PAGE_BITS;
-
+            pages = block->max_length >> TARGET_PAGE_BITS;
              block->bmap = bitmap_new(pages);
              bitmap_set(block->bmap, 0, pages);
              if (migrate_postcopy_ram()) {
@@ -1927,18 +2151,36 @@ static int ram_state_init(RAMState *rs)
              }
          }
      }
+}
  
-    /*
-     * Count the total number of pages used by ram blocks not including any
-     * gaps due to alignment or unplugs.
-     */
-    rs->migration_dirty_pages = ram_bytes_total() >> TARGET_PAGE_BITS;
+static void ram_init_bitmaps(RAMState *rs)
+{
+    /* For memory_global_dirty_log_start below.  */
+    qemu_mutex_lock_iothread();
+    qemu_mutex_lock_ramlist();
+    rcu_read_lock();
  
+    ram_list_init_bitmaps();
      memory_global_dirty_log_start();
      migration_bitmap_sync(rs);
+
+    rcu_read_unlock();
      qemu_mutex_unlock_ramlist();
      qemu_mutex_unlock_iothread();
-    rcu_read_unlock();
+}
+
+static int ram_init_all(RAMState **rsp)
+{
+    if (ram_state_init(rsp)) {
+        return -1;
+    }
+
+    if (xbzrle_init()) {
+        ram_state_cleanup(rsp);
+        return -1;
+    }
+
+    ram_init_bitmaps(*rsp);
  
      return 0;
  }
@@ -1960,16 +2202,16 @@ static int ram_state_init(RAMState *rs)
   */
  static int ram_save_setup(QEMUFile *f, void *opaque)
  {
-    RAMState *rs = opaque;
+    RAMState **rsp = opaque;
      RAMBlock *block;
  
      /* migration has already setup the bitmap, reuse it. */
      if (!migration_in_colo_state()) {
-        if (ram_state_init(rs) < 0) {
+        if (ram_init_all(rsp) != 0) {
              return -1;
-         }
+        }
      }
-    rs->f = f;
+    (*rsp)->f = f;
  
      rcu_read_lock();
  
@@ -1985,6 +2227,7 @@ static int ram_save_setup(QEMUFile *f, void *opaque)
      }
  
      rcu_read_unlock();
+    compress_threads_save_setup();
  
      ram_control_before_iterate(f, RAM_CONTROL_SETUP);
      ram_control_after_iterate(f, RAM_CONTROL_SETUP);
@@ -2004,7 +2247,8 @@ static int ram_save_setup(QEMUFile *f, void *opaque)
   */
  static int ram_save_iterate(QEMUFile *f, void *opaque)
  {
-    RAMState *rs = opaque;
+    RAMState **temp = opaque;
+    RAMState *rs = *temp;
      int ret;
      int i;
      int64_t t0;
@@ -2057,7 +2301,7 @@ static int ram_save_iterate(QEMUFile *f, void *opaque)
      ram_control_after_iterate(f, RAM_CONTROL_ROUND);
  
      qemu_put_be64(f, RAM_SAVE_FLAG_EOS);
-    rs->bytes_transferred += 8;
+    ram_counters.transferred += 8;
  
      ret = qemu_file_get_error(f);
      if (ret < 0) {
@@ -2079,7 +2323,8 @@ static int ram_save_iterate(QEMUFile *f, void *opaque)
   */
  static int ram_save_complete(QEMUFile *f, void *opaque)
  {
-    RAMState *rs = opaque;
+    RAMState **temp = opaque;
+    RAMState *rs = *temp;
  
      rcu_read_lock();
  
@@ -2116,7 +2361,8 @@ static void ram_save_pending(QEMUFile *f, void *opaque, uint64_t max_size,
                               uint64_t *non_postcopiable_pending,
                               uint64_t *postcopiable_pending)
  {
-    RAMState *rs = opaque;
+    RAMState **temp = opaque;
+    RAMState *rs = *temp;
      uint64_t remaining_size;
  
      remaining_size = rs->migration_dirty_pages * TARGET_PAGE_SIZE;
@@ -2131,8 +2377,12 @@ static void ram_save_pending(QEMUFile *f, void *opaque, uint64_t max_size,
          remaining_size = rs->migration_dirty_pages * TARGET_PAGE_SIZE;
      }
  
-    /* We can do postcopy, and all the data is postcopiable */
-    *postcopiable_pending += remaining_size;
+    if (migrate_postcopy_ram()) {
+        /* We can do postcopy, and all the data is postcopiable */
+        *postcopiable_pending += remaining_size;
+    } else {
+        *non_postcopiable_pending += remaining_size;
+    }
  }
  
  static int load_xbzrle(QEMUFile *f, ram_addr_t addr, void *host)
@@ -2141,11 +2391,6 @@ static int load_xbzrle(QEMUFile *f, ram_addr_t addr, void *host)
      int xh_flags;
      uint8_t *loaded_data;
  
-    if (!xbzrle_decoded_buf) {
-        xbzrle_decoded_buf = g_malloc(TARGET_PAGE_SIZE);
-    }
-    loaded_data = xbzrle_decoded_buf;
-
      /* extract RLE header */
      xh_flags = qemu_get_byte(f);
      xh_len = qemu_get_be16(f);
@@ -2159,7 +2404,9 @@ static int load_xbzrle(QEMUFile *f, ram_addr_t addr, void *host)
          error_report("Failed to load XBZRLE page - len overflow!");
          return -1;
      }
+    loaded_data = XBZRLE.decoded_buf;
      /* load data and decode */
+    /* it can change loaded_data to point to an internal buffer */
      qemu_get_buffer_in_place(f, &loaded_data, xh_len);
  
      /* decode RLE */
@@ -2293,10 +2540,13 @@ static void wait_for_decompress_done(void)
      qemu_mutex_unlock(&decomp_done_lock);
  }
  
-void migrate_decompress_threads_create(void)
+static void compress_threads_load_setup(void)
  {
      int i, thread_count;
  
+    if (!migrate_use_compression()) {
+        return;
+    }
      thread_count = migrate_decompress_threads();
      decompress_threads = g_new0(QemuThread, thread_count);
      decomp_param = g_new0(DecompressParam, thread_count);
@@ -2314,10 +2564,13 @@ void migrate_decompress_threads_create(void)
      }
  }
  
-void migrate_decompress_threads_join(void)
+static void compress_threads_load_cleanup(void)
  {
      int i, thread_count;
  
+    if (!migrate_use_compression()) {
+        return;
+    }
      thread_count = migrate_decompress_threads();
      for (i = 0; i < thread_count; i++) {
          qemu_mutex_lock(&decomp_param[i].mutex);
@@ -2366,6 +2619,35 @@ static void decompress_data_with_multi_threads(QEMUFile *f,
      qemu_mutex_unlock(&decomp_done_lock);
  }
  
+/**
+ * ram_load_setup: Setup RAM for migration incoming side
+ *
+ * Returns zero to indicate success and negative for error
+ *
+ * @f: QEMUFile where to receive the data
+ * @opaque: RAMState pointer
+ */
+static int ram_load_setup(QEMUFile *f, void *opaque)
+{
+    xbzrle_load_setup();
+    compress_threads_load_setup();
+    ramblock_recv_map_init();
+    return 0;
+}
+
+static int ram_load_cleanup(void *opaque)
+{
+    RAMBlock *rb;
+    xbzrle_load_cleanup();
+    compress_threads_load_cleanup();
+
+    RAMBLOCK_FOREACH(rb) {
+        g_free(rb->receivedmap);
+        rb->receivedmap = NULL;
+    }
+    return 0;
+}
+
  /**
   * ram_postcopy_incoming_init: allocate postcopy data structures
   *
@@ -2502,10 +2784,10 @@ static int ram_load_postcopy(QEMUFile *f)
  
              if (all_zero) {
                  ret = postcopy_place_page_zero(mis, place_dest,
-                                               block->page_size);
+                                               block);
              } else {
                  ret = postcopy_place_page(mis, place_dest,
-                                          place_source, block->page_size);
+                                          place_source, block);
              }
          }
          if (!ret) {
@@ -2518,7 +2800,7 @@ static int ram_load_postcopy(QEMUFile *f)
  
  static int ram_load(QEMUFile *f, void *opaque, int version_id)
  {
-    int flags = 0, ret = 0;
+    int flags = 0, ret = 0, invalid_flags = 0;
      static uint64_t seq_iter;
      int len = 0;
      /*
@@ -2535,6 +2817,9 @@ static int ram_load(QEMUFile *f, void *opaque, int version_id)
          ret = -EINVAL;
      }
  
+    if (!migrate_use_compression()) {
+        invalid_flags |= RAM_SAVE_FLAG_COMPRESS_PAGE;
+    }
      /* This RCU critical section can be very long running.
       * When RCU reclaims in the code start to become numerous,
       * it will be necessary to reduce the granularity of this
@@ -2555,6 +2840,15 @@ static int ram_load(QEMUFile *f, void *opaque, int version_id)
          flags = addr & ~TARGET_PAGE_MASK;
          addr &= TARGET_PAGE_MASK;
  
+        if (flags & invalid_flags) {
+            if (flags & invalid_flags & RAM_SAVE_FLAG_COMPRESS_PAGE) {
+                error_report("Received an unexpected compressed page");
+            }
+
+            ret = -EINVAL;
+            break;
+        }
+
          if (flags & (RAM_SAVE_FLAG_ZERO | RAM_SAVE_FLAG_PAGE |
                       RAM_SAVE_FLAG_COMPRESS_PAGE | RAM_SAVE_FLAG_XBZRLE)) {
              RAMBlock *block = ram_block_from_stream(f, flags);
@@ -2565,6 +2859,7 @@ static int ram_load(QEMUFile *f, void *opaque, int version_id)
                  ret = -EINVAL;
                  break;
              }
+            ramblock_recv_bitmap_set(block, host);
              trace_ram_load_loop(block->idstr, (uint64_t)addr, flags, host);
          }
  
@@ -2667,14 +2962,22 @@ static int ram_load(QEMUFile *f, void *opaque, int version_id)
      return ret;
  }
  
+static bool ram_has_postcopy(void *opaque)
+{
+    return migrate_postcopy_ram();
+}
+
  static SaveVMHandlers savevm_ram_handlers = {
-    .save_live_setup = ram_save_setup,
+    .save_setup = ram_save_setup,
      .save_live_iterate = ram_save_iterate,
      .save_live_complete_postcopy = ram_save_complete,
      .save_live_complete_precopy = ram_save_complete,
+    .has_postcopy = ram_has_postcopy,
      .save_live_pending = ram_save_pending,
      .load_state = ram_load,
-    .cleanup = ram_migration_cleanup,
+    .save_cleanup = ram_save_cleanup,
+    .load_setup = ram_load_setup,
+    .load_cleanup = ram_load_cleanup,
  };
  
  void ram_mig_init(void)