Merge remote-tracking branch 'remotes/rth/tags/pull-tcg-20190903' into staging

[mirror_qemu.git] / exec.c
diff --git a/exec.c b/exec.c

index 03dd673d36d8ab4fcee56471abfbca81cf289c3e..235d6bc88323432899f4f10b7f292548facc4df0 100644 (file)
--- a/exec.c
+++ b/exec.c
@@ -16,7 +16,9 @@
   * You should have received a copy of the GNU Lesser General Public
   * License along with this library; if not, see <http://www.gnu.org/licenses/>.
   */
+
  #include "qemu/osdep.h"
+#include "qemu-common.h"
  #include "qapi/error.h"
  
  #include "qemu/cutils.h"
@@ -32,17 +34,18 @@
  #endif
  #include "sysemu/kvm.h"
  #include "sysemu/sysemu.h"
+#include "sysemu/tcg.h"
  #include "qemu/timer.h"
  #include "qemu/config-file.h"
  #include "qemu/error-report.h"
+#include "qemu/qemu-print.h"
  #if defined(CONFIG_USER_ONLY)
  #include "qemu.h"
  #else /* !CONFIG_USER_ONLY */
-#include "hw/hw.h"
  #include "exec/memory.h"
  #include "exec/ioport.h"
  #include "sysemu/dma.h"
-#include "sysemu/numa.h"
+#include "sysemu/hostmem.h"
  #include "sysemu/hw_accel.h"
  #include "exec/address-spaces.h"
  #include "sysemu/xen-mapcache.h"
@@ -190,14 +193,12 @@ typedef struct subpage_t {
  #define PHYS_SECTION_UNASSIGNED 0
  #define PHYS_SECTION_NOTDIRTY 1
  #define PHYS_SECTION_ROM 2
-#define PHYS_SECTION_WATCH 3
  
  static void io_mem_init(void);
  static void memory_map_init(void);
+static void tcg_log_global_after_sync(MemoryListener *listener);
  static void tcg_commit(MemoryListener *listener);
  
-static MemoryRegion io_mem_watch;
-
  /**
   * CPUAddressSpace: all the information a CPU needs about an AddressSpace
   * @cpu: the CPU whose AddressSpace this is
@@ -902,6 +903,7 @@ void cpu_address_space_init(CPUState *cpu, int asidx,
      newas->cpu = cpu;
      newas->as = as;
      if (tcg_enabled()) {
+        newas->tcg_as_listener.log_global_after_sync = tcg_log_global_after_sync;
          newas->tcg_as_listener.commit = tcg_commit;
          memory_listener_register(&newas->tcg_as_listener, as);
      }
@@ -934,7 +936,7 @@ void cpu_exec_unrealizefn(CPUState *cpu)
  Property cpu_common_props[] = {
  #ifndef CONFIG_USER_ONLY
      /* Create a memory property for softmmu CPU object,
-     * so users can wire up its memory. (This can't go in qom/cpu.c
+     * so users can wire up its memory. (This can't go in hw/core/cpu.c
       * because that file is compiled only once for both user-mode
       * and system builds.) The default if no link is set up is to use
       * the system address space.
@@ -982,14 +984,18 @@ void cpu_exec_realizefn(CPUState *cpu, Error **errp)
  #endif
  }
  
-const char *parse_cpu_model(const char *cpu_model)
+const char *parse_cpu_option(const char *cpu_option)
  {
      ObjectClass *oc;
      CPUClass *cc;
      gchar **model_pieces;
      const char *cpu_type;
  
-    model_pieces = g_strsplit(cpu_model, ",", 2);
+    model_pieces = g_strsplit(cpu_option, ",", 2);
+    if (!model_pieces[0]) {
+        error_report("-cpu option cannot be empty");
+        exit(1);
+    }
  
      oc = cpu_class_by_name(CPU_RESOLVING_TYPE, model_pieces[0]);
      if (oc == NULL) {
@@ -1053,28 +1059,7 @@ static void breakpoint_invalidate(CPUState *cpu, target_ulong pc)
  }
  #endif
  
-#if defined(CONFIG_USER_ONLY)
-void cpu_watchpoint_remove_all(CPUState *cpu, int mask)
-
-{
-}
-
-int cpu_watchpoint_remove(CPUState *cpu, vaddr addr, vaddr len,
-                          int flags)
-{
-    return -ENOSYS;
-}
-
-void cpu_watchpoint_remove_by_ref(CPUState *cpu, CPUWatchpoint *watchpoint)
-{
-}
-
-int cpu_watchpoint_insert(CPUState *cpu, vaddr addr, vaddr len,
-                          int flags, CPUWatchpoint **watchpoint)
-{
-    return -ENOSYS;
-}
-#else
+#ifndef CONFIG_USER_ONLY
  /* Add a watchpoint.  */
  int cpu_watchpoint_insert(CPUState *cpu, vaddr addr, vaddr len,
                            int flags, CPUWatchpoint **watchpoint)
@@ -1150,9 +1135,8 @@ void cpu_watchpoint_remove_all(CPUState *cpu, int mask)
   * partially or completely with the address range covered by the
   * access).
   */
-static inline bool cpu_watchpoint_address_matches(CPUWatchpoint *wp,
-                                                  vaddr addr,
-                                                  vaddr len)
+static inline bool watchpoint_address_matches(CPUWatchpoint *wp,
+                                              vaddr addr, vaddr len)
  {
      /* We know the lengths are non-zero, but a little caution is
       * required to avoid errors in the case where the range ends
@@ -1165,7 +1149,20 @@ static inline bool cpu_watchpoint_address_matches(CPUWatchpoint *wp,
      return !(addr > wpend || wp->vaddr > addrend);
  }
  
-#endif
+/* Return flags for watchpoints that match addr + prot.  */
+int cpu_watchpoint_address_matches(CPUState *cpu, vaddr addr, vaddr len)
+{
+    CPUWatchpoint *wp;
+    int ret = 0;
+
+    QTAILQ_FOREACH(wp, &cpu->watchpoints, entry) {
+        if (watchpoint_address_matches(wp, addr, TARGET_PAGE_SIZE)) {
+            ret |= wp->flags;
+        }
+    }
+    return ret;
+}
+#endif /* !CONFIG_USER_ONLY */
  
  /* Add a breakpoint.  */
  int cpu_breakpoint_insert(CPUState *cpu, vaddr pc, int flags,
@@ -1255,7 +1252,7 @@ void cpu_abort(CPUState *cpu, const char *fmt, ...)
      fprintf(stderr, "qemu: fatal: ");
      vfprintf(stderr, fmt, ap);
      fprintf(stderr, "\n");
-    cpu_dump_state(cpu, stderr, fprintf, CPU_DUMP_FPU | CPU_DUMP_CCOP);
+    cpu_dump_state(cpu, stderr, CPU_DUMP_FPU | CPU_DUMP_CCOP);
      if (qemu_log_separate()) {
          qemu_log_lock();
          qemu_log("qemu: fatal: ");
@@ -1350,6 +1347,8 @@ bool cpu_physical_memory_test_and_clear_dirty(ram_addr_t start,
      DirtyMemoryBlocks *blocks;
      unsigned long end, page;
      bool dirty = false;
+    RAMBlock *ramblock;
+    uint64_t mr_offset, mr_size;
  
      if (length == 0) {
          return false;
@@ -1361,6 +1360,10 @@ bool cpu_physical_memory_test_and_clear_dirty(ram_addr_t start,
      rcu_read_lock();
  
      blocks = atomic_rcu_read(&ram_list.dirty_memory[client]);
+    ramblock = qemu_get_ram_block(start);
+    /* Range sanity check on the ramblock */
+    assert(start >= ramblock->offset &&
+           start + length <= ramblock->offset + ramblock->used_length);
  
      while (page < end) {
          unsigned long idx = page / DIRTY_MEMORY_BLOCK_SIZE;
@@ -1372,6 +1375,10 @@ bool cpu_physical_memory_test_and_clear_dirty(ram_addr_t start,
          page += num;
      }
  
+    mr_offset = (ram_addr_t)(page << TARGET_PAGE_BITS) - ramblock->offset;
+    mr_size = (end - page) << TARGET_PAGE_BITS;
+    memory_region_clear_dirty_bitmap(ramblock->mr, mr_offset, mr_size);
+
      rcu_read_unlock();
  
      if (dirty && tcg_enabled()) {
@@ -1382,9 +1389,10 @@ bool cpu_physical_memory_test_and_clear_dirty(ram_addr_t start,
  }
  
  DirtyBitmapSnapshot *cpu_physical_memory_snapshot_and_clear_dirty
-     (ram_addr_t start, ram_addr_t length, unsigned client)
+    (MemoryRegion *mr, hwaddr offset, hwaddr length, unsigned client)
  {
      DirtyMemoryBlocks *blocks;
+    ram_addr_t start = memory_region_get_ram_addr(mr) + offset;
      unsigned long align = 1UL << (TARGET_PAGE_BITS + BITS_PER_LEVEL);
      ram_addr_t first = QEMU_ALIGN_DOWN(start, align);
      ram_addr_t last  = QEMU_ALIGN_UP(start + length, align);
@@ -1426,6 +1434,8 @@ DirtyBitmapSnapshot *cpu_physical_memory_snapshot_and_clear_dirty
          tlb_reset_dirty_range_all(start, length);
      }
  
+    memory_region_clear_dirty_bitmap(mr, offset, length);
+
      return snap;
  }
  
@@ -1459,7 +1469,6 @@ hwaddr memory_region_section_get_iotlb(CPUState *cpu,
                                         target_ulong *address)
  {
      hwaddr iotlb;
-    CPUWatchpoint *wp;
  
      if (memory_region_is_ram(section->mr)) {
          /* Normal RAM.  */
@@ -1477,19 +1486,6 @@ hwaddr memory_region_section_get_iotlb(CPUState *cpu,
          iotlb += xlat;
      }
  
-    /* Make accesses to pages with watchpoints go via the
-       watchpoint trap routines.  */
-    QTAILQ_FOREACH(wp, &cpu->watchpoints, entry) {
-        if (cpu_watchpoint_address_matches(wp, vaddr, TARGET_PAGE_SIZE)) {
-            /* Avoid trapping reads of pages with a write breakpoint. */
-            if ((prot & PAGE_WRITE) || (wp->flags & BP_MEM_READ)) {
-                iotlb = PHYS_SECTION_WATCH + paddr;
-                *address |= TLB_MMIO;
-                break;
-            }
-        }
-    }
-
      return iotlb;
  }
  #endif /* defined(CONFIG_USER_ONLY) */
@@ -1599,35 +1595,49 @@ static void register_multipage(FlatView *fv,
      phys_page_set(d, start_addr >> TARGET_PAGE_BITS, num_pages, section_index);
  }
  
+/*
+ * The range in *section* may look like this:
+ *
+ *      |s|PPPPPPP|s|
+ *
+ * where s stands for subpage and P for page.
+ */
  void flatview_add_to_dispatch(FlatView *fv, MemoryRegionSection *section)
  {
-    MemoryRegionSection now = *section, remain = *section;
+    MemoryRegionSection remain = *section;
      Int128 page_size = int128_make64(TARGET_PAGE_SIZE);
  
-    if (now.offset_within_address_space & ~TARGET_PAGE_MASK) {
-        uint64_t left = TARGET_PAGE_ALIGN(now.offset_within_address_space)
-                       - now.offset_within_address_space;
+    /* register first subpage */
+    if (remain.offset_within_address_space & ~TARGET_PAGE_MASK) {
+        uint64_t left = TARGET_PAGE_ALIGN(remain.offset_within_address_space)
+                        - remain.offset_within_address_space;
  
+        MemoryRegionSection now = remain;
          now.size = int128_min(int128_make64(left), now.size);
          register_subpage(fv, &now);
-    } else {
-        now.size = int128_zero();
-    }
-    while (int128_ne(remain.size, now.size)) {
+        if (int128_eq(remain.size, now.size)) {
+            return;
+        }
          remain.size = int128_sub(remain.size, now.size);
          remain.offset_within_address_space += int128_get64(now.size);
          remain.offset_within_region += int128_get64(now.size);
-        now = remain;
-        if (int128_lt(remain.size, page_size)) {
-            register_subpage(fv, &now);
-        } else if (remain.offset_within_address_space & ~TARGET_PAGE_MASK) {
-            now.size = page_size;
-            register_subpage(fv, &now);
-        } else {
-            now.size = int128_and(now.size, int128_neg(page_size));
-            register_multipage(fv, &now);
+    }
+
+    /* register whole pages */
+    if (int128_ge(remain.size, page_size)) {
+        MemoryRegionSection now = remain;
+        now.size = int128_and(now.size, int128_neg(page_size));
+        register_multipage(fv, &now);
+        if (int128_eq(remain.size, now.size)) {
+            return;
          }
+        remain.size = int128_sub(remain.size, now.size);
+        remain.offset_within_address_space += int128_get64(now.size);
+        remain.offset_within_region += int128_get64(now.size);
      }
+
+    /* register last subpage */
+    register_subpage(fv, &remain);
  }
  
  void qemu_flush_coalesced_mmio_buffer(void)
@@ -1673,14 +1683,15 @@ void ram_block_dump(Monitor *mon)
   * when we actually open and map them.  Iterate over the file
   * descriptors instead, and use qemu_fd_getpagesize().
   */
-static int find_max_supported_pagesize(Object *obj, void *opaque)
+static int find_min_backend_pagesize(Object *obj, void *opaque)
  {
      long *hpsize_min = opaque;
  
      if (object_dynamic_cast(obj, TYPE_MEMORY_BACKEND)) {
-        long hpsize = host_memory_backend_pagesize(MEMORY_BACKEND(obj));
+        HostMemoryBackend *backend = MEMORY_BACKEND(obj);
+        long hpsize = host_memory_backend_pagesize(backend);
  
-        if (hpsize < *hpsize_min) {
+        if (host_memory_backend_is_mapped(backend) && (hpsize < *hpsize_min)) {
              *hpsize_min = hpsize;
          }
      }
@@ -1688,11 +1699,32 @@ static int find_max_supported_pagesize(Object *obj, void *opaque)
      return 0;
  }
  
-long qemu_getrampagesize(void)
+static int find_max_backend_pagesize(Object *obj, void *opaque)
+{
+    long *hpsize_max = opaque;
+
+    if (object_dynamic_cast(obj, TYPE_MEMORY_BACKEND)) {
+        HostMemoryBackend *backend = MEMORY_BACKEND(obj);
+        long hpsize = host_memory_backend_pagesize(backend);
+
+        if (host_memory_backend_is_mapped(backend) && (hpsize > *hpsize_max)) {
+            *hpsize_max = hpsize;
+        }
+    }
+
+    return 0;
+}
+
+/*
+ * TODO: We assume right now that all mapped host memory backends are
+ * used as RAM, however some might be used for different purposes.
+ */
+long qemu_minrampagesize(void)
  {
      long hpsize = LONG_MAX;
      long mainrampagesize;
      Object *memdev_root;
+    MachineState *ms = MACHINE(qdev_get_machine());
  
      mainrampagesize = qemu_mempath_getpagesize(mem_path);
  
@@ -1708,7 +1740,7 @@ long qemu_getrampagesize(void)
       */
      memdev_root = object_resolve_path("/objects", NULL);
      if (memdev_root) {
-        object_child_foreach(memdev_root, find_max_supported_pagesize, &hpsize);
+        object_child_foreach(memdev_root, find_min_backend_pagesize, &hpsize);
      }
      if (hpsize == LONG_MAX) {
          /* No additional memory regions found ==> Report main RAM page size */
@@ -1720,7 +1752,9 @@ long qemu_getrampagesize(void)
       * so if its page size is smaller we have got to report that size instead.
       */
      if (hpsize > mainrampagesize &&
-        (nb_numa_nodes == 0 || numa_info[0].node_memdev == NULL)) {
+        (ms->numa_state == NULL ||
+         ms->numa_state->num_nodes == 0 ||
+         ms->numa_state->nodes[0].node_memdev == NULL)) {
          static bool warned;
          if (!warned) {
              error_report("Huge page support disabled (n/a for main memory).");
@@ -1731,8 +1765,24 @@ long qemu_getrampagesize(void)
  
      return hpsize;
  }
+
+long qemu_maxrampagesize(void)
+{
+    long pagesize = qemu_mempath_getpagesize(mem_path);
+    Object *memdev_root = object_resolve_path("/objects", NULL);
+
+    if (memdev_root) {
+        object_child_foreach(memdev_root, find_max_backend_pagesize,
+                             &pagesize);
+    }
+    return pagesize;
+}
  #else
-long qemu_getrampagesize(void)
+long qemu_minrampagesize(void)
+{
+    return getpagesize();
+}
+long qemu_maxrampagesize(void)
  {
      return getpagesize();
  }
@@ -1815,6 +1865,7 @@ static void *file_ram_alloc(RAMBlock *block,
                              bool truncate,
                              Error **errp)
  {
+    MachineState *ms = MACHINE(qdev_get_machine());
      void *area;
  
      block->page_size = qemu_fd_getpagesize(fd);
@@ -1863,7 +1914,7 @@ static void *file_ram_alloc(RAMBlock *block,
      }
  
      area = qemu_ram_mmap(fd, memory, block->mr->align,
-                         block->flags & RAM_SHARED);
+                         block->flags & RAM_SHARED, block->flags & RAM_PMEM);
      if (area == MAP_FAILED) {
          error_setg_errno(errp, errno,
                           "unable to map backing store for guest RAM");
@@ -1871,7 +1922,7 @@ static void *file_ram_alloc(RAMBlock *block,
      }
  
      if (mem_prealloc) {
-        os_mem_prealloc(fd, area, memory, smp_cpus, errp);
+        os_mem_prealloc(fd, area, memory, ms->smp.cpus, errp);
          if (errp && *errp) {
              qemu_ram_munmap(fd, area, memory);
              return NULL;
@@ -1972,6 +2023,21 @@ const char *qemu_ram_get_idstr(RAMBlock *rb)
      return rb->idstr;
  }
  
+void *qemu_ram_get_host_addr(RAMBlock *rb)
+{
+    return rb->host;
+}
+
+ram_addr_t qemu_ram_get_offset(RAMBlock *rb)
+{
+    return rb->offset;
+}
+
+ram_addr_t qemu_ram_get_used_length(RAMBlock *rb)
+{
+    return rb->used_length;
+}
+
  bool qemu_ram_is_shared(RAMBlock *rb)
  {
      return rb->flags & RAM_SHARED;
@@ -2722,32 +2788,35 @@ static const MemoryRegionOps notdirty_mem_ops = {
  };
  
  /* Generate a debug exception if a watchpoint has been hit.  */
-static void check_watchpoint(int offset, int len, MemTxAttrs attrs, int flags)
+void cpu_check_watchpoint(CPUState *cpu, vaddr addr, vaddr len,
+                          MemTxAttrs attrs, int flags, uintptr_t ra)
  {
-    CPUState *cpu = current_cpu;
      CPUClass *cc = CPU_GET_CLASS(cpu);
-    target_ulong vaddr;
      CPUWatchpoint *wp;
  
      assert(tcg_enabled());
      if (cpu->watchpoint_hit) {
-        /* We re-entered the check after replacing the TB. Now raise
-         * the debug interrupt so that is will trigger after the
-         * current instruction. */
+        /*
+         * We re-entered the check after replacing the TB.
+         * Now raise the debug interrupt so that it will
+         * trigger after the current instruction.
+         */
+        qemu_mutex_lock_iothread();
          cpu_interrupt(cpu, CPU_INTERRUPT_DEBUG);
+        qemu_mutex_unlock_iothread();
          return;
      }
-    vaddr = (cpu->mem_io_vaddr & TARGET_PAGE_MASK) + offset;
-    vaddr = cc->adjust_watchpoint_address(cpu, vaddr, len);
+
+    addr = cc->adjust_watchpoint_address(cpu, addr, len);
      QTAILQ_FOREACH(wp, &cpu->watchpoints, entry) {
-        if (cpu_watchpoint_address_matches(wp, vaddr, len)
+        if (watchpoint_address_matches(wp, addr, len)
              && (wp->flags & flags)) {
              if (flags == BP_MEM_READ) {
                  wp->flags |= BP_WATCHPOINT_HIT_READ;
              } else {
                  wp->flags |= BP_WATCHPOINT_HIT_WRITE;
              }
-            wp->hitaddr = vaddr;
+            wp->hitaddr = MAX(addr, wp->vaddr);
              wp->hitattrs = attrs;
              if (!cpu->watchpoint_hit) {
                  if (wp->flags & BP_CPU &&
@@ -2762,11 +2831,14 @@ static void check_watchpoint(int offset, int len, MemTxAttrs attrs, int flags)
                  if (wp->flags & BP_STOP_BEFORE_ACCESS) {
                      cpu->exception_index = EXCP_DEBUG;
                      mmap_unlock();
-                    cpu_loop_exit(cpu);
+                    cpu_loop_exit_restore(cpu, ra);
                  } else {
                      /* Force execution of one insn next time.  */
                      cpu->cflags_next_tb = 1 | curr_cflags();
                      mmap_unlock();
+                    if (ra) {
+                        cpu_restore_state(cpu, ra, true);
+                    }
                      cpu_loop_exit_noexc(cpu);
                  }
              }
@@ -2776,85 +2848,11 @@ static void check_watchpoint(int offset, int len, MemTxAttrs attrs, int flags)
      }
  }
  
-/* Watchpoint access routines.  Watchpoints are inserted using TLB tricks,
-   so these check for a hit then pass through to the normal out-of-line
-   phys routines.  */
-static MemTxResult watch_mem_read(void *opaque, hwaddr addr, uint64_t *pdata,
-                                  unsigned size, MemTxAttrs attrs)
-{
-    MemTxResult res;
-    uint64_t data;
-    int asidx = cpu_asidx_from_attrs(current_cpu, attrs);
-    AddressSpace *as = current_cpu->cpu_ases[asidx].as;
-
-    check_watchpoint(addr & ~TARGET_PAGE_MASK, size, attrs, BP_MEM_READ);
-    switch (size) {
-    case 1:
-        data = address_space_ldub(as, addr, attrs, &res);
-        break;
-    case 2:
-        data = address_space_lduw(as, addr, attrs, &res);
-        break;
-    case 4:
-        data = address_space_ldl(as, addr, attrs, &res);
-        break;
-    case 8:
-        data = address_space_ldq(as, addr, attrs, &res);
-        break;
-    default: abort();
-    }
-    *pdata = data;
-    return res;
-}
-
-static MemTxResult watch_mem_write(void *opaque, hwaddr addr,
-                                   uint64_t val, unsigned size,
-                                   MemTxAttrs attrs)
-{
-    MemTxResult res;
-    int asidx = cpu_asidx_from_attrs(current_cpu, attrs);
-    AddressSpace *as = current_cpu->cpu_ases[asidx].as;
-
-    check_watchpoint(addr & ~TARGET_PAGE_MASK, size, attrs, BP_MEM_WRITE);
-    switch (size) {
-    case 1:
-        address_space_stb(as, addr, val, attrs, &res);
-        break;
-    case 2:
-        address_space_stw(as, addr, val, attrs, &res);
-        break;
-    case 4:
-        address_space_stl(as, addr, val, attrs, &res);
-        break;
-    case 8:
-        address_space_stq(as, addr, val, attrs, &res);
-        break;
-    default: abort();
-    }
-    return res;
-}
-
-static const MemoryRegionOps watch_mem_ops = {
-    .read_with_attrs = watch_mem_read,
-    .write_with_attrs = watch_mem_write,
-    .endianness = DEVICE_NATIVE_ENDIAN,
-    .valid = {
-        .min_access_size = 1,
-        .max_access_size = 8,
-        .unaligned = false,
-    },
-    .impl = {
-        .min_access_size = 1,
-        .max_access_size = 8,
-        .unaligned = false,
-    },
-};
-
  static MemTxResult flatview_read(FlatView *fv, hwaddr addr,
-                                      MemTxAttrs attrs, uint8_t *buf, int len);
+                                 MemTxAttrs attrs, uint8_t *buf, hwaddr len);
  static MemTxResult flatview_write(FlatView *fv, hwaddr addr, MemTxAttrs attrs,
-                                  const uint8_t *buf, int len);
-static bool flatview_access_valid(FlatView *fv, hwaddr addr, int len,
+                                  const uint8_t *buf, hwaddr len);
+static bool flatview_access_valid(FlatView *fv, hwaddr addr, hwaddr len,
                                    bool is_write, MemTxAttrs attrs);
  
  static MemTxResult subpage_read(void *opaque, hwaddr addr, uint64_t *data,
@@ -3025,9 +3023,6 @@ static void io_mem_init(void)
      memory_region_init_io(&io_mem_notdirty, NULL, &notdirty_mem_ops, NULL,
                            NULL, UINT64_MAX);
      memory_region_clear_global_locking(&io_mem_notdirty);
-
-    memory_region_init_io(&io_mem_watch, NULL, &watch_mem_ops, NULL,
-                          NULL, UINT64_MAX);
  }
  
  AddressSpaceDispatch *address_space_dispatch_new(FlatView *fv)
@@ -3041,8 +3036,6 @@ AddressSpaceDispatch *address_space_dispatch_new(FlatView *fv)
      assert(n == PHYS_SECTION_NOTDIRTY);
      n = dummy_section(&d->map, fv, &io_mem_rom);
      assert(n == PHYS_SECTION_ROM);
-    n = dummy_section(&d->map, fv, &io_mem_watch);
-    assert(n == PHYS_SECTION_WATCH);
  
      d->phys_map  = (PhysPageEntry) { .ptr = PHYS_MAP_NODE_NIL, .skip = 1 };
  
@@ -3055,6 +3048,35 @@ void address_space_dispatch_free(AddressSpaceDispatch *d)
      g_free(d);
  }
  
+static void do_nothing(CPUState *cpu, run_on_cpu_data d)
+{
+}
+
+static void tcg_log_global_after_sync(MemoryListener *listener)
+{
+    CPUAddressSpace *cpuas;
+
+    /* Wait for the CPU to end the current TB.  This avoids the following
+     * incorrect race:
+     *
+     *      vCPU                         migration
+     *      ----------------------       -------------------------
+     *      TLB check -> slow path
+     *        notdirty_mem_write
+     *          write to RAM
+     *          mark dirty
+     *                                   clear dirty flag
+     *      TLB check -> fast path
+     *                                   read memory
+     *        write to RAM
+     *
+     * by pushing the migration thread's memory read after the vCPU thread has
+     * written the memory.
+     */
+    cpuas = container_of(listener, CPUAddressSpace, tcg_as_listener);
+    run_on_cpu(cpuas->cpu, do_nothing, RUN_ON_CPU_NULL);
+}
+
  static void tcg_commit(MemoryListener *listener)
  {
      CPUAddressSpace *cpuas;
@@ -3102,10 +3124,10 @@ MemoryRegion *get_system_io(void)
  /* physical memory access (slow version, mainly for debug) */
  #if defined(CONFIG_USER_ONLY)
  int cpu_memory_rw_debug(CPUState *cpu, target_ulong addr,
-                        uint8_t *buf, int len, int is_write)
+                        uint8_t *buf, target_ulong len, int is_write)
  {
-    int l, flags;
-    target_ulong page;
+    int flags;
+    target_ulong l, page;
      void * p;
  
      while (len > 0) {
@@ -3231,7 +3253,7 @@ static bool prepare_mmio_access(MemoryRegion *mr)
  static MemTxResult flatview_write_continue(FlatView *fv, hwaddr addr,
                                             MemTxAttrs attrs,
                                             const uint8_t *buf,
-                                           int len, hwaddr addr1,
+                                           hwaddr len, hwaddr addr1,
                                             hwaddr l, MemoryRegion *mr)
  {
      uint8_t *ptr;
@@ -3245,8 +3267,9 @@ static MemTxResult flatview_write_continue(FlatView *fv, hwaddr addr,
              l = memory_access_size(mr, l, addr1);
              /* XXX: could force current_cpu to NULL to avoid
                 potential bugs */
-            val = ldn_p(buf, l);
-            result |= memory_region_dispatch_write(mr, addr1, val, l, attrs);
+            val = ldn_he_p(buf, l);
+            result |= memory_region_dispatch_write(mr, addr1, val,
+                                                   size_memop(l), attrs);
          } else {
              /* RAM case */
              ptr = qemu_ram_ptr_length(mr->ram_block, addr1, &l, false);
@@ -3276,7 +3299,7 @@ static MemTxResult flatview_write_continue(FlatView *fv, hwaddr addr,
  
  /* Called from RCU critical section.  */
  static MemTxResult flatview_write(FlatView *fv, hwaddr addr, MemTxAttrs attrs,
-                                  const uint8_t *buf, int len)
+                                  const uint8_t *buf, hwaddr len)
  {
      hwaddr l;
      hwaddr addr1;
@@ -3294,7 +3317,7 @@ static MemTxResult flatview_write(FlatView *fv, hwaddr addr, MemTxAttrs attrs,
  /* Called within RCU critical section.  */
  MemTxResult flatview_read_continue(FlatView *fv, hwaddr addr,
                                     MemTxAttrs attrs, uint8_t *buf,
-                                   int len, hwaddr addr1, hwaddr l,
+                                   hwaddr len, hwaddr addr1, hwaddr l,
                                     MemoryRegion *mr)
  {
      uint8_t *ptr;
@@ -3307,8 +3330,9 @@ MemTxResult flatview_read_continue(FlatView *fv, hwaddr addr,
              /* I/O case */
              release_lock |= prepare_mmio_access(mr);
              l = memory_access_size(mr, l, addr1);
-            result |= memory_region_dispatch_read(mr, addr1, &val, l, attrs);
-            stn_p(buf, l, val);
+            result |= memory_region_dispatch_read(mr, addr1, &val,
+                                                  size_memop(l), attrs);
+            stn_he_p(buf, l, val);
          } else {
              /* RAM case */
              ptr = qemu_ram_ptr_length(mr->ram_block, addr1, &l, false);
@@ -3337,7 +3361,7 @@ MemTxResult flatview_read_continue(FlatView *fv, hwaddr addr,
  
  /* Called from RCU critical section.  */
  static MemTxResult flatview_read(FlatView *fv, hwaddr addr,
-                                 MemTxAttrs attrs, uint8_t *buf, int len)
+                                 MemTxAttrs attrs, uint8_t *buf, hwaddr len)
  {
      hwaddr l;
      hwaddr addr1;
@@ -3350,7 +3374,7 @@ static MemTxResult flatview_read(FlatView *fv, hwaddr addr,
  }
  
  MemTxResult address_space_read_full(AddressSpace *as, hwaddr addr,
-                                    MemTxAttrs attrs, uint8_t *buf, int len)
+                                    MemTxAttrs attrs, uint8_t *buf, hwaddr len)
  {
      MemTxResult result = MEMTX_OK;
      FlatView *fv;
@@ -3367,7 +3391,7 @@ MemTxResult address_space_read_full(AddressSpace *as, hwaddr addr,
  
  MemTxResult address_space_write(AddressSpace *as, hwaddr addr,
                                  MemTxAttrs attrs,
-                                const uint8_t *buf, int len)
+                                const uint8_t *buf, hwaddr len)
  {
      MemTxResult result = MEMTX_OK;
      FlatView *fv;
@@ -3383,7 +3407,7 @@ MemTxResult address_space_write(AddressSpace *as, hwaddr addr,
  }
  
  MemTxResult address_space_rw(AddressSpace *as, hwaddr addr, MemTxAttrs attrs,
-                             uint8_t *buf, int len, bool is_write)
+                             uint8_t *buf, hwaddr len, bool is_write)
  {
      if (is_write) {
          return address_space_write(as, addr, attrs, buf, len);
@@ -3393,7 +3417,7 @@ MemTxResult address_space_rw(AddressSpace *as, hwaddr addr, MemTxAttrs attrs,
  }
  
  void cpu_physical_memory_rw(hwaddr addr, uint8_t *buf,
-                            int len, int is_write)
+                            hwaddr len, int is_write)
  {
      address_space_rw(&address_space_memory, addr, MEMTXATTRS_UNSPECIFIED,
                       buf, len, is_write);
@@ -3408,7 +3432,7 @@ static inline MemTxResult address_space_write_rom_internal(AddressSpace *as,
                                                             hwaddr addr,
                                                             MemTxAttrs attrs,
                                                             const uint8_t *buf,
-                                                           int len,
+                                                           hwaddr len,
                                                             enum write_rom_type type)
  {
      hwaddr l;
@@ -3448,13 +3472,13 @@ static inline MemTxResult address_space_write_rom_internal(AddressSpace *as,
  /* used for ROM loading : can write in RAM and ROM */
  MemTxResult address_space_write_rom(AddressSpace *as, hwaddr addr,
                                      MemTxAttrs attrs,
-                                    const uint8_t *buf, int len)
+                                    const uint8_t *buf, hwaddr len)
  {
      return address_space_write_rom_internal(as, addr, attrs,
                                              buf, len, WRITE_DATA);
  }
  
-void cpu_flush_icache_range(hwaddr start, int len)
+void cpu_flush_icache_range(hwaddr start, hwaddr len)
  {
      /*
       * This function should do the same thing as an icache flush that was
@@ -3557,7 +3581,7 @@ static void cpu_notify_map_clients(void)
      qemu_mutex_unlock(&map_client_list_lock);
  }
  
-static bool flatview_access_valid(FlatView *fv, hwaddr addr, int len,
+static bool flatview_access_valid(FlatView *fv, hwaddr addr, hwaddr len,
                                    bool is_write, MemTxAttrs attrs)
  {
      MemoryRegion *mr;
@@ -3580,7 +3604,7 @@ static bool flatview_access_valid(FlatView *fv, hwaddr addr, int len,
  }
  
  bool address_space_access_valid(AddressSpace *as, hwaddr addr,
-                                int len, bool is_write,
+                                hwaddr len, bool is_write,
                                  MemTxAttrs attrs)
  {
      FlatView *fv;
@@ -3833,7 +3857,7 @@ static inline MemoryRegion *address_space_translate_cached(
   */
  void
  address_space_read_cached_slow(MemoryRegionCache *cache, hwaddr addr,
-                                   void *buf, int len)
+                                   void *buf, hwaddr len)
  {
      hwaddr addr1, l;
      MemoryRegion *mr;
@@ -3851,7 +3875,7 @@ address_space_read_cached_slow(MemoryRegionCache *cache, hwaddr addr,
   */
  void
  address_space_write_cached_slow(MemoryRegionCache *cache, hwaddr addr,
-                                    const void *buf, int len)
+                                    const void *buf, hwaddr len)
  {
      hwaddr addr1, l;
      MemoryRegion *mr;
@@ -3874,11 +3898,10 @@ address_space_write_cached_slow(MemoryRegionCache *cache, hwaddr addr,
  
  /* virtual memory access for debug (includes writing to ROM) */
  int cpu_memory_rw_debug(CPUState *cpu, target_ulong addr,
-                        uint8_t *buf, int len, int is_write)
+                        uint8_t *buf, target_ulong len, int is_write)
  {
-    int l;
      hwaddr phys_addr;
-    target_ulong page;
+    target_ulong l, page;
  
      cpu_synchronize_state(cpu);
      while (len > 0) {
@@ -3962,28 +3985,7 @@ int qemu_ram_foreach_block(RAMBlockIterFunc func, void *opaque)
  
      rcu_read_lock();
      RAMBLOCK_FOREACH(block) {
-        ret = func(block->idstr, block->host, block->offset,
-                   block->used_length, opaque);
-        if (ret) {
-            break;
-        }
-    }
-    rcu_read_unlock();
-    return ret;
-}
-
-int qemu_ram_foreach_migratable_block(RAMBlockIterFunc func, void *opaque)
-{
-    RAMBlock *block;
-    int ret = 0;
-
-    rcu_read_lock();
-    RAMBLOCK_FOREACH(block) {
-        if (!qemu_ram_is_migratable(block)) {
-            continue;
-        }
-        ret = func(block->idstr, block->host, block->offset,
-                   block->used_length, opaque);
+        ret = func(block, opaque);
          if (ret) {
              break;
          }
@@ -4109,42 +4111,41 @@ void page_size_init(void)
  
  #if !defined(CONFIG_USER_ONLY)
  
-static void mtree_print_phys_entries(fprintf_function mon, void *f,
-                                     int start, int end, int skip, int ptr)
+static void mtree_print_phys_entries(int start, int end, int skip, int ptr)
  {
      if (start == end - 1) {
-        mon(f, "\t%3d      ", start);
+        qemu_printf("\t%3d      ", start);
      } else {
-        mon(f, "\t%3d..%-3d ", start, end - 1);
+        qemu_printf("\t%3d..%-3d ", start, end - 1);
      }
-    mon(f, " skip=%d ", skip);
+    qemu_printf(" skip=%d ", skip);
      if (ptr == PHYS_MAP_NODE_NIL) {
-        mon(f, " ptr=NIL");
+        qemu_printf(" ptr=NIL");
      } else if (!skip) {
-        mon(f, " ptr=#%d", ptr);
+        qemu_printf(" ptr=#%d", ptr);
      } else {
-        mon(f, " ptr=[%d]", ptr);
+        qemu_printf(" ptr=[%d]", ptr);
      }
-    mon(f, "\n");
+    qemu_printf("\n");
  }
  
  #define MR_SIZE(size) (int128_nz(size) ? (hwaddr)int128_get64( \
                             int128_sub((size), int128_one())) : 0)
  
-void mtree_print_dispatch(fprintf_function mon, void *f,
-                          AddressSpaceDispatch *d, MemoryRegion *root)
+void mtree_print_dispatch(AddressSpaceDispatch *d, MemoryRegion *root)
  {
      int i;
  
-    mon(f, "  Dispatch\n");
-    mon(f, "    Physical sections\n");
+    qemu_printf("  Dispatch\n");
+    qemu_printf("    Physical sections\n");
  
      for (i = 0; i < d->map.sections_nb; ++i) {
          MemoryRegionSection *s = d->map.sections + i;
          const char *names[] = { " [unassigned]", " [not dirty]",
                                  " [ROM]", " [watch]" };
  
-        mon(f, "      #%d @" TARGET_FMT_plx ".." TARGET_FMT_plx " %s%s%s%s%s",
+        qemu_printf("      #%d @" TARGET_FMT_plx ".." TARGET_FMT_plx
+                    " %s%s%s%s%s",
              i,
              s->offset_within_address_space,
              s->offset_within_address_space + MR_SIZE(s->mr->size),
@@ -4155,20 +4156,20 @@ void mtree_print_dispatch(fprintf_function mon, void *f,
              s->mr->is_iommu ? " [iommu]" : "");
  
          if (s->mr->alias) {
-            mon(f, " alias=%s", s->mr->alias->name ?
+            qemu_printf(" alias=%s", s->mr->alias->name ?
                      s->mr->alias->name : "noname");
          }
-        mon(f, "\n");
+        qemu_printf("\n");
      }
  
-    mon(f, "    Nodes (%d bits per level, %d levels) ptr=[%d] skip=%d\n",
+    qemu_printf("    Nodes (%d bits per level, %d levels) ptr=[%d] skip=%d\n",
                 P_L2_BITS, P_L2_LEVELS, d->phys_map.ptr, d->phys_map.skip);
      for (i = 0; i < d->map.nodes_nb; ++i) {
          int j, jprev;
          PhysPageEntry prev;
          Node *n = d->map.nodes + i;
  
-        mon(f, "      [%d]\n", i);
+        qemu_printf("      [%d]\n", i);
  
          for (j = 0, jprev = 0, prev = *n[0]; j < ARRAY_SIZE(*n); ++j) {
              PhysPageEntry *pe = *n + j;
@@ -4177,14 +4178,14 @@ void mtree_print_dispatch(fprintf_function mon, void *f,
                  continue;
              }
  
-            mtree_print_phys_entries(mon, f, jprev, j, prev.skip, prev.ptr);
+            mtree_print_phys_entries(jprev, j, prev.skip, prev.ptr);
  
              jprev = j;
              prev = *pe;
          }
  
          if (jprev != ARRAY_SIZE(*n)) {
-            mtree_print_phys_entries(mon, f, jprev, j, prev.skip, prev.ptr);
+            mtree_print_phys_entries(jprev, j, prev.skip, prev.ptr);
          }
      }
  }