Merge remote-tracking branch 'remotes/pmaydell/tags/pull-target-arm-20190903' into...

[qemu.git] / include / exec / ram_addr.h
diff --git a/include/exec/ram_addr.h b/include/exec/ram_addr.h

index 9ecd911c3e78ec93d4a4ce33044ee15689257f28..a327a80cfe1387a900b6989dc06694d31a30b719 100644 (file)
--- a/include/exec/ram_addr.h
+++ b/include/exec/ram_addr.h
@@ -20,7 +20,9 @@
  #define RAM_ADDR_H
  
  #ifndef CONFIG_USER_ONLY
+#include "cpu.h"
  #include "hw/xen/xen.h"
+#include "sysemu/tcg.h"
  #include "exec/ramlist.h"
  
  struct RAMBlock {
@@ -50,8 +52,70 @@ struct RAMBlock {
      unsigned long *unsentmap;
      /* bitmap of already received pages in postcopy */
      unsigned long *receivedmap;
+
+    /*
+     * bitmap to track already cleared dirty bitmap.  When the bit is
+     * set, it means the corresponding memory chunk needs a log-clear.
+     * Set this up to non-NULL to enable the capability to postpone
+     * and split clearing of dirty bitmap on the remote node (e.g.,
+     * KVM).  The bitmap will be set only when doing global sync.
+     *
+     * NOTE: this bitmap is different comparing to the other bitmaps
+     * in that one bit can represent multiple guest pages (which is
+     * decided by the `clear_bmap_shift' variable below).  On
+     * destination side, this should always be NULL, and the variable
+     * `clear_bmap_shift' is meaningless.
+     */
+    unsigned long *clear_bmap;
+    uint8_t clear_bmap_shift;
  };
  
+/**
+ * clear_bmap_size: calculate clear bitmap size
+ *
+ * @pages: number of guest pages
+ * @shift: guest page number shift
+ *
+ * Returns: number of bits for the clear bitmap
+ */
+static inline long clear_bmap_size(uint64_t pages, uint8_t shift)
+{
+    return DIV_ROUND_UP(pages, 1UL << shift);
+}
+
+/**
+ * clear_bmap_set: set clear bitmap for the page range
+ *
+ * @rb: the ramblock to operate on
+ * @start: the start page number
+ * @size: number of pages to set in the bitmap
+ *
+ * Returns: None
+ */
+static inline void clear_bmap_set(RAMBlock *rb, uint64_t start,
+                                  uint64_t npages)
+{
+    uint8_t shift = rb->clear_bmap_shift;
+
+    bitmap_set_atomic(rb->clear_bmap, start >> shift,
+                      clear_bmap_size(npages, shift));
+}
+
+/**
+ * clear_bmap_test_and_clear: test clear bitmap for the page, clear if set
+ *
+ * @rb: the ramblock to operate on
+ * @page: the page number to check
+ *
+ * Returns: true if the bit was set, false otherwise
+ */
+static inline bool clear_bmap_test_and_clear(RAMBlock *rb, uint64_t page)
+{
+    uint8_t shift = rb->clear_bmap_shift;
+
+    return bitmap_test_and_clear_atomic(rb->clear_bmap, page >> shift, 1);
+}
+
  static inline bool offset_in_ramblock(RAMBlock *b, ram_addr_t offset)
  {
      return (b && b->host && offset < b->used_length) ? true : false;
@@ -73,7 +137,8 @@ static inline unsigned long int ramblock_recv_bitmap_offset(void *host_addr,
  
  bool ramblock_is_pmem(RAMBlock *rb);
  
-long qemu_getrampagesize(void);
+long qemu_minrampagesize(void);
+long qemu_maxrampagesize(void);
  
  /**
   * qemu_ram_alloc_from_file,
@@ -347,8 +412,13 @@ static inline void cpu_physical_memory_set_dirty_lebitmap(unsigned long *bitmap,
              if (bitmap[k]) {
                  unsigned long temp = leul_to_cpu(bitmap[k]);
  
-                atomic_or(&blocks[DIRTY_MEMORY_MIGRATION][idx][offset], temp);
                  atomic_or(&blocks[DIRTY_MEMORY_VGA][idx][offset], temp);
+
+                if (global_dirty_log) {
+                    atomic_or(&blocks[DIRTY_MEMORY_MIGRATION][idx][offset],
+                              temp);
+                }
+
                  if (tcg_enabled()) {
                      atomic_or(&blocks[DIRTY_MEMORY_CODE][idx][offset], temp);
                  }
@@ -365,6 +435,11 @@ static inline void cpu_physical_memory_set_dirty_lebitmap(unsigned long *bitmap,
          xen_hvm_modified_memory(start, pages << TARGET_PAGE_BITS);
      } else {
          uint8_t clients = tcg_enabled() ? DIRTY_CLIENTS_ALL : DIRTY_CLIENTS_NOCODE;
+
+        if (!global_dirty_log) {
+            clients &= ~(1 << DIRTY_MEMORY_MIGRATION);
+        }
+
          /*
           * bitmap-traveling is faster than memory-traveling (for addr...)
           * especially when most of the memory is not dirty.
@@ -392,7 +467,7 @@ bool cpu_physical_memory_test_and_clear_dirty(ram_addr_t start,
                                                unsigned client);
  
  DirtyBitmapSnapshot *cpu_physical_memory_snapshot_and_clear_dirty
-    (ram_addr_t start, ram_addr_t length, unsigned client);
+    (MemoryRegion *mr, hwaddr offset, hwaddr length, unsigned client);
  
  bool cpu_physical_memory_snapshot_get_dirty(DirtyBitmapSnapshot *snap,
                                              ram_addr_t start,
@@ -407,6 +482,7 @@ static inline void cpu_physical_memory_clear_dirty_range(ram_addr_t start,
  }
  
  
+/* Called with RCU critical section */
  static inline
  uint64_t cpu_physical_memory_sync_dirty_bitmap(RAMBlock *rb,
                                                 ram_addr_t start,
@@ -430,8 +506,6 @@ uint64_t cpu_physical_memory_sync_dirty_bitmap(RAMBlock *rb,
                                          DIRTY_MEMORY_BLOCK_SIZE);
          unsigned long page = BIT_WORD(start >> TARGET_PAGE_BITS);
  
-        rcu_read_lock();
-
          src = atomic_rcu_read(
                  &ram_list.dirty_memory[DIRTY_MEMORY_MIGRATION])->blocks;
  
@@ -452,7 +526,18 @@ uint64_t cpu_physical_memory_sync_dirty_bitmap(RAMBlock *rb,
              }
          }
  
-        rcu_read_unlock();
+        if (rb->clear_bmap) {
+            /*
+             * Postpone the dirty bitmap clear to the point before we
+             * really send the pages, also we will split the clear
+             * dirty procedure into smaller chunks.
+             */
+            clear_bmap_set(rb, start >> TARGET_PAGE_BITS,
+                           length >> TARGET_PAGE_BITS);
+        } else {
+            /* Slow path - still do that in a huge chunk */
+            memory_region_clear_dirty_bitmap(rb->mr, start, length);
+        }
      } else {
          ram_addr_t offset = rb->offset;