qcow2: add option to clean unused cache entries after some time

[qemu.git] / block / qed.h
diff --git a/block/qed.h b/block/qed.h

index 6d49a4de5593e17d13efada9902b6e16dda9847e..615e676fc87a967a851f9c06019e696873bbfe5d 100644 (file)
--- a/block/qed.h
+++ b/block/qed.h
@@ -15,7 +15,7 @@
  #ifndef BLOCK_QED_H
  #define BLOCK_QED_H
  
-#include "block_int.h"
+#include "block/block_int.h"
  
  /* The layout of a QED file is as follows:
   *
@@ -43,18 +43,22 @@
   *
   * All fields are little-endian on disk.
   */
-
+#define  QED_DEFAULT_CLUSTER_SIZE  65536
  enum {
      QED_MAGIC = 'Q' | 'E' << 8 | 'D' << 16 | '\0' << 24,
  
      /* The image supports a backing file */
      QED_F_BACKING_FILE = 0x01,
  
+    /* The image needs a consistency check before use */
+    QED_F_NEED_CHECK = 0x02,
+
      /* The backing file format must not be probed, treat as raw image */
      QED_F_BACKING_FORMAT_NO_PROBE = 0x04,
  
      /* Feature bits must be used when the on-disk format changes */
      QED_FEATURE_MASK = QED_F_BACKING_FILE | /* supported feature bits */
+                       QED_F_NEED_CHECK |
                         QED_F_BACKING_FORMAT_NO_PROBE,
      QED_COMPAT_FEATURE_MASK = 0,            /* supported compat feature bits */
      QED_AUTOCLEAR_FEATURE_MASK = 0,         /* supported autoclear feature bits */
@@ -65,7 +69,6 @@ enum {
       */
      QED_MIN_CLUSTER_SIZE = 4 * 1024, /* in bytes */
      QED_MAX_CLUSTER_SIZE = 64 * 1024 * 1024,
-    QED_DEFAULT_CLUSTER_SIZE = 64 * 1024,
  
      /* Allocated clusters are tracked using a 2-level pagetable.  Table size is
       * a multiple of clusters so large maximum image sizes can be supported
@@ -74,6 +77,9 @@ enum {
      QED_MIN_TABLE_SIZE = 1,        /* in clusters */
      QED_MAX_TABLE_SIZE = 16,
      QED_DEFAULT_TABLE_SIZE = 4,
+
+    /* Delay to flush and clean image after last allocating write completes */
+    QED_NEED_CHECK_TIMEOUT = 5,    /* in seconds */
  };
  
  typedef struct {
@@ -93,7 +99,7 @@ typedef struct {
      /* if (features & QED_F_BACKING_FILE) */
      uint32_t backing_filename_offset; /* in bytes from start of header */
      uint32_t backing_filename_size;   /* in bytes */
-} QEDHeader;
+} QEMU_PACKED QEDHeader;
  
  typedef struct {
      uint64_t offsets[0];            /* in bytes */
@@ -116,6 +122,34 @@ typedef struct QEDRequest {
      CachedL2Table *l2_table;
  } QEDRequest;
  
+enum {
+    QED_AIOCB_WRITE = 0x0001,       /* read or write? */
+    QED_AIOCB_ZERO  = 0x0002,       /* zero write, used with QED_AIOCB_WRITE */
+};
+
+typedef struct QEDAIOCB {
+    BlockAIOCB common;
+    QEMUBH *bh;
+    int bh_ret;                     /* final return status for completion bh */
+    QSIMPLEQ_ENTRY(QEDAIOCB) next;  /* next request */
+    int flags;                      /* QED_AIOCB_* bits ORed together */
+    uint64_t end_pos;               /* request end on block device, in bytes */
+
+    /* User scatter-gather list */
+    QEMUIOVector *qiov;
+    size_t qiov_offset;             /* byte count already processed */
+
+    /* Current cluster scatter-gather list */
+    QEMUIOVector cur_qiov;
+    QEMUIOVector *backing_qiov;
+    uint64_t cur_pos;               /* position on block device, in bytes */
+    uint64_t cur_cluster;           /* cluster offset in image file */
+    unsigned int cur_nclusters;     /* number of clusters being accessed */
+    int find_cluster_ret;           /* used for L1/L2 update */
+
+    QEDRequest request;
+} QEDAIOCB;
+
  typedef struct {
      BlockDriverState *bs;           /* device */
      uint64_t file_size;             /* length of image file, in bytes */
@@ -127,10 +161,18 @@ typedef struct {
      uint32_t l1_shift;
      uint32_t l2_shift;
      uint32_t l2_mask;
+
+    /* Allocating write request queue */
+    QSIMPLEQ_HEAD(, QEDAIOCB) allocating_write_reqs;
+    bool allocating_write_reqs_plugged;
+
+    /* Periodic flush and clear need check flag */
+    QEMUTimer *need_check_timer;
  } BDRVQEDState;
  
  enum {
      QED_CLUSTER_FOUND,         /* cluster found */
+    QED_CLUSTER_ZERO,          /* zero cluster found */
      QED_CLUSTER_L2,            /* cluster missing in L2 */
      QED_CLUSTER_L1,            /* cluster missing in L1 */
  };
@@ -160,13 +202,18 @@ typedef void QEDFindClusterFunc(void *opaque, int ret, uint64_t offset, size_t l
   * Generic callback for chaining async callbacks
   */
  typedef struct {
-    BlockDriverCompletionFunc *cb;
+    BlockCompletionFunc *cb;
      void *opaque;
  } GenericCB;
  
-void *gencb_alloc(size_t len, BlockDriverCompletionFunc *cb, void *opaque);
+void *gencb_alloc(size_t len, BlockCompletionFunc *cb, void *opaque);
  void gencb_complete(void *opaque, int ret);
  
+/**
+ * Header functions
+ */
+int qed_write_header_sync(BDRVQEDState *s);
+
  /**
   * L2 cache functions
   */
@@ -182,16 +229,16 @@ void qed_commit_l2_cache_entry(L2TableCache *l2_cache, CachedL2Table *l2_table);
   */
  int qed_read_l1_table_sync(BDRVQEDState *s);
  void qed_write_l1_table(BDRVQEDState *s, unsigned int index, unsigned int n,
-                        BlockDriverCompletionFunc *cb, void *opaque);
+                        BlockCompletionFunc *cb, void *opaque);
  int qed_write_l1_table_sync(BDRVQEDState *s, unsigned int index,
                              unsigned int n);
  int qed_read_l2_table_sync(BDRVQEDState *s, QEDRequest *request,
                             uint64_t offset);
  void qed_read_l2_table(BDRVQEDState *s, QEDRequest *request, uint64_t offset,
-                       BlockDriverCompletionFunc *cb, void *opaque);
+                       BlockCompletionFunc *cb, void *opaque);
  void qed_write_l2_table(BDRVQEDState *s, QEDRequest *request,
                          unsigned int index, unsigned int n, bool flush,
-                        BlockDriverCompletionFunc *cb, void *opaque);
+                        BlockCompletionFunc *cb, void *opaque);
  int qed_write_l2_table_sync(BDRVQEDState *s, QEDRequest *request,
                              unsigned int index, unsigned int n, bool flush);
  
@@ -221,7 +268,7 @@ static inline uint64_t qed_offset_into_cluster(BDRVQEDState *s, uint64_t offset)
      return offset & (s->header.cluster_size - 1);
  }
  
-static inline unsigned int qed_bytes_to_clusters(BDRVQEDState *s, size_t bytes)
+static inline uint64_t qed_bytes_to_clusters(BDRVQEDState *s, uint64_t bytes)
  {
      return qed_start_of_cluster(s, bytes + (s->header.cluster_size - 1)) /
             (s->header.cluster_size - 1);
@@ -268,4 +315,29 @@ static inline bool qed_check_table_offset(BDRVQEDState *s, uint64_t offset)
             qed_check_cluster_offset(s, end_offset);
  }
  
+static inline bool qed_offset_is_cluster_aligned(BDRVQEDState *s,
+                                                 uint64_t offset)
+{
+    if (qed_offset_into_cluster(s, offset)) {
+        return false;
+    }
+    return true;
+}
+
+static inline bool qed_offset_is_unalloc_cluster(uint64_t offset)
+{
+    if (offset == 0) {
+        return true;
+    }
+    return false;
+}
+
+static inline bool qed_offset_is_zero_cluster(uint64_t offset)
+{
+    if (offset == 1) {
+        return true;
+    }
+    return false;
+}
+
  #endif /* BLOCK_QED_H */