| /* |
| * Block driver for Hyper-V VHDX Images |
| * |
| * Copyright (c) 2013 Red Hat, Inc., |
| * |
| * Authors: |
| * Jeff Cody <jcody@redhat.com> |
| * |
| * This is based on the "VHDX Format Specification v1.00", published 8/25/2012 |
| * by Microsoft: |
| * https://www.microsoft.com/en-us/download/details.aspx?id=34750 |
| * |
| * This work is licensed under the terms of the GNU LGPL, version 2 or later. |
| * See the COPYING.LIB file in the top-level directory. |
| * |
| */ |
| |
| #ifndef BLOCK_VHDX_H |
| #define BLOCK_VHDX_H |
| |
| #define KiB (1 * 1024) |
| #define MiB (KiB * 1024) |
| #define GiB (MiB * 1024) |
| #define TiB ((uint64_t) GiB * 1024) |
| |
| #define DEFAULT_LOG_SIZE 1048576 /* 1MiB */ |
| /* Structures and fields present in the VHDX file */ |
| |
| /* The header section has the following blocks, |
| * each block is 64KB: |
| * |
| * _____________________________________________________________________________ |
| * | File Id. | Header 1 | Header 2 | Region Table | Reserved (768KB) | |
| * |----------|---------------|------------|--------------|--------------------| |
| * | | | | | | |
| * 0.........64KB...........128KB........192KB..........256KB................1MB |
| */ |
| |
| #define VHDX_HEADER_BLOCK_SIZE (64 * 1024) |
| |
| #define VHDX_FILE_ID_OFFSET 0 |
| #define VHDX_HEADER1_OFFSET (VHDX_HEADER_BLOCK_SIZE * 1) |
| #define VHDX_HEADER2_OFFSET (VHDX_HEADER_BLOCK_SIZE * 2) |
| #define VHDX_REGION_TABLE_OFFSET (VHDX_HEADER_BLOCK_SIZE * 3) |
| #define VHDX_REGION_TABLE2_OFFSET (VHDX_HEADER_BLOCK_SIZE * 4) |
| |
| #define VHDX_HEADER_SECTION_END (1 * MiB) |
| /* |
| * A note on the use of MS-GUID fields. For more details on the GUID, |
| * please see: https://en.wikipedia.org/wiki/Globally_unique_identifier. |
| * |
| * The VHDX specification only states that these are MS GUIDs, and which |
| * bytes are data1-data4. It makes no mention of what algorithm should be used |
| * to generate the GUID, nor what standard. However, looking at the specified |
| * known GUID fields, it appears the GUIDs are: |
| * Standard/DCE GUID type (noted by 10b in the MSB of byte 0 of .data4) |
| * Random algorithm (noted by 0x4XXX for .data3) |
| */ |
| |
| /* ---- HEADER SECTION STRUCTURES ---- */ |
| |
| /* These structures are ones that are defined in the VHDX specification |
| * document */ |
| |
| #define VHDX_FILE_SIGNATURE 0x656C696678646876ULL /* "vhdxfile" in ASCII */ |
| typedef struct VHDXFileIdentifier { |
| uint64_t signature; /* "vhdxfile" in ASCII */ |
| uint16_t creator[256]; /* optional; utf-16 string to identify |
| the vhdx file creator. Diagnostic |
| only */ |
| } VHDXFileIdentifier; |
| |
| |
| /* the guid is a 16 byte unique ID - the definition for this used by |
| * Microsoft is not just 16 bytes though - it is a structure that is defined, |
| * so we need to follow it here so that endianness does not trip us up */ |
| |
| typedef struct QEMU_PACKED MSGUID { |
| uint32_t data1; |
| uint16_t data2; |
| uint16_t data3; |
| uint8_t data4[8]; |
| } MSGUID; |
| |
| #define guid_eq(a, b) \ |
| (memcmp(&(a), &(b), sizeof(MSGUID)) == 0) |
| |
| #define VHDX_HEADER_SIZE (4 * 1024) /* although the vhdx_header struct in disk |
| is only 582 bytes, for purposes of crc |
| the header is the first 4KB of the 64KB |
| block */ |
| |
| /* The full header is 4KB, although the actual header data is much smaller. |
| * But for the checksum calculation, it is over the entire 4KB structure, |
| * not just the defined portion of it */ |
| #define VHDX_HEADER_SIGNATURE 0x64616568 |
| typedef struct QEMU_PACKED VHDXHeader { |
| uint32_t signature; /* "head" in ASCII */ |
| uint32_t checksum; /* CRC-32C hash of the whole header */ |
| uint64_t sequence_number; /* Seq number of this header. Each |
| VHDX file has 2 of these headers, |
| and only the header with the highest |
| sequence number is valid */ |
| MSGUID file_write_guid; /* 128 bit unique identifier. Must be |
| updated to new, unique value before |
| the first modification is made to |
| file */ |
| MSGUID data_write_guid; /* 128 bit unique identifier. Must be |
| updated to new, unique value before |
| the first modification is made to |
| visible data. Visbile data is |
| defined as: |
| - system & user metadata |
| - raw block data |
| - disk size |
| - any change that will |
| cause the virtual disk |
| sector read to differ |
| |
| This does not need to change if |
| blocks are re-arranged */ |
| MSGUID log_guid; /* 128 bit unique identifier. If zero, |
| there is no valid log. If non-zero, |
| log entries with this guid are |
| valid. */ |
| uint16_t log_version; /* version of the log format. Must be |
| set to zero */ |
| uint16_t version; /* version of the vhdx file. Currently, |
| only supported version is "1" */ |
| uint32_t log_length; /* length of the log. Must be multiple |
| of 1MB */ |
| uint64_t log_offset; /* byte offset in the file of the log. |
| Must also be a multiple of 1MB */ |
| } VHDXHeader; |
| |
| /* Header for the region table block */ |
| #define VHDX_REGION_SIGNATURE 0x69676572 /* "regi" in ASCII */ |
| typedef struct QEMU_PACKED VHDXRegionTableHeader { |
| uint32_t signature; /* "regi" in ASCII */ |
| uint32_t checksum; /* CRC-32C hash of the 64KB table */ |
| uint32_t entry_count; /* number of valid entries */ |
| uint32_t reserved; |
| } VHDXRegionTableHeader; |
| |
| /* Individual region table entry. There may be a maximum of 2047 of these |
| * |
| * There are two known region table properties. Both are required. |
| * BAT (block allocation table): 2DC27766F62342009D64115E9BFD4A08 |
| * Metadata: 8B7CA20647904B9AB8FE575F050F886E |
| */ |
| #define VHDX_REGION_ENTRY_REQUIRED 0x01 /* if set, parser must understand |
| this entry in order to open |
| file */ |
| typedef struct QEMU_PACKED VHDXRegionTableEntry { |
| MSGUID guid; /* 128-bit unique identifier */ |
| uint64_t file_offset; /* offset of the object in the file. |
| Must be multiple of 1MB */ |
| uint32_t length; /* length, in bytes, of the object */ |
| uint32_t data_bits; |
| } VHDXRegionTableEntry; |
| |
| |
| /* ---- LOG ENTRY STRUCTURES ---- */ |
| #define VHDX_LOG_MIN_SIZE (1024 * 1024) |
| #define VHDX_LOG_SECTOR_SIZE 4096 |
| #define VHDX_LOG_HDR_SIZE 64 |
| #define VHDX_LOG_SIGNATURE 0x65676f6c |
| typedef struct QEMU_PACKED VHDXLogEntryHeader { |
| uint32_t signature; /* "loge" in ASCII */ |
| uint32_t checksum; /* CRC-32C hash of the 64KB table */ |
| uint32_t entry_length; /* length in bytes, multiple of 1MB */ |
| uint32_t tail; /* byte offset of first log entry of a |
| seq, where this entry is the last |
| entry */ |
| uint64_t sequence_number; /* incremented with each log entry. |
| May not be zero. */ |
| uint32_t descriptor_count; /* number of descriptors in this log |
| entry, must be >= 0 */ |
| uint32_t reserved; |
| MSGUID log_guid; /* value of the log_guid from |
| vhdx_header. If not found in |
| vhdx_header, it is invalid */ |
| uint64_t flushed_file_offset; /* see spec for full details - this |
| should be vhdx file size in bytes */ |
| uint64_t last_file_offset; /* size in bytes that all allocated |
| file structures fit into */ |
| } VHDXLogEntryHeader; |
| |
| #define VHDX_LOG_DESC_SIZE 32 |
| #define VHDX_LOG_DESC_SIGNATURE 0x63736564 |
| #define VHDX_LOG_ZERO_SIGNATURE 0x6f72657a |
| typedef struct QEMU_PACKED VHDXLogDescriptor { |
| uint32_t signature; /* "zero" or "desc" in ASCII */ |
| union { |
| uint32_t reserved; /* zero desc */ |
| uint32_t trailing_bytes; /* data desc: bytes 4092-4096 of the |
| data sector */ |
| }; |
| union { |
| uint64_t zero_length; /* zero desc: length of the section to |
| zero */ |
| uint64_t leading_bytes; /* data desc: bytes 0-7 of the data |
| sector */ |
| }; |
| uint64_t file_offset; /* file offset to write zeros - multiple |
| of 4kB */ |
| uint64_t sequence_number; /* must match same field in |
| vhdx_log_entry_header */ |
| } VHDXLogDescriptor; |
| |
| #define VHDX_LOG_DATA_SIGNATURE 0x61746164 |
| typedef struct QEMU_PACKED VHDXLogDataSector { |
| uint32_t data_signature; /* "data" in ASCII */ |
| uint32_t sequence_high; /* 4 MSB of 8 byte sequence_number */ |
| uint8_t data[4084]; /* raw data, bytes 8-4091 (inclusive). |
| see the data descriptor field for the |
| other mising bytes */ |
| uint32_t sequence_low; /* 4 LSB of 8 byte sequence_number */ |
| } VHDXLogDataSector; |
| |
| |
| |
| /* block states - different state values depending on whether it is a |
| * payload block, or a sector block. */ |
| |
| #define PAYLOAD_BLOCK_NOT_PRESENT 0 |
| #define PAYLOAD_BLOCK_UNDEFINED 1 |
| #define PAYLOAD_BLOCK_ZERO 2 |
| #define PAYLOAD_BLOCK_UNMAPPED 3 |
| #define PAYLOAD_BLOCK_UNMAPPED_v095 5 |
| #define PAYLOAD_BLOCK_FULLY_PRESENT 6 |
| #define PAYLOAD_BLOCK_PARTIALLY_PRESENT 7 |
| |
| #define SB_BLOCK_NOT_PRESENT 0 |
| #define SB_BLOCK_PRESENT 6 |
| |
| /* per the spec */ |
| #define VHDX_MAX_SECTORS_PER_BLOCK (1 << 23) |
| |
| /* upper 44 bits are the file offset in 1MB units lower 3 bits are the state |
| other bits are reserved */ |
| #define VHDX_BAT_STATE_BIT_MASK 0x07 |
| #define VHDX_BAT_FILE_OFF_MASK 0xFFFFFFFFFFF00000ULL /* upper 44 bits */ |
| typedef uint64_t VHDXBatEntry; |
| |
| /* ---- METADATA REGION STRUCTURES ---- */ |
| |
| #define VHDX_METADATA_ENTRY_SIZE 32 |
| #define VHDX_METADATA_MAX_ENTRIES 2047 /* not including the header */ |
| #define VHDX_METADATA_TABLE_MAX_SIZE \ |
| (VHDX_METADATA_ENTRY_SIZE * (VHDX_METADATA_MAX_ENTRIES+1)) |
| #define VHDX_METADATA_SIGNATURE 0x617461646174656DULL /* "metadata" in ASCII */ |
| typedef struct QEMU_PACKED VHDXMetadataTableHeader { |
| uint64_t signature; /* "metadata" in ASCII */ |
| uint16_t reserved; |
| uint16_t entry_count; /* number table entries. <= 2047 */ |
| uint32_t reserved2[5]; |
| } VHDXMetadataTableHeader; |
| |
| #define VHDX_META_FLAGS_IS_USER 0x01 /* max 1024 entries */ |
| #define VHDX_META_FLAGS_IS_VIRTUAL_DISK 0x02 /* virtual disk metadata if set, |
| otherwise file metdata */ |
| #define VHDX_META_FLAGS_IS_REQUIRED 0x04 /* parse must understand this |
| entry to open the file */ |
| typedef struct QEMU_PACKED VHDXMetadataTableEntry { |
| MSGUID item_id; /* 128-bit identifier for metadata */ |
| uint32_t offset; /* byte offset of the metadata. At |
| least 64kB. Relative to start of |
| metadata region */ |
| /* note: if length = 0, so is offset */ |
| uint32_t length; /* length of metadata. <= 1MB. */ |
| uint32_t data_bits; /* least-significant 3 bits are flags, |
| the rest are reserved (see above) */ |
| uint32_t reserved2; |
| } VHDXMetadataTableEntry; |
| |
| #define VHDX_PARAMS_LEAVE_BLOCKS_ALLOCED 0x01 /* Do not change any blocks to |
| be BLOCK_NOT_PRESENT. |
| If set indicates a fixed |
| size VHDX file */ |
| #define VHDX_PARAMS_HAS_PARENT 0x02 /* has parent / backing file */ |
| #define VHDX_BLOCK_SIZE_MIN (1 * MiB) |
| #define VHDX_BLOCK_SIZE_MAX (256 * MiB) |
| typedef struct QEMU_PACKED VHDXFileParameters { |
| uint32_t block_size; /* size of each payload block, always |
| power of 2, <= 256MB and >= 1MB. */ |
| uint32_t data_bits; /* least-significant 2 bits are flags, |
| the rest are reserved (see above) */ |
| } VHDXFileParameters; |
| |
| #define VHDX_MAX_IMAGE_SIZE ((uint64_t) 64 * TiB) |
| typedef struct QEMU_PACKED VHDXVirtualDiskSize { |
| uint64_t virtual_disk_size; /* Size of the virtual disk, in bytes. |
| Must be multiple of the sector size, |
| max of 64TB */ |
| } VHDXVirtualDiskSize; |
| |
| typedef struct QEMU_PACKED VHDXPage83Data { |
| MSGUID page_83_data; /* unique id for scsi devices that |
| support page 0x83 */ |
| } VHDXPage83Data; |
| |
| typedef struct QEMU_PACKED VHDXVirtualDiskLogicalSectorSize { |
| uint32_t logical_sector_size; /* virtual disk sector size (in bytes). |
| Can only be 512 or 4096 bytes */ |
| } VHDXVirtualDiskLogicalSectorSize; |
| |
| typedef struct QEMU_PACKED VHDXVirtualDiskPhysicalSectorSize { |
| uint32_t physical_sector_size; /* physical sector size (in bytes). |
| Can only be 512 or 4096 bytes */ |
| } VHDXVirtualDiskPhysicalSectorSize; |
| |
| typedef struct QEMU_PACKED VHDXParentLocatorHeader { |
| MSGUID locator_type; /* type of the parent virtual disk. */ |
| uint16_t reserved; |
| uint16_t key_value_count; /* number of key/value pairs for this |
| locator */ |
| } VHDXParentLocatorHeader; |
| |
| /* key and value strings are UNICODE strings, UTF-16 LE encoding, no NULs */ |
| typedef struct QEMU_PACKED VHDXParentLocatorEntry { |
| uint32_t key_offset; /* offset in metadata for key, > 0 */ |
| uint32_t value_offset; /* offset in metadata for value, >0 */ |
| uint16_t key_length; /* length of entry key, > 0 */ |
| uint16_t value_length; /* length of entry value, > 0 */ |
| } VHDXParentLocatorEntry; |
| |
| |
| /* ----- END VHDX SPECIFICATION STRUCTURES ---- */ |
| |
| typedef struct VHDXMetadataEntries { |
| VHDXMetadataTableEntry file_parameters_entry; |
| VHDXMetadataTableEntry virtual_disk_size_entry; |
| VHDXMetadataTableEntry page83_data_entry; |
| VHDXMetadataTableEntry logical_sector_size_entry; |
| VHDXMetadataTableEntry phys_sector_size_entry; |
| VHDXMetadataTableEntry parent_locator_entry; |
| uint16_t present; |
| } VHDXMetadataEntries; |
| |
| typedef struct VHDXLogEntries { |
| uint64_t offset; |
| uint64_t length; |
| uint32_t write; |
| uint32_t read; |
| VHDXLogEntryHeader *hdr; |
| void *desc_buffer; |
| uint64_t sequence; |
| uint32_t tail; |
| } VHDXLogEntries; |
| |
| typedef struct VHDXRegionEntry { |
| uint64_t start; |
| uint64_t end; |
| QLIST_ENTRY(VHDXRegionEntry) entries; |
| } VHDXRegionEntry; |
| |
| typedef struct BDRVVHDXState { |
| CoMutex lock; |
| |
| int curr_header; |
| VHDXHeader *headers[2]; |
| |
| VHDXRegionTableHeader rt; |
| VHDXRegionTableEntry bat_rt; /* region table for the BAT */ |
| VHDXRegionTableEntry metadata_rt; /* region table for the metadata */ |
| |
| VHDXMetadataTableHeader metadata_hdr; |
| VHDXMetadataEntries metadata_entries; |
| |
| VHDXFileParameters params; |
| uint32_t block_size; |
| uint32_t block_size_bits; |
| uint32_t sectors_per_block; |
| uint32_t sectors_per_block_bits; |
| |
| uint64_t virtual_disk_size; |
| uint32_t logical_sector_size; |
| uint32_t physical_sector_size; |
| |
| uint64_t chunk_ratio; |
| uint32_t chunk_ratio_bits; |
| uint32_t logical_sector_size_bits; |
| |
| uint32_t bat_entries; |
| VHDXBatEntry *bat; |
| uint64_t bat_offset; |
| |
| bool first_visible_write; |
| MSGUID session_guid; |
| |
| VHDXLogEntries log; |
| |
| VHDXParentLocatorHeader parent_header; |
| VHDXParentLocatorEntry *parent_entries; |
| |
| Error *migration_blocker; |
| |
| bool log_replayed_on_open; |
| |
| QLIST_HEAD(VHDXRegionHead, VHDXRegionEntry) regions; |
| } BDRVVHDXState; |
| |
| void vhdx_guid_generate(MSGUID *guid); |
| |
| int vhdx_update_headers(BlockDriverState *bs, BDRVVHDXState *s, bool rw, |
| MSGUID *log_guid); |
| |
| uint32_t vhdx_update_checksum(uint8_t *buf, size_t size, int crc_offset); |
| uint32_t vhdx_checksum_calc(uint32_t crc, uint8_t *buf, size_t size, |
| int crc_offset); |
| |
| bool vhdx_checksum_is_valid(uint8_t *buf, size_t size, int crc_offset); |
| |
| int vhdx_parse_log(BlockDriverState *bs, BDRVVHDXState *s, bool *flushed, |
| Error **errp); |
| |
| int vhdx_log_write_and_flush(BlockDriverState *bs, BDRVVHDXState *s, |
| void *data, uint32_t length, uint64_t offset); |
| |
| static inline void leguid_to_cpus(MSGUID *guid) |
| { |
| le32_to_cpus(&guid->data1); |
| le16_to_cpus(&guid->data2); |
| le16_to_cpus(&guid->data3); |
| } |
| |
| static inline void cpu_to_leguids(MSGUID *guid) |
| { |
| cpu_to_le32s(&guid->data1); |
| cpu_to_le16s(&guid->data2); |
| cpu_to_le16s(&guid->data3); |
| } |
| |
| void vhdx_header_le_import(VHDXHeader *h); |
| void vhdx_header_le_export(VHDXHeader *orig_h, VHDXHeader *new_h); |
| void vhdx_log_desc_le_import(VHDXLogDescriptor *d); |
| void vhdx_log_desc_le_export(VHDXLogDescriptor *d); |
| void vhdx_log_data_le_import(VHDXLogDataSector *d); |
| void vhdx_log_data_le_export(VHDXLogDataSector *d); |
| void vhdx_log_entry_hdr_le_import(VHDXLogEntryHeader *hdr); |
| void vhdx_log_entry_hdr_le_export(VHDXLogEntryHeader *hdr); |
| void vhdx_region_header_le_import(VHDXRegionTableHeader *hdr); |
| void vhdx_region_header_le_export(VHDXRegionTableHeader *hdr); |
| void vhdx_region_entry_le_import(VHDXRegionTableEntry *e); |
| void vhdx_region_entry_le_export(VHDXRegionTableEntry *e); |
| void vhdx_metadata_header_le_import(VHDXMetadataTableHeader *hdr); |
| void vhdx_metadata_header_le_export(VHDXMetadataTableHeader *hdr); |
| void vhdx_metadata_entry_le_import(VHDXMetadataTableEntry *e); |
| void vhdx_metadata_entry_le_export(VHDXMetadataTableEntry *e); |
| int vhdx_user_visible_write(BlockDriverState *bs, BDRVVHDXState *s); |
| |
| #endif |