2 * Block driver for Hyper-V VHDX Images
4 * Copyright (c) 2013 Red Hat, Inc.,
7 * Jeff Cody <jcody@redhat.com>
9 * This is based on the "VHDX Format Specification v1.00", published 8/25/2012
11 * https://www.microsoft.com/en-us/download/details.aspx?id=34750
13 * This file covers the functionality of the metadata log writing, parsing, and
16 * This work is licensed under the terms of the GNU LGPL, version 2 or later.
17 * See the COPYING.LIB file in the top-level directory.
21 #include "qemu/osdep.h"
22 #include "qapi/error.h"
23 #include "block/block_int.h"
24 #include "qemu/error-report.h"
25 #include "qemu/bswap.h"
29 typedef struct VHDXLogSequence
{
33 VHDXLogEntryHeader hdr
;
36 typedef struct VHDXLogDescEntries
{
37 VHDXLogEntryHeader hdr
;
38 VHDXLogDescriptor desc
[];
41 static const MSGUID zero_guid
= { 0 };
43 /* The log located on the disk is circular buffer containing
44 * sectors of 4096 bytes each.
46 * It is assumed for the read/write functions below that the
47 * circular buffer scheme uses a 'one sector open' to indicate
48 * the buffer is full. Given the validation methods used for each
49 * sector, this method should be compatible with other methods that
50 * do not waste a sector.
54 /* Allow peeking at the hdr entry at the beginning of the current
55 * read index, without advancing the read index */
56 static int vhdx_log_peek_hdr(BlockDriverState
*bs
, VHDXLogEntries
*log
,
57 VHDXLogEntryHeader
*hdr
)
65 /* peek is only supported on sector boundaries */
66 if (log
->read
% VHDX_LOG_SECTOR_SIZE
) {
72 /* we are guaranteed that a) log sectors are 4096 bytes,
73 * and b) the log length is a multiple of 1MB. So, there
74 * is always a round number of sectors in the buffer */
75 if ((read
+ sizeof(VHDXLogEntryHeader
)) > log
->length
) {
79 if (read
== log
->write
) {
84 offset
= log
->offset
+ read
;
86 ret
= bdrv_pread(bs
->file
, offset
, hdr
, sizeof(VHDXLogEntryHeader
));
90 vhdx_log_entry_hdr_le_import(hdr
);
96 /* Index increment for log, based on sector boundaries */
97 static int vhdx_log_inc_idx(uint32_t idx
, uint64_t length
)
99 idx
+= VHDX_LOG_SECTOR_SIZE
;
100 /* we are guaranteed that a) log sectors are 4096 bytes,
101 * and b) the log length is a multiple of 1MB. So, there
102 * is always a round number of sectors in the buffer */
103 return idx
>= length
? 0 : idx
;
107 /* Reset the log to empty */
108 static void vhdx_log_reset(BlockDriverState
*bs
, BDRVVHDXState
*s
)
111 s
->log
.read
= s
->log
.write
= 0;
112 /* a log guid of 0 indicates an empty log to any parser of v0
114 vhdx_update_headers(bs
, s
, false, &guid
);
117 /* Reads num_sectors from the log (all log sectors are 4096 bytes),
118 * into buffer 'buffer'. Upon return, *sectors_read will contain
119 * the number of sectors successfully read.
121 * It is assumed that 'buffer' is already allocated, and of sufficient
122 * size (i.e. >= 4096*num_sectors).
124 * If 'peek' is true, then the tail (read) pointer for the circular buffer is
127 * 0 is returned on success, -errno otherwise. */
128 static int vhdx_log_read_sectors(BlockDriverState
*bs
, VHDXLogEntries
*log
,
129 uint32_t *sectors_read
, void *buffer
,
130 uint32_t num_sectors
, bool peek
)
139 while (num_sectors
) {
140 if (read
== log
->write
) {
144 offset
= log
->offset
+ read
;
146 ret
= bdrv_pread(bs
->file
, offset
, buffer
, VHDX_LOG_SECTOR_SIZE
);
150 read
= vhdx_log_inc_idx(read
, log
->length
);
152 *sectors_read
= *sectors_read
+ 1;
163 /* Writes num_sectors to the log (all log sectors are 4096 bytes),
164 * from buffer 'buffer'. Upon return, *sectors_written will contain
165 * the number of sectors successfully written.
167 * It is assumed that 'buffer' is at least 4096*num_sectors large.
169 * 0 is returned on success, -errno otherwise */
170 static int vhdx_log_write_sectors(BlockDriverState
*bs
, VHDXLogEntries
*log
,
171 uint32_t *sectors_written
, void *buffer
,
172 uint32_t num_sectors
)
178 BDRVVHDXState
*s
= bs
->opaque
;
180 ret
= vhdx_user_visible_write(bs
, s
);
188 while (num_sectors
) {
190 offset
= log
->offset
+ write
;
191 write
= vhdx_log_inc_idx(write
, log
->length
);
192 if (write
== log
->read
) {
196 ret
= bdrv_pwrite(bs
->file
, offset
, buffer_tmp
,
197 VHDX_LOG_SECTOR_SIZE
);
201 buffer_tmp
+= VHDX_LOG_SECTOR_SIZE
;
204 *sectors_written
= *sectors_written
+ 1;
213 /* Validates a log entry header */
214 static bool vhdx_log_hdr_is_valid(VHDXLogEntries
*log
, VHDXLogEntryHeader
*hdr
,
219 if (hdr
->signature
!= VHDX_LOG_SIGNATURE
) {
223 /* if the individual entry length is larger than the whole log
224 * buffer, that is obviously invalid */
225 if (log
->length
< hdr
->entry_length
) {
229 /* length of entire entry must be in units of 4KB (log sector size) */
230 if (hdr
->entry_length
% (VHDX_LOG_SECTOR_SIZE
)) {
234 /* per spec, sequence # must be > 0 */
235 if (hdr
->sequence_number
== 0) {
239 /* log entries are only valid if they match the file-wide log guid
240 * found in the active header */
241 if (!guid_eq(hdr
->log_guid
, s
->headers
[s
->curr_header
]->log_guid
)) {
245 if (hdr
->descriptor_count
* sizeof(VHDXLogDescriptor
) > hdr
->entry_length
) {
256 * Given a log header, this will validate that the descriptors and the
257 * corresponding data sectors (if applicable)
259 * Validation consists of:
260 * 1. Making sure the sequence numbers matches the entry header
261 * 2. Verifying a valid signature ('zero' or 'desc' for descriptors)
262 * 3. File offset field is a multiple of 4KB
263 * 4. If a data descriptor, the corresponding data sector
264 * has its signature ('data') and matching sequence number
266 * @desc: the data buffer containing the descriptor
267 * @hdr: the log entry header
269 * Returns true if valid
271 static bool vhdx_log_desc_is_valid(VHDXLogDescriptor
*desc
,
272 VHDXLogEntryHeader
*hdr
)
276 if (desc
->sequence_number
!= hdr
->sequence_number
) {
279 if (desc
->file_offset
% VHDX_LOG_SECTOR_SIZE
) {
283 if (desc
->signature
== VHDX_LOG_ZERO_SIGNATURE
) {
284 if (desc
->zero_length
% VHDX_LOG_SECTOR_SIZE
== 0) {
288 } else if (desc
->signature
== VHDX_LOG_DESC_SIGNATURE
) {
298 /* Prior to sector data for a log entry, there is the header
299 * and the descriptors referenced in the header:
303 * [ hdr, desc ][ desc ][ ... ][ data ][ ... ]
305 * The first sector in a log entry has a 64 byte header, and
306 * up to 126 32-byte descriptors. If more descriptors than
307 * 126 are required, then subsequent sectors can have up to 128
308 * descriptors. Each sector is 4KB. Data follows the descriptor
311 * This will return the number of sectors needed to encompass
312 * the passed number of descriptors in desc_cnt.
314 * This will never return 0, even if desc_cnt is 0.
316 static int vhdx_compute_desc_sectors(uint32_t desc_cnt
)
318 uint32_t desc_sectors
;
320 desc_cnt
+= 2; /* account for header in first sector */
321 desc_sectors
= desc_cnt
/ 128;
322 if (desc_cnt
% 128) {
330 /* Reads the log header, and subsequent descriptors (if any). This
331 * will allocate all the space for buffer, which must be NULL when
332 * passed into this function. Each descriptor will also be validated,
333 * and error returned if any are invalid. */
334 static int vhdx_log_read_desc(BlockDriverState
*bs
, BDRVVHDXState
*s
,
335 VHDXLogEntries
*log
, VHDXLogDescEntries
**buffer
,
339 uint32_t desc_sectors
;
340 uint32_t sectors_read
;
341 VHDXLogEntryHeader hdr
;
342 VHDXLogDescEntries
*desc_entries
= NULL
;
343 VHDXLogDescriptor desc
;
346 assert(*buffer
== NULL
);
348 ret
= vhdx_log_peek_hdr(bs
, log
, &hdr
);
353 if (vhdx_log_hdr_is_valid(log
, &hdr
, s
) == false) {
358 desc_sectors
= vhdx_compute_desc_sectors(hdr
.descriptor_count
);
359 desc_entries
= qemu_try_blockalign(bs
->file
->bs
,
360 desc_sectors
* VHDX_LOG_SECTOR_SIZE
);
361 if (desc_entries
== NULL
) {
366 ret
= vhdx_log_read_sectors(bs
, log
, §ors_read
, desc_entries
,
367 desc_sectors
, false);
371 if (sectors_read
!= desc_sectors
) {
376 /* put in proper endianness, and validate each desc */
377 for (i
= 0; i
< hdr
.descriptor_count
; i
++) {
378 desc
= desc_entries
->desc
[i
];
379 vhdx_log_desc_le_import(&desc
);
380 if (convert_endian
) {
381 desc_entries
->desc
[i
] = desc
;
383 if (vhdx_log_desc_is_valid(&desc
, &hdr
) == false) {
388 if (convert_endian
) {
389 desc_entries
->hdr
= hdr
;
392 *buffer
= desc_entries
;
396 qemu_vfree(desc_entries
);
402 /* Flushes the descriptor described by desc to the VHDX image file.
403 * If the descriptor is a data descriptor, than 'data' must be non-NULL,
404 * and >= 4096 bytes (VHDX_LOG_SECTOR_SIZE), containing the data to be
407 * Verification is performed to make sure the sequence numbers of a data
408 * descriptor match the sequence number in the desc.
410 * For a zero descriptor, it may describe multiple sectors to fill with zeroes.
411 * In this case, it should be noted that zeroes are written to disk, and the
412 * image file is not extended as a sparse file. */
413 static int vhdx_log_flush_desc(BlockDriverState
*bs
, VHDXLogDescriptor
*desc
,
414 VHDXLogDataSector
*data
)
417 uint64_t seq
, file_offset
;
423 buffer
= qemu_blockalign(bs
, VHDX_LOG_SECTOR_SIZE
);
425 if (desc
->signature
== VHDX_LOG_DESC_SIGNATURE
) {
432 /* The sequence number of the data sector must match that
433 * in the descriptor */
434 seq
= data
->sequence_high
;
436 seq
|= data
->sequence_low
& 0xffffffff;
438 if (seq
!= desc
->sequence_number
) {
443 /* Each data sector is in total 4096 bytes, however the first
444 * 8 bytes, and last 4 bytes, are located in the descriptor */
445 memcpy(buffer
, &desc
->leading_bytes
, 8);
448 memcpy(buffer
+offset
, data
->data
, 4084);
451 memcpy(buffer
+offset
, &desc
->trailing_bytes
, 4);
453 } else if (desc
->signature
== VHDX_LOG_ZERO_SIGNATURE
) {
454 /* write 'count' sectors of sector */
455 memset(buffer
, 0, VHDX_LOG_SECTOR_SIZE
);
456 count
= desc
->zero_length
/ VHDX_LOG_SECTOR_SIZE
;
458 error_report("Invalid VHDX log descriptor entry signature 0x%" PRIx32
,
464 file_offset
= desc
->file_offset
;
466 /* count is only > 1 if we are writing zeroes */
467 for (i
= 0; i
< count
; i
++) {
468 ret
= bdrv_pwrite_sync(bs
->file
, file_offset
, buffer
,
469 VHDX_LOG_SECTOR_SIZE
);
473 file_offset
+= VHDX_LOG_SECTOR_SIZE
;
481 /* Flush the entire log (as described by 'logs') to the VHDX image
482 * file, and then set the log to 'empty' status once complete.
484 * The log entries should be validate prior to flushing */
485 static int vhdx_log_flush(BlockDriverState
*bs
, BDRVVHDXState
*s
,
486 VHDXLogSequence
*logs
)
490 uint32_t cnt
, sectors_read
;
491 uint64_t new_file_size
;
494 VHDXLogDescEntries
*desc_entries
= NULL
;
495 VHDXLogEntryHeader hdr_tmp
= { 0 };
499 data
= qemu_blockalign(bs
, VHDX_LOG_SECTOR_SIZE
);
501 ret
= vhdx_user_visible_write(bs
, s
);
506 /* each iteration represents one log sequence, which may span multiple
509 ret
= vhdx_log_peek_hdr(bs
, &logs
->log
, &hdr_tmp
);
513 file_length
= bdrv_getlength(bs
->file
->bs
);
514 if (file_length
< 0) {
518 /* if the log shows a FlushedFileOffset larger than our current file
519 * size, then that means the file has been truncated / corrupted, and
520 * we must refused to open it / use it */
521 if (hdr_tmp
.flushed_file_offset
> file_length
) {
526 ret
= vhdx_log_read_desc(bs
, s
, &logs
->log
, &desc_entries
, true);
531 for (i
= 0; i
< desc_entries
->hdr
.descriptor_count
; i
++) {
532 if (desc_entries
->desc
[i
].signature
== VHDX_LOG_DESC_SIGNATURE
) {
533 /* data sector, so read a sector to flush */
534 ret
= vhdx_log_read_sectors(bs
, &logs
->log
, §ors_read
,
539 if (sectors_read
!= 1) {
543 vhdx_log_data_le_import(data
);
546 ret
= vhdx_log_flush_desc(bs
, &desc_entries
->desc
[i
], data
);
551 if (file_length
< desc_entries
->hdr
.last_file_offset
) {
552 new_file_size
= desc_entries
->hdr
.last_file_offset
;
553 if (new_file_size
% (1 * MiB
)) {
554 /* round up to nearest 1MB boundary */
555 new_file_size
= QEMU_ALIGN_UP(new_file_size
, MiB
);
556 if (new_file_size
> INT64_MAX
) {
560 ret
= bdrv_truncate(bs
->file
, new_file_size
, false,
561 PREALLOC_MODE_OFF
, 0, NULL
);
567 qemu_vfree(desc_entries
);
571 ret
= bdrv_flush(bs
);
575 /* once the log is fully flushed, indicate that we have an empty log
576 * now. This also sets the log guid to 0, to indicate an empty log */
577 vhdx_log_reset(bs
, s
);
581 qemu_vfree(desc_entries
);
585 static int vhdx_validate_log_entry(BlockDriverState
*bs
, BDRVVHDXState
*s
,
586 VHDXLogEntries
*log
, uint64_t seq
,
587 bool *valid
, VHDXLogEntryHeader
*entry
)
590 VHDXLogEntryHeader hdr
;
592 uint32_t i
, desc_sectors
, total_sectors
, crc
;
593 uint32_t sectors_read
= 0;
594 VHDXLogDescEntries
*desc_buffer
= NULL
;
598 ret
= vhdx_log_peek_hdr(bs
, log
, &hdr
);
603 if (vhdx_log_hdr_is_valid(log
, &hdr
, s
) == false) {
608 if (hdr
.sequence_number
!= seq
+ 1) {
613 desc_sectors
= vhdx_compute_desc_sectors(hdr
.descriptor_count
);
615 /* Read all log sectors, and calculate log checksum */
617 total_sectors
= hdr
.entry_length
/ VHDX_LOG_SECTOR_SIZE
;
620 /* read_desc() will increment the read idx */
621 ret
= vhdx_log_read_desc(bs
, s
, log
, &desc_buffer
, false);
626 crc
= vhdx_checksum_calc(0xffffffff, (void *)desc_buffer
,
627 desc_sectors
* VHDX_LOG_SECTOR_SIZE
, 4);
630 buffer
= qemu_blockalign(bs
, VHDX_LOG_SECTOR_SIZE
);
631 if (total_sectors
> desc_sectors
) {
632 for (i
= 0; i
< total_sectors
- desc_sectors
; i
++) {
634 ret
= vhdx_log_read_sectors(bs
, log
, §ors_read
, buffer
,
636 if (ret
< 0 || sectors_read
!= 1) {
639 crc
= vhdx_checksum_calc(crc
, buffer
, VHDX_LOG_SECTOR_SIZE
, -1);
644 if (crc
!= hdr
.checksum
) {
653 log
->read
= vhdx_log_inc_idx(log
->read
, log
->length
);
657 qemu_vfree(desc_buffer
);
661 /* Search through the log circular buffer, and find the valid, active
662 * log sequence, if any exists
664 static int vhdx_log_search(BlockDriverState
*bs
, BDRVVHDXState
*s
,
665 VHDXLogSequence
*logs
)
669 bool seq_valid
= false;
670 VHDXLogSequence candidate
= { 0 };
671 VHDXLogEntryHeader hdr
= { 0 };
672 VHDXLogEntries curr_log
;
674 memcpy(&curr_log
, &s
->log
, sizeof(VHDXLogEntries
));
675 curr_log
.write
= curr_log
.length
; /* assume log is full */
679 /* now we will go through the whole log sector by sector, until
680 * we find a valid, active log sequence, or reach the end of the
683 uint64_t curr_seq
= 0;
684 VHDXLogSequence current
= { 0 };
686 tail
= curr_log
.read
;
688 ret
= vhdx_validate_log_entry(bs
, s
, &curr_log
, curr_seq
,
695 current
.valid
= true;
696 current
.log
= curr_log
;
697 current
.log
.read
= tail
;
698 current
.log
.write
= curr_log
.read
;
704 ret
= vhdx_validate_log_entry(bs
, s
, &curr_log
, curr_seq
,
709 if (seq_valid
== false) {
712 current
.log
.write
= curr_log
.read
;
715 curr_seq
= hdr
.sequence_number
;
720 if (candidate
.valid
== false ||
721 current
.hdr
.sequence_number
> candidate
.hdr
.sequence_number
) {
726 if (curr_log
.read
< tail
) {
733 if (candidate
.valid
) {
734 /* this is the next sequence number, for writes */
735 s
->log
.sequence
= candidate
.hdr
.sequence_number
+ 1;
743 /* Parse the replay log. Per the VHDX spec, if the log is present
744 * it must be replayed prior to opening the file, even read-only.
746 * If read-only, we must replay the log in RAM (or refuse to open
747 * a dirty VHDX file read-only) */
748 int vhdx_parse_log(BlockDriverState
*bs
, BDRVVHDXState
*s
, bool *flushed
,
753 VHDXLogSequence logs
= { 0 };
755 hdr
= s
->headers
[s
->curr_header
];
759 /* s->log.hdr is freed in vhdx_close() */
760 if (s
->log
.hdr
== NULL
) {
761 s
->log
.hdr
= qemu_blockalign(bs
, sizeof(VHDXLogEntryHeader
));
764 s
->log
.offset
= hdr
->log_offset
;
765 s
->log
.length
= hdr
->log_length
;
767 if (s
->log
.offset
< VHDX_LOG_MIN_SIZE
||
768 s
->log
.offset
% VHDX_LOG_MIN_SIZE
) {
773 /* per spec, only log version of 0 is supported */
774 if (hdr
->log_version
!= 0) {
779 /* If either the log guid, or log length is zero,
780 * then a replay log is not present */
781 if (guid_eq(hdr
->log_guid
, zero_guid
)) {
785 if (hdr
->log_length
== 0) {
789 if (hdr
->log_length
% VHDX_LOG_MIN_SIZE
) {
795 /* The log is present, we need to find if and where there is an active
796 * sequence of valid entries present in the log. */
798 ret
= vhdx_log_search(bs
, s
, &logs
);
804 if (bdrv_is_read_only(bs
)) {
805 bdrv_refresh_filename(bs
);
808 "VHDX image file '%s' opened read-only, but "
809 "contains a log that needs to be replayed",
811 error_append_hint(errp
, "To replay the log, run:\n"
812 "qemu-img check -r all '%s'\n",
816 /* now flush the log */
817 ret
= vhdx_log_flush(bs
, s
, &logs
);
831 static void vhdx_log_raw_to_le_sector(VHDXLogDescriptor
*desc
,
832 VHDXLogDataSector
*sector
, void *data
,
835 /* 8 + 4084 + 4 = 4096, 1 log sector */
836 memcpy(&desc
->leading_bytes
, data
, 8);
838 desc
->leading_bytes
= cpu_to_le64(desc
->leading_bytes
);
839 memcpy(sector
->data
, data
, 4084);
841 memcpy(&desc
->trailing_bytes
, data
, 4);
842 desc
->trailing_bytes
= cpu_to_le32(desc
->trailing_bytes
);
845 sector
->sequence_high
= (uint32_t) (seq
>> 32);
846 sector
->sequence_low
= (uint32_t) (seq
& 0xffffffff);
847 sector
->data_signature
= VHDX_LOG_DATA_SIGNATURE
;
849 vhdx_log_desc_le_export(desc
);
850 vhdx_log_data_le_export(sector
);
854 static int vhdx_log_write(BlockDriverState
*bs
, BDRVVHDXState
*s
,
855 void *data
, uint32_t length
, uint64_t offset
)
859 void *merged_sector
= NULL
;
860 void *data_tmp
, *sector_write
;
863 uint32_t desc_sectors
, sectors
, total_length
;
864 uint32_t sectors_written
= 0;
865 uint32_t aligned_length
;
866 uint32_t leading_length
= 0;
867 uint32_t trailing_length
= 0;
868 uint32_t partial_sectors
= 0;
869 uint32_t bytes_written
= 0;
870 uint64_t file_offset
;
873 VHDXLogEntryHeader new_hdr
;
874 VHDXLogDescriptor
*new_desc
= NULL
;
875 VHDXLogDataSector
*data_sector
= NULL
;
876 MSGUID new_guid
= { 0 };
878 header
= s
->headers
[s
->curr_header
];
880 /* need to have offset read data, and be on 4096 byte boundary */
882 if (length
> header
->log_length
) {
883 /* no log present. we could create a log here instead of failing */
888 if (guid_eq(header
->log_guid
, zero_guid
)) {
889 vhdx_guid_generate(&new_guid
);
890 vhdx_update_headers(bs
, s
, false, &new_guid
);
892 /* currently, we require that the log be flushed after
898 /* 0 is an invalid sequence number, but may also represent the first
899 * log write (or a wrapped seq) */
900 if (s
->log
.sequence
== 0) {
904 sector_offset
= offset
% VHDX_LOG_SECTOR_SIZE
;
905 file_offset
= QEMU_ALIGN_DOWN(offset
, VHDX_LOG_SECTOR_SIZE
);
907 aligned_length
= length
;
909 /* add in the unaligned head and tail bytes */
911 leading_length
= (VHDX_LOG_SECTOR_SIZE
- sector_offset
);
912 leading_length
= leading_length
> length
? length
: leading_length
;
913 aligned_length
-= leading_length
;
917 sectors
= aligned_length
/ VHDX_LOG_SECTOR_SIZE
;
918 trailing_length
= aligned_length
- (sectors
* VHDX_LOG_SECTOR_SIZE
);
919 if (trailing_length
) {
923 sectors
+= partial_sectors
;
925 file_length
= bdrv_getlength(bs
->file
->bs
);
926 if (file_length
< 0) {
931 /* sectors is now how many sectors the data itself takes, not
932 * including the header and descriptor metadata */
934 new_hdr
= (VHDXLogEntryHeader
) {
935 .signature
= VHDX_LOG_SIGNATURE
,
937 .sequence_number
= s
->log
.sequence
,
938 .descriptor_count
= sectors
,
940 .flushed_file_offset
= file_length
,
941 .last_file_offset
= file_length
,
942 .log_guid
= header
->log_guid
,
946 desc_sectors
= vhdx_compute_desc_sectors(new_hdr
.descriptor_count
);
948 total_length
= (desc_sectors
+ sectors
) * VHDX_LOG_SECTOR_SIZE
;
949 new_hdr
.entry_length
= total_length
;
951 vhdx_log_entry_hdr_le_export(&new_hdr
);
953 buffer
= qemu_blockalign(bs
, total_length
);
954 memcpy(buffer
, &new_hdr
, sizeof(new_hdr
));
956 new_desc
= buffer
+ sizeof(new_hdr
);
957 data_sector
= buffer
+ (desc_sectors
* VHDX_LOG_SECTOR_SIZE
);
960 /* All log sectors are 4KB, so for any partial sectors we must
961 * merge the data with preexisting data from the final file
963 merged_sector
= qemu_blockalign(bs
, VHDX_LOG_SECTOR_SIZE
);
965 for (i
= 0; i
< sectors
; i
++) {
966 new_desc
->signature
= VHDX_LOG_DESC_SIGNATURE
;
967 new_desc
->sequence_number
= s
->log
.sequence
;
968 new_desc
->file_offset
= file_offset
;
970 if (i
== 0 && leading_length
) {
971 /* partial sector at the front of the buffer */
972 ret
= bdrv_pread(bs
->file
, file_offset
, merged_sector
,
973 VHDX_LOG_SECTOR_SIZE
);
977 memcpy(merged_sector
+ sector_offset
, data_tmp
, leading_length
);
978 bytes_written
= leading_length
;
979 sector_write
= merged_sector
;
980 } else if (i
== sectors
- 1 && trailing_length
) {
981 /* partial sector at the end of the buffer */
982 ret
= bdrv_pread(bs
->file
,
984 merged_sector
+ trailing_length
,
985 VHDX_LOG_SECTOR_SIZE
- trailing_length
);
989 memcpy(merged_sector
, data_tmp
, trailing_length
);
990 bytes_written
= trailing_length
;
991 sector_write
= merged_sector
;
993 bytes_written
= VHDX_LOG_SECTOR_SIZE
;
994 sector_write
= data_tmp
;
997 /* populate the raw sector data into the proper structures,
998 * as well as update the descriptor, and convert to proper
1000 vhdx_log_raw_to_le_sector(new_desc
, data_sector
, sector_write
,
1003 data_tmp
+= bytes_written
;
1006 file_offset
+= VHDX_LOG_SECTOR_SIZE
;
1009 /* checksum covers entire entry, from the log header through the
1010 * last data sector */
1011 vhdx_update_checksum(buffer
, total_length
,
1012 offsetof(VHDXLogEntryHeader
, checksum
));
1014 /* now write to the log */
1015 ret
= vhdx_log_write_sectors(bs
, &s
->log
, §ors_written
, buffer
,
1016 desc_sectors
+ sectors
);
1021 if (sectors_written
!= desc_sectors
+ sectors
) {
1022 /* instead of failing, we could flush the log here */
1028 /* write new tail */
1029 s
->log
.tail
= s
->log
.write
;
1033 qemu_vfree(merged_sector
);
1037 /* Perform a log write, and then immediately flush the entire log */
1038 int vhdx_log_write_and_flush(BlockDriverState
*bs
, BDRVVHDXState
*s
,
1039 void *data
, uint32_t length
, uint64_t offset
)
1042 VHDXLogSequence logs
= { .valid
= true,
1047 /* Make sure data written (new and/or changed blocks) is stable
1048 * on disk, before creating log entry */
1049 ret
= bdrv_flush(bs
);
1054 ret
= vhdx_log_write(bs
, s
, data
, length
, offset
);
1060 /* Make sure log is stable on disk */
1061 ret
= bdrv_flush(bs
);
1066 ret
= vhdx_log_flush(bs
, s
, &logs
);