2 * Block driver for RAW files (win32)
4 * Copyright (c) 2006 Fabrice Bellard
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
25 #include "qemu/osdep.h"
26 #include "qapi/error.h"
27 #include "qemu/cutils.h"
28 #include "block/block_int.h"
29 #include "qemu/module.h"
30 #include "qemu/option.h"
31 #include "block/raw-aio.h"
33 #include "block/thread-pool.h"
35 #include "qapi/qmp/qdict.h"
36 #include "qapi/qmp/qstring.h"
42 #define FTYPE_HARDDISK 2
44 typedef struct RawWin32AIOData
{
47 struct iovec
*aio_iov
;
54 typedef struct BDRVRawState
{
57 char drive_path
[16]; /* format: "d:\" */
58 QEMUWin32AIOState
*aio
;
62 * Read/writes the data to/from a given linear buffer.
64 * Returns the number of bytes handles or -errno in case of an error. Short
65 * reads are only returned if the end of the file is reached.
67 static size_t handle_aiocb_rw(RawWin32AIOData
*aiocb
)
72 for (i
= 0; i
< aiocb
->aio_niov
; i
++) {
74 DWORD ret
, ret_count
, len
;
76 memset(&ov
, 0, sizeof(ov
));
77 ov
.Offset
= (aiocb
->aio_offset
+ offset
);
78 ov
.OffsetHigh
= (aiocb
->aio_offset
+ offset
) >> 32;
79 len
= aiocb
->aio_iov
[i
].iov_len
;
80 if (aiocb
->aio_type
& QEMU_AIO_WRITE
) {
81 ret
= WriteFile(aiocb
->hfile
, aiocb
->aio_iov
[i
].iov_base
,
82 len
, &ret_count
, &ov
);
84 ret
= ReadFile(aiocb
->hfile
, aiocb
->aio_iov
[i
].iov_base
,
85 len
, &ret_count
, &ov
);
90 if (ret_count
!= len
) {
100 static int aio_worker(void *arg
)
102 RawWin32AIOData
*aiocb
= arg
;
106 switch (aiocb
->aio_type
& QEMU_AIO_TYPE_MASK
) {
108 count
= handle_aiocb_rw(aiocb
);
109 if (count
< aiocb
->aio_nbytes
) {
110 /* A short read means that we have reached EOF. Pad the buffer
111 * with zeros for bytes after EOF. */
112 iov_memset(aiocb
->aio_iov
, aiocb
->aio_niov
, count
,
113 0, aiocb
->aio_nbytes
- count
);
115 count
= aiocb
->aio_nbytes
;
117 if (count
== aiocb
->aio_nbytes
) {
124 count
= handle_aiocb_rw(aiocb
);
125 if (count
== aiocb
->aio_nbytes
) {
132 if (!FlushFileBuffers(aiocb
->hfile
)) {
137 fprintf(stderr
, "invalid aio request (0x%x)\n", aiocb
->aio_type
);
146 static BlockAIOCB
*paio_submit(BlockDriverState
*bs
, HANDLE hfile
,
147 int64_t offset
, QEMUIOVector
*qiov
, int count
,
148 BlockCompletionFunc
*cb
, void *opaque
, int type
)
150 RawWin32AIOData
*acb
= g_new(RawWin32AIOData
, 1);
155 acb
->aio_type
= type
;
158 acb
->aio_iov
= qiov
->iov
;
159 acb
->aio_niov
= qiov
->niov
;
160 assert(qiov
->size
== count
);
162 acb
->aio_nbytes
= count
;
163 acb
->aio_offset
= offset
;
165 trace_file_paio_submit(acb
, opaque
, offset
, count
, type
);
166 pool
= aio_get_thread_pool(bdrv_get_aio_context(bs
));
167 return thread_pool_submit_aio(pool
, aio_worker
, acb
, cb
, opaque
);
170 int qemu_ftruncate64(int fd
, int64_t length
)
178 if ((GetVersion() & 0x80000000UL
) && (length
>> 32) != 0)
181 h
= (HANDLE
)_get_osfhandle(fd
);
183 /* get current position, ftruncate do not change position */
185 li
.LowPart
= SetFilePointer (h
, 0, &li
.HighPart
, FILE_CURRENT
);
186 if (li
.LowPart
== INVALID_SET_FILE_POINTER
&& GetLastError() != NO_ERROR
) {
191 dw
= SetFilePointer(h
, (DWORD
) length
, &high
, FILE_BEGIN
);
192 if (dw
== INVALID_SET_FILE_POINTER
&& GetLastError() != NO_ERROR
) {
195 res
= SetEndOfFile(h
);
197 /* back to old position */
198 SetFilePointer(h
, li
.LowPart
, &li
.HighPart
, FILE_BEGIN
);
202 static int set_sparse(int fd
)
205 return (int) DeviceIoControl((HANDLE
)_get_osfhandle(fd
), FSCTL_SET_SPARSE
,
206 NULL
, 0, NULL
, 0, &returned
, NULL
);
209 static void raw_detach_aio_context(BlockDriverState
*bs
)
211 BDRVRawState
*s
= bs
->opaque
;
214 win32_aio_detach_aio_context(s
->aio
, bdrv_get_aio_context(bs
));
218 static void raw_attach_aio_context(BlockDriverState
*bs
,
219 AioContext
*new_context
)
221 BDRVRawState
*s
= bs
->opaque
;
224 win32_aio_attach_aio_context(s
->aio
, new_context
);
228 static void raw_probe_alignment(BlockDriverState
*bs
, Error
**errp
)
230 BDRVRawState
*s
= bs
->opaque
;
231 DWORD sectorsPerCluster
, freeClusters
, totalClusters
, count
;
235 if (s
->type
== FTYPE_CD
) {
236 bs
->bl
.request_alignment
= 2048;
239 if (s
->type
== FTYPE_HARDDISK
) {
240 status
= DeviceIoControl(s
->hfile
, IOCTL_DISK_GET_DRIVE_GEOMETRY_EX
,
241 NULL
, 0, &dg
, sizeof(dg
), &count
, NULL
);
243 bs
->bl
.request_alignment
= dg
.Geometry
.BytesPerSector
;
246 /* try GetDiskFreeSpace too */
249 if (s
->drive_path
[0]) {
250 GetDiskFreeSpace(s
->drive_path
, §orsPerCluster
,
251 &dg
.Geometry
.BytesPerSector
,
252 &freeClusters
, &totalClusters
);
253 bs
->bl
.request_alignment
= dg
.Geometry
.BytesPerSector
;
257 /* XXX Does Windows support AIO on less than 512-byte alignment? */
258 bs
->bl
.request_alignment
= 512;
261 static void raw_parse_flags(int flags
, bool use_aio
, int *access_flags
,
264 assert(access_flags
!= NULL
);
265 assert(overlapped
!= NULL
);
267 if (flags
& BDRV_O_RDWR
) {
268 *access_flags
= GENERIC_READ
| GENERIC_WRITE
;
270 *access_flags
= GENERIC_READ
;
273 *overlapped
= FILE_ATTRIBUTE_NORMAL
;
275 *overlapped
|= FILE_FLAG_OVERLAPPED
;
277 if (flags
& BDRV_O_NOCACHE
) {
278 *overlapped
|= FILE_FLAG_NO_BUFFERING
;
282 static void raw_parse_filename(const char *filename
, QDict
*options
,
285 bdrv_parse_filename_strip_prefix(filename
, "file:", options
);
288 static QemuOptsList raw_runtime_opts
= {
290 .head
= QTAILQ_HEAD_INITIALIZER(raw_runtime_opts
.head
),
294 .type
= QEMU_OPT_STRING
,
295 .help
= "File name of the image",
299 .type
= QEMU_OPT_STRING
,
300 .help
= "host AIO implementation (threads, native)",
302 { /* end of list */ }
306 static bool get_aio_option(QemuOpts
*opts
, int flags
, Error
**errp
)
308 BlockdevAioOptions aio
, aio_default
;
310 aio_default
= (flags
& BDRV_O_NATIVE_AIO
) ? BLOCKDEV_AIO_OPTIONS_NATIVE
311 : BLOCKDEV_AIO_OPTIONS_THREADS
;
312 aio
= qapi_enum_parse(&BlockdevAioOptions_lookup
, qemu_opt_get(opts
, "aio"),
316 case BLOCKDEV_AIO_OPTIONS_NATIVE
:
318 case BLOCKDEV_AIO_OPTIONS_THREADS
:
321 error_setg(errp
, "Invalid AIO option");
326 static int raw_open(BlockDriverState
*bs
, QDict
*options
, int flags
,
329 BDRVRawState
*s
= bs
->opaque
;
333 Error
*local_err
= NULL
;
334 const char *filename
;
338 s
->type
= FTYPE_FILE
;
340 opts
= qemu_opts_create(&raw_runtime_opts
, NULL
, 0, &error_abort
);
341 if (!qemu_opts_absorb_qdict(opts
, options
, errp
)) {
346 if (qdict_get_try_bool(options
, "locking", false)) {
347 error_setg(errp
, "locking=on is not supported on Windows");
352 filename
= qemu_opt_get(opts
, "filename");
354 use_aio
= get_aio_option(opts
, flags
, &local_err
);
356 error_propagate(errp
, local_err
);
361 raw_parse_flags(flags
, use_aio
, &access_flags
, &overlapped
);
363 if (filename
[0] && filename
[1] == ':') {
364 snprintf(s
->drive_path
, sizeof(s
->drive_path
), "%c:\\", filename
[0]);
365 } else if (filename
[0] == '\\' && filename
[1] == '\\') {
366 s
->drive_path
[0] = 0;
370 GetCurrentDirectory(MAX_PATH
, buf
);
371 snprintf(s
->drive_path
, sizeof(s
->drive_path
), "%c:\\", buf
[0]);
374 s
->hfile
= CreateFile(filename
, access_flags
,
375 FILE_SHARE_READ
, NULL
,
376 OPEN_EXISTING
, overlapped
, NULL
);
377 if (s
->hfile
== INVALID_HANDLE_VALUE
) {
378 int err
= GetLastError();
380 error_setg_win32(errp
, err
, "Could not open '%s'", filename
);
381 if (err
== ERROR_ACCESS_DENIED
) {
390 s
->aio
= win32_aio_init();
391 if (s
->aio
== NULL
) {
392 CloseHandle(s
->hfile
);
393 error_setg(errp
, "Could not initialize AIO");
398 ret
= win32_aio_attach(s
->aio
, s
->hfile
);
400 win32_aio_cleanup(s
->aio
);
401 CloseHandle(s
->hfile
);
402 error_setg_errno(errp
, -ret
, "Could not enable AIO");
406 win32_aio_attach_aio_context(s
->aio
, bdrv_get_aio_context(bs
));
409 /* When extending regular files, we get zeros from the OS */
410 bs
->supported_truncate_flags
= BDRV_REQ_ZERO_WRITE
;
418 static BlockAIOCB
*raw_aio_preadv(BlockDriverState
*bs
,
419 uint64_t offset
, uint64_t bytes
,
420 QEMUIOVector
*qiov
, int flags
,
421 BlockCompletionFunc
*cb
, void *opaque
)
423 BDRVRawState
*s
= bs
->opaque
;
425 return win32_aio_submit(bs
, s
->aio
, s
->hfile
, offset
, bytes
, qiov
,
426 cb
, opaque
, QEMU_AIO_READ
);
428 return paio_submit(bs
, s
->hfile
, offset
, qiov
, bytes
,
429 cb
, opaque
, QEMU_AIO_READ
);
433 static BlockAIOCB
*raw_aio_pwritev(BlockDriverState
*bs
,
434 uint64_t offset
, uint64_t bytes
,
435 QEMUIOVector
*qiov
, int flags
,
436 BlockCompletionFunc
*cb
, void *opaque
)
438 BDRVRawState
*s
= bs
->opaque
;
440 return win32_aio_submit(bs
, s
->aio
, s
->hfile
, offset
, bytes
, qiov
,
441 cb
, opaque
, QEMU_AIO_WRITE
);
443 return paio_submit(bs
, s
->hfile
, offset
, qiov
, bytes
,
444 cb
, opaque
, QEMU_AIO_WRITE
);
448 static BlockAIOCB
*raw_aio_flush(BlockDriverState
*bs
,
449 BlockCompletionFunc
*cb
, void *opaque
)
451 BDRVRawState
*s
= bs
->opaque
;
452 return paio_submit(bs
, s
->hfile
, 0, NULL
, 0, cb
, opaque
, QEMU_AIO_FLUSH
);
455 static void raw_close(BlockDriverState
*bs
)
457 BDRVRawState
*s
= bs
->opaque
;
460 win32_aio_detach_aio_context(s
->aio
, bdrv_get_aio_context(bs
));
461 win32_aio_cleanup(s
->aio
);
465 CloseHandle(s
->hfile
);
466 if (bs
->open_flags
& BDRV_O_TEMPORARY
) {
467 unlink(bs
->filename
);
471 static int coroutine_fn
raw_co_truncate(BlockDriverState
*bs
, int64_t offset
,
472 bool exact
, PreallocMode prealloc
,
473 BdrvRequestFlags flags
, Error
**errp
)
475 BDRVRawState
*s
= bs
->opaque
;
479 if (prealloc
!= PREALLOC_MODE_OFF
) {
480 error_setg(errp
, "Unsupported preallocation mode '%s'",
481 PreallocMode_str(prealloc
));
489 * An error has occurred if the return value is INVALID_SET_FILE_POINTER
490 * and GetLastError doesn't return NO_ERROR.
492 dwPtrLow
= SetFilePointer(s
->hfile
, low
, &high
, FILE_BEGIN
);
493 if (dwPtrLow
== INVALID_SET_FILE_POINTER
&& GetLastError() != NO_ERROR
) {
494 error_setg_win32(errp
, GetLastError(), "SetFilePointer error");
497 if (SetEndOfFile(s
->hfile
) == 0) {
498 error_setg_win32(errp
, GetLastError(), "SetEndOfFile error");
504 static int64_t raw_getlength(BlockDriverState
*bs
)
506 BDRVRawState
*s
= bs
->opaque
;
508 ULARGE_INTEGER available
, total
, total_free
;
515 l
.LowPart
= GetFileSize(s
->hfile
, (PDWORD
)&l
.HighPart
);
516 if (l
.LowPart
== 0xffffffffUL
&& GetLastError() != NO_ERROR
)
520 if (!GetDiskFreeSpaceEx(s
->drive_path
, &available
, &total
, &total_free
))
522 l
.QuadPart
= total
.QuadPart
;
525 status
= DeviceIoControl(s
->hfile
, IOCTL_DISK_GET_DRIVE_GEOMETRY_EX
,
526 NULL
, 0, &dg
, sizeof(dg
), &count
, NULL
);
537 static int64_t raw_get_allocated_file_size(BlockDriverState
*bs
)
539 typedef DWORD (WINAPI
* get_compressed_t
)(const char *filename
,
541 get_compressed_t get_compressed
;
543 const char *filename
= bs
->filename
;
544 /* WinNT support GetCompressedFileSize to determine allocate size */
546 (get_compressed_t
) GetProcAddress(GetModuleHandle("kernel32"),
547 "GetCompressedFileSizeA");
548 if (get_compressed
) {
550 low
= get_compressed(filename
, &high
);
551 if (low
!= 0xFFFFFFFFlu
|| GetLastError() == NO_ERROR
) {
552 return (((int64_t) high
) << 32) + low
;
556 if (_stati64(filename
, &st
) < 0) {
562 static int raw_co_create(BlockdevCreateOptions
*options
, Error
**errp
)
564 BlockdevCreateOptionsFile
*file_opts
;
567 assert(options
->driver
== BLOCKDEV_DRIVER_FILE
);
568 file_opts
= &options
->u
.file
;
570 if (file_opts
->has_preallocation
) {
571 error_setg(errp
, "Preallocation is not supported on Windows");
574 if (file_opts
->has_nocow
) {
575 error_setg(errp
, "nocow is not supported on Windows");
579 fd
= qemu_open(file_opts
->filename
, O_WRONLY
| O_CREAT
| O_TRUNC
| O_BINARY
,
582 error_setg_errno(errp
, errno
, "Could not create file");
586 ftruncate(fd
, file_opts
->size
);
592 static int coroutine_fn
raw_co_create_opts(BlockDriver
*drv
,
593 const char *filename
,
597 BlockdevCreateOptions options
;
598 int64_t total_size
= 0;
600 strstart(filename
, "file:", &filename
);
602 /* Read out options */
603 total_size
= ROUND_UP(qemu_opt_get_size_del(opts
, BLOCK_OPT_SIZE
, 0),
606 options
= (BlockdevCreateOptions
) {
607 .driver
= BLOCKDEV_DRIVER_FILE
,
609 .filename
= (char *) filename
,
611 .has_preallocation
= false,
615 return raw_co_create(&options
, errp
);
618 static QemuOptsList raw_create_opts
= {
619 .name
= "raw-create-opts",
620 .head
= QTAILQ_HEAD_INITIALIZER(raw_create_opts
.head
),
623 .name
= BLOCK_OPT_SIZE
,
624 .type
= QEMU_OPT_SIZE
,
625 .help
= "Virtual disk size"
627 { /* end of list */ }
631 BlockDriver bdrv_file
= {
632 .format_name
= "file",
633 .protocol_name
= "file",
634 .instance_size
= sizeof(BDRVRawState
),
635 .bdrv_needs_filename
= true,
636 .bdrv_parse_filename
= raw_parse_filename
,
637 .bdrv_file_open
= raw_open
,
638 .bdrv_refresh_limits
= raw_probe_alignment
,
639 .bdrv_close
= raw_close
,
640 .bdrv_co_create_opts
= raw_co_create_opts
,
641 .bdrv_has_zero_init
= bdrv_has_zero_init_1
,
643 .bdrv_aio_preadv
= raw_aio_preadv
,
644 .bdrv_aio_pwritev
= raw_aio_pwritev
,
645 .bdrv_aio_flush
= raw_aio_flush
,
647 .bdrv_co_truncate
= raw_co_truncate
,
648 .bdrv_getlength
= raw_getlength
,
649 .bdrv_get_allocated_file_size
650 = raw_get_allocated_file_size
,
652 .create_opts
= &raw_create_opts
,
655 /***********************************************/
658 static int find_cdrom(char *cdrom_name
, int cdrom_name_size
)
660 char drives
[256], *pdrv
= drives
;
663 memset(drives
, 0, sizeof(drives
));
664 GetLogicalDriveStrings(sizeof(drives
), drives
);
665 while(pdrv
[0] != '\0') {
666 type
= GetDriveType(pdrv
);
669 snprintf(cdrom_name
, cdrom_name_size
, "\\\\.\\%c:", pdrv
[0]);
673 pdrv
+= lstrlen(pdrv
) + 1;
678 static int find_device_type(BlockDriverState
*bs
, const char *filename
)
680 BDRVRawState
*s
= bs
->opaque
;
684 if (strstart(filename
, "\\\\.\\", &p
) ||
685 strstart(filename
, "//./", &p
)) {
686 if (stristart(p
, "PhysicalDrive", NULL
))
687 return FTYPE_HARDDISK
;
688 snprintf(s
->drive_path
, sizeof(s
->drive_path
), "%c:\\", p
[0]);
689 type
= GetDriveType(s
->drive_path
);
691 case DRIVE_REMOVABLE
:
693 return FTYPE_HARDDISK
;
704 static int hdev_probe_device(const char *filename
)
706 if (strstart(filename
, "/dev/cdrom", NULL
))
708 if (is_windows_drive(filename
))
713 static void hdev_parse_filename(const char *filename
, QDict
*options
,
716 bdrv_parse_filename_strip_prefix(filename
, "host_device:", options
);
719 static void hdev_refresh_limits(BlockDriverState
*bs
, Error
**errp
)
721 /* XXX Does Windows support AIO on less than 512-byte alignment? */
722 bs
->bl
.request_alignment
= 512;
725 static int hdev_open(BlockDriverState
*bs
, QDict
*options
, int flags
,
728 BDRVRawState
*s
= bs
->opaque
;
729 int access_flags
, create_flags
;
732 char device_name
[64];
734 Error
*local_err
= NULL
;
735 const char *filename
;
738 QemuOpts
*opts
= qemu_opts_create(&raw_runtime_opts
, NULL
, 0,
740 if (!qemu_opts_absorb_qdict(opts
, options
, errp
)) {
745 filename
= qemu_opt_get(opts
, "filename");
747 use_aio
= get_aio_option(opts
, flags
, &local_err
);
748 if (!local_err
&& use_aio
) {
749 error_setg(&local_err
, "AIO is not supported on Windows host devices");
752 error_propagate(errp
, local_err
);
757 if (strstart(filename
, "/dev/cdrom", NULL
)) {
758 if (find_cdrom(device_name
, sizeof(device_name
)) < 0) {
759 error_setg(errp
, "Could not open CD-ROM drive");
763 filename
= device_name
;
765 /* transform drive letters into device name */
766 if (((filename
[0] >= 'a' && filename
[0] <= 'z') ||
767 (filename
[0] >= 'A' && filename
[0] <= 'Z')) &&
768 filename
[1] == ':' && filename
[2] == '\0') {
769 snprintf(device_name
, sizeof(device_name
), "\\\\.\\%c:", filename
[0]);
770 filename
= device_name
;
773 s
->type
= find_device_type(bs
, filename
);
775 raw_parse_flags(flags
, use_aio
, &access_flags
, &overlapped
);
777 create_flags
= OPEN_EXISTING
;
779 s
->hfile
= CreateFile(filename
, access_flags
,
780 FILE_SHARE_READ
, NULL
,
781 create_flags
, overlapped
, NULL
);
782 if (s
->hfile
== INVALID_HANDLE_VALUE
) {
783 int err
= GetLastError();
785 if (err
== ERROR_ACCESS_DENIED
) {
790 error_setg_errno(errp
, -ret
, "Could not open device");
799 static BlockDriver bdrv_host_device
= {
800 .format_name
= "host_device",
801 .protocol_name
= "host_device",
802 .instance_size
= sizeof(BDRVRawState
),
803 .bdrv_needs_filename
= true,
804 .bdrv_parse_filename
= hdev_parse_filename
,
805 .bdrv_probe_device
= hdev_probe_device
,
806 .bdrv_file_open
= hdev_open
,
807 .bdrv_close
= raw_close
,
808 .bdrv_refresh_limits
= hdev_refresh_limits
,
810 .bdrv_aio_preadv
= raw_aio_preadv
,
811 .bdrv_aio_pwritev
= raw_aio_pwritev
,
812 .bdrv_aio_flush
= raw_aio_flush
,
814 .bdrv_detach_aio_context
= raw_detach_aio_context
,
815 .bdrv_attach_aio_context
= raw_attach_aio_context
,
817 .bdrv_getlength
= raw_getlength
,
818 .has_variable_length
= true,
820 .bdrv_get_allocated_file_size
821 = raw_get_allocated_file_size
,
824 static void bdrv_file_init(void)
826 bdrv_register(&bdrv_file
);
827 bdrv_register(&bdrv_host_device
);
830 block_init(bdrv_file_init
);