2 * xen paravirt block device backend
4 * (c) Gerd Hoffmann <kraxel@redhat.com>
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; under version 2 of the License.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
15 * You should have received a copy of the GNU General Public License along
16 * with this program; if not, see <http://www.gnu.org/licenses/>.
29 #include <sys/ioctl.h>
30 #include <sys/types.h>
37 #include <xen/io/xenbus.h>
40 #include "block_int.h"
41 #include "qemu-char.h"
42 #include "xen_blkif.h"
43 #include "xen_backend.h"
46 /* ------------------------------------------------------------- */
48 static int syncwrite
= 0;
49 static int batch_maps
= 0;
51 static int max_requests
= 32;
52 static int use_aio
= 1;
54 /* ------------------------------------------------------------- */
56 #define BLOCK_SIZE 512
57 #define IOCB_COUNT (BLKIF_MAX_SEGMENTS_PER_REQUEST + 2)
70 uint32_t domids
[BLKIF_MAX_SEGMENTS_PER_REQUEST
];
71 uint32_t refs
[BLKIF_MAX_SEGMENTS_PER_REQUEST
];
73 void *page
[BLKIF_MAX_SEGMENTS_PER_REQUEST
];
80 struct XenBlkDev
*blkdev
;
81 QLIST_ENTRY(ioreq
) list
;
86 struct XenDevice xendev
; /* must be first */
92 const char *fileproto
;
99 blkif_back_rings_t rings
;
104 QLIST_HEAD(inflight_head
, ioreq
) inflight
;
105 QLIST_HEAD(finished_head
, ioreq
) finished
;
106 QLIST_HEAD(freelist_head
, ioreq
) freelist
;
108 int requests_inflight
;
109 int requests_finished
;
111 /* qemu block driver */
113 BlockDriverState
*bs
;
117 /* ------------------------------------------------------------- */
119 static struct ioreq
*ioreq_start(struct XenBlkDev
*blkdev
)
121 struct ioreq
*ioreq
= NULL
;
123 if (QLIST_EMPTY(&blkdev
->freelist
)) {
124 if (blkdev
->requests_total
>= max_requests
) {
127 /* allocate new struct */
128 ioreq
= g_malloc0(sizeof(*ioreq
));
129 ioreq
->blkdev
= blkdev
;
130 blkdev
->requests_total
++;
131 qemu_iovec_init(&ioreq
->v
, BLKIF_MAX_SEGMENTS_PER_REQUEST
);
133 /* get one from freelist */
134 ioreq
= QLIST_FIRST(&blkdev
->freelist
);
135 QLIST_REMOVE(ioreq
, list
);
136 qemu_iovec_reset(&ioreq
->v
);
138 QLIST_INSERT_HEAD(&blkdev
->inflight
, ioreq
, list
);
139 blkdev
->requests_inflight
++;
145 static void ioreq_finish(struct ioreq
*ioreq
)
147 struct XenBlkDev
*blkdev
= ioreq
->blkdev
;
149 QLIST_REMOVE(ioreq
, list
);
150 QLIST_INSERT_HEAD(&blkdev
->finished
, ioreq
, list
);
151 blkdev
->requests_inflight
--;
152 blkdev
->requests_finished
++;
155 static void ioreq_release(struct ioreq
*ioreq
)
157 struct XenBlkDev
*blkdev
= ioreq
->blkdev
;
159 QLIST_REMOVE(ioreq
, list
);
160 memset(ioreq
, 0, sizeof(*ioreq
));
161 ioreq
->blkdev
= blkdev
;
162 QLIST_INSERT_HEAD(&blkdev
->freelist
, ioreq
, list
);
163 blkdev
->requests_finished
--;
167 * translate request into iovec + start offset
168 * do sanity checks along the way
170 static int ioreq_parse(struct ioreq
*ioreq
)
172 struct XenBlkDev
*blkdev
= ioreq
->blkdev
;
177 xen_be_printf(&blkdev
->xendev
, 3,
178 "op %d, nr %d, handle %d, id %" PRId64
", sector %" PRId64
"\n",
179 ioreq
->req
.operation
, ioreq
->req
.nr_segments
,
180 ioreq
->req
.handle
, ioreq
->req
.id
, ioreq
->req
.sector_number
);
181 switch (ioreq
->req
.operation
) {
183 ioreq
->prot
= PROT_WRITE
; /* to memory */
185 case BLKIF_OP_WRITE_BARRIER
:
186 if (!ioreq
->req
.nr_segments
) {
191 ioreq
->presync
= ioreq
->postsync
= 1;
195 ioreq
->prot
= PROT_READ
; /* from memory */
201 xen_be_printf(&blkdev
->xendev
, 0, "error: unknown operation (%d)\n",
202 ioreq
->req
.operation
);
206 if (ioreq
->req
.operation
!= BLKIF_OP_READ
&& blkdev
->mode
[0] != 'w') {
207 xen_be_printf(&blkdev
->xendev
, 0, "error: write req for ro device\n");
211 ioreq
->start
= ioreq
->req
.sector_number
* blkdev
->file_blk
;
212 for (i
= 0; i
< ioreq
->req
.nr_segments
; i
++) {
213 if (i
== BLKIF_MAX_SEGMENTS_PER_REQUEST
) {
214 xen_be_printf(&blkdev
->xendev
, 0, "error: nr_segments too big\n");
217 if (ioreq
->req
.seg
[i
].first_sect
> ioreq
->req
.seg
[i
].last_sect
) {
218 xen_be_printf(&blkdev
->xendev
, 0, "error: first > last sector\n");
221 if (ioreq
->req
.seg
[i
].last_sect
* BLOCK_SIZE
>= XC_PAGE_SIZE
) {
222 xen_be_printf(&blkdev
->xendev
, 0, "error: page crossing\n");
226 ioreq
->domids
[i
] = blkdev
->xendev
.dom
;
227 ioreq
->refs
[i
] = ioreq
->req
.seg
[i
].gref
;
229 mem
= ioreq
->req
.seg
[i
].first_sect
* blkdev
->file_blk
;
230 len
= (ioreq
->req
.seg
[i
].last_sect
- ioreq
->req
.seg
[i
].first_sect
+ 1) * blkdev
->file_blk
;
231 qemu_iovec_add(&ioreq
->v
, (void*)mem
, len
);
233 if (ioreq
->start
+ ioreq
->v
.size
> blkdev
->file_size
) {
234 xen_be_printf(&blkdev
->xendev
, 0, "error: access beyond end of file\n");
240 ioreq
->status
= BLKIF_RSP_ERROR
;
244 static void ioreq_unmap(struct ioreq
*ioreq
)
246 XenGnttab gnt
= ioreq
->blkdev
->xendev
.gnttabdev
;
249 if (ioreq
->v
.niov
== 0) {
256 if (xc_gnttab_munmap(gnt
, ioreq
->pages
, ioreq
->v
.niov
) != 0) {
257 xen_be_printf(&ioreq
->blkdev
->xendev
, 0, "xc_gnttab_munmap failed: %s\n",
260 ioreq
->blkdev
->cnt_map
-= ioreq
->v
.niov
;
263 for (i
= 0; i
< ioreq
->v
.niov
; i
++) {
264 if (!ioreq
->page
[i
]) {
267 if (xc_gnttab_munmap(gnt
, ioreq
->page
[i
], 1) != 0) {
268 xen_be_printf(&ioreq
->blkdev
->xendev
, 0, "xc_gnttab_munmap failed: %s\n",
271 ioreq
->blkdev
->cnt_map
--;
272 ioreq
->page
[i
] = NULL
;
277 static int ioreq_map(struct ioreq
*ioreq
)
279 XenGnttab gnt
= ioreq
->blkdev
->xendev
.gnttabdev
;
282 if (ioreq
->v
.niov
== 0) {
286 ioreq
->pages
= xc_gnttab_map_grant_refs
287 (gnt
, ioreq
->v
.niov
, ioreq
->domids
, ioreq
->refs
, ioreq
->prot
);
288 if (ioreq
->pages
== NULL
) {
289 xen_be_printf(&ioreq
->blkdev
->xendev
, 0,
290 "can't map %d grant refs (%s, %d maps)\n",
291 ioreq
->v
.niov
, strerror(errno
), ioreq
->blkdev
->cnt_map
);
294 for (i
= 0; i
< ioreq
->v
.niov
; i
++) {
295 ioreq
->v
.iov
[i
].iov_base
= ioreq
->pages
+ i
* XC_PAGE_SIZE
+
296 (uintptr_t)ioreq
->v
.iov
[i
].iov_base
;
298 ioreq
->blkdev
->cnt_map
+= ioreq
->v
.niov
;
300 for (i
= 0; i
< ioreq
->v
.niov
; i
++) {
301 ioreq
->page
[i
] = xc_gnttab_map_grant_ref
302 (gnt
, ioreq
->domids
[i
], ioreq
->refs
[i
], ioreq
->prot
);
303 if (ioreq
->page
[i
] == NULL
) {
304 xen_be_printf(&ioreq
->blkdev
->xendev
, 0,
305 "can't map grant ref %d (%s, %d maps)\n",
306 ioreq
->refs
[i
], strerror(errno
), ioreq
->blkdev
->cnt_map
);
310 ioreq
->v
.iov
[i
].iov_base
= ioreq
->page
[i
] + (uintptr_t)ioreq
->v
.iov
[i
].iov_base
;
311 ioreq
->blkdev
->cnt_map
++;
317 static int ioreq_runio_qemu_sync(struct ioreq
*ioreq
)
319 struct XenBlkDev
*blkdev
= ioreq
->blkdev
;
323 if (ioreq
->req
.nr_segments
&& ioreq_map(ioreq
) == -1) {
326 if (ioreq
->presync
) {
327 bdrv_flush(blkdev
->bs
);
330 switch (ioreq
->req
.operation
) {
333 for (i
= 0; i
< ioreq
->v
.niov
; i
++) {
334 rc
= bdrv_read(blkdev
->bs
, pos
/ BLOCK_SIZE
,
335 ioreq
->v
.iov
[i
].iov_base
,
336 ioreq
->v
.iov
[i
].iov_len
/ BLOCK_SIZE
);
338 xen_be_printf(&blkdev
->xendev
, 0, "rd I/O error (%p, len %zd)\n",
339 ioreq
->v
.iov
[i
].iov_base
,
340 ioreq
->v
.iov
[i
].iov_len
);
343 pos
+= ioreq
->v
.iov
[i
].iov_len
;
347 case BLKIF_OP_WRITE_BARRIER
:
348 if (!ioreq
->req
.nr_segments
) {
352 for (i
= 0; i
< ioreq
->v
.niov
; i
++) {
353 rc
= bdrv_write(blkdev
->bs
, pos
/ BLOCK_SIZE
,
354 ioreq
->v
.iov
[i
].iov_base
,
355 ioreq
->v
.iov
[i
].iov_len
/ BLOCK_SIZE
);
357 xen_be_printf(&blkdev
->xendev
, 0, "wr I/O error (%p, len %zd)\n",
358 ioreq
->v
.iov
[i
].iov_base
,
359 ioreq
->v
.iov
[i
].iov_len
);
362 pos
+= ioreq
->v
.iov
[i
].iov_len
;
366 /* unknown operation (shouldn't happen -- parse catches this) */
370 if (ioreq
->postsync
) {
371 bdrv_flush(blkdev
->bs
);
373 ioreq
->status
= BLKIF_RSP_OKAY
;
383 ioreq
->status
= BLKIF_RSP_ERROR
;
387 static void qemu_aio_complete(void *opaque
, int ret
)
389 struct ioreq
*ioreq
= opaque
;
392 xen_be_printf(&ioreq
->blkdev
->xendev
, 0, "%s I/O error\n",
393 ioreq
->req
.operation
== BLKIF_OP_READ
? "read" : "write");
397 ioreq
->aio_inflight
--;
398 if (ioreq
->aio_inflight
> 0) {
402 ioreq
->status
= ioreq
->aio_errors
? BLKIF_RSP_ERROR
: BLKIF_RSP_OKAY
;
405 bdrv_acct_done(ioreq
->blkdev
->bs
, &ioreq
->acct
);
406 qemu_bh_schedule(ioreq
->blkdev
->bh
);
409 static int ioreq_runio_qemu_aio(struct ioreq
*ioreq
)
411 struct XenBlkDev
*blkdev
= ioreq
->blkdev
;
413 if (ioreq
->req
.nr_segments
&& ioreq_map(ioreq
) == -1) {
417 ioreq
->aio_inflight
++;
418 if (ioreq
->presync
) {
419 bdrv_flush(blkdev
->bs
); /* FIXME: aio_flush() ??? */
422 switch (ioreq
->req
.operation
) {
424 bdrv_acct_start(blkdev
->bs
, &ioreq
->acct
, ioreq
->v
.size
, BDRV_ACCT_READ
);
425 ioreq
->aio_inflight
++;
426 bdrv_aio_readv(blkdev
->bs
, ioreq
->start
/ BLOCK_SIZE
,
427 &ioreq
->v
, ioreq
->v
.size
/ BLOCK_SIZE
,
428 qemu_aio_complete
, ioreq
);
431 case BLKIF_OP_WRITE_BARRIER
:
432 if (!ioreq
->req
.nr_segments
) {
436 bdrv_acct_start(blkdev
->bs
, &ioreq
->acct
, ioreq
->v
.size
, BDRV_ACCT_WRITE
);
437 ioreq
->aio_inflight
++;
438 bdrv_aio_writev(blkdev
->bs
, ioreq
->start
/ BLOCK_SIZE
,
439 &ioreq
->v
, ioreq
->v
.size
/ BLOCK_SIZE
,
440 qemu_aio_complete
, ioreq
);
443 /* unknown operation (shouldn't happen -- parse catches this) */
447 if (ioreq
->postsync
) {
448 bdrv_flush(blkdev
->bs
); /* FIXME: aio_flush() ??? */
450 qemu_aio_complete(ioreq
, 0);
458 ioreq
->status
= BLKIF_RSP_ERROR
;
462 static int blk_send_response_one(struct ioreq
*ioreq
)
464 struct XenBlkDev
*blkdev
= ioreq
->blkdev
;
466 int have_requests
= 0;
467 blkif_response_t resp
;
470 resp
.id
= ioreq
->req
.id
;
471 resp
.operation
= ioreq
->req
.operation
;
472 resp
.status
= ioreq
->status
;
474 /* Place on the response ring for the relevant domain. */
475 switch (blkdev
->protocol
) {
476 case BLKIF_PROTOCOL_NATIVE
:
477 dst
= RING_GET_RESPONSE(&blkdev
->rings
.native
, blkdev
->rings
.native
.rsp_prod_pvt
);
479 case BLKIF_PROTOCOL_X86_32
:
480 dst
= RING_GET_RESPONSE(&blkdev
->rings
.x86_32_part
,
481 blkdev
->rings
.x86_32_part
.rsp_prod_pvt
);
483 case BLKIF_PROTOCOL_X86_64
:
484 dst
= RING_GET_RESPONSE(&blkdev
->rings
.x86_64_part
,
485 blkdev
->rings
.x86_64_part
.rsp_prod_pvt
);
490 memcpy(dst
, &resp
, sizeof(resp
));
491 blkdev
->rings
.common
.rsp_prod_pvt
++;
493 RING_PUSH_RESPONSES_AND_CHECK_NOTIFY(&blkdev
->rings
.common
, send_notify
);
494 if (blkdev
->rings
.common
.rsp_prod_pvt
== blkdev
->rings
.common
.req_cons
) {
496 * Tail check for pending requests. Allows frontend to avoid
497 * notifications if requests are already in flight (lower
498 * overheads and promotes batching).
500 RING_FINAL_CHECK_FOR_REQUESTS(&blkdev
->rings
.common
, have_requests
);
501 } else if (RING_HAS_UNCONSUMED_REQUESTS(&blkdev
->rings
.common
)) {
511 /* walk finished list, send outstanding responses, free requests */
512 static void blk_send_response_all(struct XenBlkDev
*blkdev
)
517 while (!QLIST_EMPTY(&blkdev
->finished
)) {
518 ioreq
= QLIST_FIRST(&blkdev
->finished
);
519 send_notify
+= blk_send_response_one(ioreq
);
520 ioreq_release(ioreq
);
523 xen_be_send_notify(&blkdev
->xendev
);
527 static int blk_get_request(struct XenBlkDev
*blkdev
, struct ioreq
*ioreq
, RING_IDX rc
)
529 switch (blkdev
->protocol
) {
530 case BLKIF_PROTOCOL_NATIVE
:
531 memcpy(&ioreq
->req
, RING_GET_REQUEST(&blkdev
->rings
.native
, rc
),
534 case BLKIF_PROTOCOL_X86_32
:
535 blkif_get_x86_32_req(&ioreq
->req
,
536 RING_GET_REQUEST(&blkdev
->rings
.x86_32_part
, rc
));
538 case BLKIF_PROTOCOL_X86_64
:
539 blkif_get_x86_64_req(&ioreq
->req
,
540 RING_GET_REQUEST(&blkdev
->rings
.x86_64_part
, rc
));
546 static void blk_handle_requests(struct XenBlkDev
*blkdev
)
551 blkdev
->more_work
= 0;
553 rc
= blkdev
->rings
.common
.req_cons
;
554 rp
= blkdev
->rings
.common
.sring
->req_prod
;
555 xen_rmb(); /* Ensure we see queued requests up to 'rp'. */
558 blk_send_response_all(blkdev
);
561 /* pull request from ring */
562 if (RING_REQUEST_CONS_OVERFLOW(&blkdev
->rings
.common
, rc
)) {
565 ioreq
= ioreq_start(blkdev
);
570 blk_get_request(blkdev
, ioreq
, rc
);
571 blkdev
->rings
.common
.req_cons
= ++rc
;
574 if (ioreq_parse(ioreq
) != 0) {
575 if (blk_send_response_one(ioreq
)) {
576 xen_be_send_notify(&blkdev
->xendev
);
578 ioreq_release(ioreq
);
583 /* run i/o in aio mode */
584 ioreq_runio_qemu_aio(ioreq
);
586 /* run i/o in sync mode */
587 ioreq_runio_qemu_sync(ioreq
);
591 blk_send_response_all(blkdev
);
594 if (blkdev
->more_work
&& blkdev
->requests_inflight
< max_requests
) {
595 qemu_bh_schedule(blkdev
->bh
);
599 /* ------------------------------------------------------------- */
601 static void blk_bh(void *opaque
)
603 struct XenBlkDev
*blkdev
= opaque
;
604 blk_handle_requests(blkdev
);
607 static void blk_alloc(struct XenDevice
*xendev
)
609 struct XenBlkDev
*blkdev
= container_of(xendev
, struct XenBlkDev
, xendev
);
611 QLIST_INIT(&blkdev
->inflight
);
612 QLIST_INIT(&blkdev
->finished
);
613 QLIST_INIT(&blkdev
->freelist
);
614 blkdev
->bh
= qemu_bh_new(blk_bh
, blkdev
);
615 if (xen_mode
!= XEN_EMULATE
) {
620 static int blk_init(struct XenDevice
*xendev
)
622 struct XenBlkDev
*blkdev
= container_of(xendev
, struct XenBlkDev
, xendev
);
623 int index
, qflags
, info
= 0;
625 /* read xenstore entries */
626 if (blkdev
->params
== NULL
) {
628 blkdev
->params
= xenstore_read_be_str(&blkdev
->xendev
, "params");
629 if (blkdev
->params
!= NULL
) {
630 h
= strchr(blkdev
->params
, ':');
633 blkdev
->fileproto
= blkdev
->params
;
634 blkdev
->filename
= h
+1;
637 blkdev
->fileproto
= "<unset>";
638 blkdev
->filename
= blkdev
->params
;
641 if (!strcmp("aio", blkdev
->fileproto
)) {
642 blkdev
->fileproto
= "raw";
644 if (blkdev
->mode
== NULL
) {
645 blkdev
->mode
= xenstore_read_be_str(&blkdev
->xendev
, "mode");
647 if (blkdev
->type
== NULL
) {
648 blkdev
->type
= xenstore_read_be_str(&blkdev
->xendev
, "type");
650 if (blkdev
->dev
== NULL
) {
651 blkdev
->dev
= xenstore_read_be_str(&blkdev
->xendev
, "dev");
653 if (blkdev
->devtype
== NULL
) {
654 blkdev
->devtype
= xenstore_read_be_str(&blkdev
->xendev
, "device-type");
657 /* do we have all we need? */
658 if (blkdev
->params
== NULL
||
659 blkdev
->mode
== NULL
||
660 blkdev
->type
== NULL
||
661 blkdev
->dev
== NULL
) {
666 if (strcmp(blkdev
->mode
, "w") == 0) {
667 qflags
= BDRV_O_RDWR
;
670 info
|= VDISK_READONLY
;
674 if (blkdev
->devtype
&& !strcmp(blkdev
->devtype
, "cdrom")) {
678 /* init qemu block driver */
679 index
= (blkdev
->xendev
.dev
- 202 * 256) / 16;
680 blkdev
->dinfo
= drive_get(IF_XEN
, 0, index
);
681 if (!blkdev
->dinfo
) {
682 /* setup via xenbus -> create new block driver instance */
683 xen_be_printf(&blkdev
->xendev
, 2, "create new bdrv (xenbus setup)\n");
684 blkdev
->bs
= bdrv_new(blkdev
->dev
);
686 if (bdrv_open(blkdev
->bs
, blkdev
->filename
, qflags
,
687 bdrv_find_whitelisted_format(blkdev
->fileproto
)) != 0) {
688 bdrv_delete(blkdev
->bs
);
696 /* setup via qemu cmdline -> already setup for us */
697 xen_be_printf(&blkdev
->xendev
, 2, "get configured bdrv (cmdline setup)\n");
698 blkdev
->bs
= blkdev
->dinfo
->bdrv
;
700 bdrv_attach_dev_nofail(blkdev
->bs
, blkdev
);
701 blkdev
->file_blk
= BLOCK_SIZE
;
702 blkdev
->file_size
= bdrv_getlength(blkdev
->bs
);
703 if (blkdev
->file_size
< 0) {
704 xen_be_printf(&blkdev
->xendev
, 1, "bdrv_getlength: %d (%s) | drv %s\n",
705 (int)blkdev
->file_size
, strerror(-blkdev
->file_size
),
706 blkdev
->bs
->drv
? blkdev
->bs
->drv
->format_name
: "-");
707 blkdev
->file_size
= 0;
710 xen_be_printf(xendev
, 1, "type \"%s\", fileproto \"%s\", filename \"%s\","
711 " size %" PRId64
" (%" PRId64
" MB)\n",
712 blkdev
->type
, blkdev
->fileproto
, blkdev
->filename
,
713 blkdev
->file_size
, blkdev
->file_size
>> 20);
716 xenstore_write_be_int(&blkdev
->xendev
, "feature-barrier", 1);
717 xenstore_write_be_int(&blkdev
->xendev
, "info", info
);
718 xenstore_write_be_int(&blkdev
->xendev
, "sector-size", blkdev
->file_blk
);
719 xenstore_write_be_int(&blkdev
->xendev
, "sectors",
720 blkdev
->file_size
/ blkdev
->file_blk
);
724 g_free(blkdev
->params
);
725 blkdev
->params
= NULL
;
726 g_free(blkdev
->mode
);
728 g_free(blkdev
->type
);
732 g_free(blkdev
->devtype
);
733 blkdev
->devtype
= NULL
;
737 static int blk_connect(struct XenDevice
*xendev
)
739 struct XenBlkDev
*blkdev
= container_of(xendev
, struct XenBlkDev
, xendev
);
741 if (xenstore_read_fe_int(&blkdev
->xendev
, "ring-ref", &blkdev
->ring_ref
) == -1) {
744 if (xenstore_read_fe_int(&blkdev
->xendev
, "event-channel",
745 &blkdev
->xendev
.remote_port
) == -1) {
749 blkdev
->protocol
= BLKIF_PROTOCOL_NATIVE
;
750 if (blkdev
->xendev
.protocol
) {
751 if (strcmp(blkdev
->xendev
.protocol
, XEN_IO_PROTO_ABI_X86_32
) == 0) {
752 blkdev
->protocol
= BLKIF_PROTOCOL_X86_32
;
754 if (strcmp(blkdev
->xendev
.protocol
, XEN_IO_PROTO_ABI_X86_64
) == 0) {
755 blkdev
->protocol
= BLKIF_PROTOCOL_X86_64
;
759 blkdev
->sring
= xc_gnttab_map_grant_ref(blkdev
->xendev
.gnttabdev
,
762 PROT_READ
| PROT_WRITE
);
763 if (!blkdev
->sring
) {
768 switch (blkdev
->protocol
) {
769 case BLKIF_PROTOCOL_NATIVE
:
771 blkif_sring_t
*sring_native
= blkdev
->sring
;
772 BACK_RING_INIT(&blkdev
->rings
.native
, sring_native
, XC_PAGE_SIZE
);
775 case BLKIF_PROTOCOL_X86_32
:
777 blkif_x86_32_sring_t
*sring_x86_32
= blkdev
->sring
;
779 BACK_RING_INIT(&blkdev
->rings
.x86_32_part
, sring_x86_32
, XC_PAGE_SIZE
);
782 case BLKIF_PROTOCOL_X86_64
:
784 blkif_x86_64_sring_t
*sring_x86_64
= blkdev
->sring
;
786 BACK_RING_INIT(&blkdev
->rings
.x86_64_part
, sring_x86_64
, XC_PAGE_SIZE
);
791 xen_be_bind_evtchn(&blkdev
->xendev
);
793 xen_be_printf(&blkdev
->xendev
, 1, "ok: proto %s, ring-ref %d, "
794 "remote port %d, local port %d\n",
795 blkdev
->xendev
.protocol
, blkdev
->ring_ref
,
796 blkdev
->xendev
.remote_port
, blkdev
->xendev
.local_port
);
800 static void blk_disconnect(struct XenDevice
*xendev
)
802 struct XenBlkDev
*blkdev
= container_of(xendev
, struct XenBlkDev
, xendev
);
805 if (!blkdev
->dinfo
) {
806 /* close/delete only if we created it ourself */
807 bdrv_close(blkdev
->bs
);
808 bdrv_delete(blkdev
->bs
);
812 xen_be_unbind_evtchn(&blkdev
->xendev
);
815 xc_gnttab_munmap(blkdev
->xendev
.gnttabdev
, blkdev
->sring
, 1);
817 blkdev
->sring
= NULL
;
821 static int blk_free(struct XenDevice
*xendev
)
823 struct XenBlkDev
*blkdev
= container_of(xendev
, struct XenBlkDev
, xendev
);
826 while (!QLIST_EMPTY(&blkdev
->freelist
)) {
827 ioreq
= QLIST_FIRST(&blkdev
->freelist
);
828 QLIST_REMOVE(ioreq
, list
);
829 qemu_iovec_destroy(&ioreq
->v
);
833 g_free(blkdev
->params
);
834 g_free(blkdev
->mode
);
835 g_free(blkdev
->type
);
837 g_free(blkdev
->devtype
);
838 qemu_bh_delete(blkdev
->bh
);
842 static void blk_event(struct XenDevice
*xendev
)
844 struct XenBlkDev
*blkdev
= container_of(xendev
, struct XenBlkDev
, xendev
);
846 qemu_bh_schedule(blkdev
->bh
);
849 struct XenDevOps xen_blkdev_ops
= {
850 .size
= sizeof(struct XenBlkDev
),
851 .flags
= DEVOPS_FLAG_NEED_GNTDEV
,
854 .initialise
= blk_connect
,
855 .disconnect
= blk_disconnect
,