linux-user: Emulate /proc/self/smaps
[qemu/kevin.git] / hw / 9pfs / xen-9p-backend.c
blob4aa9c8c736dda11bda45e4318749f76b3397cded
1 /*
2 * Xen 9p backend
4 * Copyright Aporeto 2017
6 * Authors:
7 * Stefano Stabellini <stefano@aporeto.com>
9 */
12 * Not so fast! You might want to read the 9p developer docs first:
13 * https://wiki.qemu.org/Documentation/9p
16 #include "qemu/osdep.h"
18 #include "hw/9pfs/9p.h"
19 #include "hw/xen/xen-legacy-backend.h"
20 #include "hw/9pfs/xen-9pfs.h"
21 #include "qapi/error.h"
22 #include "qemu/config-file.h"
23 #include "qemu/main-loop.h"
24 #include "qemu/option.h"
25 #include "qemu/iov.h"
26 #include "fsdev/qemu-fsdev.h"
28 #include "trace.h"
30 #define VERSIONS "1"
31 #define MAX_RINGS 8
32 #define MAX_RING_ORDER 9
34 typedef struct Xen9pfsRing {
35 struct Xen9pfsDev *priv;
37 int ref;
38 xenevtchn_handle *evtchndev;
39 int evtchn;
40 int local_port;
41 int ring_order;
42 struct xen_9pfs_data_intf *intf;
43 unsigned char *data;
44 struct xen_9pfs_data ring;
46 struct iovec *sg;
47 QEMUBH *bh;
48 Coroutine *co;
50 /* local copies, so that we can read/write PDU data directly from
51 * the ring */
52 RING_IDX out_cons, out_size, in_cons;
53 bool inprogress;
54 } Xen9pfsRing;
56 typedef struct Xen9pfsDev {
57 struct XenLegacyDevice xendev; /* must be first */
58 V9fsState state;
59 char *path;
60 char *security_model;
61 char *tag;
62 char *id;
64 int num_rings;
65 Xen9pfsRing *rings;
66 MemReentrancyGuard mem_reentrancy_guard;
67 } Xen9pfsDev;
69 static void xen_9pfs_disconnect(struct XenLegacyDevice *xendev);
71 static void xen_9pfs_in_sg(Xen9pfsRing *ring,
72 struct iovec *in_sg,
73 int *num,
74 uint32_t idx,
75 uint32_t size)
77 RING_IDX cons, prod, masked_prod, masked_cons;
79 cons = ring->intf->in_cons;
80 prod = ring->intf->in_prod;
81 xen_rmb();
82 masked_prod = xen_9pfs_mask(prod, XEN_FLEX_RING_SIZE(ring->ring_order));
83 masked_cons = xen_9pfs_mask(cons, XEN_FLEX_RING_SIZE(ring->ring_order));
85 if (masked_prod < masked_cons) {
86 in_sg[0].iov_base = ring->ring.in + masked_prod;
87 in_sg[0].iov_len = masked_cons - masked_prod;
88 *num = 1;
89 } else {
90 in_sg[0].iov_base = ring->ring.in + masked_prod;
91 in_sg[0].iov_len = XEN_FLEX_RING_SIZE(ring->ring_order) - masked_prod;
92 in_sg[1].iov_base = ring->ring.in;
93 in_sg[1].iov_len = masked_cons;
94 *num = 2;
98 static void xen_9pfs_out_sg(Xen9pfsRing *ring,
99 struct iovec *out_sg,
100 int *num,
101 uint32_t idx)
103 RING_IDX cons, prod, masked_prod, masked_cons;
105 cons = ring->intf->out_cons;
106 prod = ring->intf->out_prod;
107 xen_rmb();
108 masked_prod = xen_9pfs_mask(prod, XEN_FLEX_RING_SIZE(ring->ring_order));
109 masked_cons = xen_9pfs_mask(cons, XEN_FLEX_RING_SIZE(ring->ring_order));
111 if (masked_cons < masked_prod) {
112 out_sg[0].iov_base = ring->ring.out + masked_cons;
113 out_sg[0].iov_len = ring->out_size;
114 *num = 1;
115 } else {
116 if (ring->out_size >
117 (XEN_FLEX_RING_SIZE(ring->ring_order) - masked_cons)) {
118 out_sg[0].iov_base = ring->ring.out + masked_cons;
119 out_sg[0].iov_len = XEN_FLEX_RING_SIZE(ring->ring_order) -
120 masked_cons;
121 out_sg[1].iov_base = ring->ring.out;
122 out_sg[1].iov_len = ring->out_size -
123 (XEN_FLEX_RING_SIZE(ring->ring_order) -
124 masked_cons);
125 *num = 2;
126 } else {
127 out_sg[0].iov_base = ring->ring.out + masked_cons;
128 out_sg[0].iov_len = ring->out_size;
129 *num = 1;
134 static ssize_t xen_9pfs_pdu_vmarshal(V9fsPDU *pdu,
135 size_t offset,
136 const char *fmt,
137 va_list ap)
139 Xen9pfsDev *xen_9pfs = container_of(pdu->s, Xen9pfsDev, state);
140 struct iovec in_sg[2];
141 int num;
142 ssize_t ret;
144 xen_9pfs_in_sg(&xen_9pfs->rings[pdu->tag % xen_9pfs->num_rings],
145 in_sg, &num, pdu->idx, ROUND_UP(offset + 128, 512));
147 ret = v9fs_iov_vmarshal(in_sg, num, offset, 0, fmt, ap);
148 if (ret < 0) {
149 xen_pv_printf(&xen_9pfs->xendev, 0,
150 "Failed to encode VirtFS reply type %d\n",
151 pdu->id + 1);
152 xen_be_set_state(&xen_9pfs->xendev, XenbusStateClosing);
153 xen_9pfs_disconnect(&xen_9pfs->xendev);
155 return ret;
158 static ssize_t xen_9pfs_pdu_vunmarshal(V9fsPDU *pdu,
159 size_t offset,
160 const char *fmt,
161 va_list ap)
163 Xen9pfsDev *xen_9pfs = container_of(pdu->s, Xen9pfsDev, state);
164 struct iovec out_sg[2];
165 int num;
166 ssize_t ret;
168 xen_9pfs_out_sg(&xen_9pfs->rings[pdu->tag % xen_9pfs->num_rings],
169 out_sg, &num, pdu->idx);
171 ret = v9fs_iov_vunmarshal(out_sg, num, offset, 0, fmt, ap);
172 if (ret < 0) {
173 xen_pv_printf(&xen_9pfs->xendev, 0,
174 "Failed to decode VirtFS request type %d\n", pdu->id);
175 xen_be_set_state(&xen_9pfs->xendev, XenbusStateClosing);
176 xen_9pfs_disconnect(&xen_9pfs->xendev);
178 return ret;
181 static void xen_9pfs_init_out_iov_from_pdu(V9fsPDU *pdu,
182 struct iovec **piov,
183 unsigned int *pniov,
184 size_t size)
186 Xen9pfsDev *xen_9pfs = container_of(pdu->s, Xen9pfsDev, state);
187 Xen9pfsRing *ring = &xen_9pfs->rings[pdu->tag % xen_9pfs->num_rings];
188 int num;
190 g_free(ring->sg);
192 ring->sg = g_new0(struct iovec, 2);
193 xen_9pfs_out_sg(ring, ring->sg, &num, pdu->idx);
194 *piov = ring->sg;
195 *pniov = num;
198 static void xen_9pfs_init_in_iov_from_pdu(V9fsPDU *pdu,
199 struct iovec **piov,
200 unsigned int *pniov,
201 size_t size)
203 Xen9pfsDev *xen_9pfs = container_of(pdu->s, Xen9pfsDev, state);
204 Xen9pfsRing *ring = &xen_9pfs->rings[pdu->tag % xen_9pfs->num_rings];
205 int num;
206 size_t buf_size;
208 g_free(ring->sg);
210 ring->sg = g_new0(struct iovec, 2);
211 ring->co = qemu_coroutine_self();
212 /* make sure other threads see ring->co changes before continuing */
213 smp_wmb();
215 again:
216 xen_9pfs_in_sg(ring, ring->sg, &num, pdu->idx, size);
217 buf_size = iov_size(ring->sg, num);
218 if (buf_size < size) {
219 qemu_coroutine_yield();
220 goto again;
222 ring->co = NULL;
223 /* make sure other threads see ring->co changes before continuing */
224 smp_wmb();
226 *piov = ring->sg;
227 *pniov = num;
230 static void xen_9pfs_push_and_notify(V9fsPDU *pdu)
232 RING_IDX prod;
233 Xen9pfsDev *priv = container_of(pdu->s, Xen9pfsDev, state);
234 Xen9pfsRing *ring = &priv->rings[pdu->tag % priv->num_rings];
236 g_free(ring->sg);
237 ring->sg = NULL;
239 ring->intf->out_cons = ring->out_cons;
240 xen_wmb();
242 prod = ring->intf->in_prod;
243 xen_rmb();
244 ring->intf->in_prod = prod + pdu->size;
245 xen_wmb();
247 ring->inprogress = false;
248 qemu_xen_evtchn_notify(ring->evtchndev, ring->local_port);
250 qemu_bh_schedule(ring->bh);
253 static const V9fsTransport xen_9p_transport = {
254 .pdu_vmarshal = xen_9pfs_pdu_vmarshal,
255 .pdu_vunmarshal = xen_9pfs_pdu_vunmarshal,
256 .init_in_iov_from_pdu = xen_9pfs_init_in_iov_from_pdu,
257 .init_out_iov_from_pdu = xen_9pfs_init_out_iov_from_pdu,
258 .push_and_notify = xen_9pfs_push_and_notify,
261 static int xen_9pfs_init(struct XenLegacyDevice *xendev)
263 return 0;
266 static int xen_9pfs_receive(Xen9pfsRing *ring)
268 P9MsgHeader h;
269 RING_IDX cons, prod, masked_prod, masked_cons, queued;
270 V9fsPDU *pdu;
272 if (ring->inprogress) {
273 return 0;
276 cons = ring->intf->out_cons;
277 prod = ring->intf->out_prod;
278 xen_rmb();
280 queued = xen_9pfs_queued(prod, cons, XEN_FLEX_RING_SIZE(ring->ring_order));
281 if (queued < sizeof(h)) {
282 return 0;
284 ring->inprogress = true;
286 masked_prod = xen_9pfs_mask(prod, XEN_FLEX_RING_SIZE(ring->ring_order));
287 masked_cons = xen_9pfs_mask(cons, XEN_FLEX_RING_SIZE(ring->ring_order));
289 xen_9pfs_read_packet((uint8_t *) &h, ring->ring.out, sizeof(h),
290 masked_prod, &masked_cons,
291 XEN_FLEX_RING_SIZE(ring->ring_order));
292 if (queued < le32_to_cpu(h.size_le)) {
293 return 0;
296 /* cannot fail, because we only handle one request per ring at a time */
297 pdu = pdu_alloc(&ring->priv->state);
298 ring->out_size = le32_to_cpu(h.size_le);
299 ring->out_cons = cons + le32_to_cpu(h.size_le);
301 pdu_submit(pdu, &h);
303 return 0;
306 static void xen_9pfs_bh(void *opaque)
308 Xen9pfsRing *ring = opaque;
309 bool wait;
311 again:
312 wait = ring->co != NULL && qemu_coroutine_entered(ring->co);
313 /* paired with the smb_wmb barriers in xen_9pfs_init_in_iov_from_pdu */
314 smp_rmb();
315 if (wait) {
316 cpu_relax();
317 goto again;
320 if (ring->co != NULL) {
321 qemu_coroutine_enter_if_inactive(ring->co);
323 xen_9pfs_receive(ring);
326 static void xen_9pfs_evtchn_event(void *opaque)
328 Xen9pfsRing *ring = opaque;
329 evtchn_port_t port;
331 port = qemu_xen_evtchn_pending(ring->evtchndev);
332 qemu_xen_evtchn_unmask(ring->evtchndev, port);
334 qemu_bh_schedule(ring->bh);
337 static void xen_9pfs_disconnect(struct XenLegacyDevice *xendev)
339 Xen9pfsDev *xen_9pdev = container_of(xendev, Xen9pfsDev, xendev);
340 int i;
342 trace_xen_9pfs_disconnect(xendev->name);
344 for (i = 0; i < xen_9pdev->num_rings; i++) {
345 if (xen_9pdev->rings[i].evtchndev != NULL) {
346 qemu_set_fd_handler(qemu_xen_evtchn_fd(xen_9pdev->rings[i].evtchndev),
347 NULL, NULL, NULL);
348 qemu_xen_evtchn_unbind(xen_9pdev->rings[i].evtchndev,
349 xen_9pdev->rings[i].local_port);
350 xen_9pdev->rings[i].evtchndev = NULL;
352 if (xen_9pdev->rings[i].data != NULL) {
353 xen_be_unmap_grant_refs(&xen_9pdev->xendev,
354 xen_9pdev->rings[i].data,
355 xen_9pdev->rings[i].intf->ref,
356 (1 << xen_9pdev->rings[i].ring_order));
357 xen_9pdev->rings[i].data = NULL;
359 if (xen_9pdev->rings[i].intf != NULL) {
360 xen_be_unmap_grant_ref(&xen_9pdev->xendev,
361 xen_9pdev->rings[i].intf,
362 xen_9pdev->rings[i].ref);
363 xen_9pdev->rings[i].intf = NULL;
365 if (xen_9pdev->rings[i].bh != NULL) {
366 qemu_bh_delete(xen_9pdev->rings[i].bh);
367 xen_9pdev->rings[i].bh = NULL;
371 g_free(xen_9pdev->id);
372 xen_9pdev->id = NULL;
373 g_free(xen_9pdev->tag);
374 xen_9pdev->tag = NULL;
375 g_free(xen_9pdev->path);
376 xen_9pdev->path = NULL;
377 g_free(xen_9pdev->security_model);
378 xen_9pdev->security_model = NULL;
379 g_free(xen_9pdev->rings);
380 xen_9pdev->rings = NULL;
383 static int xen_9pfs_free(struct XenLegacyDevice *xendev)
385 trace_xen_9pfs_free(xendev->name);
387 return 0;
390 static int xen_9pfs_connect(struct XenLegacyDevice *xendev)
392 Error *err = NULL;
393 int i;
394 Xen9pfsDev *xen_9pdev = container_of(xendev, Xen9pfsDev, xendev);
395 V9fsState *s = &xen_9pdev->state;
396 QemuOpts *fsdev;
398 trace_xen_9pfs_connect(xendev->name);
400 if (xenstore_read_fe_int(&xen_9pdev->xendev, "num-rings",
401 &xen_9pdev->num_rings) == -1 ||
402 xen_9pdev->num_rings > MAX_RINGS || xen_9pdev->num_rings < 1) {
403 return -1;
406 xen_9pdev->rings = g_new0(Xen9pfsRing, xen_9pdev->num_rings);
407 for (i = 0; i < xen_9pdev->num_rings; i++) {
408 char *str;
409 int ring_order;
411 xen_9pdev->rings[i].priv = xen_9pdev;
412 xen_9pdev->rings[i].evtchn = -1;
413 xen_9pdev->rings[i].local_port = -1;
415 str = g_strdup_printf("ring-ref%u", i);
416 if (xenstore_read_fe_int(&xen_9pdev->xendev, str,
417 &xen_9pdev->rings[i].ref) == -1) {
418 g_free(str);
419 goto out;
421 g_free(str);
422 str = g_strdup_printf("event-channel-%u", i);
423 if (xenstore_read_fe_int(&xen_9pdev->xendev, str,
424 &xen_9pdev->rings[i].evtchn) == -1) {
425 g_free(str);
426 goto out;
428 g_free(str);
430 xen_9pdev->rings[i].intf =
431 xen_be_map_grant_ref(&xen_9pdev->xendev,
432 xen_9pdev->rings[i].ref,
433 PROT_READ | PROT_WRITE);
434 if (!xen_9pdev->rings[i].intf) {
435 goto out;
437 ring_order = xen_9pdev->rings[i].intf->ring_order;
438 if (ring_order > MAX_RING_ORDER) {
439 goto out;
441 xen_9pdev->rings[i].ring_order = ring_order;
442 xen_9pdev->rings[i].data =
443 xen_be_map_grant_refs(&xen_9pdev->xendev,
444 xen_9pdev->rings[i].intf->ref,
445 (1 << ring_order),
446 PROT_READ | PROT_WRITE);
447 if (!xen_9pdev->rings[i].data) {
448 goto out;
450 xen_9pdev->rings[i].ring.in = xen_9pdev->rings[i].data;
451 xen_9pdev->rings[i].ring.out = xen_9pdev->rings[i].data +
452 XEN_FLEX_RING_SIZE(ring_order);
454 xen_9pdev->rings[i].bh = qemu_bh_new_guarded(xen_9pfs_bh,
455 &xen_9pdev->rings[i],
456 &xen_9pdev->mem_reentrancy_guard);
457 xen_9pdev->rings[i].out_cons = 0;
458 xen_9pdev->rings[i].out_size = 0;
459 xen_9pdev->rings[i].inprogress = false;
462 xen_9pdev->rings[i].evtchndev = qemu_xen_evtchn_open();
463 if (xen_9pdev->rings[i].evtchndev == NULL) {
464 goto out;
466 qemu_set_cloexec(qemu_xen_evtchn_fd(xen_9pdev->rings[i].evtchndev));
467 xen_9pdev->rings[i].local_port = qemu_xen_evtchn_bind_interdomain
468 (xen_9pdev->rings[i].evtchndev,
469 xendev->dom,
470 xen_9pdev->rings[i].evtchn);
471 if (xen_9pdev->rings[i].local_port == -1) {
472 xen_pv_printf(xendev, 0,
473 "xenevtchn_bind_interdomain failed port=%d\n",
474 xen_9pdev->rings[i].evtchn);
475 goto out;
477 xen_pv_printf(xendev, 2, "bind evtchn port %d\n", xendev->local_port);
478 qemu_set_fd_handler(qemu_xen_evtchn_fd(xen_9pdev->rings[i].evtchndev),
479 xen_9pfs_evtchn_event, NULL, &xen_9pdev->rings[i]);
482 xen_9pdev->security_model = xenstore_read_be_str(xendev, "security_model");
483 xen_9pdev->path = xenstore_read_be_str(xendev, "path");
484 xen_9pdev->id = s->fsconf.fsdev_id =
485 g_strdup_printf("xen9p%d", xendev->dev);
486 xen_9pdev->tag = s->fsconf.tag = xenstore_read_fe_str(xendev, "tag");
487 fsdev = qemu_opts_create(qemu_find_opts("fsdev"),
488 s->fsconf.tag,
489 1, NULL);
490 qemu_opt_set(fsdev, "fsdriver", "local", NULL);
491 qemu_opt_set(fsdev, "path", xen_9pdev->path, NULL);
492 qemu_opt_set(fsdev, "security_model", xen_9pdev->security_model, NULL);
493 qemu_opts_set_id(fsdev, s->fsconf.fsdev_id);
494 qemu_fsdev_add(fsdev, &err);
495 if (err) {
496 error_report_err(err);
498 v9fs_device_realize_common(s, &xen_9p_transport, NULL);
500 return 0;
502 out:
503 xen_9pfs_free(xendev);
504 return -1;
507 static void xen_9pfs_alloc(struct XenLegacyDevice *xendev)
509 trace_xen_9pfs_alloc(xendev->name);
511 xenstore_write_be_str(xendev, "versions", VERSIONS);
512 xenstore_write_be_int(xendev, "max-rings", MAX_RINGS);
513 xenstore_write_be_int(xendev, "max-ring-page-order", MAX_RING_ORDER);
516 struct XenDevOps xen_9pfs_ops = {
517 .size = sizeof(Xen9pfsDev),
518 .flags = DEVOPS_FLAG_NEED_GNTDEV,
519 .alloc = xen_9pfs_alloc,
520 .init = xen_9pfs_init,
521 .initialise = xen_9pfs_connect,
522 .disconnect = xen_9pfs_disconnect,
523 .free = xen_9pfs_free,