Fix UTIME_OMIT handling
[dragonfly.git] / sys / dev / virtual / virtio / balloon / virtio_balloon.c
blob80c1b326b3b59d9d7a075aa917107daf4cac49f7
1 /*-
2 * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
4 * Copyright (c) 2011, Bryan Venteicher <bryanv@FreeBSD.org>
5 * All rights reserved.
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
9 * are met:
10 * 1. Redistributions of source code must retain the above copyright
11 * notice unmodified, this list of conditions, and the following
12 * disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
17 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
18 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
19 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
20 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
21 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
22 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
26 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
28 * $FreeBSD: head/sys/dev/virtio/balloon/virtio_balloon.c 326255 2017-11-27 14:52:40Z pfg $
32 * Copyright (c) 2018 The DragonFly Project. All rights reserved.
34 * This code is derived from software contributed to The DragonFly Project
35 * by Diederik de Groot <info@talon.nl>
37 * Redistribution and use in source and binary forms, with or without
38 * modification, are permitted provided that the following conditions
39 * are met:
41 * 1. Redistributions of source code must retain the above copyright
42 * notice, this list of conditions and the following disclaimer.
43 * 2. Redistributions in binary form must reproduce the above copyright
44 * notice, this list of conditions and the following disclaimer in
45 * the documentation and/or other materials provided with the
46 * distribution.
47 * 3. Neither the name of The DragonFly Project nor the names of its
48 * contributors may be used to endorse or promote products derived
49 * from this software without specific, prior written permission.
51 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
52 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
53 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
54 * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
55 * COPYRIGHT HOLDERS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
56 * INCIDENTAL, SPECIAL, EXEMPLARY OR CONSEQUENTIAL DAMAGES (INCLUDING,
57 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
58 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
59 * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
60 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
61 * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
62 * SUCH DAMAGE.
65 /* Driver for VirtIO memory balloon devices. */
67 #include <sys/cdefs.h>
68 #include <sys/param.h>
69 #include <sys/systm.h>
70 #include <sys/kernel.h>
71 #include <sys/endian.h>
72 #include <sys/kthread.h>
73 #include <sys/malloc.h>
74 #include <sys/module.h>
75 #include <sys/sglist.h>
76 #include <sys/sysctl.h>
77 #include <sys/lock.h>
78 #include <sys/queue.h>
80 #include <vm/vm.h>
81 #include <vm/vm_page.h>
82 #include <sys/bus.h>
83 #include <sys/rman.h>
85 #include <dev/virtual/virtio/virtio/virtio.h>
86 #include <dev/virtual/virtio/virtio/virtqueue.h>
87 #include <dev/virtual/virtio/balloon/virtio_balloon.h>
89 struct vtballoon_softc {
90 device_t vtballoon_dev;
91 struct lwkt_serialize vtballoon_slz;
92 uint64_t vtballoon_features;
93 uint32_t vtballoon_flags;
94 #define VTBALLOON_FLAG_DETACH 0x01
96 struct virtqueue *vtballoon_inflate_vq;
97 struct virtqueue *vtballoon_deflate_vq;
99 uint32_t vtballoon_desired_npages;
100 uint32_t vtballoon_current_npages;
101 TAILQ_HEAD(,vm_page) vtballoon_pages;
103 struct thread *vtballoon_td;
104 uint32_t *vtballoon_page_frames;
105 int vtballoon_pagereq;
106 int vtballoon_timeout;
107 int vtballoon_nintr;
108 int vtballoon_debug;
109 #define VTBALLOON_INFO 0x01
110 #define VTBALLOON_ERROR 0x02
111 #define VTBALLOON_DEBUG 0x04
112 #define VTBALLOON_TRACE 0x08
114 struct virtqueue *vtballoon_stats_vq;
115 struct vtballoon_stat vtballoon_stats[VTBALLOON_S_NR];
116 bool vtballoon_update_stats;
119 static struct virtio_feature_desc vtballoon_feature_desc[] = {
120 { VIRTIO_BALLOON_F_MUST_TELL_HOST, "MustTellHost" },
121 { VIRTIO_BALLOON_F_STATS_VQ, "StatsVq" },
122 { VIRTIO_BALLOON_F_DEFLATE_ON_OOM, "DeflateOnOutOfMemory" },
123 { 0, NULL }
126 #define vtballoon_dprintf(_sc, _level, _msg, _args ...) do { \
127 if ((_sc)->vtballoon_debug & (_level)) \
128 device_printf((_sc)->vtballoon_dev, "%s:%d: "_msg, \
129 __FUNCTION__, __LINE__, ##_args); \
130 } while (0)
132 static int vtballoon_probe(device_t);
133 static int vtballoon_attach(device_t);
134 static int vtballoon_detach(device_t);
136 static int vtballoon_alloc_intrs(struct vtballoon_softc *sc);
138 static void vtballoon_negotiate_features(struct vtballoon_softc *);
139 static int vtballoon_alloc_virtqueues(struct vtballoon_softc *);
141 static void vtballoon_config_change_intr(void *);
143 static void vtballoon_update_stats(struct vtballoon_softc *sc);
144 static void vtballoon_stats_vq_intr(void *);
146 static void vtballoon_inflate_vq_intr(void *);
147 static void vtballoon_deflate_vq_intr(void *);
148 static void vtballoon_inflate(struct vtballoon_softc *, int);
149 static void vtballoon_deflate(struct vtballoon_softc *, int);
151 static void vtballoon_send_page_frames(struct vtballoon_softc *,
152 struct virtqueue *, int);
154 static void vtballoon_pop(struct vtballoon_softc *);
155 static void vtballoon_stop(struct vtballoon_softc *);
157 static vm_page_t vtballoon_alloc_page(struct vtballoon_softc *);
158 static void vtballoon_free_page(struct vtballoon_softc *, vm_page_t);
160 static int vtballoon_sleep(struct vtballoon_softc *);
161 static void vtballoon_thread(void *);
162 static void vtballoon_get_tunables(struct vtballoon_softc *);
163 static void vtballoon_add_sysctl(struct vtballoon_softc *);
166 * Features desired/implemented by this driver.
167 * VIRTIO_BALLOON_F_STATS_VQ | VIRTIO_BALLOON_F_MUST_TELL_HOST
169 #define VTBALLOON_FEATURES VIRTIO_BALLOON_F_STATS_VQ
171 /* Timeout between retries when the balloon needs inflating. */
172 #define VTBALLOON_LOWMEM_TIMEOUT hz * 100
174 /* vm_page_alloc flags */
175 #define VTBALLOON_REGULAR_ALLOC VM_ALLOC_NORMAL
176 #define VTBALLOON_LOWMEM_ALLOC VM_ALLOC_SYSTEM
179 * Maximum number of pages we'll request to inflate or deflate
180 * the balloon in one virtqueue request. Both Linux and NetBSD
181 * have settled on 256, doing up to 1MB at a time.
183 #define VTBALLOON_PAGES_PER_REQUEST 256
186 * Default Debug Level
187 * VTBALLOON_INFO | VTBALLOON_ERROR | VTBALLOON_DEBUG | VTBALLOON_TRACE
189 #define VTBALLOON_DEFAULT_DEBUG_LEVEL VTBALLOON_INFO | VTBALLOON_ERROR
192 * Maximum number of interrupts to request
194 #define VTBALLOON_MAX_INTERRUPTS 4
196 /* Must be able to fix all pages frames in one page (segment). */
197 CTASSERT(VTBALLOON_PAGES_PER_REQUEST * sizeof(uint32_t) <= PAGE_SIZE);
199 #define VTBALLOON_SLZ(_sc) &(_sc)->vtballoon_slz
200 #define VTBALLOON_ENTER_SLZ(_sc) lwkt_serialize_enter(VTBALLOON_SLZ(sc));
201 #define VTBALLOON_EXIT_SLZ(_sc) lwkt_serialize_exit(VTBALLOON_SLZ(sc));
203 static device_method_t vtballoon_methods[] = {
204 /* Device methods. */
205 DEVMETHOD(device_probe, vtballoon_probe),
206 DEVMETHOD(device_attach, vtballoon_attach),
207 DEVMETHOD(device_detach, vtballoon_detach),
209 DEVMETHOD_END
212 static driver_t vtballoon_driver = {
213 "vtballoon",
214 vtballoon_methods,
215 sizeof(struct vtballoon_softc)
217 static devclass_t vtballoon_devclass;
219 DRIVER_MODULE(virtio_balloon, virtio_pci, vtballoon_driver,
220 vtballoon_devclass, NULL, NULL);
221 MODULE_VERSION(virtio_balloon, 1);
222 MODULE_DEPEND(virtio_balloon, virtio, 1, 1, 1);
224 static int
225 vtballoon_probe(device_t dev)
227 struct vtballoon_softc *sc = device_get_softc(dev);
228 vtballoon_dprintf(sc, VTBALLOON_TRACE, "\n");
229 if (virtio_get_device_type(dev) != VIRTIO_ID_BALLOON)
230 return (ENXIO);
232 device_set_desc(dev, "VirtIO Balloon Adapter");
234 return (BUS_PROBE_DEFAULT);
237 struct irqmap {
238 int irq;
239 int idx;
240 driver_intr_t *handler;
241 const char * handler_name;
244 static int
245 vtballoon_attach(device_t dev)
247 struct vtballoon_softc *sc;
248 int error, i;
250 sc = device_get_softc(dev);
251 sc->vtballoon_dev = dev;
252 sc->vtballoon_debug = VTBALLOON_DEFAULT_DEBUG_LEVEL;
254 vtballoon_dprintf(sc, VTBALLOON_TRACE, "\n");
256 lwkt_serialize_init(VTBALLOON_SLZ(sc));
257 TAILQ_INIT(&sc->vtballoon_pages);
259 vtballoon_get_tunables(sc);
260 vtballoon_add_sysctl(sc);
262 virtio_set_feature_desc(dev, vtballoon_feature_desc);
263 vtballoon_negotiate_features(sc);
265 sc->vtballoon_page_frames = contigmalloc(VTBALLOON_PAGES_PER_REQUEST *
266 sizeof(uint32_t), M_DEVBUF, M_NOWAIT | M_ZERO, 0, BUS_SPACE_MAXADDR, 16, 0);
267 if (sc->vtballoon_page_frames == NULL) {
268 error = ENOMEM;
269 vtballoon_dprintf(sc, VTBALLOON_ERROR, "cannot allocate page frame request array (error:%d)\n", error);
270 goto fail;
272 error = vtballoon_alloc_intrs(sc);
273 if (error) {
274 vtballoon_dprintf(sc, VTBALLOON_ERROR, "cannot allocate interrupts (error:%d)\n", error);
275 goto fail;
278 error = vtballoon_alloc_virtqueues(sc);
279 if (error) {
280 vtballoon_dprintf(sc, VTBALLOON_ERROR, "cannot allocate virtqueues (error:%d)\n", error);
281 goto fail;
284 int nrhandlers = virtio_with_feature(sc->vtballoon_dev, VIRTIO_BALLOON_F_STATS_VQ) ? 4 : 3;
285 struct irqmap info[4];
287 /* Possible "Virtqueue <-> IRQ" configurations */
288 switch (sc->vtballoon_nintr) {
289 case 1:
290 info[2] = (struct irqmap){0, -1, vtballoon_config_change_intr, "config"};
291 info[0] = (struct irqmap){0, 0, vtballoon_inflate_vq_intr, "inflate"};
292 info[1] = (struct irqmap){0, 1, vtballoon_deflate_vq_intr, "deflate"};
293 info[3] = (struct irqmap){0, 2, vtballoon_stats_vq_intr, "stats"};
294 break;
295 case 2:
296 info[2] = (struct irqmap){1, -1, vtballoon_config_change_intr, "config"};
297 info[0] = (struct irqmap){0, 0, vtballoon_inflate_vq_intr, "inflate"};
298 info[1] = (struct irqmap){0, 1, vtballoon_deflate_vq_intr, "deflate"};
299 info[3] = (struct irqmap){0, 2, vtballoon_stats_vq_intr, "stats"};
300 break;
301 case 3:
302 info[2] = (struct irqmap){2, -1, vtballoon_config_change_intr, "config"};
303 info[0] = (struct irqmap){0, 0, vtballoon_inflate_vq_intr, "inflate"};
304 info[1] = (struct irqmap){1, 1, vtballoon_deflate_vq_intr, "deflate"};
305 info[3] = (struct irqmap){2, 2, vtballoon_stats_vq_intr, "stats"};
306 break;
307 case 4:
308 info[2] = (struct irqmap){3, -1, vtballoon_config_change_intr, "config"};
309 info[0] = (struct irqmap){0, 0, vtballoon_inflate_vq_intr, "inflate"};
310 info[1] = (struct irqmap){1, 1, vtballoon_deflate_vq_intr, "deflate"};
311 info[3] = (struct irqmap){2, 2, vtballoon_stats_vq_intr, "stats"};
312 break;
313 default:
314 vtballoon_dprintf(sc, VTBALLOON_ERROR, "Invalid interrupt vector count: %d\n", sc->vtballoon_nintr);
315 goto fail;
317 for (i = 0; i < nrhandlers; i++) {
318 error = virtio_bind_intr(sc->vtballoon_dev, info[i].irq, info[i].idx,
319 info[i].handler, sc);
320 if (error) {
321 vtballoon_dprintf(sc, VTBALLOON_ERROR, "cannot bind virtqueue '%s' handler to IRQ:%d/%d\n",
322 info[i].handler_name, info[i].irq, sc->vtballoon_nintr);
323 goto fail;
327 for (i = 0; i < sc->vtballoon_nintr; i++) {
328 error = virtio_setup_intr(dev, i, VTBALLOON_SLZ(sc));
329 if (error) {
330 vtballoon_dprintf(sc, VTBALLOON_ERROR, "cannot setup virtqueue interrupt:%d (error:%d)\n", i, error);
331 goto fail;
335 error = kthread_create(vtballoon_thread, sc, &sc->vtballoon_td, "virtio_balloon");
336 if (error) {
337 vtballoon_dprintf(sc, VTBALLOON_ERROR, "cannot create balloon kthread (error:%d)\n", error);
338 goto fail;
341 virtqueue_enable_intr(sc->vtballoon_inflate_vq);
342 virtqueue_enable_intr(sc->vtballoon_deflate_vq);
344 if (virtio_with_feature(sc->vtballoon_dev, VIRTIO_BALLOON_F_STATS_VQ)) {
345 virtqueue_enable_intr(sc->vtballoon_stats_vq);
346 #if 0 /* enabling this causes a panic, on asserting ASSERT_SERIALIZED(sc) in vtballoon_update_stats */
348 * Prime this stats virtqueue with one buffer so the hypervisor can
349 * use it to signal us later.
351 VTBALLOON_ENTER_SLZ(sc);
352 vtballoon_update_stats(sc);
353 VTBALLOON_EXIT_SLZ(sc);
354 #endif
357 fail:
358 if (error)
359 vtballoon_detach(dev);
361 return (error);
364 static int
365 vtballoon_detach(device_t dev)
367 struct vtballoon_softc *sc;
368 int i;
370 sc = device_get_softc(dev);
371 vtballoon_dprintf(sc, VTBALLOON_TRACE, "\n");
373 if (sc->vtballoon_td != NULL) {
374 VTBALLOON_ENTER_SLZ(sc);
375 sc->vtballoon_flags |= VTBALLOON_FLAG_DETACH;
377 /* drain */
378 wakeup_one(sc);
379 zsleep(sc->vtballoon_td, VTBALLOON_SLZ(sc), 0, "vtbdth", 0);
380 VTBALLOON_EXIT_SLZ(sc);
381 sc->vtballoon_td = NULL;
384 lwkt_serialize_handler_disable(VTBALLOON_SLZ(sc));
386 for (i = 0; i < sc->vtballoon_nintr; i++)
387 virtio_teardown_intr(dev, i);
389 if (device_is_attached(dev)) {
390 vtballoon_pop(sc);
391 vtballoon_stop(sc);
394 if (sc->vtballoon_page_frames != NULL) {
395 contigfree(sc->vtballoon_page_frames, VTBALLOON_PAGES_PER_REQUEST *
396 sizeof(uint32_t), M_DEVBUF);
397 sc->vtballoon_page_frames = NULL;
399 return (0);
402 static void
403 vtballoon_negotiate_features(struct vtballoon_softc *sc)
405 device_t dev;
406 uint64_t features;
408 dev = sc->vtballoon_dev;
409 vtballoon_dprintf(sc, VTBALLOON_TRACE, "\n");
410 features = virtio_negotiate_features(dev, VTBALLOON_FEATURES);
411 sc->vtballoon_features = features;
414 static int vtballoon_alloc_intrs(struct vtballoon_softc *sc)
416 vtballoon_dprintf(sc, VTBALLOON_TRACE, "\n");
417 int cnt, error;
418 int intrcount = virtio_intr_count(sc->vtballoon_dev);
419 int use_config = 1;
421 intrcount = imin(intrcount, VTBALLOON_MAX_INTERRUPTS);
422 if (intrcount < 1)
423 return (ENXIO);
425 cnt = intrcount;
426 error = virtio_intr_alloc(sc->vtballoon_dev, &cnt, use_config, NULL);
427 if (error != 0) {
428 virtio_intr_release(sc->vtballoon_dev);
429 return (error);
431 sc->vtballoon_nintr = cnt;
432 vtballoon_dprintf(sc, VTBALLOON_TRACE, "%d Interrupts Allocated\n", sc->vtballoon_nintr);
433 return (0);
436 static int
437 vtballoon_alloc_virtqueues(struct vtballoon_softc *sc)
439 device_t dev;
440 struct vq_alloc_info vq_info[3];
441 int nvqs;
443 dev = sc->vtballoon_dev;
444 vtballoon_dprintf(sc, VTBALLOON_TRACE, "\n");
445 nvqs = 2;
447 VQ_ALLOC_INFO_INIT(&vq_info[0], 0, &sc->vtballoon_inflate_vq,
448 "%s inflate", device_get_nameunit(dev));
450 VQ_ALLOC_INFO_INIT(&vq_info[1], 0, &sc->vtballoon_deflate_vq,
451 "%s deflate", device_get_nameunit(dev));
453 if (virtio_with_feature(sc->vtballoon_dev, VIRTIO_BALLOON_F_STATS_VQ)) {
454 VQ_ALLOC_INFO_INIT(&vq_info[2], 0, &sc->vtballoon_stats_vq,
455 "%s stats", device_get_nameunit(dev));
456 nvqs = 3;
458 return (virtio_alloc_virtqueues(dev, nvqs, vq_info));
461 static void
462 vtballoon_config_change_intr(void *arg)
464 struct vtballoon_softc *sc = arg;
465 vtballoon_dprintf(sc, VTBALLOON_TRACE, "\n");
466 ASSERT_SERIALIZED(VTBALLOON_SLZ(sc));
467 wakeup_one(sc);
470 static inline void
471 vtballoon_update_stat(struct vtballoon_softc *sc, int idx,
472 uint16_t tag, uint64_t val)
474 KASSERT(idx >= VTBALLOON_S_NR, ("Stats index out of bounds"));
476 * XXX: Required for endianess in the future
477 * sc->vtballoon_stats[idx].tag = virtio_is_little_endian(sc->vtballoon_dev) ? le16toh(tag) : tag;
478 * sc->vtballoon_stats[idx].val = virtio_is_little_endian(sc->vtballoon_dev) ? le64toh(val) : val;
479 * at the moment virtio balloon is always little endian.
482 sc->vtballoon_stats[idx].tag = le16toh(tag);
483 sc->vtballoon_stats[idx].val = le64toh(val);
488 * collect guest side statistics
490 * XXX: am i using the correct memory and pagefault values
492 static unsigned int collect_balloon_stats(struct vtballoon_softc *sc)
494 #define pages_to_bytes(x) ((uint64_t)(x) << PAGE_SHIFT)
495 unsigned int idx = 0;
496 struct vmtotal total;
497 struct vmmeter vmm;
498 struct vmstats vms;
499 size_t vmt_size = sizeof(total);
500 size_t vmm_size = sizeof(vmm);
501 size_t vms_size = sizeof(vms);
503 vtballoon_dprintf(sc, VTBALLOON_TRACE, "Updating Stats Buffer\n");
504 if (!kernel_sysctlbyname("vm.vmtotal", &total, &vmt_size, NULL, 0, NULL)) {
505 /* Total amount of free memory )*/
506 vtballoon_update_stat(sc, idx++, VTBALLOON_S_MEMFREE,
507 pages_to_bytes(total.t_rm - total.t_arm));
508 /* Total amount of memory */
509 vtballoon_update_stat(sc, idx++, VTBALLOON_S_MEMTOT,
510 pages_to_bytes(total.t_rm));
511 /* Available memory as in /proc */
512 vtballoon_update_stat(sc, idx++, VTBALLOON_S_AVAIL,
513 pages_to_bytes(total.t_arm));
515 if (!kernel_sysctlbyname("vm.vmstats", &vms, &vms_size, NULL, 0, NULL)) {
516 /* Disk caches */
517 vtballoon_update_stat(sc, idx++, VTBALLOON_S_CACHES,
518 pages_to_bytes(vms.v_cache_count));
520 if (!kernel_sysctlbyname("vm.vmmeter", &vmm, &vmm_size, NULL, 0, NULL)) {
521 /* Amount of memory swapped in */
522 vtballoon_update_stat(sc, idx++, VTBALLOON_S_SWAP_IN,
523 pages_to_bytes(vmm.v_swappgsin));
524 /* Amount of memory swapped out */
525 vtballoon_update_stat(sc, idx++, VTBALLOON_S_SWAP_OUT,
526 pages_to_bytes(vmm.v_swappgsout));
527 /* Number of major faults */
528 vtballoon_update_stat(sc, idx++, VTBALLOON_S_MAJFLT,
529 vmm.v_vm_faults);
530 /* Number of minor faults */
531 vtballoon_update_stat(sc, idx++, VTBALLOON_S_MINFLT,
532 vmm.v_intrans);
535 if (sc->vtballoon_debug & VTBALLOON_TRACE) {
536 static const char *vt_balloon_names[]=VTBALLOON_S_NAMES;
537 int i;
538 for (i=0; i < idx; i++) {
539 kprintf("\t%s = %lu\n", vt_balloon_names[sc->vtballoon_stats[i].tag], sc->vtballoon_stats[i].val);
543 return idx;
546 static void
547 vtballoon_update_stats(struct vtballoon_softc *sc)
549 struct virtqueue *vq = sc->vtballoon_stats_vq;
551 ASSERT_SERIALIZED(VTBALLOON_SLZ(sc));
553 vtballoon_dprintf(sc, VTBALLOON_TRACE, "Stats Requested\n");
555 struct sglist sg;
556 struct sglist_seg segs[1];
557 unsigned int num_stats;
558 int error;
560 num_stats = collect_balloon_stats(sc);
562 sglist_init(&sg, 1, segs);
563 error = sglist_append(&sg, sc->vtballoon_stats, sizeof(sc->vtballoon_stats[0]) * num_stats);
564 KASSERT(error == 0, ("error adding page frames to sglist"));
566 error = virtqueue_enqueue(vq, vq, &sg, 1, 0);
567 KASSERT(error == 0, ("error enqueuing page frames to virtqueue"));
568 virtqueue_notify(sc->vtballoon_stats_vq, NULL);
572 * While most virtqueues communicate guest-initiated requests to the hypervisor,
573 * the stats queue operates in reverse. The driver(host) initializes the virtqueue
574 * with a single buffer. From that point forward, all conversations consist of
575 * a hypervisor request (a call to this function) which directs us to refill
576 * the virtqueue with a fresh stats buffer. Since stats collection can sleep,
577 * we delegate the job to the vtballoon_thread which will do the actual stats
578 * collecting work.
580 static void
581 vtballoon_stats_vq_intr(void *arg)
583 struct vtballoon_softc *sc = arg;
584 struct virtqueue *vq = sc->vtballoon_stats_vq;
586 ASSERT_SERIALIZED(VTBALLOON_SLZ(sc));
587 if (sc->vtballoon_update_stats || !virtqueue_pending(vq))
588 return;
590 vtballoon_dprintf(sc, VTBALLOON_TRACE, "Ballooon Stats Requested\n");
591 sc->vtballoon_update_stats = true;
592 wakeup_one(sc);
593 virtqueue_dequeue(vq, NULL);
596 static void
597 vtballoon_inflate_vq_intr(void *arg)
599 struct vtballoon_softc *sc = arg;
600 struct virtqueue *vq = sc->vtballoon_inflate_vq;
601 ASSERT_SERIALIZED(VTBALLOON_SLZ(sc));
602 if (!virtqueue_pending(vq))
603 return;
604 wakeup_one(sc);
607 static void
608 vtballoon_deflate_vq_intr(void *arg)
610 struct vtballoon_softc *sc = arg;
611 struct virtqueue *vq = sc->vtballoon_deflate_vq;
612 ASSERT_SERIALIZED(VTBALLOON_SLZ(sc));
613 if (!virtqueue_pending(vq))
614 return;
615 wakeup_one(sc);
618 static void
619 vtballoon_inflate(struct vtballoon_softc *sc, int npages)
621 struct virtqueue *vq;
623 vm_page_t m;
624 int i;
626 vq = sc->vtballoon_inflate_vq;
628 if (npages > VTBALLOON_PAGES_PER_REQUEST)
629 npages = VTBALLOON_PAGES_PER_REQUEST;
631 for (i = 0; i < npages; i++) {
632 if ((m = vtballoon_alloc_page(sc)) == NULL) {
633 /* First allocate usign VTBALLOON_REGULAR_ALLOC and fall back to VTBALLOON_LOWMEM_ALLOC
634 * when the guest is under severe memory pressure. Quickly decrease the
635 * allocation rate, allowing the system to swap out pages.
637 sc->vtballoon_pagereq = VM_ALLOC_SYSTEM | VM_ALLOC_INTERRUPT;
638 sc->vtballoon_timeout = VTBALLOON_LOWMEM_TIMEOUT;
639 break;
642 sc->vtballoon_page_frames[i] =
643 VM_PAGE_TO_PHYS(m) >> VIRTIO_BALLOON_PFN_SHIFT;
645 KASSERT(m->queue == PQ_NONE,
646 ("%s: allocated page %p on queue", __func__, m));
647 TAILQ_INSERT_TAIL(&sc->vtballoon_pages, m, pageq);
650 if (i > 0)
651 vtballoon_send_page_frames(sc, vq, i);
654 static void
655 vtballoon_deflate(struct vtballoon_softc *sc, int npages)
657 TAILQ_HEAD(, vm_page) free_pages;
658 struct virtqueue *vq;
659 vm_page_t m;
660 int i;
662 vq = sc->vtballoon_deflate_vq;
663 TAILQ_INIT(&free_pages);
665 if (npages > VTBALLOON_PAGES_PER_REQUEST)
666 npages = VTBALLOON_PAGES_PER_REQUEST;
668 for (i = 0; i < npages; i++) {
669 m = TAILQ_FIRST(&sc->vtballoon_pages);
670 KASSERT(m != NULL, ("%s: no more pages to deflate", __func__));
672 sc->vtballoon_page_frames[i] =
673 VM_PAGE_TO_PHYS(m) >> VIRTIO_BALLOON_PFN_SHIFT;
675 TAILQ_REMOVE(&sc->vtballoon_pages, m, pageq);
676 TAILQ_INSERT_TAIL(&free_pages, m, pageq);
679 if (i > 0) {
681 * Note that if virtio VIRTIO_BALLOON_F_MUST_TELL_HOST
682 * feature is true, we *have* to tell host first
683 * before freeing the pages.
685 vtballoon_send_page_frames(sc, vq, i);
687 while ((m = TAILQ_FIRST(&free_pages)) != NULL) {
688 TAILQ_REMOVE(&free_pages, m, pageq);
689 vtballoon_free_page(sc, m);
693 KASSERT((TAILQ_EMPTY(&sc->vtballoon_pages) &&
694 sc->vtballoon_current_npages == 0) ||
695 (!TAILQ_EMPTY(&sc->vtballoon_pages) &&
696 sc->vtballoon_current_npages != 0),
697 ("%s: bogus page count %d", __func__,
698 sc->vtballoon_current_npages));
701 static void
702 vtballoon_send_page_frames(struct vtballoon_softc *sc, struct virtqueue *vq,
703 int npages)
705 struct sglist sg;
706 struct sglist_seg segs[1];
707 void *c;
708 int error;
710 sglist_init(&sg, 1, segs);
712 error = sglist_append(&sg, sc->vtballoon_page_frames,
713 npages * sizeof(uint32_t));
714 KASSERT(error == 0, ("error adding page frames to sglist"));
716 error = virtqueue_enqueue(vq, vq, &sg, 1, 0);
717 KASSERT(error == 0, ("error enqueuing page frames to virtqueue"));
718 virtqueue_notify(vq, NULL);
721 * Inflate and deflate operations are done synchronously. The
722 * interrupt handler will wake us up.
724 VTBALLOON_ENTER_SLZ(sc);
725 while ((c = virtqueue_dequeue(vq, NULL)) == NULL) {
726 zsleep(sc, VTBALLOON_SLZ(sc), 0, "vtbspf", 0);
728 VTBALLOON_EXIT_SLZ(sc);
730 KASSERT(c == vq, ("unexpected balloon operation response"));
733 static void
734 vtballoon_pop(struct vtballoon_softc *sc)
736 vtballoon_dprintf(sc, VTBALLOON_TRACE, "Popping\n");
738 while (!TAILQ_EMPTY(&sc->vtballoon_pages))
739 vtballoon_deflate(sc, sc->vtballoon_current_npages);
742 static void
743 vtballoon_stop(struct vtballoon_softc *sc)
745 vtballoon_dprintf(sc, VTBALLOON_TRACE, "Stopping\n");
747 virtqueue_disable_intr(sc->vtballoon_inflate_vq);
748 virtqueue_disable_intr(sc->vtballoon_deflate_vq);
750 if (virtio_with_feature(sc->vtballoon_dev, VIRTIO_BALLOON_F_STATS_VQ)) {
751 virtqueue_disable_intr(sc->vtballoon_stats_vq);
754 virtio_stop(sc->vtballoon_dev);
757 static vm_page_t
758 vtballoon_alloc_page(struct vtballoon_softc *sc)
760 vm_page_t m;
762 m = vm_page_alloc(NULL, 0, sc->vtballoon_pagereq);
763 if (m != NULL)
764 sc->vtballoon_current_npages++;
766 return (m);
769 static void
770 vtballoon_free_page(struct vtballoon_softc *sc, vm_page_t m)
772 vm_page_free_toq(m);
773 sc->vtballoon_current_npages--;
776 static uint32_t
777 vtballoon_desired_size(struct vtballoon_softc *sc)
779 uint32_t desired;
781 desired = virtio_read_dev_config_4(sc->vtballoon_dev,
782 offsetof(struct virtio_balloon_config, num_pages));
784 return (le32toh(desired));
787 static void
788 vtballoon_update_size(struct vtballoon_softc *sc)
790 virtio_write_dev_config_4(sc->vtballoon_dev,
791 offsetof(struct virtio_balloon_config, actual),
792 htole32(sc->vtballoon_current_npages));
795 static int
796 vtballoon_sleep(struct vtballoon_softc *sc)
798 int rc, timeout;
799 uint32_t current, desired;
801 rc = 0;
802 current = sc->vtballoon_current_npages;
803 sc->vtballoon_pagereq = VM_ALLOC_NORMAL | VM_ALLOC_INTERRUPT;
805 VTBALLOON_ENTER_SLZ(sc);
806 for (;;) {
807 if (sc->vtballoon_flags & VTBALLOON_FLAG_DETACH) {
808 rc = 1;
809 break;
812 desired = vtballoon_desired_size(sc);
813 if (desired != sc->vtballoon_desired_npages)
814 vtballoon_dprintf(sc, VTBALLOON_DEBUG, "balloon %s %d -> %d (4K pages)\n",
815 desired < sc->vtballoon_desired_npages ? "deflating" : "inflating",
816 current, desired);
818 sc->vtballoon_desired_npages = desired;
821 * If given, use non-zero timeout on the first time through
822 * the loop. On subsequent times, timeout will be zero so
823 * we will reevaluate the desired size of the balloon and
824 * break out to retry if needed.
826 timeout = sc->vtballoon_timeout;
827 sc->vtballoon_timeout = 0;
829 if (current > desired)
830 break;
831 else if (current < desired && timeout == 0)
832 break;
833 else if (sc->vtballoon_update_stats)
834 break;
835 else if (!timeout)
836 vtballoon_dprintf(sc, VTBALLOON_TRACE, "balloon %d (4K pages) reached\n", current);
838 zsleep(sc, VTBALLOON_SLZ(sc), 0, "vtbslp", timeout);
840 VTBALLOON_EXIT_SLZ(sc);
842 return (rc);
845 static void
846 vtballoon_thread(void *arg)
848 struct vtballoon_softc *sc = arg;
849 vtballoon_dprintf(sc, VTBALLOON_TRACE, "Thread started.\n");
851 uint32_t current, desired;
852 for (;;) {
853 if (vtballoon_sleep(sc) != 0)
854 break;
856 current = sc->vtballoon_current_npages;
857 desired = sc->vtballoon_desired_npages;
859 if (desired != current) {
860 if (desired > current)
861 vtballoon_inflate(sc, desired - current);
862 else
863 vtballoon_deflate(sc, current - desired);
865 vtballoon_update_size(sc);
867 if (sc->vtballoon_update_stats) {
868 vtballoon_update_stats(sc);
869 sc->vtballoon_update_stats = false;
873 kthread_exit();
876 static void
877 vtballoon_get_tunables(struct vtballoon_softc *sc)
879 char tmpstr[64];
880 vtballoon_dprintf(sc, VTBALLOON_TRACE, "\n");
882 TUNABLE_INT_FETCH("hw.vtballoon.debug_level", &sc->vtballoon_debug);
884 ksnprintf(tmpstr, sizeof(tmpstr), "dev.vtballoon.%d.debug_level",
885 device_get_unit(sc->vtballoon_dev));
886 TUNABLE_INT_FETCH(tmpstr, &sc->vtballoon_debug);
889 static void
890 vtballoon_add_sysctl(struct vtballoon_softc *sc)
892 device_t dev;
893 struct sysctl_ctx_list *ctx;
894 struct sysctl_oid *tree;
895 struct sysctl_oid_list *child;
897 dev = sc->vtballoon_dev;
898 vtballoon_dprintf(sc, VTBALLOON_TRACE, "\n");
900 ctx = device_get_sysctl_ctx(dev);
901 tree = device_get_sysctl_tree(dev);
902 child = SYSCTL_CHILDREN(tree);
904 SYSCTL_ADD_INT(ctx, child, OID_AUTO, "debug_level",
905 CTLFLAG_RW, &sc->vtballoon_debug, 0,
906 "Debug level");
908 SYSCTL_ADD_UINT(ctx, child, OID_AUTO, "desired",
909 CTLFLAG_RD, &sc->vtballoon_desired_npages, sizeof(uint32_t),
910 "Desired balloon size in pages");
912 SYSCTL_ADD_UINT(ctx, child, OID_AUTO, "current",
913 CTLFLAG_RD, &sc->vtballoon_current_npages, sizeof(uint32_t),
914 "Current balloon size in pages");