2 * Support for RAM backed by mmaped host memory.
4 * Copyright (c) 2015 Red Hat, Inc.
7 * Michael S. Tsirkin <mst@redhat.com>
9 * This work is licensed under the terms of the GNU GPL, version 2 or
10 * later. See the COPYING file in the top-level directory.
13 #include "qemu/osdep.h"
14 #include "qemu/mmap-alloc.h"
15 #include "qemu/host-utils.h"
17 #define HUGETLBFS_MAGIC 0x958458f6
23 size_t qemu_fd_getpagesize(int fd
)
31 ret
= fstatfs(fd
, &fs
);
32 } while (ret
!= 0 && errno
== EINTR
);
34 if (ret
== 0 && fs
.f_type
== HUGETLBFS_MAGIC
) {
39 /* SPARC Linux needs greater alignment than the pagesize */
40 return QEMU_VMALLOC_ALIGN
;
47 size_t qemu_mempath_getpagesize(const char *mem_path
)
55 ret
= statfs(mem_path
, &fs
);
56 } while (ret
!= 0 && errno
== EINTR
);
59 fprintf(stderr
, "Couldn't statfs() memory path: %s\n",
64 if (fs
.f_type
== HUGETLBFS_MAGIC
) {
65 /* It's hugepage, return the huge page size */
70 /* SPARC Linux needs greater alignment than the pagesize */
71 return QEMU_VMALLOC_ALIGN
;
78 void *qemu_ram_mmap(int fd
, size_t size
, size_t align
, bool shared
)
89 * Note: this always allocates at least one extra page of virtual address
90 * space, even if size is already aligned.
94 #if defined(__powerpc64__) && defined(__linux__)
95 /* On ppc64 mappings in the same segment (aka slice) must share the same
96 * page size. Since we will be re-allocating part of this segment
97 * from the supplied fd, we should make sure to use the same page size, to
98 * this end we mmap the supplied fd. In this case, set MAP_NORESERVE to
99 * avoid allocating backing store memory.
100 * We do this unless we are using the system page size, in which case
101 * anonymous memory is OK.
104 pagesize
= qemu_fd_getpagesize(fd
);
105 if (fd
== -1 || pagesize
== getpagesize()) {
107 flags
|= MAP_ANONYMOUS
;
110 flags
|= MAP_NORESERVE
;
114 pagesize
= getpagesize();
115 flags
= MAP_PRIVATE
| MAP_ANONYMOUS
;
118 guardptr
= mmap(0, total
, PROT_NONE
, flags
, guardfd
, 0);
120 if (guardptr
== MAP_FAILED
) {
124 assert(is_power_of_2(align
));
125 /* Always align to host page size */
126 assert(align
>= pagesize
);
129 flags
|= fd
== -1 ? MAP_ANONYMOUS
: 0;
130 flags
|= shared
? MAP_SHARED
: MAP_PRIVATE
;
131 offset
= QEMU_ALIGN_UP((uintptr_t)guardptr
, align
) - (uintptr_t)guardptr
;
133 ptr
= mmap(guardptr
+ offset
, size
, PROT_READ
| PROT_WRITE
, flags
, fd
, 0);
135 if (ptr
== MAP_FAILED
) {
136 munmap(guardptr
, total
);
141 munmap(guardptr
, offset
);
145 * Leave a single PROT_NONE page allocated after the RAM block, to serve as
146 * a guard page guarding against potential buffer overflows.
149 if (total
> size
+ pagesize
) {
150 munmap(ptr
+ size
+ pagesize
, total
- size
- pagesize
);
156 void qemu_ram_munmap(int fd
, void *ptr
, size_t size
)
161 /* Unmap both the RAM block and the guard page */
162 #if defined(__powerpc64__) && defined(__linux__)
163 pagesize
= qemu_fd_getpagesize(fd
);
165 pagesize
= getpagesize();
167 munmap(ptr
, size
+ pagesize
);