blob: 07beab174dca452d06f4e53ece5b8e9e2c8d28a4 [file] [log] [blame]
Marc-André Lureauf04cf922015-10-09 17:17:19 +02001/*
2 * memfd.c
3 *
4 * Copyright (c) 2015 Red Hat, Inc.
5 *
6 * QEMU library functions on POSIX which are shared between QEMU and
7 * the QEMU tools.
8 *
9 * Permission is hereby granted, free of charge, to any person obtaining a copy
10 * of this software and associated documentation files (the "Software"), to deal
11 * in the Software without restriction, including without limitation the rights
12 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
13 * copies of the Software, and to permit persons to whom the Software is
14 * furnished to do so, subject to the following conditions:
15 *
16 * The above copyright notice and this permission notice shall be included in
17 * all copies or substantial portions of the Software.
18 *
19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
20 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
21 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
22 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
23 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
24 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
25 * THE SOFTWARE.
26 */
27
28#include "qemu/osdep.h"
29
Marc-André Lureau0f2956f2018-02-01 14:27:51 +010030#include "qapi/error.h"
Marc-André Lureauc90204b2024-10-08 16:50:17 +040031#include "qemu/error-report.h"
Marc-André Lureauf04cf922015-10-09 17:17:19 +020032#include "qemu/memfd.h"
Marc-André Lureau2ef8c0c2018-02-01 14:27:53 +010033#include "qemu/host-utils.h"
Marc-André Lureauf04cf922015-10-09 17:17:19 +020034
Paolo Bonzini75e5b702017-11-28 11:51:27 +010035#if defined CONFIG_LINUX && !defined CONFIG_MEMFD
Marc-André Lureauf04cf922015-10-09 17:17:19 +020036#include <sys/syscall.h>
37#include <asm/unistd.h>
38
Shu-Chun Weng9bdfa4d2019-08-19 11:09:47 -070039int memfd_create(const char *name, unsigned int flags)
Marc-André Lureauf04cf922015-10-09 17:17:19 +020040{
41#ifdef __NR_memfd_create
42 return syscall(__NR_memfd_create, name, flags);
43#else
Ilya Maximetsdf208192019-03-11 16:58:49 +030044 errno = ENOSYS;
Marc-André Lureauf04cf922015-10-09 17:17:19 +020045 return -1;
46#endif
47}
48#endif
49
Marc-André Lureauc5b2a9e2018-02-01 14:27:52 +010050int qemu_memfd_create(const char *name, size_t size, bool hugetlb,
Marc-André Lureau2ef8c0c2018-02-01 14:27:53 +010051 uint64_t hugetlbsize, unsigned int seals, Error **errp)
Marc-André Lureaudcff1032017-10-23 15:18:07 +010052{
Marc-André Lureau2ef8c0c2018-02-01 14:27:53 +010053 int htsize = hugetlbsize ? ctz64(hugetlbsize) : 0;
54
Peter Maydell4f938cb2018-05-15 18:27:29 +010055 if (htsize && 1ULL << htsize != hugetlbsize) {
Marc-André Lureau2ef8c0c2018-02-01 14:27:53 +010056 error_setg(errp, "Hugepage size must be a power of 2");
57 return -1;
58 }
59
60 htsize = htsize << MFD_HUGE_SHIFT;
61
Marc-André Lureaudcff1032017-10-23 15:18:07 +010062#ifdef CONFIG_LINUX
Marc-André Lureau0f2956f2018-02-01 14:27:51 +010063 int mfd = -1;
Marc-André Lureaudcff1032017-10-23 15:18:07 +010064 unsigned int flags = MFD_CLOEXEC;
65
66 if (seals) {
67 flags |= MFD_ALLOW_SEALING;
68 }
Marc-André Lureauc5b2a9e2018-02-01 14:27:52 +010069 if (hugetlb) {
70 flags |= MFD_HUGETLB;
Marc-André Lureau2ef8c0c2018-02-01 14:27:53 +010071 flags |= htsize;
Marc-André Lureauc5b2a9e2018-02-01 14:27:52 +010072 }
Marc-André Lureaudcff1032017-10-23 15:18:07 +010073 mfd = memfd_create(name, flags);
74 if (mfd < 0) {
Ilya Maximetsedaed6c2019-03-11 16:58:50 +030075 error_setg_errno(errp, errno,
76 "failed to create memfd with flags 0x%x", flags);
Marc-André Lureau0f2956f2018-02-01 14:27:51 +010077 goto err;
Marc-André Lureaudcff1032017-10-23 15:18:07 +010078 }
79
80 if (ftruncate(mfd, size) == -1) {
Ilya Maximetsedaed6c2019-03-11 16:58:50 +030081 error_setg_errno(errp, errno, "failed to resize memfd to %zu", size);
Marc-André Lureau0f2956f2018-02-01 14:27:51 +010082 goto err;
Marc-André Lureaudcff1032017-10-23 15:18:07 +010083 }
84
85 if (seals && fcntl(mfd, F_ADD_SEALS, seals) == -1) {
Ilya Maximetsedaed6c2019-03-11 16:58:50 +030086 error_setg_errno(errp, errno, "failed to add seals 0x%x", seals);
Marc-André Lureau0f2956f2018-02-01 14:27:51 +010087 goto err;
Marc-André Lureaudcff1032017-10-23 15:18:07 +010088 }
Marc-André Lureaudcff1032017-10-23 15:18:07 +010089
90 return mfd;
Marc-André Lureau0f2956f2018-02-01 14:27:51 +010091
92err:
93 if (mfd >= 0) {
94 close(mfd);
95 }
Ilya Maximetsedaed6c2019-03-11 16:58:50 +030096#else
97 error_setg_errno(errp, ENOSYS, "failed to create memfd");
Marc-André Lureau0f2956f2018-02-01 14:27:51 +010098#endif
Marc-André Lureau0f2956f2018-02-01 14:27:51 +010099 return -1;
Marc-André Lureaudcff1032017-10-23 15:18:07 +0100100}
101
Marc-André Lureaud3592192015-10-09 17:17:20 +0200102/*
103 * This is a best-effort helper for shared memory allocation, with
104 * optional sealing. The helper will do his best to allocate using
105 * memfd with sealing, but may fallback on other methods without
106 * sealing.
107 */
108void *qemu_memfd_alloc(const char *name, size_t size, unsigned int seals,
Marc-André Lureau0f2956f2018-02-01 14:27:51 +0100109 int *fd, Error **errp)
Marc-André Lureaud3592192015-10-09 17:17:20 +0200110{
111 void *ptr;
Marc-André Lureau2ef8c0c2018-02-01 14:27:53 +0100112 int mfd = qemu_memfd_create(name, size, false, 0, seals, NULL);
Marc-André Lureaud3592192015-10-09 17:17:20 +0200113
Marc-André Lureaudcff1032017-10-23 15:18:07 +0100114 /* some systems have memfd without sealing */
115 if (mfd == -1) {
Marc-André Lureau2ef8c0c2018-02-01 14:27:53 +0100116 mfd = qemu_memfd_create(name, size, false, 0, 0, NULL);
Marc-André Lureaud3592192015-10-09 17:17:20 +0200117 }
118
119 if (mfd == -1) {
Marc-André Lureau35f9b6e2015-10-09 17:17:21 +0200120 const char *tmpdir = g_get_tmp_dir();
121 gchar *fname;
122
123 fname = g_strdup_printf("%s/memfd-XXXXXX", tmpdir);
124 mfd = mkstemp(fname);
125 unlink(fname);
126 g_free(fname);
127
Marc-André Lureau0f2956f2018-02-01 14:27:51 +0100128 if (mfd == -1 ||
129 ftruncate(mfd, size) == -1) {
130 goto err;
Marc-André Lureau35f9b6e2015-10-09 17:17:21 +0200131 }
Marc-André Lureaud3592192015-10-09 17:17:20 +0200132 }
133
134 ptr = mmap(0, size, PROT_READ | PROT_WRITE, MAP_SHARED, mfd, 0);
135 if (ptr == MAP_FAILED) {
Marc-André Lureau0f2956f2018-02-01 14:27:51 +0100136 goto err;
Marc-André Lureaud3592192015-10-09 17:17:20 +0200137 }
138
139 *fd = mfd;
140 return ptr;
Marc-André Lureau0f2956f2018-02-01 14:27:51 +0100141
142err:
143 error_setg_errno(errp, errno, "failed to allocate shared memory");
144 if (mfd >= 0) {
145 close(mfd);
146 }
147 return NULL;
Marc-André Lureaud3592192015-10-09 17:17:20 +0200148}
149
150void qemu_memfd_free(void *ptr, size_t size, int fd)
151{
152 if (ptr) {
Marc-André Lureauc90204b2024-10-08 16:50:17 +0400153 if (munmap(ptr, size) != 0) {
154 error_report("memfd munmap() failed: %s", strerror(errno));
155 }
Marc-André Lureaud3592192015-10-09 17:17:20 +0200156 }
157
158 if (fd != -1) {
Marc-André Lureauc90204b2024-10-08 16:50:17 +0400159 if (close(fd) != 0) {
160 error_report("memfd close() failed: %s", strerror(errno));
161 }
Marc-André Lureaud3592192015-10-09 17:17:20 +0200162 }
163}
Marc-André Lureau31190ed2015-10-09 17:17:34 +0200164
165enum {
166 MEMFD_KO,
167 MEMFD_OK,
168 MEMFD_TODO
169};
170
Marc-André Lureau648abbf2018-03-28 14:18:04 +0200171/**
172 * qemu_memfd_alloc_check():
173 *
174 * Check if qemu_memfd_alloc() can allocate, including using a
175 * fallback implementation when host doesn't support memfd.
176 */
177bool qemu_memfd_alloc_check(void)
Marc-André Lureau31190ed2015-10-09 17:17:34 +0200178{
179 static int memfd_check = MEMFD_TODO;
180
181 if (memfd_check == MEMFD_TODO) {
182 int fd;
183 void *ptr;
184
Dima Stepanov1e7ec6c2018-06-13 11:19:54 +0300185 fd = -1;
Marc-André Lureau0f2956f2018-02-01 14:27:51 +0100186 ptr = qemu_memfd_alloc("test", 4096, 0, &fd, NULL);
Marc-André Lureau31190ed2015-10-09 17:17:34 +0200187 memfd_check = ptr ? MEMFD_OK : MEMFD_KO;
188 qemu_memfd_free(ptr, 4096, fd);
189 }
190
191 return memfd_check == MEMFD_OK;
192}
Marc-André Lureau648abbf2018-03-28 14:18:04 +0200193
194/**
195 * qemu_memfd_check():
196 *
Steve Sistare9fb40bb2025-01-15 11:00:30 -0800197 * Check if host supports memfd. Cache the answer for the common case flags=0.
Marc-André Lureau648abbf2018-03-28 14:18:04 +0200198 */
Marc-André Lureau38296402018-09-06 20:14:15 +0400199bool qemu_memfd_check(unsigned int flags)
Marc-André Lureau648abbf2018-03-28 14:18:04 +0200200{
201#ifdef CONFIG_LINUX
Steve Sistare9fb40bb2025-01-15 11:00:30 -0800202 int mfd;
203 static int memfd_check = MEMFD_TODO;
Marc-André Lureau648abbf2018-03-28 14:18:04 +0200204
Steve Sistare9fb40bb2025-01-15 11:00:30 -0800205 if (!flags && memfd_check != MEMFD_TODO) {
206 return memfd_check;
207 }
208
209 mfd = memfd_create("test", flags | MFD_CLOEXEC);
Marc-André Lureau38296402018-09-06 20:14:15 +0400210 if (mfd >= 0) {
211 close(mfd);
Marc-André Lureau648abbf2018-03-28 14:18:04 +0200212 }
Steve Sistare9fb40bb2025-01-15 11:00:30 -0800213 if (!flags) {
214 memfd_check = (mfd >= 0) ? MEMFD_OK : MEMFD_KO;
215 }
216 return (mfd >= 0);
217
Marc-André Lureau648abbf2018-03-28 14:18:04 +0200218#endif
Marc-André Lureau38296402018-09-06 20:14:15 +0400219
220 return false;
Marc-André Lureau648abbf2018-03-28 14:18:04 +0200221}