blob: 4a3c07e0bee6ddcf168553f9c96005bdb11e42c5 [file] [log] [blame]
Marc-André Lureauf04cf922015-10-09 17:17:19 +02001/*
2 * memfd.c
3 *
4 * Copyright (c) 2015 Red Hat, Inc.
5 *
6 * QEMU library functions on POSIX which are shared between QEMU and
7 * the QEMU tools.
8 *
9 * Permission is hereby granted, free of charge, to any person obtaining a copy
10 * of this software and associated documentation files (the "Software"), to deal
11 * in the Software without restriction, including without limitation the rights
12 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
13 * copies of the Software, and to permit persons to whom the Software is
14 * furnished to do so, subject to the following conditions:
15 *
16 * The above copyright notice and this permission notice shall be included in
17 * all copies or substantial portions of the Software.
18 *
19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
20 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
21 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
22 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
23 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
24 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
25 * THE SOFTWARE.
26 */
27
28#include "qemu/osdep.h"
29
Marc-André Lureau0f2956f2018-02-01 14:27:51 +010030#include "qapi/error.h"
Marc-André Lureauf04cf922015-10-09 17:17:19 +020031#include "qemu/memfd.h"
Marc-André Lureau2ef8c0c2018-02-01 14:27:53 +010032#include "qemu/host-utils.h"
Marc-André Lureauf04cf922015-10-09 17:17:19 +020033
Paolo Bonzini75e5b702017-11-28 11:51:27 +010034#if defined CONFIG_LINUX && !defined CONFIG_MEMFD
Marc-André Lureauf04cf922015-10-09 17:17:19 +020035#include <sys/syscall.h>
36#include <asm/unistd.h>
37
Shu-Chun Weng9bdfa4d2019-08-19 11:09:47 -070038int memfd_create(const char *name, unsigned int flags)
Marc-André Lureauf04cf922015-10-09 17:17:19 +020039{
40#ifdef __NR_memfd_create
41 return syscall(__NR_memfd_create, name, flags);
42#else
Ilya Maximetsdf208192019-03-11 16:58:49 +030043 errno = ENOSYS;
Marc-André Lureauf04cf922015-10-09 17:17:19 +020044 return -1;
45#endif
46}
47#endif
48
Marc-André Lureauc5b2a9e2018-02-01 14:27:52 +010049int qemu_memfd_create(const char *name, size_t size, bool hugetlb,
Marc-André Lureau2ef8c0c2018-02-01 14:27:53 +010050 uint64_t hugetlbsize, unsigned int seals, Error **errp)
Marc-André Lureaudcff1032017-10-23 15:18:07 +010051{
Marc-André Lureau2ef8c0c2018-02-01 14:27:53 +010052 int htsize = hugetlbsize ? ctz64(hugetlbsize) : 0;
53
Peter Maydell4f938cb2018-05-15 18:27:29 +010054 if (htsize && 1ULL << htsize != hugetlbsize) {
Marc-André Lureau2ef8c0c2018-02-01 14:27:53 +010055 error_setg(errp, "Hugepage size must be a power of 2");
56 return -1;
57 }
58
59 htsize = htsize << MFD_HUGE_SHIFT;
60
Marc-André Lureaudcff1032017-10-23 15:18:07 +010061#ifdef CONFIG_LINUX
Marc-André Lureau0f2956f2018-02-01 14:27:51 +010062 int mfd = -1;
Marc-André Lureaudcff1032017-10-23 15:18:07 +010063 unsigned int flags = MFD_CLOEXEC;
64
65 if (seals) {
66 flags |= MFD_ALLOW_SEALING;
67 }
Marc-André Lureauc5b2a9e2018-02-01 14:27:52 +010068 if (hugetlb) {
69 flags |= MFD_HUGETLB;
Marc-André Lureau2ef8c0c2018-02-01 14:27:53 +010070 flags |= htsize;
Marc-André Lureauc5b2a9e2018-02-01 14:27:52 +010071 }
Marc-André Lureaudcff1032017-10-23 15:18:07 +010072 mfd = memfd_create(name, flags);
73 if (mfd < 0) {
Ilya Maximetsedaed6c2019-03-11 16:58:50 +030074 error_setg_errno(errp, errno,
75 "failed to create memfd with flags 0x%x", flags);
Marc-André Lureau0f2956f2018-02-01 14:27:51 +010076 goto err;
Marc-André Lureaudcff1032017-10-23 15:18:07 +010077 }
78
79 if (ftruncate(mfd, size) == -1) {
Ilya Maximetsedaed6c2019-03-11 16:58:50 +030080 error_setg_errno(errp, errno, "failed to resize memfd to %zu", size);
Marc-André Lureau0f2956f2018-02-01 14:27:51 +010081 goto err;
Marc-André Lureaudcff1032017-10-23 15:18:07 +010082 }
83
84 if (seals && fcntl(mfd, F_ADD_SEALS, seals) == -1) {
Ilya Maximetsedaed6c2019-03-11 16:58:50 +030085 error_setg_errno(errp, errno, "failed to add seals 0x%x", seals);
Marc-André Lureau0f2956f2018-02-01 14:27:51 +010086 goto err;
Marc-André Lureaudcff1032017-10-23 15:18:07 +010087 }
Marc-André Lureaudcff1032017-10-23 15:18:07 +010088
89 return mfd;
Marc-André Lureau0f2956f2018-02-01 14:27:51 +010090
91err:
92 if (mfd >= 0) {
93 close(mfd);
94 }
Ilya Maximetsedaed6c2019-03-11 16:58:50 +030095#else
96 error_setg_errno(errp, ENOSYS, "failed to create memfd");
Marc-André Lureau0f2956f2018-02-01 14:27:51 +010097#endif
Marc-André Lureau0f2956f2018-02-01 14:27:51 +010098 return -1;
Marc-André Lureaudcff1032017-10-23 15:18:07 +010099}
100
Marc-André Lureaud3592192015-10-09 17:17:20 +0200101/*
102 * This is a best-effort helper for shared memory allocation, with
103 * optional sealing. The helper will do his best to allocate using
104 * memfd with sealing, but may fallback on other methods without
105 * sealing.
106 */
107void *qemu_memfd_alloc(const char *name, size_t size, unsigned int seals,
Marc-André Lureau0f2956f2018-02-01 14:27:51 +0100108 int *fd, Error **errp)
Marc-André Lureaud3592192015-10-09 17:17:20 +0200109{
110 void *ptr;
Marc-André Lureau2ef8c0c2018-02-01 14:27:53 +0100111 int mfd = qemu_memfd_create(name, size, false, 0, seals, NULL);
Marc-André Lureaud3592192015-10-09 17:17:20 +0200112
Marc-André Lureaudcff1032017-10-23 15:18:07 +0100113 /* some systems have memfd without sealing */
114 if (mfd == -1) {
Marc-André Lureau2ef8c0c2018-02-01 14:27:53 +0100115 mfd = qemu_memfd_create(name, size, false, 0, 0, NULL);
Marc-André Lureaud3592192015-10-09 17:17:20 +0200116 }
117
118 if (mfd == -1) {
Marc-André Lureau35f9b6e2015-10-09 17:17:21 +0200119 const char *tmpdir = g_get_tmp_dir();
120 gchar *fname;
121
122 fname = g_strdup_printf("%s/memfd-XXXXXX", tmpdir);
123 mfd = mkstemp(fname);
124 unlink(fname);
125 g_free(fname);
126
Marc-André Lureau0f2956f2018-02-01 14:27:51 +0100127 if (mfd == -1 ||
128 ftruncate(mfd, size) == -1) {
129 goto err;
Marc-André Lureau35f9b6e2015-10-09 17:17:21 +0200130 }
Marc-André Lureaud3592192015-10-09 17:17:20 +0200131 }
132
133 ptr = mmap(0, size, PROT_READ | PROT_WRITE, MAP_SHARED, mfd, 0);
134 if (ptr == MAP_FAILED) {
Marc-André Lureau0f2956f2018-02-01 14:27:51 +0100135 goto err;
Marc-André Lureaud3592192015-10-09 17:17:20 +0200136 }
137
138 *fd = mfd;
139 return ptr;
Marc-André Lureau0f2956f2018-02-01 14:27:51 +0100140
141err:
142 error_setg_errno(errp, errno, "failed to allocate shared memory");
143 if (mfd >= 0) {
144 close(mfd);
145 }
146 return NULL;
Marc-André Lureaud3592192015-10-09 17:17:20 +0200147}
148
149void qemu_memfd_free(void *ptr, size_t size, int fd)
150{
151 if (ptr) {
152 munmap(ptr, size);
153 }
154
155 if (fd != -1) {
156 close(fd);
157 }
158}
Marc-André Lureau31190ed2015-10-09 17:17:34 +0200159
160enum {
161 MEMFD_KO,
162 MEMFD_OK,
163 MEMFD_TODO
164};
165
Marc-André Lureau648abbf2018-03-28 14:18:04 +0200166/**
167 * qemu_memfd_alloc_check():
168 *
169 * Check if qemu_memfd_alloc() can allocate, including using a
170 * fallback implementation when host doesn't support memfd.
171 */
172bool qemu_memfd_alloc_check(void)
Marc-André Lureau31190ed2015-10-09 17:17:34 +0200173{
174 static int memfd_check = MEMFD_TODO;
175
176 if (memfd_check == MEMFD_TODO) {
177 int fd;
178 void *ptr;
179
Dima Stepanov1e7ec6c2018-06-13 11:19:54 +0300180 fd = -1;
Marc-André Lureau0f2956f2018-02-01 14:27:51 +0100181 ptr = qemu_memfd_alloc("test", 4096, 0, &fd, NULL);
Marc-André Lureau31190ed2015-10-09 17:17:34 +0200182 memfd_check = ptr ? MEMFD_OK : MEMFD_KO;
183 qemu_memfd_free(ptr, 4096, fd);
184 }
185
186 return memfd_check == MEMFD_OK;
187}
Marc-André Lureau648abbf2018-03-28 14:18:04 +0200188
189/**
190 * qemu_memfd_check():
191 *
192 * Check if host supports memfd.
193 */
Marc-André Lureau38296402018-09-06 20:14:15 +0400194bool qemu_memfd_check(unsigned int flags)
Marc-André Lureau648abbf2018-03-28 14:18:04 +0200195{
196#ifdef CONFIG_LINUX
Ilya Maximets92db9222019-03-11 16:58:48 +0300197 int mfd = memfd_create("test", flags | MFD_CLOEXEC);
Marc-André Lureau648abbf2018-03-28 14:18:04 +0200198
Marc-André Lureau38296402018-09-06 20:14:15 +0400199 if (mfd >= 0) {
200 close(mfd);
201 return true;
Marc-André Lureau648abbf2018-03-28 14:18:04 +0200202 }
Marc-André Lureau648abbf2018-03-28 14:18:04 +0200203#endif
Marc-André Lureau38296402018-09-06 20:14:15 +0400204
205 return false;
Marc-André Lureau648abbf2018-03-28 14:18:04 +0200206}