bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 1 | /* |
| 2 | * mmap support for qemu |
ths | 5fafdf2 | 2007-09-16 21:08:06 +0000 | [diff] [blame] | 3 | * |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 4 | * Copyright (c) 2003 Fabrice Bellard |
| 5 | * |
| 6 | * This program is free software; you can redistribute it and/or modify |
| 7 | * it under the terms of the GNU General Public License as published by |
| 8 | * the Free Software Foundation; either version 2 of the License, or |
| 9 | * (at your option) any later version. |
| 10 | * |
| 11 | * This program is distributed in the hope that it will be useful, |
| 12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| 14 | * GNU General Public License for more details. |
| 15 | * |
| 16 | * You should have received a copy of the GNU General Public License |
Blue Swirl | 8167ee8 | 2009-07-16 20:47:01 +0000 | [diff] [blame] | 17 | * along with this program; if not, see <http://www.gnu.org/licenses/>. |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 18 | */ |
Peter Maydell | d39594e | 2016-01-26 18:17:02 +0000 | [diff] [blame] | 19 | #include "qemu/osdep.h" |
Richard Henderson | 225a206 | 2023-08-20 09:24:14 -0700 | [diff] [blame] | 20 | #include <sys/shm.h> |
Alex Bennée | 11d9605 | 2019-12-05 12:25:12 +0000 | [diff] [blame] | 21 | #include "trace.h" |
Alex Bennée | 10d0d50 | 2019-12-05 12:25:15 +0000 | [diff] [blame] | 22 | #include "exec/log.h" |
Philippe Mathieu-Daudé | 74781c0 | 2023-12-06 20:27:32 +0100 | [diff] [blame] | 23 | #include "exec/page-protection.h" |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 24 | #include "qemu.h" |
Peter Maydell | 3b249d2 | 2021-09-08 16:44:03 +0100 | [diff] [blame] | 25 | #include "user-internals.h" |
Peter Maydell | 5423e6d | 2021-09-08 16:44:01 +0100 | [diff] [blame] | 26 | #include "user-mmap.h" |
Ilya Leoshkevich | 8655b4c | 2022-09-06 02:08:36 +0200 | [diff] [blame] | 27 | #include "target_mman.h" |
Richard Henderson | 044e95c | 2023-08-20 13:39:37 -0700 | [diff] [blame] | 28 | #include "qemu/interval-tree.h" |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 29 | |
Peter Maydell | 5a53431 | 2023-10-24 17:35:05 +0100 | [diff] [blame] | 30 | #ifdef TARGET_ARM |
| 31 | #include "target/arm/cpu-features.h" |
| 32 | #endif |
| 33 | |
Blue Swirl | 1e6eec8 | 2009-09-05 10:14:07 +0000 | [diff] [blame] | 34 | static pthread_mutex_t mmap_mutex = PTHREAD_MUTEX_INITIALIZER; |
Juan Quintela | dfd3f85 | 2009-09-23 01:19:03 +0200 | [diff] [blame] | 35 | static __thread int mmap_lock_count; |
pbrook | c8a706f | 2008-06-02 16:16:42 +0000 | [diff] [blame] | 36 | |
| 37 | void mmap_lock(void) |
| 38 | { |
| 39 | if (mmap_lock_count++ == 0) { |
| 40 | pthread_mutex_lock(&mmap_mutex); |
| 41 | } |
| 42 | } |
| 43 | |
| 44 | void mmap_unlock(void) |
| 45 | { |
Richard Henderson | 990ef91 | 2023-07-17 19:58:58 +0100 | [diff] [blame] | 46 | assert(mmap_lock_count > 0); |
pbrook | c8a706f | 2008-06-02 16:16:42 +0000 | [diff] [blame] | 47 | if (--mmap_lock_count == 0) { |
| 48 | pthread_mutex_unlock(&mmap_mutex); |
| 49 | } |
| 50 | } |
pbrook | d597536 | 2008-06-07 20:50:51 +0000 | [diff] [blame] | 51 | |
Alex Bennée | 301e40e | 2016-10-27 16:10:00 +0100 | [diff] [blame] | 52 | bool have_mmap_lock(void) |
| 53 | { |
| 54 | return mmap_lock_count > 0 ? true : false; |
| 55 | } |
| 56 | |
pbrook | d597536 | 2008-06-07 20:50:51 +0000 | [diff] [blame] | 57 | /* Grab lock to make sure things are in a consistent state after fork(). */ |
| 58 | void mmap_fork_start(void) |
| 59 | { |
| 60 | if (mmap_lock_count) |
| 61 | abort(); |
| 62 | pthread_mutex_lock(&mmap_mutex); |
| 63 | } |
| 64 | |
| 65 | void mmap_fork_end(int child) |
| 66 | { |
Richard Henderson | 2b730f7 | 2023-07-07 21:40:32 +0100 | [diff] [blame] | 67 | if (child) { |
pbrook | d597536 | 2008-06-07 20:50:51 +0000 | [diff] [blame] | 68 | pthread_mutex_init(&mmap_mutex, NULL); |
Richard Henderson | 2b730f7 | 2023-07-07 21:40:32 +0100 | [diff] [blame] | 69 | } else { |
pbrook | d597536 | 2008-06-07 20:50:51 +0000 | [diff] [blame] | 70 | pthread_mutex_unlock(&mmap_mutex); |
Richard Henderson | 2b730f7 | 2023-07-07 21:40:32 +0100 | [diff] [blame] | 71 | } |
pbrook | d597536 | 2008-06-07 20:50:51 +0000 | [diff] [blame] | 72 | } |
pbrook | c8a706f | 2008-06-02 16:16:42 +0000 | [diff] [blame] | 73 | |
Richard Henderson | 044e95c | 2023-08-20 13:39:37 -0700 | [diff] [blame] | 74 | /* Protected by mmap_lock. */ |
| 75 | static IntervalTreeRoot shm_regions; |
| 76 | |
| 77 | static void shm_region_add(abi_ptr start, abi_ptr last) |
| 78 | { |
| 79 | IntervalTreeNode *i = g_new0(IntervalTreeNode, 1); |
| 80 | |
| 81 | i->start = start; |
| 82 | i->last = last; |
| 83 | interval_tree_insert(i, &shm_regions); |
| 84 | } |
| 85 | |
| 86 | static abi_ptr shm_region_find(abi_ptr start) |
| 87 | { |
| 88 | IntervalTreeNode *i; |
| 89 | |
| 90 | for (i = interval_tree_iter_first(&shm_regions, start, start); i; |
| 91 | i = interval_tree_iter_next(i, start, start)) { |
| 92 | if (i->start == start) { |
| 93 | return i->last; |
| 94 | } |
| 95 | } |
| 96 | return 0; |
| 97 | } |
| 98 | |
| 99 | static void shm_region_rm_complete(abi_ptr start, abi_ptr last) |
| 100 | { |
| 101 | IntervalTreeNode *i, *n; |
| 102 | |
| 103 | for (i = interval_tree_iter_first(&shm_regions, start, last); i; i = n) { |
| 104 | n = interval_tree_iter_next(i, start, last); |
| 105 | if (i->start >= start && i->last <= last) { |
| 106 | interval_tree_remove(i, &shm_regions); |
| 107 | g_free(i); |
| 108 | } |
| 109 | } |
| 110 | } |
| 111 | |
Richard Henderson | 9dba3ca | 2020-05-19 11:56:44 -0700 | [diff] [blame] | 112 | /* |
| 113 | * Validate target prot bitmask. |
| 114 | * Return the prot bitmask for the host in *HOST_PROT. |
| 115 | * Return 0 if the target prot bitmask is invalid, otherwise |
| 116 | * the internal qemu page_flags (which will include PAGE_VALID). |
| 117 | */ |
Richard Henderson | 0dd5581 | 2023-07-07 21:40:40 +0100 | [diff] [blame] | 118 | static int validate_prot_to_pageflags(int prot) |
Richard Henderson | 9dba3ca | 2020-05-19 11:56:44 -0700 | [diff] [blame] | 119 | { |
| 120 | int valid = PROT_READ | PROT_WRITE | PROT_EXEC | TARGET_PROT_SEM; |
BALATON Zoltan | 86b7c55 | 2024-05-05 14:10:08 +0200 | [diff] [blame] | 121 | int page_flags = (prot & PAGE_RWX) | PAGE_VALID; |
Richard Henderson | 9dba3ca | 2020-05-19 11:56:44 -0700 | [diff] [blame] | 122 | |
Richard Henderson | be5d6f4 | 2020-10-21 10:37:39 -0700 | [diff] [blame] | 123 | #ifdef TARGET_AARCH64 |
Richard Henderson | d109b46 | 2021-02-12 10:48:55 -0800 | [diff] [blame] | 124 | { |
Richard Henderson | be5d6f4 | 2020-10-21 10:37:39 -0700 | [diff] [blame] | 125 | ARMCPU *cpu = ARM_CPU(thread_cpu); |
Richard Henderson | d109b46 | 2021-02-12 10:48:55 -0800 | [diff] [blame] | 126 | |
| 127 | /* |
| 128 | * The PROT_BTI bit is only accepted if the cpu supports the feature. |
| 129 | * Since this is the unusual case, don't bother checking unless |
| 130 | * the bit has been requested. If set and valid, record the bit |
| 131 | * within QEMU's page_flags. |
| 132 | */ |
| 133 | if ((prot & TARGET_PROT_BTI) && cpu_isar_feature(aa64_bti, cpu)) { |
Richard Henderson | be5d6f4 | 2020-10-21 10:37:39 -0700 | [diff] [blame] | 134 | valid |= TARGET_PROT_BTI; |
| 135 | page_flags |= PAGE_BTI; |
| 136 | } |
Richard Henderson | d109b46 | 2021-02-12 10:48:55 -0800 | [diff] [blame] | 137 | /* Similarly for the PROT_MTE bit. */ |
| 138 | if ((prot & TARGET_PROT_MTE) && cpu_isar_feature(aa64_mte, cpu)) { |
| 139 | valid |= TARGET_PROT_MTE; |
| 140 | page_flags |= PAGE_MTE; |
| 141 | } |
Richard Henderson | be5d6f4 | 2020-10-21 10:37:39 -0700 | [diff] [blame] | 142 | } |
Helge Deller | 4c184e7 | 2022-09-24 13:45:00 +0200 | [diff] [blame] | 143 | #elif defined(TARGET_HPPA) |
| 144 | valid |= PROT_GROWSDOWN | PROT_GROWSUP; |
Richard Henderson | be5d6f4 | 2020-10-21 10:37:39 -0700 | [diff] [blame] | 145 | #endif |
| 146 | |
Richard Henderson | 9dba3ca | 2020-05-19 11:56:44 -0700 | [diff] [blame] | 147 | return prot & ~valid ? 0 : page_flags; |
| 148 | } |
| 149 | |
Richard Henderson | 0dd5581 | 2023-07-07 21:40:40 +0100 | [diff] [blame] | 150 | /* |
| 151 | * For the host, we need not pass anything except read/write/exec. |
| 152 | * While PROT_SEM is allowed by all hosts, it is also ignored, so |
| 153 | * don't bother transforming guest bit to host bit. Any other |
| 154 | * target-specific prot bits will not be understood by the host |
| 155 | * and will need to be encoded into page_flags for qemu emulation. |
| 156 | * |
| 157 | * Pages that are executable by the guest will never be executed |
| 158 | * by the host, but the host will need to be able to read them. |
| 159 | */ |
| 160 | static int target_to_host_prot(int prot) |
| 161 | { |
| 162 | return (prot & (PROT_READ | PROT_WRITE)) | |
| 163 | (prot & PROT_EXEC ? PROT_READ : 0); |
| 164 | } |
| 165 | |
pbrook | 53a5960 | 2006-03-25 19:31:22 +0000 | [diff] [blame] | 166 | /* NOTE: all the constants are the HOST ones, but addresses are target. */ |
Richard Henderson | 9dba3ca | 2020-05-19 11:56:44 -0700 | [diff] [blame] | 167 | int target_mprotect(abi_ulong start, abi_ulong len, int target_prot) |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 168 | { |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 169 | int host_page_size = qemu_real_host_page_size(); |
Richard Henderson | 7bdc1ac | 2023-07-07 21:40:42 +0100 | [diff] [blame] | 170 | abi_ulong starts[3]; |
| 171 | abi_ulong lens[3]; |
| 172 | int prots[3]; |
| 173 | abi_ulong host_start, host_last, last; |
| 174 | int prot1, ret, page_flags, nranges; |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 175 | |
Richard Henderson | 9dba3ca | 2020-05-19 11:56:44 -0700 | [diff] [blame] | 176 | trace_target_mprotect(start, len, target_prot); |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 177 | |
Richard Henderson | 9dba3ca | 2020-05-19 11:56:44 -0700 | [diff] [blame] | 178 | if ((start & ~TARGET_PAGE_MASK) != 0) { |
Max Filippov | 78cf339 | 2018-02-28 14:16:05 -0800 | [diff] [blame] | 179 | return -TARGET_EINVAL; |
Richard Henderson | 9dba3ca | 2020-05-19 11:56:44 -0700 | [diff] [blame] | 180 | } |
Richard Henderson | 0dd5581 | 2023-07-07 21:40:40 +0100 | [diff] [blame] | 181 | page_flags = validate_prot_to_pageflags(target_prot); |
Richard Henderson | 9dba3ca | 2020-05-19 11:56:44 -0700 | [diff] [blame] | 182 | if (!page_flags) { |
| 183 | return -TARGET_EINVAL; |
| 184 | } |
Richard Henderson | 9dba3ca | 2020-05-19 11:56:44 -0700 | [diff] [blame] | 185 | if (len == 0) { |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 186 | return 0; |
Richard Henderson | 9dba3ca | 2020-05-19 11:56:44 -0700 | [diff] [blame] | 187 | } |
Richard Henderson | 7bdc1ac | 2023-07-07 21:40:42 +0100 | [diff] [blame] | 188 | len = TARGET_PAGE_ALIGN(len); |
| 189 | if (!guest_range_valid_untagged(start, len)) { |
| 190 | return -TARGET_ENOMEM; |
| 191 | } |
| 192 | |
| 193 | last = start + len - 1; |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 194 | host_start = start & -host_page_size; |
Richard Henderson | b36b2b1 | 2024-01-02 12:57:45 +1100 | [diff] [blame] | 195 | host_last = ROUND_UP(last, host_page_size) - 1; |
Richard Henderson | 7bdc1ac | 2023-07-07 21:40:42 +0100 | [diff] [blame] | 196 | nranges = 0; |
ths | 3b46e62 | 2007-09-17 08:09:54 +0000 | [diff] [blame] | 197 | |
pbrook | c8a706f | 2008-06-02 16:16:42 +0000 | [diff] [blame] | 198 | mmap_lock(); |
Richard Henderson | 7bdc1ac | 2023-07-07 21:40:42 +0100 | [diff] [blame] | 199 | |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 200 | if (host_last - host_start < host_page_size) { |
Richard Henderson | 7bdc1ac | 2023-07-07 21:40:42 +0100 | [diff] [blame] | 201 | /* Single host page contains all guest pages: sum the prot. */ |
Richard Henderson | 0dd5581 | 2023-07-07 21:40:40 +0100 | [diff] [blame] | 202 | prot1 = target_prot; |
Richard Henderson | 7bdc1ac | 2023-07-07 21:40:42 +0100 | [diff] [blame] | 203 | for (abi_ulong a = host_start; a < start; a += TARGET_PAGE_SIZE) { |
| 204 | prot1 |= page_get_flags(a); |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 205 | } |
Richard Henderson | 7bdc1ac | 2023-07-07 21:40:42 +0100 | [diff] [blame] | 206 | for (abi_ulong a = last; a < host_last; a += TARGET_PAGE_SIZE) { |
| 207 | prot1 |= page_get_flags(a + 1); |
| 208 | } |
| 209 | starts[nranges] = host_start; |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 210 | lens[nranges] = host_page_size; |
Richard Henderson | 7bdc1ac | 2023-07-07 21:40:42 +0100 | [diff] [blame] | 211 | prots[nranges] = prot1; |
| 212 | nranges++; |
| 213 | } else { |
| 214 | if (host_start < start) { |
| 215 | /* Host page contains more than one guest page: sum the prot. */ |
| 216 | prot1 = target_prot; |
| 217 | for (abi_ulong a = host_start; a < start; a += TARGET_PAGE_SIZE) { |
| 218 | prot1 |= page_get_flags(a); |
bellard | d418c81 | 2003-05-13 00:57:50 +0000 | [diff] [blame] | 219 | } |
Richard Henderson | 7bdc1ac | 2023-07-07 21:40:42 +0100 | [diff] [blame] | 220 | /* If the resulting sum differs, create a new range. */ |
| 221 | if (prot1 != target_prot) { |
| 222 | starts[nranges] = host_start; |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 223 | lens[nranges] = host_page_size; |
Richard Henderson | 7bdc1ac | 2023-07-07 21:40:42 +0100 | [diff] [blame] | 224 | prots[nranges] = prot1; |
| 225 | nranges++; |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 226 | host_start += host_page_size; |
Richard Henderson | 7bdc1ac | 2023-07-07 21:40:42 +0100 | [diff] [blame] | 227 | } |
bellard | d418c81 | 2003-05-13 00:57:50 +0000 | [diff] [blame] | 228 | } |
Richard Henderson | 7bdc1ac | 2023-07-07 21:40:42 +0100 | [diff] [blame] | 229 | |
| 230 | if (last < host_last) { |
| 231 | /* Host page contains more than one guest page: sum the prot. */ |
| 232 | prot1 = target_prot; |
| 233 | for (abi_ulong a = last; a < host_last; a += TARGET_PAGE_SIZE) { |
| 234 | prot1 |= page_get_flags(a + 1); |
| 235 | } |
| 236 | /* If the resulting sum differs, create a new range. */ |
| 237 | if (prot1 != target_prot) { |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 238 | host_last -= host_page_size; |
Richard Henderson | 7bdc1ac | 2023-07-07 21:40:42 +0100 | [diff] [blame] | 239 | starts[nranges] = host_last + 1; |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 240 | lens[nranges] = host_page_size; |
Richard Henderson | 7bdc1ac | 2023-07-07 21:40:42 +0100 | [diff] [blame] | 241 | prots[nranges] = prot1; |
| 242 | nranges++; |
| 243 | } |
Richard Henderson | 9dba3ca | 2020-05-19 11:56:44 -0700 | [diff] [blame] | 244 | } |
Richard Henderson | 7bdc1ac | 2023-07-07 21:40:42 +0100 | [diff] [blame] | 245 | |
| 246 | /* Create a range for the middle, if any remains. */ |
| 247 | if (host_start < host_last) { |
| 248 | starts[nranges] = host_start; |
| 249 | lens[nranges] = host_last - host_start + 1; |
| 250 | prots[nranges] = target_prot; |
| 251 | nranges++; |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 252 | } |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 253 | } |
ths | 3b46e62 | 2007-09-17 08:09:54 +0000 | [diff] [blame] | 254 | |
Richard Henderson | 7bdc1ac | 2023-07-07 21:40:42 +0100 | [diff] [blame] | 255 | for (int i = 0; i < nranges; ++i) { |
| 256 | ret = mprotect(g2h_untagged(starts[i]), lens[i], |
| 257 | target_to_host_prot(prots[i])); |
Richard Henderson | 9dba3ca | 2020-05-19 11:56:44 -0700 | [diff] [blame] | 258 | if (ret != 0) { |
pbrook | c8a706f | 2008-06-02 16:16:42 +0000 | [diff] [blame] | 259 | goto error; |
Richard Henderson | 9dba3ca | 2020-05-19 11:56:44 -0700 | [diff] [blame] | 260 | } |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 261 | } |
Ilya Leoshkevich | aa98e2d | 2022-08-17 17:05:03 +0200 | [diff] [blame] | 262 | |
Richard Henderson | 7bdc1ac | 2023-07-07 21:40:42 +0100 | [diff] [blame] | 263 | page_set_flags(start, last, page_flags); |
Ilya Leoshkevich | aa98e2d | 2022-08-17 17:05:03 +0200 | [diff] [blame] | 264 | ret = 0; |
| 265 | |
Richard Henderson | 7bdc1ac | 2023-07-07 21:40:42 +0100 | [diff] [blame] | 266 | error: |
pbrook | c8a706f | 2008-06-02 16:16:42 +0000 | [diff] [blame] | 267 | mmap_unlock(); |
| 268 | return ret; |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 269 | } |
| 270 | |
Richard Henderson | 2952b64 | 2024-02-13 10:20:27 -1000 | [diff] [blame] | 271 | /* |
| 272 | * Perform munmap on behalf of the target, with host parameters. |
| 273 | * If reserved_va, we must replace the memory reservation. |
| 274 | */ |
| 275 | static int do_munmap(void *addr, size_t len) |
| 276 | { |
| 277 | if (reserved_va) { |
| 278 | void *ptr = mmap(addr, len, PROT_NONE, |
| 279 | MAP_FIXED | MAP_ANONYMOUS |
| 280 | | MAP_PRIVATE | MAP_NORESERVE, -1, 0); |
| 281 | return ptr == addr ? 0 : -1; |
| 282 | } |
| 283 | return munmap(addr, len); |
| 284 | } |
| 285 | |
Richard Henderson | eb5027a | 2024-01-02 12:57:58 +1100 | [diff] [blame] | 286 | /* |
| 287 | * Map an incomplete host page. |
| 288 | * |
| 289 | * Here be dragons. This case will not work if there is an existing |
| 290 | * overlapping host page, which is file mapped, and for which the mapping |
| 291 | * is beyond the end of the file. In that case, we will see SIGBUS when |
| 292 | * trying to write a portion of this page. |
| 293 | * |
| 294 | * FIXME: Work around this with a temporary signal handler and longjmp. |
| 295 | */ |
Richard Henderson | 99982be | 2023-07-07 21:40:43 +0100 | [diff] [blame] | 296 | static bool mmap_frag(abi_ulong real_start, abi_ulong start, abi_ulong last, |
| 297 | int prot, int flags, int fd, off_t offset) |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 298 | { |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 299 | int host_page_size = qemu_real_host_page_size(); |
Richard Henderson | 99982be | 2023-07-07 21:40:43 +0100 | [diff] [blame] | 300 | abi_ulong real_last; |
pbrook | 53a5960 | 2006-03-25 19:31:22 +0000 | [diff] [blame] | 301 | void *host_start; |
Richard Henderson | 99982be | 2023-07-07 21:40:43 +0100 | [diff] [blame] | 302 | int prot_old, prot_new; |
| 303 | int host_prot_old, host_prot_new; |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 304 | |
Richard Henderson | 99982be | 2023-07-07 21:40:43 +0100 | [diff] [blame] | 305 | if (!(flags & MAP_ANONYMOUS) |
| 306 | && (flags & MAP_TYPE) == MAP_SHARED |
| 307 | && (prot & PROT_WRITE)) { |
| 308 | /* |
| 309 | * msync() won't work with the partial page, so we return an |
| 310 | * error if write is possible while it is a shared mapping. |
| 311 | */ |
| 312 | errno = EINVAL; |
| 313 | return false; |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 314 | } |
ths | 3b46e62 | 2007-09-17 08:09:54 +0000 | [diff] [blame] | 315 | |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 316 | real_last = real_start + host_page_size - 1; |
Richard Henderson | 99982be | 2023-07-07 21:40:43 +0100 | [diff] [blame] | 317 | host_start = g2h_untagged(real_start); |
| 318 | |
| 319 | /* Get the protection of the target pages outside the mapping. */ |
| 320 | prot_old = 0; |
| 321 | for (abi_ulong a = real_start; a < start; a += TARGET_PAGE_SIZE) { |
| 322 | prot_old |= page_get_flags(a); |
| 323 | } |
| 324 | for (abi_ulong a = real_last; a > last; a -= TARGET_PAGE_SIZE) { |
| 325 | prot_old |= page_get_flags(a); |
| 326 | } |
| 327 | |
| 328 | if (prot_old == 0) { |
| 329 | /* |
| 330 | * Since !(prot_old & PAGE_VALID), there were no guest pages |
| 331 | * outside of the fragment we need to map. Allocate a new host |
| 332 | * page to cover, discarding whatever else may have been present. |
| 333 | */ |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 334 | void *p = mmap(host_start, host_page_size, |
Richard Henderson | 0dd5581 | 2023-07-07 21:40:40 +0100 | [diff] [blame] | 335 | target_to_host_prot(prot), |
ths | 80210bc | 2007-11-02 19:08:57 +0000 | [diff] [blame] | 336 | flags | MAP_ANONYMOUS, -1, 0); |
Akihiko Odaki | ddcdd8c | 2023-08-02 16:17:48 +0900 | [diff] [blame] | 337 | if (p != host_start) { |
| 338 | if (p != MAP_FAILED) { |
Richard Henderson | 3bfa271 | 2024-02-13 10:40:57 -1000 | [diff] [blame] | 339 | do_munmap(p, host_page_size); |
Akihiko Odaki | ddcdd8c | 2023-08-02 16:17:48 +0900 | [diff] [blame] | 340 | errno = EEXIST; |
| 341 | } |
Richard Henderson | 99982be | 2023-07-07 21:40:43 +0100 | [diff] [blame] | 342 | return false; |
Richard Henderson | 2b730f7 | 2023-07-07 21:40:32 +0100 | [diff] [blame] | 343 | } |
Richard Henderson | 99982be | 2023-07-07 21:40:43 +0100 | [diff] [blame] | 344 | prot_old = prot; |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 345 | } |
Richard Henderson | 99982be | 2023-07-07 21:40:43 +0100 | [diff] [blame] | 346 | prot_new = prot | prot_old; |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 347 | |
Richard Henderson | 99982be | 2023-07-07 21:40:43 +0100 | [diff] [blame] | 348 | host_prot_old = target_to_host_prot(prot_old); |
| 349 | host_prot_new = target_to_host_prot(prot_new); |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 350 | |
Richard Henderson | 99982be | 2023-07-07 21:40:43 +0100 | [diff] [blame] | 351 | /* Adjust protection to be able to write. */ |
| 352 | if (!(host_prot_old & PROT_WRITE)) { |
| 353 | host_prot_old |= PROT_WRITE; |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 354 | mprotect(host_start, host_page_size, host_prot_old); |
Richard Henderson | 99982be | 2023-07-07 21:40:43 +0100 | [diff] [blame] | 355 | } |
ths | 3b46e62 | 2007-09-17 08:09:54 +0000 | [diff] [blame] | 356 | |
Richard Henderson | 99982be | 2023-07-07 21:40:43 +0100 | [diff] [blame] | 357 | /* Read or zero the new guest pages. */ |
| 358 | if (flags & MAP_ANONYMOUS) { |
| 359 | memset(g2h_untagged(start), 0, last - start + 1); |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 360 | } else { |
Richard Henderson | 99982be | 2023-07-07 21:40:43 +0100 | [diff] [blame] | 361 | if (pread(fd, g2h_untagged(start), last - start + 1, offset) == -1) { |
| 362 | return false; |
Chen Gang | e6deac9 | 2015-12-30 09:10:54 +0800 | [diff] [blame] | 363 | } |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 364 | } |
Richard Henderson | 99982be | 2023-07-07 21:40:43 +0100 | [diff] [blame] | 365 | |
| 366 | /* Put final protection */ |
| 367 | if (host_prot_new != host_prot_old) { |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 368 | mprotect(host_start, host_page_size, host_prot_new); |
Richard Henderson | 99982be | 2023-07-07 21:40:43 +0100 | [diff] [blame] | 369 | } |
| 370 | return true; |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 371 | } |
| 372 | |
Richard Henderson | c8fb5cf | 2023-08-02 14:25:27 -0700 | [diff] [blame] | 373 | abi_ulong task_unmapped_base; |
Richard Henderson | da2b71f | 2023-08-02 15:17:33 -0700 | [diff] [blame] | 374 | abi_ulong elf_et_dyn_base; |
Richard Henderson | c8fb5cf | 2023-08-02 14:25:27 -0700 | [diff] [blame] | 375 | abi_ulong mmap_next_start; |
bellard | a03e2d4 | 2007-11-14 11:29:07 +0000 | [diff] [blame] | 376 | |
Richard Henderson | 2b730f7 | 2023-07-07 21:40:32 +0100 | [diff] [blame] | 377 | /* |
| 378 | * Subroutine of mmap_find_vma, used when we have pre-allocated |
| 379 | * a chunk of guest address space. |
| 380 | */ |
Richard Henderson | 30ab9ef | 2019-05-19 13:19:52 -0700 | [diff] [blame] | 381 | static abi_ulong mmap_find_vma_reserved(abi_ulong start, abi_ulong size, |
| 382 | abi_ulong align) |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 383 | { |
Richard Henderson | 4c13048 | 2023-07-07 21:40:46 +0100 | [diff] [blame] | 384 | target_ulong ret; |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 385 | |
Richard Henderson | 4c13048 | 2023-07-07 21:40:46 +0100 | [diff] [blame] | 386 | ret = page_find_range_empty(start, reserved_va, size, align); |
| 387 | if (ret == -1 && start > mmap_min_addr) { |
| 388 | /* Restart at the beginning of the address space. */ |
| 389 | ret = page_find_range_empty(mmap_min_addr, start - 1, size, align); |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 390 | } |
| 391 | |
Richard Henderson | 4c13048 | 2023-07-07 21:40:46 +0100 | [diff] [blame] | 392 | return ret; |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 393 | } |
| 394 | |
Kirill A. Shutemov | fe3b415 | 2009-08-13 21:03:58 +0300 | [diff] [blame] | 395 | /* |
| 396 | * Find and reserve a free memory area of size 'size'. The search |
| 397 | * starts at 'start'. |
| 398 | * It must be called with mmap_lock() held. |
| 399 | * Return -1 if error. |
| 400 | */ |
Richard Henderson | 30ab9ef | 2019-05-19 13:19:52 -0700 | [diff] [blame] | 401 | abi_ulong mmap_find_vma(abi_ulong start, abi_ulong size, abi_ulong align) |
bellard | a03e2d4 | 2007-11-14 11:29:07 +0000 | [diff] [blame] | 402 | { |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 403 | int host_page_size = qemu_real_host_page_size(); |
Richard Henderson | 14f24e1 | 2010-03-10 15:39:07 -0800 | [diff] [blame] | 404 | void *ptr, *prev; |
Kirill A. Shutemov | fe3b415 | 2009-08-13 21:03:58 +0300 | [diff] [blame] | 405 | abi_ulong addr; |
Richard Henderson | 14f24e1 | 2010-03-10 15:39:07 -0800 | [diff] [blame] | 406 | int wrapped, repeat; |
Kirill A. Shutemov | fe3b415 | 2009-08-13 21:03:58 +0300 | [diff] [blame] | 407 | |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 408 | align = MAX(align, host_page_size); |
Richard Henderson | 443b750 | 2019-05-19 13:19:53 -0700 | [diff] [blame] | 409 | |
Kirill A. Shutemov | fe3b415 | 2009-08-13 21:03:58 +0300 | [diff] [blame] | 410 | /* If 'start' == 0, then a default start address is used. */ |
Richard Henderson | 14f24e1 | 2010-03-10 15:39:07 -0800 | [diff] [blame] | 411 | if (start == 0) { |
Kirill A. Shutemov | fe3b415 | 2009-08-13 21:03:58 +0300 | [diff] [blame] | 412 | start = mmap_next_start; |
Richard Henderson | 14f24e1 | 2010-03-10 15:39:07 -0800 | [diff] [blame] | 413 | } else { |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 414 | start &= -host_page_size; |
Richard Henderson | 14f24e1 | 2010-03-10 15:39:07 -0800 | [diff] [blame] | 415 | } |
Richard Henderson | 30ab9ef | 2019-05-19 13:19:52 -0700 | [diff] [blame] | 416 | start = ROUND_UP(start, align); |
Richard Henderson | b36b2b1 | 2024-01-02 12:57:45 +1100 | [diff] [blame] | 417 | size = ROUND_UP(size, host_page_size); |
Kirill A. Shutemov | fe3b415 | 2009-08-13 21:03:58 +0300 | [diff] [blame] | 418 | |
Laurent Vivier | b76f21a | 2015-08-24 14:53:54 +0200 | [diff] [blame] | 419 | if (reserved_va) { |
Richard Henderson | 30ab9ef | 2019-05-19 13:19:52 -0700 | [diff] [blame] | 420 | return mmap_find_vma_reserved(start, size, align); |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 421 | } |
| 422 | |
bellard | a03e2d4 | 2007-11-14 11:29:07 +0000 | [diff] [blame] | 423 | addr = start; |
Richard Henderson | 14f24e1 | 2010-03-10 15:39:07 -0800 | [diff] [blame] | 424 | wrapped = repeat = 0; |
| 425 | prev = 0; |
Kirill A. Shutemov | fe3b415 | 2009-08-13 21:03:58 +0300 | [diff] [blame] | 426 | |
Richard Henderson | 14f24e1 | 2010-03-10 15:39:07 -0800 | [diff] [blame] | 427 | for (;; prev = ptr) { |
Kirill A. Shutemov | fe3b415 | 2009-08-13 21:03:58 +0300 | [diff] [blame] | 428 | /* |
| 429 | * Reserve needed memory area to avoid a race. |
| 430 | * It should be discarded using: |
| 431 | * - mmap() with MAP_FIXED flag |
| 432 | * - mremap() with MREMAP_FIXED flag |
| 433 | * - shmat() with SHM_REMAP flag |
| 434 | */ |
Richard Henderson | 3e8f162 | 2021-02-12 10:48:43 -0800 | [diff] [blame] | 435 | ptr = mmap(g2h_untagged(addr), size, PROT_NONE, |
Richard Henderson | 2b730f7 | 2023-07-07 21:40:32 +0100 | [diff] [blame] | 436 | MAP_ANONYMOUS | MAP_PRIVATE | MAP_NORESERVE, -1, 0); |
Kirill A. Shutemov | fe3b415 | 2009-08-13 21:03:58 +0300 | [diff] [blame] | 437 | |
| 438 | /* ENOMEM, if host address space has no memory */ |
Richard Henderson | 14f24e1 | 2010-03-10 15:39:07 -0800 | [diff] [blame] | 439 | if (ptr == MAP_FAILED) { |
Kirill A. Shutemov | fe3b415 | 2009-08-13 21:03:58 +0300 | [diff] [blame] | 440 | return (abi_ulong)-1; |
Richard Henderson | 14f24e1 | 2010-03-10 15:39:07 -0800 | [diff] [blame] | 441 | } |
Kirill A. Shutemov | fe3b415 | 2009-08-13 21:03:58 +0300 | [diff] [blame] | 442 | |
Richard Henderson | 2b730f7 | 2023-07-07 21:40:32 +0100 | [diff] [blame] | 443 | /* |
| 444 | * Count the number of sequential returns of the same address. |
| 445 | * This is used to modify the search algorithm below. |
| 446 | */ |
Richard Henderson | 14f24e1 | 2010-03-10 15:39:07 -0800 | [diff] [blame] | 447 | repeat = (ptr == prev ? repeat + 1 : 0); |
Kirill A. Shutemov | fe3b415 | 2009-08-13 21:03:58 +0300 | [diff] [blame] | 448 | |
Richard Henderson | 14f24e1 | 2010-03-10 15:39:07 -0800 | [diff] [blame] | 449 | if (h2g_valid(ptr + size - 1)) { |
| 450 | addr = h2g(ptr); |
| 451 | |
Richard Henderson | 30ab9ef | 2019-05-19 13:19:52 -0700 | [diff] [blame] | 452 | if ((addr & (align - 1)) == 0) { |
Richard Henderson | 14f24e1 | 2010-03-10 15:39:07 -0800 | [diff] [blame] | 453 | /* Success. */ |
Richard Henderson | c8fb5cf | 2023-08-02 14:25:27 -0700 | [diff] [blame] | 454 | if (start == mmap_next_start && addr >= task_unmapped_base) { |
Richard Henderson | 14f24e1 | 2010-03-10 15:39:07 -0800 | [diff] [blame] | 455 | mmap_next_start = addr + size; |
| 456 | } |
| 457 | return addr; |
| 458 | } |
| 459 | |
| 460 | /* The address is not properly aligned for the target. */ |
| 461 | switch (repeat) { |
| 462 | case 0: |
Richard Henderson | 2b730f7 | 2023-07-07 21:40:32 +0100 | [diff] [blame] | 463 | /* |
| 464 | * Assume the result that the kernel gave us is the |
| 465 | * first with enough free space, so start again at the |
| 466 | * next higher target page. |
| 467 | */ |
Richard Henderson | 30ab9ef | 2019-05-19 13:19:52 -0700 | [diff] [blame] | 468 | addr = ROUND_UP(addr, align); |
Richard Henderson | 14f24e1 | 2010-03-10 15:39:07 -0800 | [diff] [blame] | 469 | break; |
| 470 | case 1: |
Richard Henderson | 2b730f7 | 2023-07-07 21:40:32 +0100 | [diff] [blame] | 471 | /* |
| 472 | * Sometimes the kernel decides to perform the allocation |
| 473 | * at the top end of memory instead. |
| 474 | */ |
Richard Henderson | 30ab9ef | 2019-05-19 13:19:52 -0700 | [diff] [blame] | 475 | addr &= -align; |
Richard Henderson | 14f24e1 | 2010-03-10 15:39:07 -0800 | [diff] [blame] | 476 | break; |
| 477 | case 2: |
| 478 | /* Start over at low memory. */ |
| 479 | addr = 0; |
| 480 | break; |
| 481 | default: |
| 482 | /* Fail. This unaligned block must the last. */ |
| 483 | addr = -1; |
| 484 | break; |
| 485 | } |
| 486 | } else { |
Richard Henderson | 2b730f7 | 2023-07-07 21:40:32 +0100 | [diff] [blame] | 487 | /* |
| 488 | * Since the result the kernel gave didn't fit, start |
| 489 | * again at low memory. If any repetition, fail. |
| 490 | */ |
Richard Henderson | 14f24e1 | 2010-03-10 15:39:07 -0800 | [diff] [blame] | 491 | addr = (repeat ? -1 : 0); |
| 492 | } |
| 493 | |
| 494 | /* Unmap and try again. */ |
Kirill A. Shutemov | fe3b415 | 2009-08-13 21:03:58 +0300 | [diff] [blame] | 495 | munmap(ptr, size); |
Kirill A. Shutemov | fe3b415 | 2009-08-13 21:03:58 +0300 | [diff] [blame] | 496 | |
Richard Henderson | 14f24e1 | 2010-03-10 15:39:07 -0800 | [diff] [blame] | 497 | /* ENOMEM if we checked the whole of the target address space. */ |
Blue Swirl | d0b3e4f | 2010-09-18 05:53:14 +0000 | [diff] [blame] | 498 | if (addr == (abi_ulong)-1) { |
bellard | a03e2d4 | 2007-11-14 11:29:07 +0000 | [diff] [blame] | 499 | return (abi_ulong)-1; |
Richard Henderson | 14f24e1 | 2010-03-10 15:39:07 -0800 | [diff] [blame] | 500 | } else if (addr == 0) { |
| 501 | if (wrapped) { |
| 502 | return (abi_ulong)-1; |
| 503 | } |
| 504 | wrapped = 1; |
Richard Henderson | 2b730f7 | 2023-07-07 21:40:32 +0100 | [diff] [blame] | 505 | /* |
| 506 | * Don't actually use 0 when wrapping, instead indicate |
| 507 | * that we'd truly like an allocation in low memory. |
| 508 | */ |
Richard Henderson | 14f24e1 | 2010-03-10 15:39:07 -0800 | [diff] [blame] | 509 | addr = (mmap_min_addr > TARGET_PAGE_SIZE |
| 510 | ? TARGET_PAGE_ALIGN(mmap_min_addr) |
| 511 | : TARGET_PAGE_SIZE); |
| 512 | } else if (wrapped && addr >= start) { |
| 513 | return (abi_ulong)-1; |
| 514 | } |
bellard | a03e2d4 | 2007-11-14 11:29:07 +0000 | [diff] [blame] | 515 | } |
bellard | a03e2d4 | 2007-11-14 11:29:07 +0000 | [diff] [blame] | 516 | } |
| 517 | |
Richard Henderson | 6ecc255 | 2024-01-02 12:57:54 +1100 | [diff] [blame] | 518 | /* |
| 519 | * Record a successful mmap within the user-exec interval tree. |
| 520 | */ |
| 521 | static abi_long mmap_end(abi_ulong start, abi_ulong last, |
| 522 | abi_ulong passthrough_start, |
| 523 | abi_ulong passthrough_last, |
| 524 | int flags, int page_flags) |
| 525 | { |
| 526 | if (flags & MAP_ANONYMOUS) { |
| 527 | page_flags |= PAGE_ANON; |
| 528 | } |
| 529 | page_flags |= PAGE_RESET; |
| 530 | if (passthrough_start > passthrough_last) { |
| 531 | page_set_flags(start, last, page_flags); |
| 532 | } else { |
| 533 | if (start < passthrough_start) { |
| 534 | page_set_flags(start, passthrough_start - 1, page_flags); |
| 535 | } |
| 536 | page_set_flags(passthrough_start, passthrough_last, |
| 537 | page_flags | PAGE_PASSTHROUGH); |
| 538 | if (passthrough_last < last) { |
| 539 | page_set_flags(passthrough_last + 1, last, page_flags); |
| 540 | } |
| 541 | } |
| 542 | shm_region_rm_complete(start, last); |
| 543 | trace_target_mmap_complete(start); |
| 544 | if (qemu_loglevel_mask(CPU_LOG_PAGE)) { |
| 545 | FILE *f = qemu_log_trylock(); |
| 546 | if (f) { |
| 547 | fprintf(f, "page layout changed following mmap\n"); |
| 548 | page_dump(f); |
| 549 | qemu_log_unlock(f); |
| 550 | } |
| 551 | } |
| 552 | return start; |
| 553 | } |
| 554 | |
Richard Henderson | 68098de | 2024-01-02 12:57:56 +1100 | [diff] [blame] | 555 | /* |
| 556 | * Special case host page size == target page size, |
| 557 | * where there are no edge conditions. |
| 558 | */ |
| 559 | static abi_long mmap_h_eq_g(abi_ulong start, abi_ulong len, |
| 560 | int host_prot, int flags, int page_flags, |
| 561 | int fd, off_t offset) |
| 562 | { |
| 563 | void *p, *want_p = g2h_untagged(start); |
| 564 | abi_ulong last; |
| 565 | |
| 566 | p = mmap(want_p, len, host_prot, flags, fd, offset); |
| 567 | if (p == MAP_FAILED) { |
| 568 | return -1; |
| 569 | } |
| 570 | /* If the host kernel does not support MAP_FIXED_NOREPLACE, emulate. */ |
| 571 | if ((flags & MAP_FIXED_NOREPLACE) && p != want_p) { |
| 572 | do_munmap(p, len); |
| 573 | errno = EEXIST; |
| 574 | return -1; |
| 575 | } |
| 576 | |
| 577 | start = h2g(p); |
| 578 | last = start + len - 1; |
| 579 | return mmap_end(start, last, start, last, flags, page_flags); |
| 580 | } |
| 581 | |
Richard Henderson | 8080b2f | 2024-01-02 12:57:57 +1100 | [diff] [blame] | 582 | /* |
| 583 | * Special case host page size < target page size. |
| 584 | * |
| 585 | * The two special cases are increased guest alignment, and mapping |
| 586 | * past the end of a file. |
| 587 | * |
| 588 | * When mapping files into a memory area larger than the file, |
| 589 | * accesses to pages beyond the file size will cause a SIGBUS. |
| 590 | * |
| 591 | * For example, if mmaping a file of 100 bytes on a host with 4K |
| 592 | * pages emulating a target with 8K pages, the target expects to |
| 593 | * be able to access the first 8K. But the host will trap us on |
| 594 | * any access beyond 4K. |
| 595 | * |
| 596 | * When emulating a target with a larger page-size than the hosts, |
| 597 | * we may need to truncate file maps at EOF and add extra anonymous |
| 598 | * pages up to the targets page boundary. |
| 599 | * |
| 600 | * This workaround only works for files that do not change. |
| 601 | * If the file is later extended (e.g. ftruncate), the SIGBUS |
| 602 | * vanishes and the proper behaviour is that changes within the |
| 603 | * anon page should be reflected in the file. |
| 604 | * |
| 605 | * However, this case is rather common with executable images, |
| 606 | * so the workaround is important for even trivial tests, whereas |
| 607 | * the mmap of of a file being extended is less common. |
| 608 | */ |
| 609 | static abi_long mmap_h_lt_g(abi_ulong start, abi_ulong len, int host_prot, |
| 610 | int mmap_flags, int page_flags, int fd, |
| 611 | off_t offset, int host_page_size) |
| 612 | { |
| 613 | void *p, *want_p = g2h_untagged(start); |
| 614 | off_t fileend_adj = 0; |
| 615 | int flags = mmap_flags; |
| 616 | abi_ulong last, pass_last; |
| 617 | |
| 618 | if (!(flags & MAP_ANONYMOUS)) { |
| 619 | struct stat sb; |
| 620 | |
| 621 | if (fstat(fd, &sb) == -1) { |
| 622 | return -1; |
| 623 | } |
| 624 | if (offset >= sb.st_size) { |
| 625 | /* |
| 626 | * The entire map is beyond the end of the file. |
| 627 | * Transform it to an anonymous mapping. |
| 628 | */ |
| 629 | flags |= MAP_ANONYMOUS; |
| 630 | fd = -1; |
| 631 | offset = 0; |
| 632 | } else if (offset + len > sb.st_size) { |
| 633 | /* |
| 634 | * A portion of the map is beyond the end of the file. |
| 635 | * Truncate the file portion of the allocation. |
| 636 | */ |
| 637 | fileend_adj = offset + len - sb.st_size; |
| 638 | } |
| 639 | } |
| 640 | |
| 641 | if (flags & (MAP_FIXED | MAP_FIXED_NOREPLACE)) { |
| 642 | if (fileend_adj) { |
| 643 | p = mmap(want_p, len, host_prot, flags | MAP_ANONYMOUS, -1, 0); |
| 644 | } else { |
| 645 | p = mmap(want_p, len, host_prot, flags, fd, offset); |
| 646 | } |
| 647 | if (p != want_p) { |
| 648 | if (p != MAP_FAILED) { |
| 649 | /* Host does not support MAP_FIXED_NOREPLACE: emulate. */ |
| 650 | do_munmap(p, len); |
| 651 | errno = EEXIST; |
| 652 | } |
| 653 | return -1; |
| 654 | } |
| 655 | |
| 656 | if (fileend_adj) { |
| 657 | void *t = mmap(p, len - fileend_adj, host_prot, |
| 658 | (flags & ~MAP_FIXED_NOREPLACE) | MAP_FIXED, |
| 659 | fd, offset); |
| 660 | |
| 661 | if (t == MAP_FAILED) { |
| 662 | int save_errno = errno; |
| 663 | |
| 664 | /* |
| 665 | * We failed a map over the top of the successful anonymous |
| 666 | * mapping above. The only failure mode is running out of VMAs, |
| 667 | * and there's nothing that we can do to detect that earlier. |
| 668 | * If we have replaced an existing mapping with MAP_FIXED, |
| 669 | * then we cannot properly recover. It's a coin toss whether |
| 670 | * it would be better to exit or continue here. |
| 671 | */ |
| 672 | if (!(flags & MAP_FIXED_NOREPLACE) && |
| 673 | !page_check_range_empty(start, start + len - 1)) { |
| 674 | qemu_log("QEMU target_mmap late failure: %s", |
| 675 | strerror(save_errno)); |
| 676 | } |
| 677 | |
| 678 | do_munmap(want_p, len); |
| 679 | errno = save_errno; |
| 680 | return -1; |
| 681 | } |
| 682 | } |
| 683 | } else { |
| 684 | size_t host_len, part_len; |
| 685 | |
| 686 | /* |
| 687 | * Take care to align the host memory. Perform a larger anonymous |
| 688 | * allocation and extract the aligned portion. Remap the file on |
| 689 | * top of that. |
| 690 | */ |
| 691 | host_len = len + TARGET_PAGE_SIZE - host_page_size; |
| 692 | p = mmap(want_p, host_len, host_prot, flags | MAP_ANONYMOUS, -1, 0); |
| 693 | if (p == MAP_FAILED) { |
| 694 | return -1; |
| 695 | } |
| 696 | |
| 697 | part_len = (uintptr_t)p & (TARGET_PAGE_SIZE - 1); |
| 698 | if (part_len) { |
| 699 | part_len = TARGET_PAGE_SIZE - part_len; |
| 700 | do_munmap(p, part_len); |
| 701 | p += part_len; |
| 702 | host_len -= part_len; |
| 703 | } |
| 704 | if (len < host_len) { |
| 705 | do_munmap(p + len, host_len - len); |
| 706 | } |
| 707 | |
| 708 | if (!(flags & MAP_ANONYMOUS)) { |
| 709 | void *t = mmap(p, len - fileend_adj, host_prot, |
| 710 | flags | MAP_FIXED, fd, offset); |
| 711 | |
| 712 | if (t == MAP_FAILED) { |
| 713 | int save_errno = errno; |
| 714 | do_munmap(p, len); |
| 715 | errno = save_errno; |
| 716 | return -1; |
| 717 | } |
| 718 | } |
| 719 | |
| 720 | start = h2g(p); |
| 721 | } |
| 722 | |
| 723 | last = start + len - 1; |
| 724 | if (fileend_adj) { |
| 725 | pass_last = ROUND_UP(last - fileend_adj, host_page_size) - 1; |
| 726 | } else { |
| 727 | pass_last = last; |
| 728 | } |
| 729 | return mmap_end(start, last, start, pass_last, mmap_flags, page_flags); |
| 730 | } |
| 731 | |
Richard Henderson | eb5027a | 2024-01-02 12:57:58 +1100 | [diff] [blame] | 732 | /* |
| 733 | * Special case host page size > target page size. |
| 734 | * |
| 735 | * The two special cases are address and file offsets that are valid |
| 736 | * for the guest that cannot be directly represented by the host. |
| 737 | */ |
| 738 | static abi_long mmap_h_gt_g(abi_ulong start, abi_ulong len, |
| 739 | int target_prot, int host_prot, |
| 740 | int flags, int page_flags, int fd, |
| 741 | off_t offset, int host_page_size) |
| 742 | { |
| 743 | void *p, *want_p = g2h_untagged(start); |
| 744 | off_t host_offset = offset & -host_page_size; |
| 745 | abi_ulong last, real_start, real_last; |
| 746 | bool misaligned_offset = false; |
| 747 | size_t host_len; |
| 748 | |
| 749 | if (!(flags & (MAP_FIXED | MAP_FIXED_NOREPLACE))) { |
| 750 | /* |
| 751 | * Adjust the offset to something representable on the host. |
| 752 | */ |
| 753 | host_len = len + offset - host_offset; |
| 754 | p = mmap(want_p, host_len, host_prot, flags, fd, host_offset); |
| 755 | if (p == MAP_FAILED) { |
| 756 | return -1; |
| 757 | } |
| 758 | |
| 759 | /* Update start to the file position at offset. */ |
| 760 | p += offset - host_offset; |
| 761 | |
| 762 | start = h2g(p); |
| 763 | last = start + len - 1; |
| 764 | return mmap_end(start, last, start, last, flags, page_flags); |
| 765 | } |
| 766 | |
| 767 | if (!(flags & MAP_ANONYMOUS)) { |
| 768 | misaligned_offset = (start ^ offset) & (host_page_size - 1); |
| 769 | |
| 770 | /* |
| 771 | * The fallback for misalignment is a private mapping + read. |
| 772 | * This carries none of semantics required of MAP_SHARED. |
| 773 | */ |
| 774 | if (misaligned_offset && (flags & MAP_TYPE) != MAP_PRIVATE) { |
| 775 | errno = EINVAL; |
| 776 | return -1; |
| 777 | } |
| 778 | } |
| 779 | |
| 780 | last = start + len - 1; |
| 781 | real_start = start & -host_page_size; |
| 782 | real_last = ROUND_UP(last, host_page_size) - 1; |
| 783 | |
| 784 | /* |
| 785 | * Handle the start and end of the mapping. |
| 786 | */ |
| 787 | if (real_start < start) { |
| 788 | abi_ulong real_page_last = real_start + host_page_size - 1; |
| 789 | if (last <= real_page_last) { |
| 790 | /* Entire allocation a subset of one host page. */ |
| 791 | if (!mmap_frag(real_start, start, last, target_prot, |
| 792 | flags, fd, offset)) { |
| 793 | return -1; |
| 794 | } |
| 795 | return mmap_end(start, last, -1, 0, flags, page_flags); |
| 796 | } |
| 797 | |
| 798 | if (!mmap_frag(real_start, start, real_page_last, target_prot, |
| 799 | flags, fd, offset)) { |
| 800 | return -1; |
| 801 | } |
| 802 | real_start = real_page_last + 1; |
| 803 | } |
| 804 | |
| 805 | if (last < real_last) { |
| 806 | abi_ulong real_page_start = real_last - host_page_size + 1; |
| 807 | if (!mmap_frag(real_page_start, real_page_start, last, |
| 808 | target_prot, flags, fd, |
| 809 | offset + real_page_start - start)) { |
| 810 | return -1; |
| 811 | } |
| 812 | real_last = real_page_start - 1; |
| 813 | } |
| 814 | |
| 815 | if (real_start > real_last) { |
| 816 | return mmap_end(start, last, -1, 0, flags, page_flags); |
| 817 | } |
| 818 | |
| 819 | /* |
| 820 | * Handle the middle of the mapping. |
| 821 | */ |
| 822 | |
| 823 | host_len = real_last - real_start + 1; |
| 824 | want_p += real_start - start; |
| 825 | |
| 826 | if (flags & MAP_ANONYMOUS) { |
| 827 | p = mmap(want_p, host_len, host_prot, flags, -1, 0); |
| 828 | } else if (!misaligned_offset) { |
| 829 | p = mmap(want_p, host_len, host_prot, flags, fd, |
| 830 | offset + real_start - start); |
| 831 | } else { |
| 832 | p = mmap(want_p, host_len, host_prot | PROT_WRITE, |
| 833 | flags | MAP_ANONYMOUS, -1, 0); |
| 834 | } |
| 835 | if (p != want_p) { |
| 836 | if (p != MAP_FAILED) { |
| 837 | do_munmap(p, host_len); |
| 838 | errno = EEXIST; |
| 839 | } |
| 840 | return -1; |
| 841 | } |
| 842 | |
| 843 | if (misaligned_offset) { |
| 844 | /* TODO: The read could be short. */ |
| 845 | if (pread(fd, p, host_len, offset + real_start - start) != host_len) { |
| 846 | do_munmap(p, host_len); |
| 847 | return -1; |
| 848 | } |
| 849 | if (!(host_prot & PROT_WRITE)) { |
| 850 | mprotect(p, host_len, host_prot); |
| 851 | } |
| 852 | } |
| 853 | |
| 854 | return mmap_end(start, last, -1, 0, flags, page_flags); |
| 855 | } |
| 856 | |
Richard Henderson | d558c39 | 2024-01-02 12:57:51 +1100 | [diff] [blame] | 857 | static abi_long target_mmap__locked(abi_ulong start, abi_ulong len, |
Richard Henderson | e8cec51 | 2024-01-02 12:57:52 +1100 | [diff] [blame] | 858 | int target_prot, int flags, int page_flags, |
Richard Henderson | d558c39 | 2024-01-02 12:57:51 +1100 | [diff] [blame] | 859 | int fd, off_t offset) |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 860 | { |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 861 | int host_page_size = qemu_real_host_page_size(); |
Richard Henderson | 68098de | 2024-01-02 12:57:56 +1100 | [diff] [blame] | 862 | int host_prot; |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 863 | |
Richard Henderson | 2b730f7 | 2023-07-07 21:40:32 +0100 | [diff] [blame] | 864 | /* |
Richard Henderson | ad87d26 | 2024-01-02 12:57:55 +1100 | [diff] [blame] | 865 | * For reserved_va, we are in full control of the allocation. |
| 866 | * Find a suitable hole and convert to MAP_FIXED. |
Richard Henderson | 2b730f7 | 2023-07-07 21:40:32 +0100 | [diff] [blame] | 867 | */ |
Richard Henderson | 68098de | 2024-01-02 12:57:56 +1100 | [diff] [blame] | 868 | if (reserved_va) { |
| 869 | if (flags & MAP_FIXED_NOREPLACE) { |
| 870 | /* Validate that the chosen range is empty. */ |
| 871 | if (!page_check_range_empty(start, start + len - 1)) { |
| 872 | errno = EEXIST; |
| 873 | return -1; |
| 874 | } |
| 875 | flags = (flags & ~MAP_FIXED_NOREPLACE) | MAP_FIXED; |
| 876 | } else if (!(flags & MAP_FIXED)) { |
Richard Henderson | eb5027a | 2024-01-02 12:57:58 +1100 | [diff] [blame] | 877 | abi_ulong real_start = start & -host_page_size; |
| 878 | off_t host_offset = offset & -host_page_size; |
Richard Henderson | 68098de | 2024-01-02 12:57:56 +1100 | [diff] [blame] | 879 | size_t real_len = len + offset - host_offset; |
| 880 | abi_ulong align = MAX(host_page_size, TARGET_PAGE_SIZE); |
| 881 | |
| 882 | start = mmap_find_vma(real_start, real_len, align); |
| 883 | if (start == (abi_ulong)-1) { |
| 884 | errno = ENOMEM; |
| 885 | return -1; |
| 886 | } |
| 887 | start += offset - host_offset; |
| 888 | flags |= MAP_FIXED; |
Richard Henderson | a5e7ee4 | 2012-06-01 16:07:52 -0700 | [diff] [blame] | 889 | } |
Richard Henderson | 68098de | 2024-01-02 12:57:56 +1100 | [diff] [blame] | 890 | } |
| 891 | |
| 892 | host_prot = target_to_host_prot(target_prot); |
| 893 | |
| 894 | if (host_page_size == TARGET_PAGE_SIZE) { |
| 895 | return mmap_h_eq_g(start, len, host_prot, flags, |
| 896 | page_flags, fd, offset); |
Richard Henderson | 8080b2f | 2024-01-02 12:57:57 +1100 | [diff] [blame] | 897 | } else if (host_page_size < TARGET_PAGE_SIZE) { |
| 898 | return mmap_h_lt_g(start, len, host_prot, flags, |
| 899 | page_flags, fd, offset, host_page_size); |
bellard | a03e2d4 | 2007-11-14 11:29:07 +0000 | [diff] [blame] | 900 | } else { |
Richard Henderson | eb5027a | 2024-01-02 12:57:58 +1100 | [diff] [blame] | 901 | return mmap_h_gt_g(start, len, target_prot, host_prot, flags, |
| 902 | page_flags, fd, offset, host_page_size); |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 903 | } |
Richard Henderson | d558c39 | 2024-01-02 12:57:51 +1100 | [diff] [blame] | 904 | } |
| 905 | |
| 906 | /* NOTE: all the constants are the HOST ones */ |
| 907 | abi_long target_mmap(abi_ulong start, abi_ulong len, int target_prot, |
| 908 | int flags, int fd, off_t offset) |
| 909 | { |
| 910 | abi_long ret; |
Richard Henderson | e8cec51 | 2024-01-02 12:57:52 +1100 | [diff] [blame] | 911 | int page_flags; |
Richard Henderson | d558c39 | 2024-01-02 12:57:51 +1100 | [diff] [blame] | 912 | |
| 913 | trace_target_mmap(start, len, target_prot, flags, fd, offset); |
Richard Henderson | e8cec51 | 2024-01-02 12:57:52 +1100 | [diff] [blame] | 914 | |
| 915 | if (!len) { |
| 916 | errno = EINVAL; |
| 917 | return -1; |
| 918 | } |
| 919 | |
| 920 | page_flags = validate_prot_to_pageflags(target_prot); |
| 921 | if (!page_flags) { |
| 922 | errno = EINVAL; |
| 923 | return -1; |
| 924 | } |
| 925 | |
| 926 | /* Also check for overflows... */ |
| 927 | len = TARGET_PAGE_ALIGN(len); |
| 928 | if (!len || len != (size_t)len) { |
| 929 | errno = ENOMEM; |
| 930 | return -1; |
| 931 | } |
| 932 | |
| 933 | if (offset & ~TARGET_PAGE_MASK) { |
| 934 | errno = EINVAL; |
| 935 | return -1; |
| 936 | } |
| 937 | if (flags & (MAP_FIXED | MAP_FIXED_NOREPLACE)) { |
| 938 | if (start & ~TARGET_PAGE_MASK) { |
| 939 | errno = EINVAL; |
| 940 | return -1; |
| 941 | } |
| 942 | if (!guest_range_valid_untagged(start, len)) { |
| 943 | errno = ENOMEM; |
| 944 | return -1; |
| 945 | } |
| 946 | } |
| 947 | |
Richard Henderson | d558c39 | 2024-01-02 12:57:51 +1100 | [diff] [blame] | 948 | mmap_lock(); |
| 949 | |
Richard Henderson | e8cec51 | 2024-01-02 12:57:52 +1100 | [diff] [blame] | 950 | ret = target_mmap__locked(start, len, target_prot, flags, |
| 951 | page_flags, fd, offset); |
Richard Henderson | d558c39 | 2024-01-02 12:57:51 +1100 | [diff] [blame] | 952 | |
pbrook | c8a706f | 2008-06-02 16:16:42 +0000 | [diff] [blame] | 953 | mmap_unlock(); |
Richard Henderson | e8cec51 | 2024-01-02 12:57:52 +1100 | [diff] [blame] | 954 | |
| 955 | /* |
| 956 | * If we're mapping shared memory, ensure we generate code for parallel |
| 957 | * execution and flush old translations. This will work up to the level |
| 958 | * supported by the host -- anything that requires EXCP_ATOMIC will not |
| 959 | * be atomic with respect to an external process. |
| 960 | */ |
| 961 | if (ret != -1 && (flags & MAP_TYPE) != MAP_PRIVATE) { |
| 962 | CPUState *cpu = thread_cpu; |
Philippe Mathieu-Daudé | b254c34 | 2024-01-10 18:09:56 +0100 | [diff] [blame] | 963 | if (!tcg_cflags_has(cpu, CF_PARALLEL)) { |
| 964 | tcg_cflags_set(cpu, CF_PARALLEL); |
Richard Henderson | e8cec51 | 2024-01-02 12:57:52 +1100 | [diff] [blame] | 965 | tb_flush(cpu); |
| 966 | } |
| 967 | } |
| 968 | |
Richard Henderson | d558c39 | 2024-01-02 12:57:51 +1100 | [diff] [blame] | 969 | return ret; |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 970 | } |
| 971 | |
Richard Henderson | 912ff69 | 2023-10-03 13:59:55 -0700 | [diff] [blame] | 972 | static int mmap_reserve_or_unmap(abi_ulong start, abi_ulong len) |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 973 | { |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 974 | int host_page_size = qemu_real_host_page_size(); |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 975 | abi_ulong real_start; |
Richard Henderson | 260561d | 2023-07-07 21:40:48 +0100 | [diff] [blame] | 976 | abi_ulong real_last; |
| 977 | abi_ulong real_len; |
| 978 | abi_ulong last; |
| 979 | abi_ulong a; |
Richard Henderson | 558a441 | 2023-07-07 21:40:49 +0100 | [diff] [blame] | 980 | void *host_start; |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 981 | int prot; |
| 982 | |
Richard Henderson | 260561d | 2023-07-07 21:40:48 +0100 | [diff] [blame] | 983 | last = start + len - 1; |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 984 | real_start = start & -host_page_size; |
Richard Henderson | b36b2b1 | 2024-01-02 12:57:45 +1100 | [diff] [blame] | 985 | real_last = ROUND_UP(last, host_page_size) - 1; |
Richard Henderson | 260561d | 2023-07-07 21:40:48 +0100 | [diff] [blame] | 986 | |
| 987 | /* |
| 988 | * If guest pages remain on the first or last host pages, |
| 989 | * adjust the deallocation to retain those guest pages. |
| 990 | * The single page special case is required for the last page, |
| 991 | * lest real_start overflow to zero. |
| 992 | */ |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 993 | if (real_last - real_start < host_page_size) { |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 994 | prot = 0; |
Richard Henderson | 260561d | 2023-07-07 21:40:48 +0100 | [diff] [blame] | 995 | for (a = real_start; a < start; a += TARGET_PAGE_SIZE) { |
| 996 | prot |= page_get_flags(a); |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 997 | } |
Richard Henderson | 260561d | 2023-07-07 21:40:48 +0100 | [diff] [blame] | 998 | for (a = last; a < real_last; a += TARGET_PAGE_SIZE) { |
| 999 | prot |= page_get_flags(a + 1); |
| 1000 | } |
| 1001 | if (prot != 0) { |
Richard Henderson | 912ff69 | 2023-10-03 13:59:55 -0700 | [diff] [blame] | 1002 | return 0; |
Richard Henderson | 260561d | 2023-07-07 21:40:48 +0100 | [diff] [blame] | 1003 | } |
| 1004 | } else { |
| 1005 | for (prot = 0, a = real_start; a < start; a += TARGET_PAGE_SIZE) { |
| 1006 | prot |= page_get_flags(a); |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 1007 | } |
Richard Henderson | 2b730f7 | 2023-07-07 21:40:32 +0100 | [diff] [blame] | 1008 | if (prot != 0) { |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 1009 | real_start += host_page_size; |
Richard Henderson | 2b730f7 | 2023-07-07 21:40:32 +0100 | [diff] [blame] | 1010 | } |
Richard Henderson | 260561d | 2023-07-07 21:40:48 +0100 | [diff] [blame] | 1011 | |
| 1012 | for (prot = 0, a = last; a < real_last; a += TARGET_PAGE_SIZE) { |
| 1013 | prot |= page_get_flags(a + 1); |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 1014 | } |
Richard Henderson | 2b730f7 | 2023-07-07 21:40:32 +0100 | [diff] [blame] | 1015 | if (prot != 0) { |
Richard Henderson | 621ac47 | 2024-01-02 12:57:43 +1100 | [diff] [blame] | 1016 | real_last -= host_page_size; |
Richard Henderson | 260561d | 2023-07-07 21:40:48 +0100 | [diff] [blame] | 1017 | } |
| 1018 | |
| 1019 | if (real_last < real_start) { |
Richard Henderson | 912ff69 | 2023-10-03 13:59:55 -0700 | [diff] [blame] | 1020 | return 0; |
Richard Henderson | 2b730f7 | 2023-07-07 21:40:32 +0100 | [diff] [blame] | 1021 | } |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 1022 | } |
Richard Henderson | 260561d | 2023-07-07 21:40:48 +0100 | [diff] [blame] | 1023 | |
| 1024 | real_len = real_last - real_start + 1; |
| 1025 | host_start = g2h_untagged(real_start); |
| 1026 | |
Richard Henderson | 2952b64 | 2024-02-13 10:20:27 -1000 | [diff] [blame] | 1027 | return do_munmap(host_start, real_len); |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 1028 | } |
| 1029 | |
blueswir1 | 992f48a | 2007-10-14 16:27:31 +0000 | [diff] [blame] | 1030 | int target_munmap(abi_ulong start, abi_ulong len) |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 1031 | { |
Richard Henderson | 912ff69 | 2023-10-03 13:59:55 -0700 | [diff] [blame] | 1032 | int ret; |
| 1033 | |
Alex Bennée | b7b18d2 | 2019-12-05 12:25:16 +0000 | [diff] [blame] | 1034 | trace_target_munmap(start, len); |
| 1035 | |
Richard Henderson | 2b730f7 | 2023-07-07 21:40:32 +0100 | [diff] [blame] | 1036 | if (start & ~TARGET_PAGE_MASK) { |
Richard Henderson | 912ff69 | 2023-10-03 13:59:55 -0700 | [diff] [blame] | 1037 | errno = EINVAL; |
| 1038 | return -1; |
Richard Henderson | 2b730f7 | 2023-07-07 21:40:32 +0100 | [diff] [blame] | 1039 | } |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 1040 | len = TARGET_PAGE_ALIGN(len); |
Richard Henderson | 46b12f4 | 2021-02-12 10:48:46 -0800 | [diff] [blame] | 1041 | if (len == 0 || !guest_range_valid_untagged(start, len)) { |
Richard Henderson | 912ff69 | 2023-10-03 13:59:55 -0700 | [diff] [blame] | 1042 | errno = EINVAL; |
| 1043 | return -1; |
Max Filippov | ebf9a36 | 2018-03-07 13:50:10 -0800 | [diff] [blame] | 1044 | } |
| 1045 | |
pbrook | c8a706f | 2008-06-02 16:16:42 +0000 | [diff] [blame] | 1046 | mmap_lock(); |
Richard Henderson | 912ff69 | 2023-10-03 13:59:55 -0700 | [diff] [blame] | 1047 | ret = mmap_reserve_or_unmap(start, len); |
| 1048 | if (likely(ret == 0)) { |
| 1049 | page_set_flags(start, start + len - 1, 0); |
| 1050 | shm_region_rm_complete(start, start + len - 1); |
| 1051 | } |
pbrook | c8a706f | 2008-06-02 16:16:42 +0000 | [diff] [blame] | 1052 | mmap_unlock(); |
Richard Henderson | d7b0c5d | 2023-07-07 21:40:50 +0100 | [diff] [blame] | 1053 | |
Richard Henderson | 912ff69 | 2023-10-03 13:59:55 -0700 | [diff] [blame] | 1054 | return ret; |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 1055 | } |
| 1056 | |
blueswir1 | 992f48a | 2007-10-14 16:27:31 +0000 | [diff] [blame] | 1057 | abi_long target_mremap(abi_ulong old_addr, abi_ulong old_size, |
| 1058 | abi_ulong new_size, unsigned long flags, |
| 1059 | abi_ulong new_addr) |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 1060 | { |
| 1061 | int prot; |
aurel32 | f19412a | 2008-12-08 18:12:40 +0000 | [diff] [blame] | 1062 | void *host_addr; |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 1063 | |
Richard Henderson | 46b12f4 | 2021-02-12 10:48:46 -0800 | [diff] [blame] | 1064 | if (!guest_range_valid_untagged(old_addr, old_size) || |
Max Filippov | ebf9a36 | 2018-03-07 13:50:10 -0800 | [diff] [blame] | 1065 | ((flags & MREMAP_FIXED) && |
Richard Henderson | 46b12f4 | 2021-02-12 10:48:46 -0800 | [diff] [blame] | 1066 | !guest_range_valid_untagged(new_addr, new_size)) || |
Richard Purdie | ccc5ccc | 2021-01-08 17:42:12 +0000 | [diff] [blame] | 1067 | ((flags & MREMAP_MAYMOVE) == 0 && |
Richard Henderson | 46b12f4 | 2021-02-12 10:48:46 -0800 | [diff] [blame] | 1068 | !guest_range_valid_untagged(old_addr, new_size))) { |
Max Filippov | ebf9a36 | 2018-03-07 13:50:10 -0800 | [diff] [blame] | 1069 | errno = ENOMEM; |
| 1070 | return -1; |
| 1071 | } |
| 1072 | |
pbrook | c8a706f | 2008-06-02 16:16:42 +0000 | [diff] [blame] | 1073 | mmap_lock(); |
aurel32 | f19412a | 2008-12-08 18:12:40 +0000 | [diff] [blame] | 1074 | |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 1075 | if (flags & MREMAP_FIXED) { |
Richard Henderson | 3e8f162 | 2021-02-12 10:48:43 -0800 | [diff] [blame] | 1076 | host_addr = mremap(g2h_untagged(old_addr), old_size, new_size, |
| 1077 | flags, g2h_untagged(new_addr)); |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 1078 | |
Laurent Vivier | b76f21a | 2015-08-24 14:53:54 +0200 | [diff] [blame] | 1079 | if (reserved_va && host_addr != MAP_FAILED) { |
Richard Henderson | 2b730f7 | 2023-07-07 21:40:32 +0100 | [diff] [blame] | 1080 | /* |
| 1081 | * If new and old addresses overlap then the above mremap will |
| 1082 | * already have failed with EINVAL. |
| 1083 | */ |
Richard Henderson | 558a441 | 2023-07-07 21:40:49 +0100 | [diff] [blame] | 1084 | mmap_reserve_or_unmap(old_addr, old_size); |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 1085 | } |
| 1086 | } else if (flags & MREMAP_MAYMOVE) { |
aurel32 | f19412a | 2008-12-08 18:12:40 +0000 | [diff] [blame] | 1087 | abi_ulong mmap_start; |
| 1088 | |
Richard Henderson | 30ab9ef | 2019-05-19 13:19:52 -0700 | [diff] [blame] | 1089 | mmap_start = mmap_find_vma(0, new_size, TARGET_PAGE_SIZE); |
aurel32 | f19412a | 2008-12-08 18:12:40 +0000 | [diff] [blame] | 1090 | |
| 1091 | if (mmap_start == -1) { |
| 1092 | errno = ENOMEM; |
| 1093 | host_addr = MAP_FAILED; |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 1094 | } else { |
Richard Henderson | 3e8f162 | 2021-02-12 10:48:43 -0800 | [diff] [blame] | 1095 | host_addr = mremap(g2h_untagged(old_addr), old_size, new_size, |
| 1096 | flags | MREMAP_FIXED, |
| 1097 | g2h_untagged(mmap_start)); |
Laurent Vivier | b76f21a | 2015-08-24 14:53:54 +0200 | [diff] [blame] | 1098 | if (reserved_va) { |
Richard Henderson | 558a441 | 2023-07-07 21:40:49 +0100 | [diff] [blame] | 1099 | mmap_reserve_or_unmap(old_addr, old_size); |
amateur | c65ffe6 | 2010-09-14 13:22:34 +0800 | [diff] [blame] | 1100 | } |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 1101 | } |
blueswir1 | 3af72a4 | 2008-12-15 17:58:49 +0000 | [diff] [blame] | 1102 | } else { |
Laurent Vivier | ea80003 | 2023-09-25 17:10:26 +0200 | [diff] [blame] | 1103 | int page_flags = 0; |
Laurent Vivier | b76f21a | 2015-08-24 14:53:54 +0200 | [diff] [blame] | 1104 | if (reserved_va && old_size < new_size) { |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 1105 | abi_ulong addr; |
| 1106 | for (addr = old_addr + old_size; |
| 1107 | addr < old_addr + new_size; |
| 1108 | addr++) { |
Laurent Vivier | ea80003 | 2023-09-25 17:10:26 +0200 | [diff] [blame] | 1109 | page_flags |= page_get_flags(addr); |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 1110 | } |
| 1111 | } |
Laurent Vivier | ea80003 | 2023-09-25 17:10:26 +0200 | [diff] [blame] | 1112 | if (page_flags == 0) { |
Richard Henderson | 3e8f162 | 2021-02-12 10:48:43 -0800 | [diff] [blame] | 1113 | host_addr = mremap(g2h_untagged(old_addr), |
| 1114 | old_size, new_size, flags); |
Tobias Koch | 56d1908 | 2020-10-28 22:38:33 +0100 | [diff] [blame] | 1115 | |
| 1116 | if (host_addr != MAP_FAILED) { |
| 1117 | /* Check if address fits target address space */ |
Richard Henderson | 46b12f4 | 2021-02-12 10:48:46 -0800 | [diff] [blame] | 1118 | if (!guest_range_valid_untagged(h2g(host_addr), new_size)) { |
Tobias Koch | 56d1908 | 2020-10-28 22:38:33 +0100 | [diff] [blame] | 1119 | /* Revert mremap() changes */ |
Richard Henderson | 3e8f162 | 2021-02-12 10:48:43 -0800 | [diff] [blame] | 1120 | host_addr = mremap(g2h_untagged(old_addr), |
| 1121 | new_size, old_size, flags); |
Tobias Koch | 56d1908 | 2020-10-28 22:38:33 +0100 | [diff] [blame] | 1122 | errno = ENOMEM; |
| 1123 | host_addr = MAP_FAILED; |
| 1124 | } else if (reserved_va && old_size > new_size) { |
Richard Henderson | 558a441 | 2023-07-07 21:40:49 +0100 | [diff] [blame] | 1125 | mmap_reserve_or_unmap(old_addr + old_size, |
| 1126 | old_size - new_size); |
Tobias Koch | 56d1908 | 2020-10-28 22:38:33 +0100 | [diff] [blame] | 1127 | } |
Paul Brook | 68a1c81 | 2010-05-29 02:27:35 +0100 | [diff] [blame] | 1128 | } |
| 1129 | } else { |
| 1130 | errno = ENOMEM; |
| 1131 | host_addr = MAP_FAILED; |
| 1132 | } |
aurel32 | f19412a | 2008-12-08 18:12:40 +0000 | [diff] [blame] | 1133 | } |
| 1134 | |
| 1135 | if (host_addr == MAP_FAILED) { |
pbrook | c8a706f | 2008-06-02 16:16:42 +0000 | [diff] [blame] | 1136 | new_addr = -1; |
| 1137 | } else { |
| 1138 | new_addr = h2g(host_addr); |
| 1139 | prot = page_get_flags(old_addr); |
Richard Henderson | 49840a4 | 2023-03-06 01:51:09 +0300 | [diff] [blame] | 1140 | page_set_flags(old_addr, old_addr + old_size - 1, 0); |
Richard Henderson | 044e95c | 2023-08-20 13:39:37 -0700 | [diff] [blame] | 1141 | shm_region_rm_complete(old_addr, old_addr + old_size - 1); |
Richard Henderson | 49840a4 | 2023-03-06 01:51:09 +0300 | [diff] [blame] | 1142 | page_set_flags(new_addr, new_addr + new_size - 1, |
Richard Henderson | d9c5858 | 2021-02-12 10:48:32 -0800 | [diff] [blame] | 1143 | prot | PAGE_VALID | PAGE_RESET); |
Richard Henderson | 044e95c | 2023-08-20 13:39:37 -0700 | [diff] [blame] | 1144 | shm_region_rm_complete(new_addr, new_addr + new_size - 1); |
pbrook | c8a706f | 2008-06-02 16:16:42 +0000 | [diff] [blame] | 1145 | } |
| 1146 | mmap_unlock(); |
bellard | 5493600 | 2003-05-13 00:25:15 +0000 | [diff] [blame] | 1147 | return new_addr; |
| 1148 | } |
Ilya Leoshkevich | 892a4f6 | 2022-06-21 16:42:05 +0200 | [diff] [blame] | 1149 | |
Ilya Leoshkevich | 892a4f6 | 2022-06-21 16:42:05 +0200 | [diff] [blame] | 1150 | abi_long target_madvise(abi_ulong start, abi_ulong len_in, int advice) |
| 1151 | { |
Richard Henderson | e230ec0 | 2023-07-07 21:40:54 +0100 | [diff] [blame] | 1152 | abi_ulong len; |
Ilya Leoshkevich | 892a4f6 | 2022-06-21 16:42:05 +0200 | [diff] [blame] | 1153 | int ret = 0; |
| 1154 | |
| 1155 | if (start & ~TARGET_PAGE_MASK) { |
| 1156 | return -TARGET_EINVAL; |
| 1157 | } |
Richard Henderson | e230ec0 | 2023-07-07 21:40:54 +0100 | [diff] [blame] | 1158 | if (len_in == 0) { |
Ilya Leoshkevich | 892a4f6 | 2022-06-21 16:42:05 +0200 | [diff] [blame] | 1159 | return 0; |
| 1160 | } |
Richard Henderson | e230ec0 | 2023-07-07 21:40:54 +0100 | [diff] [blame] | 1161 | len = TARGET_PAGE_ALIGN(len_in); |
| 1162 | if (len == 0 || !guest_range_valid_untagged(start, len)) { |
Ilya Leoshkevich | 892a4f6 | 2022-06-21 16:42:05 +0200 | [diff] [blame] | 1163 | return -TARGET_EINVAL; |
| 1164 | } |
| 1165 | |
Helge Deller | 4530deb | 2022-12-13 18:03:09 +0100 | [diff] [blame] | 1166 | /* Translate for some architectures which have different MADV_xxx values */ |
| 1167 | switch (advice) { |
| 1168 | case TARGET_MADV_DONTNEED: /* alpha */ |
| 1169 | advice = MADV_DONTNEED; |
| 1170 | break; |
| 1171 | case TARGET_MADV_WIPEONFORK: /* parisc */ |
| 1172 | advice = MADV_WIPEONFORK; |
| 1173 | break; |
| 1174 | case TARGET_MADV_KEEPONFORK: /* parisc */ |
| 1175 | advice = MADV_KEEPONFORK; |
| 1176 | break; |
| 1177 | /* we do not care about the other MADV_xxx values yet */ |
| 1178 | } |
| 1179 | |
Ilya Leoshkevich | 892a4f6 | 2022-06-21 16:42:05 +0200 | [diff] [blame] | 1180 | /* |
Helge Deller | 4530deb | 2022-12-13 18:03:09 +0100 | [diff] [blame] | 1181 | * Most advice values are hints, so ignoring and returning success is ok. |
Ilya Leoshkevich | 892a4f6 | 2022-06-21 16:42:05 +0200 | [diff] [blame] | 1182 | * |
Helge Deller | 4530deb | 2022-12-13 18:03:09 +0100 | [diff] [blame] | 1183 | * However, some advice values such as MADV_DONTNEED, MADV_WIPEONFORK and |
| 1184 | * MADV_KEEPONFORK are not hints and need to be emulated. |
Ilya Leoshkevich | 892a4f6 | 2022-06-21 16:42:05 +0200 | [diff] [blame] | 1185 | * |
Helge Deller | 4530deb | 2022-12-13 18:03:09 +0100 | [diff] [blame] | 1186 | * A straight passthrough for those may not be safe because qemu sometimes |
| 1187 | * turns private file-backed mappings into anonymous mappings. |
Richard Henderson | ecb796d | 2023-07-07 21:40:53 +0100 | [diff] [blame] | 1188 | * If all guest pages have PAGE_PASSTHROUGH set, mappings have the |
| 1189 | * same semantics for the host as for the guest. |
Helge Deller | 4530deb | 2022-12-13 18:03:09 +0100 | [diff] [blame] | 1190 | * |
| 1191 | * We pass through MADV_WIPEONFORK and MADV_KEEPONFORK if possible and |
| 1192 | * return failure if not. |
| 1193 | * |
| 1194 | * MADV_DONTNEED is passed through as well, if possible. |
| 1195 | * If passthrough isn't possible, we nevertheless (wrongly!) return |
| 1196 | * success, which is broken but some userspace programs fail to work |
| 1197 | * otherwise. Completely implementing such emulation is quite complicated |
| 1198 | * though. |
Ilya Leoshkevich | 892a4f6 | 2022-06-21 16:42:05 +0200 | [diff] [blame] | 1199 | */ |
| 1200 | mmap_lock(); |
Helge Deller | 4530deb | 2022-12-13 18:03:09 +0100 | [diff] [blame] | 1201 | switch (advice) { |
| 1202 | case MADV_WIPEONFORK: |
| 1203 | case MADV_KEEPONFORK: |
| 1204 | ret = -EINVAL; |
| 1205 | /* fall through */ |
| 1206 | case MADV_DONTNEED: |
Richard Henderson | ecb796d | 2023-07-07 21:40:53 +0100 | [diff] [blame] | 1207 | if (page_check_range(start, len, PAGE_PASSTHROUGH)) { |
Helge Deller | 4530deb | 2022-12-13 18:03:09 +0100 | [diff] [blame] | 1208 | ret = get_errno(madvise(g2h_untagged(start), len, advice)); |
| 1209 | if ((advice == MADV_DONTNEED) && (ret == 0)) { |
Richard Henderson | 10310cb | 2023-03-06 02:03:13 +0300 | [diff] [blame] | 1210 | page_reset_target_data(start, start + len - 1); |
Helge Deller | 4530deb | 2022-12-13 18:03:09 +0100 | [diff] [blame] | 1211 | } |
Vitaly Buka | dbbf897 | 2022-07-11 15:00:28 -0700 | [diff] [blame] | 1212 | } |
Ilya Leoshkevich | 892a4f6 | 2022-06-21 16:42:05 +0200 | [diff] [blame] | 1213 | } |
| 1214 | mmap_unlock(); |
| 1215 | |
| 1216 | return ret; |
| 1217 | } |
Richard Henderson | 225a206 | 2023-08-20 09:24:14 -0700 | [diff] [blame] | 1218 | |
| 1219 | #ifndef TARGET_FORCE_SHMLBA |
| 1220 | /* |
| 1221 | * For most architectures, SHMLBA is the same as the page size; |
| 1222 | * some architectures have larger values, in which case they should |
| 1223 | * define TARGET_FORCE_SHMLBA and provide a target_shmlba() function. |
| 1224 | * This corresponds to the kernel arch code defining __ARCH_FORCE_SHMLBA |
| 1225 | * and defining its own value for SHMLBA. |
| 1226 | * |
| 1227 | * The kernel also permits SHMLBA to be set by the architecture to a |
| 1228 | * value larger than the page size without setting __ARCH_FORCE_SHMLBA; |
| 1229 | * this means that addresses are rounded to the large size if |
| 1230 | * SHM_RND is set but addresses not aligned to that size are not rejected |
| 1231 | * as long as they are at least page-aligned. Since the only architecture |
| 1232 | * which uses this is ia64 this code doesn't provide for that oddity. |
| 1233 | */ |
| 1234 | static inline abi_ulong target_shmlba(CPUArchState *cpu_env) |
| 1235 | { |
| 1236 | return TARGET_PAGE_SIZE; |
| 1237 | } |
| 1238 | #endif |
| 1239 | |
Richard Henderson | 78bc8ed | 2024-02-22 13:24:38 -1000 | [diff] [blame] | 1240 | #if defined(__arm__) || defined(__mips__) || defined(__sparc__) |
| 1241 | #define HOST_FORCE_SHMLBA 1 |
| 1242 | #else |
| 1243 | #define HOST_FORCE_SHMLBA 0 |
| 1244 | #endif |
| 1245 | |
Richard Henderson | 225a206 | 2023-08-20 09:24:14 -0700 | [diff] [blame] | 1246 | abi_ulong target_shmat(CPUArchState *cpu_env, int shmid, |
| 1247 | abi_ulong shmaddr, int shmflg) |
| 1248 | { |
| 1249 | CPUState *cpu = env_cpu(cpu_env); |
Richard Henderson | 225a206 | 2023-08-20 09:24:14 -0700 | [diff] [blame] | 1250 | struct shmid_ds shm_info; |
Richard Henderson | 69fa270 | 2023-08-20 10:08:44 -0700 | [diff] [blame] | 1251 | int ret; |
Richard Henderson | 78bc8ed | 2024-02-22 13:24:38 -1000 | [diff] [blame] | 1252 | int h_pagesize; |
| 1253 | int t_shmlba, h_shmlba, m_shmlba; |
| 1254 | size_t t_len, h_len, m_len; |
Richard Henderson | 225a206 | 2023-08-20 09:24:14 -0700 | [diff] [blame] | 1255 | |
| 1256 | /* shmat pointers are always untagged */ |
| 1257 | |
Richard Henderson | 78bc8ed | 2024-02-22 13:24:38 -1000 | [diff] [blame] | 1258 | /* |
| 1259 | * Because we can't use host shmat() unless the address is sufficiently |
| 1260 | * aligned for the host, we'll need to check both. |
| 1261 | * TODO: Could be fixed with softmmu. |
| 1262 | */ |
| 1263 | t_shmlba = target_shmlba(cpu_env); |
| 1264 | h_pagesize = qemu_real_host_page_size(); |
| 1265 | h_shmlba = (HOST_FORCE_SHMLBA ? SHMLBA : h_pagesize); |
| 1266 | m_shmlba = MAX(t_shmlba, h_shmlba); |
| 1267 | |
| 1268 | if (shmaddr) { |
| 1269 | if (shmaddr & (m_shmlba - 1)) { |
| 1270 | if (shmflg & SHM_RND) { |
| 1271 | /* |
| 1272 | * The guest is allowing the kernel to round the address. |
| 1273 | * Assume that the guest is ok with us rounding to the |
| 1274 | * host required alignment too. Anyway if we don't, we'll |
| 1275 | * get an error from the kernel. |
| 1276 | */ |
| 1277 | shmaddr &= ~(m_shmlba - 1); |
| 1278 | if (shmaddr == 0 && (shmflg & SHM_REMAP)) { |
| 1279 | return -TARGET_EINVAL; |
| 1280 | } |
| 1281 | } else { |
| 1282 | int require = TARGET_PAGE_SIZE; |
| 1283 | #ifdef TARGET_FORCE_SHMLBA |
| 1284 | require = t_shmlba; |
| 1285 | #endif |
| 1286 | /* |
| 1287 | * Include host required alignment, as otherwise we cannot |
| 1288 | * use host shmat at all. |
| 1289 | */ |
| 1290 | require = MAX(require, h_shmlba); |
| 1291 | if (shmaddr & (require - 1)) { |
| 1292 | return -TARGET_EINVAL; |
| 1293 | } |
| 1294 | } |
| 1295 | } |
| 1296 | } else { |
| 1297 | if (shmflg & SHM_REMAP) { |
| 1298 | return -TARGET_EINVAL; |
| 1299 | } |
| 1300 | } |
| 1301 | /* All rounding now manually concluded. */ |
| 1302 | shmflg &= ~SHM_RND; |
| 1303 | |
| 1304 | /* Find out the length of the shared memory segment. */ |
Richard Henderson | 225a206 | 2023-08-20 09:24:14 -0700 | [diff] [blame] | 1305 | ret = get_errno(shmctl(shmid, IPC_STAT, &shm_info)); |
| 1306 | if (is_error(ret)) { |
| 1307 | /* can't get length, bail out */ |
| 1308 | return ret; |
| 1309 | } |
Richard Henderson | 78bc8ed | 2024-02-22 13:24:38 -1000 | [diff] [blame] | 1310 | t_len = TARGET_PAGE_ALIGN(shm_info.shm_segsz); |
| 1311 | h_len = ROUND_UP(shm_info.shm_segsz, h_pagesize); |
| 1312 | m_len = MAX(t_len, h_len); |
Richard Henderson | 225a206 | 2023-08-20 09:24:14 -0700 | [diff] [blame] | 1313 | |
Richard Henderson | 78bc8ed | 2024-02-22 13:24:38 -1000 | [diff] [blame] | 1314 | if (!guest_range_valid_untagged(shmaddr, m_len)) { |
Richard Henderson | 225a206 | 2023-08-20 09:24:14 -0700 | [diff] [blame] | 1315 | return -TARGET_EINVAL; |
| 1316 | } |
| 1317 | |
Richard Henderson | 69fa270 | 2023-08-20 10:08:44 -0700 | [diff] [blame] | 1318 | WITH_MMAP_LOCK_GUARD() { |
Richard Henderson | 78bc8ed | 2024-02-22 13:24:38 -1000 | [diff] [blame] | 1319 | bool mapped = false; |
| 1320 | void *want, *test; |
Richard Henderson | 044e95c | 2023-08-20 13:39:37 -0700 | [diff] [blame] | 1321 | abi_ulong last; |
Richard Henderson | 69fa270 | 2023-08-20 10:08:44 -0700 | [diff] [blame] | 1322 | |
Richard Henderson | 78bc8ed | 2024-02-22 13:24:38 -1000 | [diff] [blame] | 1323 | if (!shmaddr) { |
| 1324 | shmaddr = mmap_find_vma(0, m_len, m_shmlba); |
| 1325 | if (shmaddr == -1) { |
Richard Henderson | 69fa270 | 2023-08-20 10:08:44 -0700 | [diff] [blame] | 1326 | return -TARGET_ENOMEM; |
| 1327 | } |
Richard Henderson | 78bc8ed | 2024-02-22 13:24:38 -1000 | [diff] [blame] | 1328 | mapped = !reserved_va; |
| 1329 | } else if (shmflg & SHM_REMAP) { |
| 1330 | /* |
| 1331 | * If host page size > target page size, the host shmat may map |
| 1332 | * more memory than the guest expects. Reject a mapping that |
| 1333 | * would replace memory in the unexpected gap. |
| 1334 | * TODO: Could be fixed with softmmu. |
| 1335 | */ |
| 1336 | if (t_len < h_len && |
| 1337 | !page_check_range_empty(shmaddr + t_len, |
| 1338 | shmaddr + h_len - 1)) { |
| 1339 | return -TARGET_EINVAL; |
| 1340 | } |
| 1341 | } else { |
| 1342 | if (!page_check_range_empty(shmaddr, shmaddr + m_len - 1)) { |
| 1343 | return -TARGET_EINVAL; |
| 1344 | } |
Richard Henderson | 69fa270 | 2023-08-20 10:08:44 -0700 | [diff] [blame] | 1345 | } |
| 1346 | |
Richard Henderson | 78bc8ed | 2024-02-22 13:24:38 -1000 | [diff] [blame] | 1347 | /* All placement is now complete. */ |
| 1348 | want = (void *)g2h_untagged(shmaddr); |
Richard Henderson | 69fa270 | 2023-08-20 10:08:44 -0700 | [diff] [blame] | 1349 | |
Richard Henderson | 78bc8ed | 2024-02-22 13:24:38 -1000 | [diff] [blame] | 1350 | /* |
| 1351 | * Map anonymous pages across the entire range, then remap with |
| 1352 | * the shared memory. This is required for a number of corner |
| 1353 | * cases for which host and guest page sizes differ. |
| 1354 | */ |
| 1355 | if (h_len != t_len) { |
| 1356 | int mmap_p = PROT_READ | (shmflg & SHM_RDONLY ? 0 : PROT_WRITE); |
| 1357 | int mmap_f = MAP_PRIVATE | MAP_ANONYMOUS |
Ilya Leoshkevich | fa527b4 | 2024-03-25 20:23:01 +0100 | [diff] [blame] | 1358 | | (reserved_va || mapped || (shmflg & SHM_REMAP) |
Richard Henderson | 78bc8ed | 2024-02-22 13:24:38 -1000 | [diff] [blame] | 1359 | ? MAP_FIXED : MAP_FIXED_NOREPLACE); |
| 1360 | |
| 1361 | test = mmap(want, m_len, mmap_p, mmap_f, -1, 0); |
| 1362 | if (unlikely(test != want)) { |
| 1363 | /* shmat returns EINVAL not EEXIST like mmap. */ |
| 1364 | ret = (test == MAP_FAILED && errno != EEXIST |
| 1365 | ? get_errno(-1) : -TARGET_EINVAL); |
| 1366 | if (mapped) { |
| 1367 | do_munmap(want, m_len); |
| 1368 | } |
| 1369 | return ret; |
| 1370 | } |
| 1371 | mapped = true; |
| 1372 | } |
| 1373 | |
| 1374 | if (reserved_va || mapped) { |
| 1375 | shmflg |= SHM_REMAP; |
| 1376 | } |
| 1377 | test = shmat(shmid, want, shmflg); |
| 1378 | if (test == MAP_FAILED) { |
| 1379 | ret = get_errno(-1); |
| 1380 | if (mapped) { |
| 1381 | do_munmap(want, m_len); |
| 1382 | } |
| 1383 | return ret; |
| 1384 | } |
| 1385 | assert(test == want); |
| 1386 | |
| 1387 | last = shmaddr + m_len - 1; |
| 1388 | page_set_flags(shmaddr, last, |
Richard Henderson | 69fa270 | 2023-08-20 10:08:44 -0700 | [diff] [blame] | 1389 | PAGE_VALID | PAGE_RESET | PAGE_READ | |
Richard Henderson | 78bc8ed | 2024-02-22 13:24:38 -1000 | [diff] [blame] | 1390 | (shmflg & SHM_RDONLY ? 0 : PAGE_WRITE) | |
| 1391 | (shmflg & SHM_EXEC ? PAGE_EXEC : 0)); |
Richard Henderson | 69fa270 | 2023-08-20 10:08:44 -0700 | [diff] [blame] | 1392 | |
Richard Henderson | 78bc8ed | 2024-02-22 13:24:38 -1000 | [diff] [blame] | 1393 | shm_region_rm_complete(shmaddr, last); |
| 1394 | shm_region_add(shmaddr, last); |
Richard Henderson | 69fa270 | 2023-08-20 10:08:44 -0700 | [diff] [blame] | 1395 | } |
Richard Henderson | 225a206 | 2023-08-20 09:24:14 -0700 | [diff] [blame] | 1396 | |
| 1397 | /* |
| 1398 | * We're mapping shared memory, so ensure we generate code for parallel |
| 1399 | * execution and flush old translations. This will work up to the level |
| 1400 | * supported by the host -- anything that requires EXCP_ATOMIC will not |
| 1401 | * be atomic with respect to an external process. |
| 1402 | */ |
Philippe Mathieu-Daudé | b254c34 | 2024-01-10 18:09:56 +0100 | [diff] [blame] | 1403 | if (!tcg_cflags_has(cpu, CF_PARALLEL)) { |
| 1404 | tcg_cflags_set(cpu, CF_PARALLEL); |
Richard Henderson | 225a206 | 2023-08-20 09:24:14 -0700 | [diff] [blame] | 1405 | tb_flush(cpu); |
| 1406 | } |
| 1407 | |
Richard Henderson | 78bc8ed | 2024-02-22 13:24:38 -1000 | [diff] [blame] | 1408 | if (qemu_loglevel_mask(CPU_LOG_PAGE)) { |
| 1409 | FILE *f = qemu_log_trylock(); |
| 1410 | if (f) { |
| 1411 | fprintf(f, "page layout changed following shmat\n"); |
| 1412 | page_dump(f); |
| 1413 | qemu_log_unlock(f); |
| 1414 | } |
| 1415 | } |
| 1416 | return shmaddr; |
Richard Henderson | 225a206 | 2023-08-20 09:24:14 -0700 | [diff] [blame] | 1417 | } |
| 1418 | |
| 1419 | abi_long target_shmdt(abi_ulong shmaddr) |
| 1420 | { |
Richard Henderson | 225a206 | 2023-08-20 09:24:14 -0700 | [diff] [blame] | 1421 | abi_long rv; |
| 1422 | |
| 1423 | /* shmdt pointers are always untagged */ |
| 1424 | |
Richard Henderson | 69fa270 | 2023-08-20 10:08:44 -0700 | [diff] [blame] | 1425 | WITH_MMAP_LOCK_GUARD() { |
Richard Henderson | 044e95c | 2023-08-20 13:39:37 -0700 | [diff] [blame] | 1426 | abi_ulong last = shm_region_find(shmaddr); |
| 1427 | if (last == 0) { |
Richard Henderson | ceda568 | 2023-08-20 12:38:49 -0700 | [diff] [blame] | 1428 | return -TARGET_EINVAL; |
| 1429 | } |
| 1430 | |
Richard Henderson | 69fa270 | 2023-08-20 10:08:44 -0700 | [diff] [blame] | 1431 | rv = get_errno(shmdt(g2h_untagged(shmaddr))); |
Richard Henderson | ceda568 | 2023-08-20 12:38:49 -0700 | [diff] [blame] | 1432 | if (rv == 0) { |
Richard Henderson | 044e95c | 2023-08-20 13:39:37 -0700 | [diff] [blame] | 1433 | abi_ulong size = last - shmaddr + 1; |
Richard Henderson | ceda568 | 2023-08-20 12:38:49 -0700 | [diff] [blame] | 1434 | |
Richard Henderson | 044e95c | 2023-08-20 13:39:37 -0700 | [diff] [blame] | 1435 | page_set_flags(shmaddr, last, 0); |
| 1436 | shm_region_rm_complete(shmaddr, last); |
Richard Henderson | ceda568 | 2023-08-20 12:38:49 -0700 | [diff] [blame] | 1437 | mmap_reserve_or_unmap(shmaddr, size); |
| 1438 | } |
Richard Henderson | 225a206 | 2023-08-20 09:24:14 -0700 | [diff] [blame] | 1439 | } |
Richard Henderson | 225a206 | 2023-08-20 09:24:14 -0700 | [diff] [blame] | 1440 | return rv; |
| 1441 | } |