blob: a2863c8e53aa83e4b744b18318a415b85400651f [file] [log] [blame]
bellardea888122004-02-16 22:12:40 +00001/*
2 * QEMU low level functions
ths5fafdf22007-09-16 21:08:06 +00003 *
bellardea888122004-02-16 22:12:40 +00004 * Copyright (c) 2003 Fabrice Bellard
ths5fafdf22007-09-16 21:08:06 +00005 *
bellardea888122004-02-16 22:12:40 +00006 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
Peter Maydellaafd7582016-01-29 17:49:55 +000024#include "qemu/osdep.h"
Paolo Bonzinif582af52010-02-02 20:33:11 +010025
26/* Needed early for CONFIG_BSD etc. */
Paolo Bonzinif582af52010-02-02 20:33:11 +010027
Juan Quinteladfe5fff2009-07-27 16:12:40 +020028#ifdef CONFIG_SOLARIS
ths605686c2007-01-17 23:31:19 +000029#include <sys/statvfs.h>
Andreas Färbere78815a2010-09-25 11:26:05 +000030/* See MySQL bug #7156 (http://bugs.mysql.com/bug.php?id=7156) for
31 discussion about Solaris header problems */
32extern int madvise(caddr_t, size_t, int);
ths605686c2007-01-17 23:31:19 +000033#endif
bellardea888122004-02-16 22:12:40 +000034
blueswir1511d2b12009-03-07 15:32:56 +000035#include "qemu-common.h"
Veronia Bahaaf348b6d2016-03-20 19:16:19 +020036#include "qemu/cutils.h"
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010037#include "qemu/sockets.h"
Markus Armbrusterd49b6832015-03-17 18:29:20 +010038#include "qemu/error-report.h"
Paolo Bonzini83c90892012-12-17 18:19:49 +010039#include "monitor/monitor.h"
aliguori03ff3ca2008-09-15 15:51:35 +000040
Fam Zhenge8c10942017-05-03 00:35:55 +080041#ifdef F_OFD_SETLK
42#define QEMU_SETLK F_OFD_SETLK
43#define QEMU_GETLK F_OFD_GETLK
44#else
45#define QEMU_SETLK F_SETLK
46#define QEMU_GETLK F_GETLK
47#endif
48
Paul Moore0f669982012-08-03 14:39:21 -040049static bool fips_enabled = false;
50
Eduardo Habkostd4943522016-04-09 16:42:44 -030051static const char *hw_version = QEMU_HW_VERSION;
Crístian Viana93bfef42012-05-30 00:35:51 -030052
Paolo Bonzini128aa582011-09-21 12:36:48 +020053int socket_set_cork(int fd, int v)
54{
55#if defined(SOL_TCP) && defined(TCP_CORK)
Lei Li4bd1afb2013-03-06 22:29:16 +080056 return qemu_setsockopt(fd, SOL_TCP, TCP_CORK, &v, sizeof(v));
Paolo Bonzini128aa582011-09-21 12:36:48 +020057#else
58 return 0;
59#endif
60}
61
MORITA Kazutakabf1c8522013-02-22 12:39:50 +090062int socket_set_nodelay(int fd)
63{
64 int v = 1;
Lei Li4bd1afb2013-03-06 22:29:16 +080065 return qemu_setsockopt(fd, IPPROTO_TCP, TCP_NODELAY, &v, sizeof(v));
MORITA Kazutakabf1c8522013-02-22 12:39:50 +090066}
67
Andreas Färbere78815a2010-09-25 11:26:05 +000068int qemu_madvise(void *addr, size_t len, int advice)
69{
70 if (advice == QEMU_MADV_INVALID) {
71 errno = EINVAL;
72 return -1;
73 }
74#if defined(CONFIG_MADVISE)
75 return madvise(addr, len, advice);
76#elif defined(CONFIG_POSIX_MADVISE)
77 return posix_madvise(addr, len, advice);
78#else
79 errno = EINVAL;
80 return -1;
81#endif
82}
83
Corey Bryantadb696f2012-08-14 16:43:47 -040084#ifndef _WIN32
85/*
86 * Dups an fd and sets the flags
87 */
88static int qemu_dup_flags(int fd, int flags)
89{
90 int ret;
91 int serrno;
92 int dup_flags;
Corey Bryantadb696f2012-08-14 16:43:47 -040093
Fam Zheng761d1dd2016-06-22 20:53:19 +080094 ret = qemu_dup(fd);
Corey Bryantadb696f2012-08-14 16:43:47 -040095 if (ret == -1) {
96 goto fail;
97 }
98
99 dup_flags = fcntl(ret, F_GETFL);
100 if (dup_flags == -1) {
101 goto fail;
102 }
103
104 if ((flags & O_SYNC) != (dup_flags & O_SYNC)) {
105 errno = EINVAL;
106 goto fail;
107 }
108
109 /* Set/unset flags that we can with fcntl */
Corey Bryant3b6eda22012-10-18 16:41:04 -0400110 if (fcntl(ret, F_SETFL, flags) == -1) {
Corey Bryantadb696f2012-08-14 16:43:47 -0400111 goto fail;
112 }
113
114 /* Truncate the file in the cases that open() would truncate it */
115 if (flags & O_TRUNC ||
116 ((flags & (O_CREAT | O_EXCL)) == (O_CREAT | O_EXCL))) {
117 if (ftruncate(ret, 0) == -1) {
118 goto fail;
119 }
120 }
121
122 return ret;
123
124fail:
125 serrno = errno;
126 if (ret != -1) {
127 close(ret);
128 }
129 errno = serrno;
130 return -1;
131}
Paolo Bonzini0100fbb2012-10-29 15:19:18 +0100132
Fam Zheng761d1dd2016-06-22 20:53:19 +0800133int qemu_dup(int fd)
134{
135 int ret;
136#ifdef F_DUPFD_CLOEXEC
137 ret = fcntl(fd, F_DUPFD_CLOEXEC, 0);
138#else
139 ret = dup(fd);
140 if (ret != -1) {
141 qemu_set_cloexec(ret);
142 }
143#endif
144 return ret;
145}
146
Paolo Bonzini0100fbb2012-10-29 15:19:18 +0100147static int qemu_parse_fdset(const char *param)
148{
149 return qemu_parse_fd(param);
150}
Fam Zheng13461fd2017-05-03 00:35:54 +0800151
152static int qemu_lock_fcntl(int fd, int64_t start, int64_t len, int fl_type)
153{
Fam Zheng13461fd2017-05-03 00:35:54 +0800154 int ret;
155 struct flock fl = {
156 .l_whence = SEEK_SET,
157 .l_start = start,
158 .l_len = len,
159 .l_type = fl_type,
160 };
Fam Zhenge8c10942017-05-03 00:35:55 +0800161 ret = fcntl(fd, QEMU_SETLK, &fl);
Fam Zheng13461fd2017-05-03 00:35:54 +0800162 return ret == -1 ? -errno : 0;
Fam Zheng13461fd2017-05-03 00:35:54 +0800163}
164
165int qemu_lock_fd(int fd, int64_t start, int64_t len, bool exclusive)
166{
167 return qemu_lock_fcntl(fd, start, len, exclusive ? F_WRLCK : F_RDLCK);
168}
169
170int qemu_unlock_fd(int fd, int64_t start, int64_t len)
171{
172 return qemu_lock_fcntl(fd, start, len, F_UNLCK);
173}
174
175int qemu_lock_fd_test(int fd, int64_t start, int64_t len, bool exclusive)
176{
Fam Zheng13461fd2017-05-03 00:35:54 +0800177 int ret;
178 struct flock fl = {
179 .l_whence = SEEK_SET,
180 .l_start = start,
181 .l_len = len,
182 .l_type = exclusive ? F_WRLCK : F_RDLCK,
183 };
Fam Zhenge8c10942017-05-03 00:35:55 +0800184 ret = fcntl(fd, QEMU_GETLK, &fl);
Fam Zheng13461fd2017-05-03 00:35:54 +0800185 if (ret == -1) {
186 return -errno;
187 } else {
188 return fl.l_type == F_UNLCK ? 0 : -EAGAIN;
189 }
Fam Zheng13461fd2017-05-03 00:35:54 +0800190}
Corey Bryantadb696f2012-08-14 16:43:47 -0400191#endif
aliguori03ff3ca2008-09-15 15:51:35 +0000192
Kevin Wolf40ff6d72009-12-02 12:24:42 +0100193/*
194 * Opens a file with FD_CLOEXEC set
195 */
196int qemu_open(const char *name, int flags, ...)
197{
198 int ret;
199 int mode = 0;
200
Corey Bryantadb696f2012-08-14 16:43:47 -0400201#ifndef _WIN32
202 const char *fdset_id_str;
203
204 /* Attempt dup of fd from fd set */
205 if (strstart(name, "/dev/fdset/", &fdset_id_str)) {
206 int64_t fdset_id;
207 int fd, dupfd;
208
209 fdset_id = qemu_parse_fdset(fdset_id_str);
210 if (fdset_id == -1) {
211 errno = EINVAL;
212 return -1;
213 }
214
215 fd = monitor_fdset_get_fd(fdset_id, flags);
216 if (fd == -1) {
217 return -1;
218 }
219
220 dupfd = qemu_dup_flags(fd, flags);
221 if (dupfd == -1) {
222 return -1;
223 }
224
225 ret = monitor_fdset_dup_fd_add(fdset_id, dupfd);
226 if (ret == -1) {
227 close(dupfd);
228 errno = EINVAL;
229 return -1;
230 }
231
232 return dupfd;
233 }
234#endif
235
Kevin Wolf40ff6d72009-12-02 12:24:42 +0100236 if (flags & O_CREAT) {
237 va_list ap;
238
239 va_start(ap, flags);
240 mode = va_arg(ap, int);
241 va_end(ap);
242 }
243
244#ifdef O_CLOEXEC
245 ret = open(name, flags | O_CLOEXEC, mode);
246#else
247 ret = open(name, flags, mode);
248 if (ret >= 0) {
249 qemu_set_cloexec(ret);
250 }
251#endif
252
Stefan Hajnoczia5813072013-08-22 11:29:03 +0200253#ifdef O_DIRECT
254 if (ret == -1 && errno == EINVAL && (flags & O_DIRECT)) {
255 error_report("file system may not support O_DIRECT");
256 errno = EINVAL; /* in case it was clobbered */
257 }
258#endif /* O_DIRECT */
259
Kevin Wolf40ff6d72009-12-02 12:24:42 +0100260 return ret;
261}
262
Corey Bryant2e1e79d2012-08-14 16:43:46 -0400263int qemu_close(int fd)
264{
Corey Bryantadb696f2012-08-14 16:43:47 -0400265 int64_t fdset_id;
266
267 /* Close fd that was dup'd from an fdset */
268 fdset_id = monitor_fdset_dup_fd_find(fd);
269 if (fdset_id != -1) {
270 int ret;
271
272 ret = close(fd);
273 if (ret == 0) {
274 monitor_fdset_dup_fd_remove(fd);
275 }
276
277 return ret;
278 }
279
Corey Bryant2e1e79d2012-08-14 16:43:46 -0400280 return close(fd);
281}
282
Kirill A. Shutemov7b5f6992010-01-20 00:56:08 +0100283/*
284 * A variant of write(2) which handles partial write.
285 *
286 * Return the number of bytes transferred.
287 * Set errno if fewer than `count' bytes are written.
Juan Quintela1298cb62010-03-04 10:00:39 +0100288 *
289 * This function don't work with non-blocking fd's.
290 * Any of the possibilities with non-bloking fd's is bad:
291 * - return a short write (then name is wrong)
292 * - busy wait adding (errno == EAGAIN) to the loop
Kirill A. Shutemov7b5f6992010-01-20 00:56:08 +0100293 */
294ssize_t qemu_write_full(int fd, const void *buf, size_t count)
295{
296 ssize_t ret = 0;
297 ssize_t total = 0;
298
299 while (count) {
300 ret = write(fd, buf, count);
301 if (ret < 0) {
302 if (errno == EINTR)
303 continue;
304 break;
305 }
306
307 count -= ret;
308 buf += ret;
309 total += ret;
310 }
311
312 return total;
313}
314
Kevin Wolf40ff6d72009-12-02 12:24:42 +0100315/*
316 * Opens a socket with FD_CLOEXEC set
317 */
318int qemu_socket(int domain, int type, int protocol)
319{
320 int ret;
321
322#ifdef SOCK_CLOEXEC
323 ret = socket(domain, type | SOCK_CLOEXEC, protocol);
Andre Przywara3a03bfa2009-12-18 10:45:07 +0100324 if (ret != -1 || errno != EINVAL) {
325 return ret;
326 }
327#endif
Kevin Wolf40ff6d72009-12-02 12:24:42 +0100328 ret = socket(domain, type, protocol);
329 if (ret >= 0) {
330 qemu_set_cloexec(ret);
331 }
Kevin Wolf40ff6d72009-12-02 12:24:42 +0100332
333 return ret;
334}
335
336/*
337 * Accept a connection and set FD_CLOEXEC
338 */
339int qemu_accept(int s, struct sockaddr *addr, socklen_t *addrlen)
340{
341 int ret;
342
343#ifdef CONFIG_ACCEPT4
344 ret = accept4(s, addr, addrlen, SOCK_CLOEXEC);
Kevin Wolf347ed552010-01-13 16:20:56 +0100345 if (ret != -1 || errno != ENOSYS) {
Andre Przywara3a03bfa2009-12-18 10:45:07 +0100346 return ret;
347 }
348#endif
Kevin Wolf40ff6d72009-12-02 12:24:42 +0100349 ret = accept(s, addr, addrlen);
350 if (ret >= 0) {
351 qemu_set_cloexec(ret);
352 }
Kevin Wolf40ff6d72009-12-02 12:24:42 +0100353
354 return ret;
355}
Paolo Bonzini993295f2011-09-17 16:27:59 +0200356
Eduardo Habkost35c2c8d2015-10-30 17:36:08 -0200357void qemu_set_hw_version(const char *version)
Crístian Viana93bfef42012-05-30 00:35:51 -0300358{
Eduardo Habkost35c2c8d2015-10-30 17:36:08 -0200359 hw_version = version;
Crístian Viana93bfef42012-05-30 00:35:51 -0300360}
361
Eduardo Habkost35c2c8d2015-10-30 17:36:08 -0200362const char *qemu_hw_version(void)
Crístian Viana93bfef42012-05-30 00:35:51 -0300363{
Eduardo Habkost35c2c8d2015-10-30 17:36:08 -0200364 return hw_version;
Crístian Viana93bfef42012-05-30 00:35:51 -0300365}
Paul Moore0f669982012-08-03 14:39:21 -0400366
367void fips_set_state(bool requested)
368{
369#ifdef __linux__
370 if (requested) {
371 FILE *fds = fopen("/proc/sys/crypto/fips_enabled", "r");
372 if (fds != NULL) {
373 fips_enabled = (fgetc(fds) == '1');
374 fclose(fds);
375 }
376 }
377#else
378 fips_enabled = false;
379#endif /* __linux__ */
380
381#ifdef _FIPS_DEBUG
382 fprintf(stderr, "FIPS mode %s (requested %s)\n",
383 (fips_enabled ? "enabled" : "disabled"),
384 (requested ? "enabled" : "disabled"));
385#endif
386}
387
388bool fips_get_state(void)
389{
390 return fips_enabled;
391}
Paolo Bonzini0100fbb2012-10-29 15:19:18 +0100392
Marc-André Lureaud3bf8252013-02-25 23:31:11 +0100393#ifdef _WIN32
394static void socket_cleanup(void)
395{
396 WSACleanup();
397}
398#endif
399
400int socket_init(void)
401{
402#ifdef _WIN32
403 WSADATA Data;
404 int ret, err;
405
406 ret = WSAStartup(MAKEWORD(2, 2), &Data);
407 if (ret != 0) {
408 err = WSAGetLastError();
409 fprintf(stderr, "WSAStartup: %d\n", err);
410 return -1;
411 }
412 atexit(socket_cleanup);
413#endif
414 return 0;
415}
Paolo Bonzini9adea5f2013-04-21 12:01:06 +0200416
Michael Tokarevf33cc842014-05-02 18:35:55 +0400417#if !GLIB_CHECK_VERSION(2, 31, 0)
418/* Ensure that glib is running in multi-threaded mode
419 * Old versions of glib require explicit initialization. Failure to do
420 * this results in the single-threaded code paths being taken inside
421 * glib. For example, the g_slice allocator will not be thread-safe
422 * and cause crashes.
423 */
Stefan Hajnocziae2990c2013-10-08 11:58:31 +0200424static void __attribute__((constructor)) thread_init(void)
425{
426 if (!g_thread_supported()) {
Michael Tokarevf33cc842014-05-02 18:35:55 +0400427 g_thread_init(NULL);
Stefan Hajnocziae2990c2013-10-08 11:58:31 +0200428 }
429}
Michael Tokarevf33cc842014-05-02 18:35:55 +0400430#endif
Stefan Hajnocziae2990c2013-10-08 11:58:31 +0200431
Paolo Bonzini9adea5f2013-04-21 12:01:06 +0200432#ifndef CONFIG_IOVEC
433/* helper function for iov_send_recv() */
434static ssize_t
435readv_writev(int fd, const struct iovec *iov, int iov_cnt, bool do_write)
436{
437 unsigned i = 0;
438 ssize_t ret = 0;
439 while (i < iov_cnt) {
440 ssize_t r = do_write
441 ? write(fd, iov[i].iov_base, iov[i].iov_len)
442 : read(fd, iov[i].iov_base, iov[i].iov_len);
443 if (r > 0) {
444 ret += r;
445 } else if (!r) {
446 break;
447 } else if (errno == EINTR) {
448 continue;
449 } else {
450 /* else it is some "other" error,
451 * only return if there was no data processed. */
452 if (ret == 0) {
453 ret = -1;
454 }
455 break;
456 }
457 i++;
458 }
459 return ret;
460}
461
462ssize_t
463readv(int fd, const struct iovec *iov, int iov_cnt)
464{
465 return readv_writev(fd, iov, iov_cnt, false);
466}
467
468ssize_t
469writev(int fd, const struct iovec *iov, int iov_cnt)
470{
471 return readv_writev(fd, iov, iov_cnt, true);
472}
473#endif