xref: /qemu/util/osdep.c (revision 7a4e543d)
1 /*
2  * QEMU low level functions
3  *
4  * Copyright (c) 2003 Fabrice Bellard
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining a copy
7  * of this software and associated documentation files (the "Software"), to deal
8  * in the Software without restriction, including without limitation the rights
9  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10  * copies of the Software, and to permit persons to whom the Software is
11  * furnished to do so, subject to the following conditions:
12  *
13  * The above copyright notice and this permission notice shall be included in
14  * all copies or substantial portions of the Software.
15  *
16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22  * THE SOFTWARE.
23  */
24 #include "qemu/osdep.h"
25 
26 /* Needed early for CONFIG_BSD etc. */
27 
28 #if defined(CONFIG_MADVISE) || defined(CONFIG_POSIX_MADVISE)
29 #include <sys/mman.h>
30 #endif
31 
32 #ifdef CONFIG_SOLARIS
33 #include <sys/statvfs.h>
34 /* See MySQL bug #7156 (http://bugs.mysql.com/bug.php?id=7156) for
35    discussion about Solaris header problems */
36 extern int madvise(caddr_t, size_t, int);
37 #endif
38 
39 #include "qemu-common.h"
40 #include "qemu/sockets.h"
41 #include "qemu/error-report.h"
42 #include "monitor/monitor.h"
43 
44 static bool fips_enabled = false;
45 
46 /* Starting on QEMU 2.5, qemu_hw_version() returns "2.5+" by default
47  * instead of QEMU_VERSION, so setting hw_version on MachineClass
48  * is no longer mandatory.
49  *
50  * Do NOT change this string, or it will break compatibility on all
51  * machine classes that don't set hw_version.
52  */
53 static const char *hw_version = "2.5+";
54 
55 int socket_set_cork(int fd, int v)
56 {
57 #if defined(SOL_TCP) && defined(TCP_CORK)
58     return qemu_setsockopt(fd, SOL_TCP, TCP_CORK, &v, sizeof(v));
59 #else
60     return 0;
61 #endif
62 }
63 
64 int socket_set_nodelay(int fd)
65 {
66     int v = 1;
67     return qemu_setsockopt(fd, IPPROTO_TCP, TCP_NODELAY, &v, sizeof(v));
68 }
69 
70 int qemu_madvise(void *addr, size_t len, int advice)
71 {
72     if (advice == QEMU_MADV_INVALID) {
73         errno = EINVAL;
74         return -1;
75     }
76 #if defined(CONFIG_MADVISE)
77     return madvise(addr, len, advice);
78 #elif defined(CONFIG_POSIX_MADVISE)
79     return posix_madvise(addr, len, advice);
80 #else
81     errno = EINVAL;
82     return -1;
83 #endif
84 }
85 
86 #ifndef _WIN32
87 /*
88  * Dups an fd and sets the flags
89  */
90 static int qemu_dup_flags(int fd, int flags)
91 {
92     int ret;
93     int serrno;
94     int dup_flags;
95 
96 #ifdef F_DUPFD_CLOEXEC
97     ret = fcntl(fd, F_DUPFD_CLOEXEC, 0);
98 #else
99     ret = dup(fd);
100     if (ret != -1) {
101         qemu_set_cloexec(ret);
102     }
103 #endif
104     if (ret == -1) {
105         goto fail;
106     }
107 
108     dup_flags = fcntl(ret, F_GETFL);
109     if (dup_flags == -1) {
110         goto fail;
111     }
112 
113     if ((flags & O_SYNC) != (dup_flags & O_SYNC)) {
114         errno = EINVAL;
115         goto fail;
116     }
117 
118     /* Set/unset flags that we can with fcntl */
119     if (fcntl(ret, F_SETFL, flags) == -1) {
120         goto fail;
121     }
122 
123     /* Truncate the file in the cases that open() would truncate it */
124     if (flags & O_TRUNC ||
125             ((flags & (O_CREAT | O_EXCL)) == (O_CREAT | O_EXCL))) {
126         if (ftruncate(ret, 0) == -1) {
127             goto fail;
128         }
129     }
130 
131     return ret;
132 
133 fail:
134     serrno = errno;
135     if (ret != -1) {
136         close(ret);
137     }
138     errno = serrno;
139     return -1;
140 }
141 
142 static int qemu_parse_fdset(const char *param)
143 {
144     return qemu_parse_fd(param);
145 }
146 #endif
147 
148 /*
149  * Opens a file with FD_CLOEXEC set
150  */
151 int qemu_open(const char *name, int flags, ...)
152 {
153     int ret;
154     int mode = 0;
155 
156 #ifndef _WIN32
157     const char *fdset_id_str;
158 
159     /* Attempt dup of fd from fd set */
160     if (strstart(name, "/dev/fdset/", &fdset_id_str)) {
161         int64_t fdset_id;
162         int fd, dupfd;
163 
164         fdset_id = qemu_parse_fdset(fdset_id_str);
165         if (fdset_id == -1) {
166             errno = EINVAL;
167             return -1;
168         }
169 
170         fd = monitor_fdset_get_fd(fdset_id, flags);
171         if (fd == -1) {
172             return -1;
173         }
174 
175         dupfd = qemu_dup_flags(fd, flags);
176         if (dupfd == -1) {
177             return -1;
178         }
179 
180         ret = monitor_fdset_dup_fd_add(fdset_id, dupfd);
181         if (ret == -1) {
182             close(dupfd);
183             errno = EINVAL;
184             return -1;
185         }
186 
187         return dupfd;
188     }
189 #endif
190 
191     if (flags & O_CREAT) {
192         va_list ap;
193 
194         va_start(ap, flags);
195         mode = va_arg(ap, int);
196         va_end(ap);
197     }
198 
199 #ifdef O_CLOEXEC
200     ret = open(name, flags | O_CLOEXEC, mode);
201 #else
202     ret = open(name, flags, mode);
203     if (ret >= 0) {
204         qemu_set_cloexec(ret);
205     }
206 #endif
207 
208 #ifdef O_DIRECT
209     if (ret == -1 && errno == EINVAL && (flags & O_DIRECT)) {
210         error_report("file system may not support O_DIRECT");
211         errno = EINVAL; /* in case it was clobbered */
212     }
213 #endif /* O_DIRECT */
214 
215     return ret;
216 }
217 
218 int qemu_close(int fd)
219 {
220     int64_t fdset_id;
221 
222     /* Close fd that was dup'd from an fdset */
223     fdset_id = monitor_fdset_dup_fd_find(fd);
224     if (fdset_id != -1) {
225         int ret;
226 
227         ret = close(fd);
228         if (ret == 0) {
229             monitor_fdset_dup_fd_remove(fd);
230         }
231 
232         return ret;
233     }
234 
235     return close(fd);
236 }
237 
238 /*
239  * A variant of write(2) which handles partial write.
240  *
241  * Return the number of bytes transferred.
242  * Set errno if fewer than `count' bytes are written.
243  *
244  * This function don't work with non-blocking fd's.
245  * Any of the possibilities with non-bloking fd's is bad:
246  *   - return a short write (then name is wrong)
247  *   - busy wait adding (errno == EAGAIN) to the loop
248  */
249 ssize_t qemu_write_full(int fd, const void *buf, size_t count)
250 {
251     ssize_t ret = 0;
252     ssize_t total = 0;
253 
254     while (count) {
255         ret = write(fd, buf, count);
256         if (ret < 0) {
257             if (errno == EINTR)
258                 continue;
259             break;
260         }
261 
262         count -= ret;
263         buf += ret;
264         total += ret;
265     }
266 
267     return total;
268 }
269 
270 /*
271  * Opens a socket with FD_CLOEXEC set
272  */
273 int qemu_socket(int domain, int type, int protocol)
274 {
275     int ret;
276 
277 #ifdef SOCK_CLOEXEC
278     ret = socket(domain, type | SOCK_CLOEXEC, protocol);
279     if (ret != -1 || errno != EINVAL) {
280         return ret;
281     }
282 #endif
283     ret = socket(domain, type, protocol);
284     if (ret >= 0) {
285         qemu_set_cloexec(ret);
286     }
287 
288     return ret;
289 }
290 
291 /*
292  * Accept a connection and set FD_CLOEXEC
293  */
294 int qemu_accept(int s, struct sockaddr *addr, socklen_t *addrlen)
295 {
296     int ret;
297 
298 #ifdef CONFIG_ACCEPT4
299     ret = accept4(s, addr, addrlen, SOCK_CLOEXEC);
300     if (ret != -1 || errno != ENOSYS) {
301         return ret;
302     }
303 #endif
304     ret = accept(s, addr, addrlen);
305     if (ret >= 0) {
306         qemu_set_cloexec(ret);
307     }
308 
309     return ret;
310 }
311 
312 void qemu_set_hw_version(const char *version)
313 {
314     hw_version = version;
315 }
316 
317 const char *qemu_hw_version(void)
318 {
319     return hw_version;
320 }
321 
322 void fips_set_state(bool requested)
323 {
324 #ifdef __linux__
325     if (requested) {
326         FILE *fds = fopen("/proc/sys/crypto/fips_enabled", "r");
327         if (fds != NULL) {
328             fips_enabled = (fgetc(fds) == '1');
329             fclose(fds);
330         }
331     }
332 #else
333     fips_enabled = false;
334 #endif /* __linux__ */
335 
336 #ifdef _FIPS_DEBUG
337     fprintf(stderr, "FIPS mode %s (requested %s)\n",
338 	    (fips_enabled ? "enabled" : "disabled"),
339 	    (requested ? "enabled" : "disabled"));
340 #endif
341 }
342 
343 bool fips_get_state(void)
344 {
345     return fips_enabled;
346 }
347 
348 #ifdef _WIN32
349 static void socket_cleanup(void)
350 {
351     WSACleanup();
352 }
353 #endif
354 
355 int socket_init(void)
356 {
357 #ifdef _WIN32
358     WSADATA Data;
359     int ret, err;
360 
361     ret = WSAStartup(MAKEWORD(2, 2), &Data);
362     if (ret != 0) {
363         err = WSAGetLastError();
364         fprintf(stderr, "WSAStartup: %d\n", err);
365         return -1;
366     }
367     atexit(socket_cleanup);
368 #endif
369     return 0;
370 }
371 
372 #if !GLIB_CHECK_VERSION(2, 31, 0)
373 /* Ensure that glib is running in multi-threaded mode
374  * Old versions of glib require explicit initialization.  Failure to do
375  * this results in the single-threaded code paths being taken inside
376  * glib.  For example, the g_slice allocator will not be thread-safe
377  * and cause crashes.
378  */
379 static void __attribute__((constructor)) thread_init(void)
380 {
381     if (!g_thread_supported()) {
382        g_thread_init(NULL);
383     }
384 }
385 #endif
386 
387 #ifndef CONFIG_IOVEC
388 /* helper function for iov_send_recv() */
389 static ssize_t
390 readv_writev(int fd, const struct iovec *iov, int iov_cnt, bool do_write)
391 {
392     unsigned i = 0;
393     ssize_t ret = 0;
394     while (i < iov_cnt) {
395         ssize_t r = do_write
396             ? write(fd, iov[i].iov_base, iov[i].iov_len)
397             : read(fd, iov[i].iov_base, iov[i].iov_len);
398         if (r > 0) {
399             ret += r;
400         } else if (!r) {
401             break;
402         } else if (errno == EINTR) {
403             continue;
404         } else {
405             /* else it is some "other" error,
406              * only return if there was no data processed. */
407             if (ret == 0) {
408                 ret = -1;
409             }
410             break;
411         }
412         i++;
413     }
414     return ret;
415 }
416 
417 ssize_t
418 readv(int fd, const struct iovec *iov, int iov_cnt)
419 {
420     return readv_writev(fd, iov, iov_cnt, false);
421 }
422 
423 ssize_t
424 writev(int fd, const struct iovec *iov, int iov_cnt)
425 {
426     return readv_writev(fd, iov, iov_cnt, true);
427 }
428 #endif
429