| 
									
										
										
										
											2015-10-09 17:17:19 +02:00
										 |  |  | /*
 | 
					
						
							|  |  |  |  * memfd.c | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Copyright (c) 2015 Red Hat, Inc. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * QEMU library functions on POSIX which are shared between QEMU and | 
					
						
							|  |  |  |  * the QEMU tools. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Permission is hereby granted, free of charge, to any person obtaining a copy | 
					
						
							|  |  |  |  * of this software and associated documentation files (the "Software"), to deal | 
					
						
							|  |  |  |  * in the Software without restriction, including without limitation the rights | 
					
						
							|  |  |  |  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell | 
					
						
							|  |  |  |  * copies of the Software, and to permit persons to whom the Software is | 
					
						
							|  |  |  |  * furnished to do so, subject to the following conditions: | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * The above copyright notice and this permission notice shall be included in | 
					
						
							|  |  |  |  * all copies or substantial portions of the Software. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR | 
					
						
							|  |  |  |  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, | 
					
						
							|  |  |  |  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL | 
					
						
							|  |  |  |  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER | 
					
						
							|  |  |  |  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, | 
					
						
							|  |  |  |  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN | 
					
						
							|  |  |  |  * THE SOFTWARE. | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #include "qemu/osdep.h"
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:51 +01:00
										 |  |  | #include "qapi/error.h"
 | 
					
						
							| 
									
										
										
										
											2015-10-09 17:17:19 +02:00
										 |  |  | #include "qemu/memfd.h"
 | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:53 +01:00
										 |  |  | #include "qemu/host-utils.h"
 | 
					
						
							| 
									
										
										
										
											2015-10-09 17:17:19 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-11-28 11:51:27 +01:00
										 |  |  | #if defined CONFIG_LINUX && !defined CONFIG_MEMFD
 | 
					
						
							| 
									
										
										
										
											2015-10-09 17:17:19 +02:00
										 |  |  | #include <sys/syscall.h>
 | 
					
						
							|  |  |  | #include <asm/unistd.h>
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-08-19 11:09:47 -07:00
										 |  |  | int memfd_create(const char *name, unsigned int flags) | 
					
						
							| 
									
										
										
										
											2015-10-09 17:17:19 +02:00
										 |  |  | { | 
					
						
							|  |  |  | #ifdef __NR_memfd_create
 | 
					
						
							|  |  |  |     return syscall(__NR_memfd_create, name, flags); | 
					
						
							|  |  |  | #else
 | 
					
						
							| 
									
										
										
										
											2019-03-11 16:58:49 +03:00
										 |  |  |     errno = ENOSYS; | 
					
						
							| 
									
										
										
										
											2015-10-09 17:17:19 +02:00
										 |  |  |     return -1; | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:52 +01:00
										 |  |  | int qemu_memfd_create(const char *name, size_t size, bool hugetlb, | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:53 +01:00
										 |  |  |                       uint64_t hugetlbsize, unsigned int seals, Error **errp) | 
					
						
							| 
									
										
										
										
											2017-10-23 15:18:07 +01:00
										 |  |  | { | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:53 +01:00
										 |  |  |     int htsize = hugetlbsize ? ctz64(hugetlbsize) : 0; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-05-15 18:27:29 +01:00
										 |  |  |     if (htsize && 1ULL << htsize != hugetlbsize) { | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:53 +01:00
										 |  |  |         error_setg(errp, "Hugepage size must be a power of 2"); | 
					
						
							|  |  |  |         return -1; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     htsize = htsize << MFD_HUGE_SHIFT; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-10-23 15:18:07 +01:00
										 |  |  | #ifdef CONFIG_LINUX
 | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:51 +01:00
										 |  |  |     int mfd = -1; | 
					
						
							| 
									
										
										
										
											2017-10-23 15:18:07 +01:00
										 |  |  |     unsigned int flags = MFD_CLOEXEC; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (seals) { | 
					
						
							|  |  |  |         flags |= MFD_ALLOW_SEALING; | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:52 +01:00
										 |  |  |     if (hugetlb) { | 
					
						
							|  |  |  |         flags |= MFD_HUGETLB; | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:53 +01:00
										 |  |  |         flags |= htsize; | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:52 +01:00
										 |  |  |     } | 
					
						
							| 
									
										
										
										
											2017-10-23 15:18:07 +01:00
										 |  |  |     mfd = memfd_create(name, flags); | 
					
						
							|  |  |  |     if (mfd < 0) { | 
					
						
							| 
									
										
										
										
											2019-03-11 16:58:50 +03:00
										 |  |  |         error_setg_errno(errp, errno, | 
					
						
							|  |  |  |                          "failed to create memfd with flags 0x%x", flags); | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:51 +01:00
										 |  |  |         goto err; | 
					
						
							| 
									
										
										
										
											2017-10-23 15:18:07 +01:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (ftruncate(mfd, size) == -1) { | 
					
						
							| 
									
										
										
										
											2019-03-11 16:58:50 +03:00
										 |  |  |         error_setg_errno(errp, errno, "failed to resize memfd to %zu", size); | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:51 +01:00
										 |  |  |         goto err; | 
					
						
							| 
									
										
										
										
											2017-10-23 15:18:07 +01:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (seals && fcntl(mfd, F_ADD_SEALS, seals) == -1) { | 
					
						
							| 
									
										
										
										
											2019-03-11 16:58:50 +03:00
										 |  |  |         error_setg_errno(errp, errno, "failed to add seals 0x%x", seals); | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:51 +01:00
										 |  |  |         goto err; | 
					
						
							| 
									
										
										
										
											2017-10-23 15:18:07 +01:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     return mfd; | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:51 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  | err: | 
					
						
							|  |  |  |     if (mfd >= 0) { | 
					
						
							|  |  |  |         close(mfd); | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2019-03-11 16:58:50 +03:00
										 |  |  | #else
 | 
					
						
							|  |  |  |     error_setg_errno(errp, ENOSYS, "failed to create memfd"); | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:51 +01:00
										 |  |  | #endif
 | 
					
						
							|  |  |  |     return -1; | 
					
						
							| 
									
										
										
										
											2017-10-23 15:18:07 +01:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-10-09 17:17:20 +02:00
										 |  |  | /*
 | 
					
						
							|  |  |  |  * This is a best-effort helper for shared memory allocation, with | 
					
						
							|  |  |  |  * optional sealing. The helper will do his best to allocate using | 
					
						
							|  |  |  |  * memfd with sealing, but may fallback on other methods without | 
					
						
							|  |  |  |  * sealing. | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | void *qemu_memfd_alloc(const char *name, size_t size, unsigned int seals, | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:51 +01:00
										 |  |  |                        int *fd, Error **errp) | 
					
						
							| 
									
										
										
										
											2015-10-09 17:17:20 +02:00
										 |  |  | { | 
					
						
							|  |  |  |     void *ptr; | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:53 +01:00
										 |  |  |     int mfd = qemu_memfd_create(name, size, false, 0, seals, NULL); | 
					
						
							| 
									
										
										
										
											2015-10-09 17:17:20 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-10-23 15:18:07 +01:00
										 |  |  |     /* some systems have memfd without sealing */ | 
					
						
							| 
									
										
										
										
											2015-10-09 17:17:20 +02:00
										 |  |  |     if (mfd == -1) { | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:53 +01:00
										 |  |  |         mfd = qemu_memfd_create(name, size, false, 0, 0, NULL); | 
					
						
							| 
									
										
										
										
											2015-10-09 17:17:20 +02:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-10-23 15:18:07 +01:00
										 |  |  |     if (mfd == -1) { | 
					
						
							| 
									
										
										
										
											2015-10-09 17:17:21 +02:00
										 |  |  |         const char *tmpdir = g_get_tmp_dir(); | 
					
						
							|  |  |  |         gchar *fname; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         fname = g_strdup_printf("%s/memfd-XXXXXX", tmpdir); | 
					
						
							|  |  |  |         mfd = mkstemp(fname); | 
					
						
							|  |  |  |         unlink(fname); | 
					
						
							|  |  |  |         g_free(fname); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:51 +01:00
										 |  |  |         if (mfd == -1 || | 
					
						
							|  |  |  |             ftruncate(mfd, size) == -1) { | 
					
						
							|  |  |  |             goto err; | 
					
						
							| 
									
										
										
										
											2015-10-09 17:17:21 +02:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2015-10-09 17:17:20 +02:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     ptr = mmap(0, size, PROT_READ | PROT_WRITE, MAP_SHARED, mfd, 0); | 
					
						
							|  |  |  |     if (ptr == MAP_FAILED) { | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:51 +01:00
										 |  |  |         goto err; | 
					
						
							| 
									
										
										
										
											2015-10-09 17:17:20 +02:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     *fd = mfd; | 
					
						
							|  |  |  |     return ptr; | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:51 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  | err: | 
					
						
							|  |  |  |     error_setg_errno(errp, errno, "failed to allocate shared memory"); | 
					
						
							|  |  |  |     if (mfd >= 0) { | 
					
						
							|  |  |  |         close(mfd); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |     return NULL; | 
					
						
							| 
									
										
										
										
											2015-10-09 17:17:20 +02:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | void qemu_memfd_free(void *ptr, size_t size, int fd) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     if (ptr) { | 
					
						
							|  |  |  |         munmap(ptr, size); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (fd != -1) { | 
					
						
							|  |  |  |         close(fd); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | } | 
					
						
							| 
									
										
										
										
											2015-10-09 17:17:34 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  | enum { | 
					
						
							|  |  |  |     MEMFD_KO, | 
					
						
							|  |  |  |     MEMFD_OK, | 
					
						
							|  |  |  |     MEMFD_TODO | 
					
						
							|  |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-03-28 14:18:04 +02:00
										 |  |  | /**
 | 
					
						
							|  |  |  |  * qemu_memfd_alloc_check(): | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Check if qemu_memfd_alloc() can allocate, including using a | 
					
						
							|  |  |  |  * fallback implementation when host doesn't support memfd. | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | bool qemu_memfd_alloc_check(void) | 
					
						
							| 
									
										
										
										
											2015-10-09 17:17:34 +02:00
										 |  |  | { | 
					
						
							|  |  |  |     static int memfd_check = MEMFD_TODO; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (memfd_check == MEMFD_TODO) { | 
					
						
							|  |  |  |         int fd; | 
					
						
							|  |  |  |         void *ptr; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-06-13 11:19:54 +03:00
										 |  |  |         fd = -1; | 
					
						
							| 
									
										
										
										
											2018-02-01 14:27:51 +01:00
										 |  |  |         ptr = qemu_memfd_alloc("test", 4096, 0, &fd, NULL); | 
					
						
							| 
									
										
										
										
											2015-10-09 17:17:34 +02:00
										 |  |  |         memfd_check = ptr ? MEMFD_OK : MEMFD_KO; | 
					
						
							|  |  |  |         qemu_memfd_free(ptr, 4096, fd); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     return memfd_check == MEMFD_OK; | 
					
						
							|  |  |  | } | 
					
						
							| 
									
										
										
										
											2018-03-28 14:18:04 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  | /**
 | 
					
						
							|  |  |  |  * qemu_memfd_check(): | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Check if host supports memfd. | 
					
						
							|  |  |  |  */ | 
					
						
							| 
									
										
										
										
											2018-09-06 20:14:15 +04:00
										 |  |  | bool qemu_memfd_check(unsigned int flags) | 
					
						
							| 
									
										
										
										
											2018-03-28 14:18:04 +02:00
										 |  |  | { | 
					
						
							|  |  |  | #ifdef CONFIG_LINUX
 | 
					
						
							| 
									
										
										
										
											2019-03-11 16:58:48 +03:00
										 |  |  |     int mfd = memfd_create("test", flags | MFD_CLOEXEC); | 
					
						
							| 
									
										
										
										
											2018-03-28 14:18:04 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-09-06 20:14:15 +04:00
										 |  |  |     if (mfd >= 0) { | 
					
						
							|  |  |  |         close(mfd); | 
					
						
							|  |  |  |         return true; | 
					
						
							| 
									
										
										
										
											2018-03-28 14:18:04 +02:00
										 |  |  |     } | 
					
						
							| 
									
										
										
										
											2018-09-06 20:14:15 +04:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2018-03-28 14:18:04 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |     return false; | 
					
						
							|  |  |  | } |