2015-10-09 17:17:19 +02:00
|
|
|
/*
|
|
|
|
* memfd.c
|
|
|
|
*
|
|
|
|
* Copyright (c) 2015 Red Hat, Inc.
|
|
|
|
*
|
|
|
|
* QEMU library functions on POSIX which are shared between QEMU and
|
|
|
|
* the QEMU tools.
|
|
|
|
*
|
|
|
|
* Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
|
|
* of this software and associated documentation files (the "Software"), to deal
|
|
|
|
* in the Software without restriction, including without limitation the rights
|
|
|
|
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
|
|
* copies of the Software, and to permit persons to whom the Software is
|
|
|
|
* furnished to do so, subject to the following conditions:
|
|
|
|
*
|
|
|
|
* The above copyright notice and this permission notice shall be included in
|
|
|
|
* all copies or substantial portions of the Software.
|
|
|
|
*
|
|
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
|
|
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
|
|
* THE SOFTWARE.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "qemu/osdep.h"
|
|
|
|
|
2018-02-01 14:27:51 +01:00
|
|
|
#include "qapi/error.h"
|
2015-10-09 17:17:19 +02:00
|
|
|
#include "qemu/memfd.h"
|
2018-02-01 14:27:53 +01:00
|
|
|
#include "qemu/host-utils.h"
|
2015-10-09 17:17:19 +02:00
|
|
|
|
2017-11-28 11:51:27 +01:00
|
|
|
#if defined CONFIG_LINUX && !defined CONFIG_MEMFD
|
2015-10-09 17:17:19 +02:00
|
|
|
#include <sys/syscall.h>
|
|
|
|
#include <asm/unistd.h>
|
|
|
|
|
2015-10-09 17:17:20 +02:00
|
|
|
static int memfd_create(const char *name, unsigned int flags)
|
2015-10-09 17:17:19 +02:00
|
|
|
{
|
|
|
|
#ifdef __NR_memfd_create
|
|
|
|
return syscall(__NR_memfd_create, name, flags);
|
|
|
|
#else
|
|
|
|
return -1;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#ifndef MFD_CLOEXEC
|
|
|
|
#define MFD_CLOEXEC 0x0001U
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#ifndef MFD_ALLOW_SEALING
|
|
|
|
#define MFD_ALLOW_SEALING 0x0002U
|
|
|
|
#endif
|
2015-10-09 17:17:20 +02:00
|
|
|
|
2018-02-01 14:27:52 +01:00
|
|
|
#ifndef MFD_HUGETLB
|
|
|
|
#define MFD_HUGETLB 0x0004U
|
|
|
|
#endif
|
|
|
|
|
2018-02-01 14:27:53 +01:00
|
|
|
#ifndef MFD_HUGE_SHIFT
|
|
|
|
#define MFD_HUGE_SHIFT 26
|
|
|
|
#endif
|
|
|
|
|
2018-02-01 14:27:52 +01:00
|
|
|
int qemu_memfd_create(const char *name, size_t size, bool hugetlb,
|
2018-02-01 14:27:53 +01:00
|
|
|
uint64_t hugetlbsize, unsigned int seals, Error **errp)
|
2017-10-23 15:18:07 +01:00
|
|
|
{
|
2018-02-01 14:27:53 +01:00
|
|
|
int htsize = hugetlbsize ? ctz64(hugetlbsize) : 0;
|
|
|
|
|
2018-05-15 18:27:29 +01:00
|
|
|
if (htsize && 1ULL << htsize != hugetlbsize) {
|
2018-02-01 14:27:53 +01:00
|
|
|
error_setg(errp, "Hugepage size must be a power of 2");
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
htsize = htsize << MFD_HUGE_SHIFT;
|
|
|
|
|
2017-10-23 15:18:07 +01:00
|
|
|
#ifdef CONFIG_LINUX
|
2018-02-01 14:27:51 +01:00
|
|
|
int mfd = -1;
|
2017-10-23 15:18:07 +01:00
|
|
|
unsigned int flags = MFD_CLOEXEC;
|
|
|
|
|
|
|
|
if (seals) {
|
|
|
|
flags |= MFD_ALLOW_SEALING;
|
|
|
|
}
|
2018-02-01 14:27:52 +01:00
|
|
|
if (hugetlb) {
|
|
|
|
flags |= MFD_HUGETLB;
|
2018-02-01 14:27:53 +01:00
|
|
|
flags |= htsize;
|
2018-02-01 14:27:52 +01:00
|
|
|
}
|
2017-10-23 15:18:07 +01:00
|
|
|
mfd = memfd_create(name, flags);
|
|
|
|
if (mfd < 0) {
|
2018-02-01 14:27:51 +01:00
|
|
|
goto err;
|
2017-10-23 15:18:07 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
if (ftruncate(mfd, size) == -1) {
|
2018-02-01 14:27:51 +01:00
|
|
|
goto err;
|
2017-10-23 15:18:07 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
if (seals && fcntl(mfd, F_ADD_SEALS, seals) == -1) {
|
2018-02-01 14:27:51 +01:00
|
|
|
goto err;
|
2017-10-23 15:18:07 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
return mfd;
|
2018-02-01 14:27:51 +01:00
|
|
|
|
|
|
|
err:
|
|
|
|
if (mfd >= 0) {
|
|
|
|
close(mfd);
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
error_setg_errno(errp, errno, "failed to create memfd");
|
|
|
|
return -1;
|
2017-10-23 15:18:07 +01:00
|
|
|
}
|
|
|
|
|
2015-10-09 17:17:20 +02:00
|
|
|
/*
|
|
|
|
* This is a best-effort helper for shared memory allocation, with
|
|
|
|
* optional sealing. The helper will do his best to allocate using
|
|
|
|
* memfd with sealing, but may fallback on other methods without
|
|
|
|
* sealing.
|
|
|
|
*/
|
|
|
|
void *qemu_memfd_alloc(const char *name, size_t size, unsigned int seals,
|
2018-02-01 14:27:51 +01:00
|
|
|
int *fd, Error **errp)
|
2015-10-09 17:17:20 +02:00
|
|
|
{
|
|
|
|
void *ptr;
|
2018-02-01 14:27:53 +01:00
|
|
|
int mfd = qemu_memfd_create(name, size, false, 0, seals, NULL);
|
2015-10-09 17:17:20 +02:00
|
|
|
|
2017-10-23 15:18:07 +01:00
|
|
|
/* some systems have memfd without sealing */
|
2015-10-09 17:17:20 +02:00
|
|
|
if (mfd == -1) {
|
2018-02-01 14:27:53 +01:00
|
|
|
mfd = qemu_memfd_create(name, size, false, 0, 0, NULL);
|
2015-10-09 17:17:20 +02:00
|
|
|
}
|
|
|
|
|
2017-10-23 15:18:07 +01:00
|
|
|
if (mfd == -1) {
|
2015-10-09 17:17:21 +02:00
|
|
|
const char *tmpdir = g_get_tmp_dir();
|
|
|
|
gchar *fname;
|
|
|
|
|
|
|
|
fname = g_strdup_printf("%s/memfd-XXXXXX", tmpdir);
|
|
|
|
mfd = mkstemp(fname);
|
|
|
|
unlink(fname);
|
|
|
|
g_free(fname);
|
|
|
|
|
2018-02-01 14:27:51 +01:00
|
|
|
if (mfd == -1 ||
|
|
|
|
ftruncate(mfd, size) == -1) {
|
|
|
|
goto err;
|
2015-10-09 17:17:21 +02:00
|
|
|
}
|
2015-10-09 17:17:20 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
ptr = mmap(0, size, PROT_READ | PROT_WRITE, MAP_SHARED, mfd, 0);
|
|
|
|
if (ptr == MAP_FAILED) {
|
2018-02-01 14:27:51 +01:00
|
|
|
goto err;
|
2015-10-09 17:17:20 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
*fd = mfd;
|
|
|
|
return ptr;
|
2018-02-01 14:27:51 +01:00
|
|
|
|
|
|
|
err:
|
|
|
|
error_setg_errno(errp, errno, "failed to allocate shared memory");
|
|
|
|
if (mfd >= 0) {
|
|
|
|
close(mfd);
|
|
|
|
}
|
|
|
|
return NULL;
|
2015-10-09 17:17:20 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
void qemu_memfd_free(void *ptr, size_t size, int fd)
|
|
|
|
{
|
|
|
|
if (ptr) {
|
|
|
|
munmap(ptr, size);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (fd != -1) {
|
|
|
|
close(fd);
|
|
|
|
}
|
|
|
|
}
|
2015-10-09 17:17:34 +02:00
|
|
|
|
|
|
|
enum {
|
|
|
|
MEMFD_KO,
|
|
|
|
MEMFD_OK,
|
|
|
|
MEMFD_TODO
|
|
|
|
};
|
|
|
|
|
2018-03-28 14:18:04 +02:00
|
|
|
/**
|
|
|
|
* qemu_memfd_alloc_check():
|
|
|
|
*
|
|
|
|
* Check if qemu_memfd_alloc() can allocate, including using a
|
|
|
|
* fallback implementation when host doesn't support memfd.
|
|
|
|
*/
|
|
|
|
bool qemu_memfd_alloc_check(void)
|
2015-10-09 17:17:34 +02:00
|
|
|
{
|
|
|
|
static int memfd_check = MEMFD_TODO;
|
|
|
|
|
|
|
|
if (memfd_check == MEMFD_TODO) {
|
|
|
|
int fd;
|
|
|
|
void *ptr;
|
|
|
|
|
2018-02-01 14:27:51 +01:00
|
|
|
ptr = qemu_memfd_alloc("test", 4096, 0, &fd, NULL);
|
2015-10-09 17:17:34 +02:00
|
|
|
memfd_check = ptr ? MEMFD_OK : MEMFD_KO;
|
|
|
|
qemu_memfd_free(ptr, 4096, fd);
|
|
|
|
}
|
|
|
|
|
|
|
|
return memfd_check == MEMFD_OK;
|
|
|
|
}
|
2018-03-28 14:18:04 +02:00
|
|
|
|
|
|
|
/**
|
|
|
|
* qemu_memfd_check():
|
|
|
|
*
|
|
|
|
* Check if host supports memfd.
|
|
|
|
*/
|
|
|
|
bool qemu_memfd_check(void)
|
|
|
|
{
|
|
|
|
#ifdef CONFIG_LINUX
|
|
|
|
static int memfd_check = MEMFD_TODO;
|
|
|
|
|
|
|
|
if (memfd_check == MEMFD_TODO) {
|
|
|
|
int mfd = memfd_create("test", 0);
|
|
|
|
if (mfd >= 0) {
|
|
|
|
memfd_check = MEMFD_OK;
|
|
|
|
close(mfd);
|
|
|
|
} else {
|
|
|
|
memfd_check = MEMFD_KO;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return memfd_check == MEMFD_OK;
|
|
|
|
#else
|
|
|
|
return false;
|
|
|
|
#endif
|
|
|
|
}
|