qemu/util/memfd.c
<<
>>
Prefs
   1/*
   2 * memfd.c
   3 *
   4 * Copyright (c) 2015 Red Hat, Inc.
   5 *
   6 * QEMU library functions on POSIX which are shared between QEMU and
   7 * the QEMU tools.
   8 *
   9 * Permission is hereby granted, free of charge, to any person obtaining a copy
  10 * of this software and associated documentation files (the "Software"), to deal
  11 * in the Software without restriction, including without limitation the rights
  12 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  13 * copies of the Software, and to permit persons to whom the Software is
  14 * furnished to do so, subject to the following conditions:
  15 *
  16 * The above copyright notice and this permission notice shall be included in
  17 * all copies or substantial portions of the Software.
  18 *
  19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  20 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  21 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  22 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  23 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  24 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
  25 * THE SOFTWARE.
  26 */
  27
  28#include "qemu/osdep.h"
  29
  30#include "qapi/error.h"
  31#include "qemu/memfd.h"
  32#include "qemu/host-utils.h"
  33
  34#if defined CONFIG_LINUX && !defined CONFIG_MEMFD
  35#include <sys/syscall.h>
  36#include <asm/unistd.h>
  37
  38static int memfd_create(const char *name, unsigned int flags)
  39{
  40#ifdef __NR_memfd_create
  41    return syscall(__NR_memfd_create, name, flags);
  42#else
  43    errno = ENOSYS;
  44    return -1;
  45#endif
  46}
  47#endif
  48
  49int qemu_memfd_create(const char *name, size_t size, bool hugetlb,
  50                      uint64_t hugetlbsize, unsigned int seals, Error **errp)
  51{
  52    int htsize = hugetlbsize ? ctz64(hugetlbsize) : 0;
  53
  54    if (htsize && 1ULL << htsize != hugetlbsize) {
  55        error_setg(errp, "Hugepage size must be a power of 2");
  56        return -1;
  57    }
  58
  59    htsize = htsize << MFD_HUGE_SHIFT;
  60
  61#ifdef CONFIG_LINUX
  62    int mfd = -1;
  63    unsigned int flags = MFD_CLOEXEC;
  64
  65    if (seals) {
  66        flags |= MFD_ALLOW_SEALING;
  67    }
  68    if (hugetlb) {
  69        flags |= MFD_HUGETLB;
  70        flags |= htsize;
  71    }
  72    mfd = memfd_create(name, flags);
  73    if (mfd < 0) {
  74        error_setg_errno(errp, errno,
  75                         "failed to create memfd with flags 0x%x", flags);
  76        goto err;
  77    }
  78
  79    if (ftruncate(mfd, size) == -1) {
  80        error_setg_errno(errp, errno, "failed to resize memfd to %zu", size);
  81        goto err;
  82    }
  83
  84    if (seals && fcntl(mfd, F_ADD_SEALS, seals) == -1) {
  85        error_setg_errno(errp, errno, "failed to add seals 0x%x", seals);
  86        goto err;
  87    }
  88
  89    return mfd;
  90
  91err:
  92    if (mfd >= 0) {
  93        close(mfd);
  94    }
  95#else
  96    error_setg_errno(errp, ENOSYS, "failed to create memfd");
  97#endif
  98    return -1;
  99}
 100
 101/*
 102 * This is a best-effort helper for shared memory allocation, with
 103 * optional sealing. The helper will do his best to allocate using
 104 * memfd with sealing, but may fallback on other methods without
 105 * sealing.
 106 */
 107void *qemu_memfd_alloc(const char *name, size_t size, unsigned int seals,
 108                       int *fd, Error **errp)
 109{
 110    void *ptr;
 111    int mfd = qemu_memfd_create(name, size, false, 0, seals, NULL);
 112
 113    /* some systems have memfd without sealing */
 114    if (mfd == -1) {
 115        mfd = qemu_memfd_create(name, size, false, 0, 0, NULL);
 116    }
 117
 118    if (mfd == -1) {
 119        const char *tmpdir = g_get_tmp_dir();
 120        gchar *fname;
 121
 122        fname = g_strdup_printf("%s/memfd-XXXXXX", tmpdir);
 123        mfd = mkstemp(fname);
 124        unlink(fname);
 125        g_free(fname);
 126
 127        if (mfd == -1 ||
 128            ftruncate(mfd, size) == -1) {
 129            goto err;
 130        }
 131    }
 132
 133    ptr = mmap(0, size, PROT_READ | PROT_WRITE, MAP_SHARED, mfd, 0);
 134    if (ptr == MAP_FAILED) {
 135        goto err;
 136    }
 137
 138    *fd = mfd;
 139    return ptr;
 140
 141err:
 142    error_setg_errno(errp, errno, "failed to allocate shared memory");
 143    if (mfd >= 0) {
 144        close(mfd);
 145    }
 146    return NULL;
 147}
 148
 149void qemu_memfd_free(void *ptr, size_t size, int fd)
 150{
 151    if (ptr) {
 152        munmap(ptr, size);
 153    }
 154
 155    if (fd != -1) {
 156        close(fd);
 157    }
 158}
 159
 160enum {
 161    MEMFD_KO,
 162    MEMFD_OK,
 163    MEMFD_TODO
 164};
 165
 166/**
 167 * qemu_memfd_alloc_check():
 168 *
 169 * Check if qemu_memfd_alloc() can allocate, including using a
 170 * fallback implementation when host doesn't support memfd.
 171 */
 172bool qemu_memfd_alloc_check(void)
 173{
 174    static int memfd_check = MEMFD_TODO;
 175
 176    if (memfd_check == MEMFD_TODO) {
 177        int fd;
 178        void *ptr;
 179
 180        fd = -1;
 181        ptr = qemu_memfd_alloc("test", 4096, 0, &fd, NULL);
 182        memfd_check = ptr ? MEMFD_OK : MEMFD_KO;
 183        qemu_memfd_free(ptr, 4096, fd);
 184    }
 185
 186    return memfd_check == MEMFD_OK;
 187}
 188
 189/**
 190 * qemu_memfd_check():
 191 *
 192 * Check if host supports memfd.
 193 */
 194bool qemu_memfd_check(unsigned int flags)
 195{
 196#ifdef CONFIG_LINUX
 197    int mfd = memfd_create("test", flags | MFD_CLOEXEC);
 198
 199    if (mfd >= 0) {
 200        close(mfd);
 201        return true;
 202    }
 203#endif
 204
 205    return false;
 206}
 207