2020-07-20 16:18:57 +02:00
|
|
|
/*
|
|
|
|
* qemu_namespace.c: QEMU domain namespace helpers
|
|
|
|
*
|
|
|
|
* Copyright (C) 2006-2020 Red Hat, Inc.
|
|
|
|
* Copyright (C) 2006 Daniel P. Berrange
|
|
|
|
*
|
|
|
|
* This library is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
|
|
* License as published by the Free Software Foundation; either
|
|
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This library is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
* Lesser General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
|
|
* License along with this library. If not, see
|
|
|
|
* <http://www.gnu.org/licenses/>.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <config.h>
|
|
|
|
|
|
|
|
#ifdef __linux__
|
|
|
|
# include <sys/sysmacros.h>
|
|
|
|
#endif
|
2020-09-01 13:27:44 +02:00
|
|
|
#if defined(WITH_SYS_MOUNT_H)
|
2020-07-20 16:18:57 +02:00
|
|
|
# include <sys/mount.h>
|
|
|
|
#endif
|
|
|
|
#ifdef WITH_SELINUX
|
|
|
|
# include <selinux/selinux.h>
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#include "qemu_namespace.h"
|
|
|
|
#include "qemu_domain.h"
|
|
|
|
#include "qemu_cgroup.h"
|
|
|
|
#include "qemu_security.h"
|
|
|
|
#include "qemu_hostdev.h"
|
|
|
|
#include "viralloc.h"
|
|
|
|
#include "virlog.h"
|
|
|
|
#include "virdevmapper.h"
|
2021-02-04 14:10:42 +01:00
|
|
|
#include "virglibutil.h"
|
2020-07-20 16:18:57 +02:00
|
|
|
|
|
|
|
#define VIR_FROM_THIS VIR_FROM_QEMU
|
|
|
|
|
|
|
|
VIR_LOG_INIT("qemu.qemu_domain");
|
|
|
|
|
|
|
|
|
|
|
|
VIR_ENUM_IMPL(qemuDomainNamespace,
|
|
|
|
QEMU_DOMAIN_NS_LAST,
|
|
|
|
"mount",
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
* qemuDomainGetPreservedMountPath:
|
|
|
|
* @cfg: driver configuration data
|
|
|
|
* @vm: domain object
|
|
|
|
* @mountpoint: mount point path to convert
|
|
|
|
*
|
|
|
|
* For given @mountpoint return new path where the mount point
|
|
|
|
* should be moved temporarily whilst building the namespace.
|
|
|
|
*
|
|
|
|
* Returns: allocated string on success which the caller must free,
|
|
|
|
* NULL on failure.
|
|
|
|
*/
|
|
|
|
static char *
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainGetPreservedMountPath(virQEMUDriverConfig *cfg,
|
|
|
|
virDomainObj *vm,
|
2020-07-20 16:18:57 +02:00
|
|
|
const char *mountpoint)
|
|
|
|
{
|
|
|
|
char *path = NULL;
|
|
|
|
char *tmp;
|
|
|
|
const char *suffix = mountpoint + strlen(QEMU_DEVPREFIX);
|
|
|
|
g_autofree char *domname = virDomainDefGetShortName(vm->def);
|
|
|
|
size_t off;
|
|
|
|
|
|
|
|
if (!domname)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
if (STREQ(mountpoint, "/dev"))
|
|
|
|
suffix = "dev";
|
|
|
|
|
|
|
|
path = g_strdup_printf("%s/%s.%s", cfg->stateDir, domname, suffix);
|
|
|
|
|
|
|
|
/* Now consider that @mountpoint is "/dev/blah/blah2".
|
|
|
|
* @suffix then points to "blah/blah2". However, caller
|
|
|
|
* expects all the @paths to be the same depth. The
|
|
|
|
* caller doesn't always do `mkdir -p` but sometimes bare
|
|
|
|
* `touch`. Therefore fix all the suffixes. */
|
|
|
|
off = strlen(path) - strlen(suffix);
|
|
|
|
|
|
|
|
tmp = path + off;
|
|
|
|
while (*tmp) {
|
|
|
|
if (*tmp == '/')
|
|
|
|
*tmp = '.';
|
|
|
|
tmp++;
|
|
|
|
}
|
|
|
|
|
|
|
|
return path;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
* qemuDomainGetPreservedMounts:
|
|
|
|
*
|
|
|
|
* Process list of mounted filesystems and:
|
|
|
|
* a) save all FSs mounted under /dev to @devPath
|
|
|
|
* b) generate backup path for all the entries in a)
|
|
|
|
*
|
2021-02-04 15:09:57 +01:00
|
|
|
* Any of the return pointers can be NULL. Both arrays are NULL-terminated.
|
qemu_namespace: Fix a corner case in qemuDomainGetPreservedMounts()
When setting up namespace for QEMU we look at mount points under
/dev (like /dev/pts, /dev/mqueue/, etc.) because we want to
preserve those (which is done by moving them to a temp location,
unshare(), and then moving them back). We have a convenience
helper - qemuDomainGetPreservedMounts() - that processes the
mount table and (optionally) moves the other filesystems too.
This helper is also used when attempting to create a path in NS,
because the path, while starting with "/dev/" prefix, may
actually lead to one of those filesystems that we preserved.
And here comes the corner case: while we require the parent mount
table to be in shared mode (equivalent of `mount --make-rshared /'),
these mount events propagate iff the target path exist inside the
slave mount table (= QEMU's private namespace). And since we
create only a subset of /dev nodes, well, that assumption is not
always the case.
For instance, assume that a domain is already running, no
hugepages were configured for it nor any hugetlbfs is mounted.
Now, when a hugetlbfs is mounted into '/dev/hugepages', this is
propagated into the QEMU's namespace, but since the target dir
does not exist in the private /dev, the FS is not mounted in the
namespace.
Fortunately, this difference between namespaces is visible when
comparing /proc/mounts and /proc/$PID/mounts (where PID is the
QEMU's PID). Therefore, if possible we should look at the latter.
Signed-off-by: Michal Privoznik <mprivozn@redhat.com>
Reviewed-by: Martin Kletzander <mkletzan@redhat.com>
2022-09-06 13:43:22 +02:00
|
|
|
* Get the mount table either from @vm's PID (if running), or from the
|
|
|
|
* namespace we're in (if @vm's not running).
|
2020-07-20 16:18:57 +02:00
|
|
|
*
|
|
|
|
* Returns 0 on success, -1 otherwise (with error reported)
|
|
|
|
*/
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainGetPreservedMounts(virQEMUDriverConfig *cfg,
|
|
|
|
virDomainObj *vm,
|
2020-07-20 16:18:57 +02:00
|
|
|
char ***devPath,
|
|
|
|
char ***devSavePath,
|
|
|
|
size_t *ndevPath)
|
|
|
|
{
|
2021-02-04 15:09:57 +01:00
|
|
|
g_auto(GStrv) mounts = NULL;
|
|
|
|
size_t nmounts = 0;
|
|
|
|
g_auto(GStrv) paths = NULL;
|
|
|
|
g_auto(GStrv) savePaths = NULL;
|
qemu_namespace: Fix a corner case in qemuDomainGetPreservedMounts()
When setting up namespace for QEMU we look at mount points under
/dev (like /dev/pts, /dev/mqueue/, etc.) because we want to
preserve those (which is done by moving them to a temp location,
unshare(), and then moving them back). We have a convenience
helper - qemuDomainGetPreservedMounts() - that processes the
mount table and (optionally) moves the other filesystems too.
This helper is also used when attempting to create a path in NS,
because the path, while starting with "/dev/" prefix, may
actually lead to one of those filesystems that we preserved.
And here comes the corner case: while we require the parent mount
table to be in shared mode (equivalent of `mount --make-rshared /'),
these mount events propagate iff the target path exist inside the
slave mount table (= QEMU's private namespace). And since we
create only a subset of /dev nodes, well, that assumption is not
always the case.
For instance, assume that a domain is already running, no
hugepages were configured for it nor any hugetlbfs is mounted.
Now, when a hugetlbfs is mounted into '/dev/hugepages', this is
propagated into the QEMU's namespace, but since the target dir
does not exist in the private /dev, the FS is not mounted in the
namespace.
Fortunately, this difference between namespaces is visible when
comparing /proc/mounts and /proc/$PID/mounts (where PID is the
QEMU's PID). Therefore, if possible we should look at the latter.
Signed-off-by: Michal Privoznik <mprivozn@redhat.com>
Reviewed-by: Martin Kletzander <mkletzan@redhat.com>
2022-09-06 13:43:22 +02:00
|
|
|
g_autofree char *mountsPath = NULL;
|
2021-02-04 15:09:57 +01:00
|
|
|
size_t i;
|
|
|
|
|
|
|
|
if (ndevPath)
|
|
|
|
*ndevPath = 0;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
qemu_namespace: Fix a corner case in qemuDomainGetPreservedMounts()
When setting up namespace for QEMU we look at mount points under
/dev (like /dev/pts, /dev/mqueue/, etc.) because we want to
preserve those (which is done by moving them to a temp location,
unshare(), and then moving them back). We have a convenience
helper - qemuDomainGetPreservedMounts() - that processes the
mount table and (optionally) moves the other filesystems too.
This helper is also used when attempting to create a path in NS,
because the path, while starting with "/dev/" prefix, may
actually lead to one of those filesystems that we preserved.
And here comes the corner case: while we require the parent mount
table to be in shared mode (equivalent of `mount --make-rshared /'),
these mount events propagate iff the target path exist inside the
slave mount table (= QEMU's private namespace). And since we
create only a subset of /dev nodes, well, that assumption is not
always the case.
For instance, assume that a domain is already running, no
hugepages were configured for it nor any hugetlbfs is mounted.
Now, when a hugetlbfs is mounted into '/dev/hugepages', this is
propagated into the QEMU's namespace, but since the target dir
does not exist in the private /dev, the FS is not mounted in the
namespace.
Fortunately, this difference between namespaces is visible when
comparing /proc/mounts and /proc/$PID/mounts (where PID is the
QEMU's PID). Therefore, if possible we should look at the latter.
Signed-off-by: Michal Privoznik <mprivozn@redhat.com>
Reviewed-by: Martin Kletzander <mkletzan@redhat.com>
2022-09-06 13:43:22 +02:00
|
|
|
if (vm->pid > 0)
|
|
|
|
mountsPath = g_strdup_printf("/proc/%lld/mounts", (long long) vm->pid);
|
|
|
|
else
|
|
|
|
mountsPath = g_strdup(QEMU_PROC_MOUNTS);
|
|
|
|
|
|
|
|
if (virFileGetMountSubtree(mountsPath, "/dev", &mounts, &nmounts) < 0)
|
2021-02-04 15:09:57 +01:00
|
|
|
return -1;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2021-02-04 15:09:57 +01:00
|
|
|
if (nmounts == 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return 0;
|
|
|
|
|
|
|
|
/* There can be nested mount points. For instance
|
|
|
|
* /dev/shm/blah can be a mount point and /dev/shm too. It
|
|
|
|
* doesn't make much sense to return the former path because
|
|
|
|
* caller preserves the latter (and with that the former
|
|
|
|
* too). Therefore prune nested mount points.
|
|
|
|
* NB mounts[0] is "/dev". Should we start the outer loop
|
|
|
|
* from the beginning of the array all we'd be left with is
|
|
|
|
* just the first element. Think about it.
|
|
|
|
*/
|
|
|
|
for (i = 1; i < nmounts; i++) {
|
2021-02-04 15:09:57 +01:00
|
|
|
size_t j = i + 1;
|
|
|
|
|
2022-10-31 16:26:17 +01:00
|
|
|
/* If we looked into mount table of already running VM,
|
|
|
|
* we might have found /dev twice. Remove the other
|
|
|
|
* occurrence as it would jeopardize the rest of the prune
|
|
|
|
* algorithm.
|
|
|
|
*/
|
|
|
|
if (STREQ(mounts[i], "/dev")) {
|
|
|
|
VIR_FREE(mounts[i]);
|
|
|
|
VIR_DELETE_ELEMENT_INPLACE(mounts, i, nmounts);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2020-07-20 16:18:57 +02:00
|
|
|
while (j < nmounts) {
|
|
|
|
char *c = STRSKIP(mounts[j], mounts[i]);
|
|
|
|
|
|
|
|
if (c && (*c == '/' || *c == '\0')) {
|
|
|
|
VIR_DEBUG("Dropping path %s because of %s", mounts[j], mounts[i]);
|
2022-10-31 15:38:13 +01:00
|
|
|
VIR_FREE(mounts[j]);
|
|
|
|
VIR_DELETE_ELEMENT_INPLACE(mounts, j, nmounts);
|
2020-07-20 16:18:57 +02:00
|
|
|
} else {
|
|
|
|
j++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-02-04 15:09:57 +01:00
|
|
|
/* mounts may not be NULL-terminated at this point, but we convert it into
|
|
|
|
* 'paths' which is NULL-terminated */
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2021-02-04 15:09:57 +01:00
|
|
|
paths = g_new0(char *, nmounts + 1);
|
|
|
|
|
|
|
|
for (i = 0; i < nmounts; i++)
|
|
|
|
paths[i] = g_steal_pointer(&mounts[i]);
|
|
|
|
|
|
|
|
if (devSavePath) {
|
|
|
|
savePaths = g_new0(char *, nmounts + 1);
|
|
|
|
|
|
|
|
for (i = 0; i < nmounts; i++) {
|
|
|
|
if (!(savePaths[i] = qemuDomainGetPreservedMountPath(cfg, vm, paths[i])))
|
|
|
|
return -1;
|
|
|
|
}
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
if (devPath)
|
2021-02-04 15:09:57 +01:00
|
|
|
*devPath = g_steal_pointer(&paths);
|
2020-07-20 16:18:57 +02:00
|
|
|
|
|
|
|
if (devSavePath)
|
2021-02-04 15:09:57 +01:00
|
|
|
*devSavePath = g_steal_pointer(&savePaths);
|
2020-07-20 16:18:57 +02:00
|
|
|
|
|
|
|
if (ndevPath)
|
|
|
|
*ndevPath = nmounts;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainPopulateDevices(virQEMUDriverConfig *cfg,
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList **paths)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
|
|
|
const char *const *devices = (const char *const *) cfg->cgroupDeviceACL;
|
|
|
|
size_t i;
|
|
|
|
|
|
|
|
if (!devices)
|
|
|
|
devices = defaultDeviceACL;
|
|
|
|
|
|
|
|
for (i = 0; devices[i]; i++) {
|
2021-02-04 14:10:42 +01:00
|
|
|
*paths = g_slist_prepend(*paths, g_strdup(devices[i]));
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainSetupDev(virSecurityManager *mgr,
|
|
|
|
virDomainObj *vm,
|
2020-07-21 17:13:11 +02:00
|
|
|
const char *path)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
|
|
|
g_autofree char *mount_options = NULL;
|
|
|
|
g_autofree char *opts = NULL;
|
|
|
|
|
|
|
|
VIR_DEBUG("Setting up /dev/ for domain %s", vm->def->name);
|
|
|
|
|
|
|
|
mount_options = qemuSecurityGetMountOptions(mgr, vm->def);
|
|
|
|
|
|
|
|
if (!mount_options)
|
|
|
|
mount_options = g_strdup("");
|
|
|
|
|
|
|
|
/*
|
|
|
|
* tmpfs is limited to 64kb, since we only have device nodes in there
|
|
|
|
* and don't want to DOS the entire OS RAM usage
|
|
|
|
*/
|
|
|
|
opts = g_strdup_printf("mode=755,size=65536%s", mount_options);
|
|
|
|
|
2020-07-21 17:13:11 +02:00
|
|
|
if (virFileSetupDev(path, opts) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainSetupDisk(virStorageSource *src,
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList **paths)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
2021-03-11 08:16:13 +01:00
|
|
|
virStorageSource *next;
|
2020-07-20 16:18:57 +02:00
|
|
|
bool hasNVMe = false;
|
|
|
|
|
2020-07-21 13:32:32 +02:00
|
|
|
for (next = src; virStorageSourceIsBacking(next); next = next->backingStore) {
|
2020-07-21 14:11:41 +02:00
|
|
|
g_autofree char *tmpPath = NULL;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
|
|
|
if (next->type == VIR_STORAGE_TYPE_NVME) {
|
|
|
|
hasNVMe = true;
|
|
|
|
|
2020-07-21 14:11:41 +02:00
|
|
|
if (!(tmpPath = virPCIDeviceAddressGetIOMMUGroupDev(&next->nvme->pciAddr)))
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
} else {
|
2022-01-25 17:49:00 +01:00
|
|
|
GSList *targetPaths = NULL;
|
2020-07-21 14:11:41 +02:00
|
|
|
|
|
|
|
if (virStorageSourceIsEmpty(next) ||
|
|
|
|
!virStorageSourceIsLocalStorage(next)) {
|
2020-07-20 16:18:57 +02:00
|
|
|
/* Not creating device. Just continue. */
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2020-07-21 14:11:41 +02:00
|
|
|
tmpPath = g_strdup(next->path);
|
2020-07-20 16:18:57 +02:00
|
|
|
|
|
|
|
if (virDevMapperGetTargets(next->path, &targetPaths) < 0 &&
|
|
|
|
errno != ENOSYS) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("Unable to get devmapper targets for %s"),
|
|
|
|
next->path);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
2021-09-20 14:30:59 +02:00
|
|
|
if (targetPaths)
|
|
|
|
*paths = g_slist_concat(g_slist_reverse(targetPaths), *paths);
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
2020-07-21 14:11:41 +02:00
|
|
|
|
2021-02-04 14:10:42 +01:00
|
|
|
*paths = g_slist_prepend(*paths, g_steal_pointer(&tmpPath));
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
/* qemu-pr-helper might require access to /dev/mapper/control. */
|
2021-02-04 14:10:42 +01:00
|
|
|
if (src->pr)
|
|
|
|
*paths = g_slist_prepend(*paths, g_strdup(QEMU_DEVICE_MAPPER_CONTROL_PATH));
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2021-02-04 14:10:42 +01:00
|
|
|
if (hasNVMe)
|
|
|
|
*paths = g_slist_prepend(*paths, g_strdup(QEMU_DEV_VFIO));
|
2020-07-20 16:18:57 +02:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainSetupAllDisks(virDomainObj *vm,
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList **paths)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
|
|
|
size_t i;
|
2020-07-21 14:11:41 +02:00
|
|
|
|
2020-07-20 16:18:57 +02:00
|
|
|
VIR_DEBUG("Setting up disks");
|
|
|
|
|
|
|
|
for (i = 0; i < vm->def->ndisks; i++) {
|
2020-07-21 13:32:32 +02:00
|
|
|
if (qemuDomainSetupDisk(vm->def->disks[i]->src,
|
2020-07-21 14:11:41 +02:00
|
|
|
paths) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
VIR_DEBUG("Setup all disks");
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainSetupHostdev(virDomainObj *vm,
|
|
|
|
virDomainHostdevDef *hostdev,
|
2020-07-21 14:18:59 +02:00
|
|
|
bool hotplug,
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList **paths)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
|
|
|
g_autofree char *path = NULL;
|
|
|
|
|
2020-07-21 14:18:59 +02:00
|
|
|
if (qemuDomainGetHostdevPath(hostdev, &path, NULL) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
|
2021-02-04 14:10:42 +01:00
|
|
|
if (path)
|
|
|
|
*paths = g_slist_prepend(*paths, g_steal_pointer(&path));
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2020-07-21 14:18:59 +02:00
|
|
|
if (qemuHostdevNeedsVFIO(hostdev) &&
|
2021-02-04 14:10:42 +01:00
|
|
|
(!hotplug || !qemuDomainNeedsVFIO(vm->def)))
|
|
|
|
*paths = g_slist_prepend(*paths, g_strdup(QEMU_DEV_VFIO));
|
2020-07-20 16:18:57 +02:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainSetupAllHostdevs(virDomainObj *vm,
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList **paths)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
|
|
|
size_t i;
|
|
|
|
|
|
|
|
VIR_DEBUG("Setting up hostdevs");
|
|
|
|
for (i = 0; i < vm->def->nhostdevs; i++) {
|
2020-07-21 14:18:59 +02:00
|
|
|
if (qemuDomainSetupHostdev(vm,
|
|
|
|
vm->def->hostdevs[i],
|
|
|
|
false,
|
|
|
|
paths) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
VIR_DEBUG("Setup all hostdevs");
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainSetupMemory(virDomainMemoryDef *mem,
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList **paths)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
2022-11-10 17:21:25 -08:00
|
|
|
switch (mem->model) {
|
|
|
|
case VIR_DOMAIN_MEMORY_MODEL_NVDIMM:
|
|
|
|
case VIR_DOMAIN_MEMORY_MODEL_VIRTIO_PMEM:
|
|
|
|
*paths = g_slist_prepend(*paths, g_strdup(mem->nvdimmPath));
|
|
|
|
break;
|
|
|
|
|
|
|
|
case VIR_DOMAIN_MEMORY_MODEL_SGX_EPC:
|
|
|
|
*paths = g_slist_prepend(*paths, g_strdup(QEMU_DEV_SGX_VEPVC));
|
|
|
|
*paths = g_slist_prepend(*paths, g_strdup(QEMU_DEV_SGX_PROVISION));
|
|
|
|
break;
|
|
|
|
|
|
|
|
case VIR_DOMAIN_MEMORY_MODEL_NONE:
|
|
|
|
case VIR_DOMAIN_MEMORY_MODEL_DIMM:
|
|
|
|
case VIR_DOMAIN_MEMORY_MODEL_VIRTIO_MEM:
|
|
|
|
case VIR_DOMAIN_MEMORY_MODEL_LAST:
|
|
|
|
break;
|
|
|
|
}
|
2021-02-04 14:10:42 +01:00
|
|
|
|
|
|
|
return 0;
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainSetupAllMemories(virDomainObj *vm,
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList **paths)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
|
|
|
size_t i;
|
|
|
|
|
|
|
|
VIR_DEBUG("Setting up memories");
|
|
|
|
for (i = 0; i < vm->def->nmems; i++) {
|
2020-07-21 12:57:49 +02:00
|
|
|
if (qemuDomainSetupMemory(vm->def->mems[i],
|
2020-07-21 13:30:31 +02:00
|
|
|
paths) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
VIR_DEBUG("Setup all memories");
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainSetupChardev(virDomainDef *def G_GNUC_UNUSED,
|
|
|
|
virDomainChrDef *dev,
|
2020-07-20 16:18:57 +02:00
|
|
|
void *opaque)
|
|
|
|
{
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList **paths = opaque;
|
2020-07-20 16:18:57 +02:00
|
|
|
const char *path = NULL;
|
|
|
|
|
|
|
|
if (!(path = virDomainChrSourceDefGetPath(dev->source)))
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
/* Socket created by qemu. It doesn't exist upfront. */
|
|
|
|
if (dev->source->type == VIR_DOMAIN_CHR_TYPE_UNIX &&
|
|
|
|
dev->source->data.nix.listen)
|
|
|
|
return 0;
|
|
|
|
|
2021-02-04 14:10:42 +01:00
|
|
|
*paths = g_slist_prepend(*paths, g_strdup(path));
|
|
|
|
return 0;
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainSetupAllChardevs(virDomainObj *vm,
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList **paths)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
|
|
|
VIR_DEBUG("Setting up chardevs");
|
|
|
|
|
|
|
|
if (virDomainChrDefForeach(vm->def,
|
|
|
|
true,
|
|
|
|
qemuDomainSetupChardev,
|
2020-07-21 14:26:49 +02:00
|
|
|
paths) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
VIR_DEBUG("Setup all chardevs");
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainSetupTPM(virDomainTPMDef *dev,
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList **paths)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
|
|
|
switch (dev->type) {
|
|
|
|
case VIR_DOMAIN_TPM_TYPE_PASSTHROUGH:
|
2021-11-05 16:51:22 +01:00
|
|
|
*paths = g_slist_prepend(*paths, g_strdup(dev->data.passthrough.source->data.file.path));
|
2020-07-20 16:18:57 +02:00
|
|
|
break;
|
|
|
|
|
|
|
|
case VIR_DOMAIN_TPM_TYPE_EMULATOR:
|
2022-10-17 15:20:24 +02:00
|
|
|
case VIR_DOMAIN_TPM_TYPE_EXTERNAL:
|
2020-07-20 16:18:57 +02:00
|
|
|
case VIR_DOMAIN_TPM_TYPE_LAST:
|
|
|
|
/* nada */
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainSetupAllTPMs(virDomainObj *vm,
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList **paths)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
|
|
|
size_t i;
|
|
|
|
|
|
|
|
VIR_DEBUG("Setting up TPMs");
|
|
|
|
|
|
|
|
for (i = 0; i < vm->def->ntpms; i++) {
|
2020-07-21 14:29:09 +02:00
|
|
|
if (qemuDomainSetupTPM(vm->def->tpms[i], paths) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
VIR_DEBUG("Setup all TPMs");
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainSetupGraphics(virDomainGraphicsDef *gfx,
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList **paths)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
|
|
|
const char *rendernode = virDomainGraphicsGetRenderNode(gfx);
|
|
|
|
|
|
|
|
if (!rendernode)
|
|
|
|
return 0;
|
|
|
|
|
2021-02-04 14:10:42 +01:00
|
|
|
*paths = g_slist_prepend(*paths, g_strdup(rendernode));
|
|
|
|
return 0;
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainSetupAllGraphics(virDomainObj *vm,
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList **paths)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
|
|
|
size_t i;
|
|
|
|
|
|
|
|
VIR_DEBUG("Setting up graphics");
|
|
|
|
for (i = 0; i < vm->def->ngraphics; i++) {
|
2020-07-21 12:57:49 +02:00
|
|
|
if (qemuDomainSetupGraphics(vm->def->graphics[i],
|
2020-07-21 14:30:44 +02:00
|
|
|
paths) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
VIR_DEBUG("Setup all graphics");
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainSetupInput(virDomainInputDef *input,
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList **paths)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
|
|
|
const char *path = virDomainInputDefGetPath(input);
|
|
|
|
|
2021-02-04 14:10:42 +01:00
|
|
|
if (!path)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
*paths = g_slist_prepend(*paths, g_strdup(path));
|
2020-07-20 16:18:57 +02:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainSetupAllInputs(virDomainObj *vm,
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList **paths)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
|
|
|
size_t i;
|
|
|
|
|
|
|
|
VIR_DEBUG("Setting up inputs");
|
|
|
|
for (i = 0; i < vm->def->ninputs; i++) {
|
2020-07-21 12:57:49 +02:00
|
|
|
if (qemuDomainSetupInput(vm->def->inputs[i],
|
2020-07-21 14:34:22 +02:00
|
|
|
paths) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
VIR_DEBUG("Setup all inputs");
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainSetupRNG(virDomainRNGDef *rng,
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList **paths)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
|
|
|
switch ((virDomainRNGBackend) rng->backend) {
|
|
|
|
case VIR_DOMAIN_RNG_BACKEND_RANDOM:
|
2021-02-04 14:10:42 +01:00
|
|
|
*paths = g_slist_prepend(*paths, g_strdup(rng->source.file));
|
2020-07-20 16:18:57 +02:00
|
|
|
break;
|
|
|
|
|
|
|
|
case VIR_DOMAIN_RNG_BACKEND_EGD:
|
|
|
|
case VIR_DOMAIN_RNG_BACKEND_BUILTIN:
|
|
|
|
case VIR_DOMAIN_RNG_BACKEND_LAST:
|
|
|
|
/* nada */
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainSetupAllRNGs(virDomainObj *vm,
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList **paths)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
|
|
|
size_t i;
|
|
|
|
|
|
|
|
VIR_DEBUG("Setting up RNGs");
|
|
|
|
for (i = 0; i < vm->def->nrngs; i++) {
|
2020-07-21 12:57:49 +02:00
|
|
|
if (qemuDomainSetupRNG(vm->def->rngs[i],
|
2020-07-21 14:37:22 +02:00
|
|
|
paths) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
VIR_DEBUG("Setup all RNGs");
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainSetupLoader(virDomainObj *vm,
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList **paths)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
2021-03-11 08:16:13 +01:00
|
|
|
virDomainLoaderDef *loader = vm->def->os.loader;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
|
|
|
VIR_DEBUG("Setting up loader");
|
|
|
|
|
|
|
|
if (loader) {
|
|
|
|
switch ((virDomainLoader) loader->type) {
|
|
|
|
case VIR_DOMAIN_LOADER_TYPE_ROM:
|
2021-02-04 14:10:42 +01:00
|
|
|
*paths = g_slist_prepend(*paths, g_strdup(loader->path));
|
2020-07-20 16:18:57 +02:00
|
|
|
break;
|
|
|
|
|
|
|
|
case VIR_DOMAIN_LOADER_TYPE_PFLASH:
|
2021-02-04 14:10:42 +01:00
|
|
|
*paths = g_slist_prepend(*paths, g_strdup(loader->path));
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2022-05-04 09:51:11 -07:00
|
|
|
if (loader->nvram &&
|
2022-06-03 13:11:08 +02:00
|
|
|
qemuDomainSetupDisk(loader->nvram, paths) < 0)
|
|
|
|
return -1;
|
|
|
|
|
2020-07-20 16:18:57 +02:00
|
|
|
break;
|
|
|
|
|
|
|
|
case VIR_DOMAIN_LOADER_TYPE_NONE:
|
|
|
|
case VIR_DOMAIN_LOADER_TYPE_LAST:
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
VIR_DEBUG("Setup loader");
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainSetupLaunchSecurity(virDomainObj *vm,
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList **paths)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
2021-07-21 13:07:51 +02:00
|
|
|
virDomainSecDef *sec = vm->def->sec;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2021-07-21 13:07:51 +02:00
|
|
|
if (!sec)
|
2020-07-20 16:18:57 +02:00
|
|
|
return 0;
|
|
|
|
|
2021-07-21 13:07:51 +02:00
|
|
|
switch ((virDomainLaunchSecurity) sec->sectype) {
|
|
|
|
case VIR_DOMAIN_LAUNCH_SECURITY_SEV:
|
|
|
|
VIR_DEBUG("Setting up launch security for SEV");
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2021-07-21 13:07:51 +02:00
|
|
|
*paths = g_slist_prepend(*paths, g_strdup(QEMU_DEV_SEV));
|
|
|
|
|
|
|
|
VIR_DEBUG("Set up launch security for SEV");
|
|
|
|
break;
|
2021-07-21 13:17:40 +02:00
|
|
|
case VIR_DOMAIN_LAUNCH_SECURITY_PV:
|
|
|
|
break;
|
2021-07-21 13:07:51 +02:00
|
|
|
case VIR_DOMAIN_LAUNCH_SECURITY_NONE:
|
|
|
|
case VIR_DOMAIN_LAUNCH_SECURITY_LAST:
|
|
|
|
virReportEnumRangeError(virDomainLaunchSecurity, sec->sectype);
|
|
|
|
return -1;
|
|
|
|
}
|
2020-07-20 16:18:57 +02:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
qemu_domain_namespace: Repurpose qemuDomainBuildNamespace()
Okay, here is the deal. Currently, the way we build namespace is
very fragile. It is done from pre-exec hook when starting a
domain, after we mass closed all FDs and before we drop
privileges and exec() QEMU. This fact poses some limitations onto
the namespace build code, e.g. it has to make sure not to keep
any FD opened (not even through a library call), because it would
be leaked to QEMU. Also, it has to call only async signal safe
functions. These requirements are hard to meet - in fact as of my
commit v6.2.0-rc1~235 we are leaking a FD into QEMU by calling
libdevmapper functions.
To solve this issue and avoid similar problems in the future, we
should change our paradigm. We already have functions which can
populate domain's namespace with nodes from the daemon context.
If we use them to populate the namespace and keep only the bare
minimum in the pre-exec hook, we've mitigated the risk.
Therefore, the old qemuDomainBuildNamespace() is renamed to
qemuDomainUnshareNamespace() and new qemuDomainBuildNamespace()
function is introduced. So far, the new function is basically a
NOP and domain's namespace is still populated from the pre-exec
hook - next patches will fix it.
Signed-off-by: Michal Privoznik <mprivozn@redhat.com>
Reviewed-by: Ján Tomko <jtomko@redhat.com>
2020-07-21 18:12:26 +02:00
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuNamespaceMknodPaths(virDomainObj *vm,
|
2021-07-14 16:46:54 +02:00
|
|
|
GSList *paths,
|
|
|
|
bool *created);
|
qemu_domain_namespace: Repurpose qemuDomainBuildNamespace()
Okay, here is the deal. Currently, the way we build namespace is
very fragile. It is done from pre-exec hook when starting a
domain, after we mass closed all FDs and before we drop
privileges and exec() QEMU. This fact poses some limitations onto
the namespace build code, e.g. it has to make sure not to keep
any FD opened (not even through a library call), because it would
be leaked to QEMU. Also, it has to call only async signal safe
functions. These requirements are hard to meet - in fact as of my
commit v6.2.0-rc1~235 we are leaking a FD into QEMU by calling
libdevmapper functions.
To solve this issue and avoid similar problems in the future, we
should change our paradigm. We already have functions which can
populate domain's namespace with nodes from the daemon context.
If we use them to populate the namespace and keep only the bare
minimum in the pre-exec hook, we've mitigated the risk.
Therefore, the old qemuDomainBuildNamespace() is renamed to
qemuDomainUnshareNamespace() and new qemuDomainBuildNamespace()
function is introduced. So far, the new function is basically a
NOP and domain's namespace is still populated from the pre-exec
hook - next patches will fix it.
Signed-off-by: Michal Privoznik <mprivozn@redhat.com>
Reviewed-by: Ján Tomko <jtomko@redhat.com>
2020-07-21 18:12:26 +02:00
|
|
|
|
|
|
|
|
|
|
|
int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainBuildNamespace(virQEMUDriverConfig *cfg,
|
|
|
|
virDomainObj *vm)
|
qemu_domain_namespace: Repurpose qemuDomainBuildNamespace()
Okay, here is the deal. Currently, the way we build namespace is
very fragile. It is done from pre-exec hook when starting a
domain, after we mass closed all FDs and before we drop
privileges and exec() QEMU. This fact poses some limitations onto
the namespace build code, e.g. it has to make sure not to keep
any FD opened (not even through a library call), because it would
be leaked to QEMU. Also, it has to call only async signal safe
functions. These requirements are hard to meet - in fact as of my
commit v6.2.0-rc1~235 we are leaking a FD into QEMU by calling
libdevmapper functions.
To solve this issue and avoid similar problems in the future, we
should change our paradigm. We already have functions which can
populate domain's namespace with nodes from the daemon context.
If we use them to populate the namespace and keep only the bare
minimum in the pre-exec hook, we've mitigated the risk.
Therefore, the old qemuDomainBuildNamespace() is renamed to
qemuDomainUnshareNamespace() and new qemuDomainBuildNamespace()
function is introduced. So far, the new function is basically a
NOP and domain's namespace is still populated from the pre-exec
hook - next patches will fix it.
Signed-off-by: Michal Privoznik <mprivozn@redhat.com>
Reviewed-by: Ján Tomko <jtomko@redhat.com>
2020-07-21 18:12:26 +02:00
|
|
|
{
|
2021-02-04 14:10:42 +01:00
|
|
|
g_autoptr(virGSListString) paths = NULL;
|
qemu_domain_namespace: Repurpose qemuDomainBuildNamespace()
Okay, here is the deal. Currently, the way we build namespace is
very fragile. It is done from pre-exec hook when starting a
domain, after we mass closed all FDs and before we drop
privileges and exec() QEMU. This fact poses some limitations onto
the namespace build code, e.g. it has to make sure not to keep
any FD opened (not even through a library call), because it would
be leaked to QEMU. Also, it has to call only async signal safe
functions. These requirements are hard to meet - in fact as of my
commit v6.2.0-rc1~235 we are leaking a FD into QEMU by calling
libdevmapper functions.
To solve this issue and avoid similar problems in the future, we
should change our paradigm. We already have functions which can
populate domain's namespace with nodes from the daemon context.
If we use them to populate the namespace and keep only the bare
minimum in the pre-exec hook, we've mitigated the risk.
Therefore, the old qemuDomainBuildNamespace() is renamed to
qemuDomainUnshareNamespace() and new qemuDomainBuildNamespace()
function is introduced. So far, the new function is basically a
NOP and domain's namespace is still populated from the pre-exec
hook - next patches will fix it.
Signed-off-by: Michal Privoznik <mprivozn@redhat.com>
Reviewed-by: Ján Tomko <jtomko@redhat.com>
2020-07-21 18:12:26 +02:00
|
|
|
|
2020-08-21 15:49:29 +02:00
|
|
|
if (!qemuDomainNamespaceEnabled(vm, QEMU_DOMAIN_NS_MOUNT)) {
|
|
|
|
VIR_DEBUG("namespaces disabled for domain %s", vm->def->name);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2020-07-21 17:13:11 +02:00
|
|
|
if (qemuDomainPopulateDevices(cfg, &paths) < 0)
|
|
|
|
return -1;
|
|
|
|
|
2020-07-21 14:11:41 +02:00
|
|
|
if (qemuDomainSetupAllDisks(vm, &paths) < 0)
|
|
|
|
return -1;
|
|
|
|
|
2020-07-21 14:18:59 +02:00
|
|
|
if (qemuDomainSetupAllHostdevs(vm, &paths) < 0)
|
|
|
|
return -1;
|
|
|
|
|
2020-07-21 13:30:31 +02:00
|
|
|
if (qemuDomainSetupAllMemories(vm, &paths) < 0)
|
|
|
|
return -1;
|
|
|
|
|
2020-07-21 14:26:49 +02:00
|
|
|
if (qemuDomainSetupAllChardevs(vm, &paths) < 0)
|
|
|
|
return -1;
|
|
|
|
|
2020-07-21 14:29:09 +02:00
|
|
|
if (qemuDomainSetupAllTPMs(vm, &paths) < 0)
|
|
|
|
return -1;
|
|
|
|
|
2020-07-21 14:30:44 +02:00
|
|
|
if (qemuDomainSetupAllGraphics(vm, &paths) < 0)
|
|
|
|
return -1;
|
|
|
|
|
2020-07-21 14:34:22 +02:00
|
|
|
if (qemuDomainSetupAllInputs(vm, &paths) < 0)
|
|
|
|
return -1;
|
|
|
|
|
2020-07-21 14:37:22 +02:00
|
|
|
if (qemuDomainSetupAllRNGs(vm, &paths) < 0)
|
|
|
|
return -1;
|
|
|
|
|
2020-07-21 14:49:42 +02:00
|
|
|
if (qemuDomainSetupLoader(vm, &paths) < 0)
|
|
|
|
return -1;
|
|
|
|
|
2020-07-21 14:51:13 +02:00
|
|
|
if (qemuDomainSetupLaunchSecurity(vm, &paths) < 0)
|
|
|
|
return -1;
|
|
|
|
|
2021-07-14 16:46:54 +02:00
|
|
|
if (qemuNamespaceMknodPaths(vm, paths, NULL) < 0)
|
qemu_domain_namespace: Repurpose qemuDomainBuildNamespace()
Okay, here is the deal. Currently, the way we build namespace is
very fragile. It is done from pre-exec hook when starting a
domain, after we mass closed all FDs and before we drop
privileges and exec() QEMU. This fact poses some limitations onto
the namespace build code, e.g. it has to make sure not to keep
any FD opened (not even through a library call), because it would
be leaked to QEMU. Also, it has to call only async signal safe
functions. These requirements are hard to meet - in fact as of my
commit v6.2.0-rc1~235 we are leaking a FD into QEMU by calling
libdevmapper functions.
To solve this issue and avoid similar problems in the future, we
should change our paradigm. We already have functions which can
populate domain's namespace with nodes from the daemon context.
If we use them to populate the namespace and keep only the bare
minimum in the pre-exec hook, we've mitigated the risk.
Therefore, the old qemuDomainBuildNamespace() is renamed to
qemuDomainUnshareNamespace() and new qemuDomainBuildNamespace()
function is introduced. So far, the new function is basically a
NOP and domain's namespace is still populated from the pre-exec
hook - next patches will fix it.
Signed-off-by: Michal Privoznik <mprivozn@redhat.com>
Reviewed-by: Ján Tomko <jtomko@redhat.com>
2020-07-21 18:12:26 +02:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2020-07-20 16:18:57 +02:00
|
|
|
int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainUnshareNamespace(virQEMUDriverConfig *cfg,
|
|
|
|
virSecurityManager *mgr,
|
|
|
|
virDomainObj *vm)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
|
|
|
const char *devPath = NULL;
|
2021-08-03 13:01:04 +02:00
|
|
|
g_auto(GStrv) devMountsPath = NULL;
|
|
|
|
g_auto(GStrv) devMountsSavePath = NULL;
|
2020-07-20 16:18:57 +02:00
|
|
|
size_t ndevMountsPath = 0, i;
|
|
|
|
int ret = -1;
|
|
|
|
|
|
|
|
if (!qemuDomainNamespaceEnabled(vm, QEMU_DOMAIN_NS_MOUNT)) {
|
|
|
|
ret = 0;
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (qemuDomainGetPreservedMounts(cfg, vm,
|
|
|
|
&devMountsPath, &devMountsSavePath,
|
|
|
|
&ndevMountsPath) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
for (i = 0; i < ndevMountsPath; i++) {
|
|
|
|
if (STREQ(devMountsPath[i], "/dev")) {
|
|
|
|
devPath = devMountsSavePath[i];
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!devPath) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
|
|
|
|
_("Unable to find any /dev mount"));
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (virProcessSetupPrivateMountNS() < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
2020-07-21 17:13:11 +02:00
|
|
|
if (qemuDomainSetupDev(mgr, vm, devPath) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
/* Save some mount points because we want to share them with the host */
|
|
|
|
for (i = 0; i < ndevMountsPath; i++) {
|
|
|
|
struct stat sb;
|
|
|
|
|
|
|
|
if (devMountsSavePath[i] == devPath)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
if (stat(devMountsPath[i], &sb) < 0) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("Unable to stat: %s"),
|
|
|
|
devMountsPath[i]);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* At this point, devMountsPath is either:
|
|
|
|
* a file (regular or special), or
|
|
|
|
* a directory. */
|
2021-02-26 09:37:10 +01:00
|
|
|
if ((S_ISDIR(sb.st_mode) && g_mkdir_with_parents(devMountsSavePath[i], 0777) < 0) ||
|
2020-07-20 16:18:57 +02:00
|
|
|
(!S_ISDIR(sb.st_mode) && virFileTouch(devMountsSavePath[i], sb.st_mode) < 0)) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("Failed to create %s"),
|
|
|
|
devMountsSavePath[i]);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (virFileMoveMount(devMountsPath[i], devMountsSavePath[i]) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (virFileMoveMount(devPath, "/dev") < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
for (i = 0; i < ndevMountsPath; i++) {
|
|
|
|
struct stat sb;
|
|
|
|
|
|
|
|
if (devMountsSavePath[i] == devPath)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
if (stat(devMountsSavePath[i], &sb) < 0) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("Unable to stat: %s"),
|
|
|
|
devMountsSavePath[i]);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (S_ISDIR(sb.st_mode)) {
|
2021-02-26 09:37:10 +01:00
|
|
|
if (g_mkdir_with_parents(devMountsPath[i], 0777) < 0) {
|
2020-07-20 16:18:57 +02:00
|
|
|
virReportSystemError(errno, _("Cannot create %s"),
|
|
|
|
devMountsPath[i]);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
if (virFileMakeParentPath(devMountsPath[i]) < 0 ||
|
|
|
|
virFileTouch(devMountsPath[i], sb.st_mode) < 0) {
|
|
|
|
virReportSystemError(errno, _("Cannot create %s"),
|
|
|
|
devMountsPath[i]);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (virFileMoveMount(devMountsSavePath[i], devMountsPath[i]) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = 0;
|
|
|
|
cleanup:
|
|
|
|
for (i = 0; i < ndevMountsPath; i++) {
|
|
|
|
#if defined(__linux__)
|
|
|
|
umount(devMountsSavePath[i]);
|
|
|
|
#endif /* defined(__linux__) */
|
|
|
|
/* The path can be either a regular file or a dir. */
|
|
|
|
if (virFileIsDir(devMountsSavePath[i]))
|
|
|
|
virFileDeleteTree(devMountsSavePath[i]);
|
|
|
|
else
|
|
|
|
unlink(devMountsSavePath[i]);
|
|
|
|
}
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
bool
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainNamespaceEnabled(virDomainObj *vm,
|
2020-07-20 16:18:57 +02:00
|
|
|
qemuDomainNamespace ns)
|
|
|
|
{
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainObjPrivate *priv = vm->privateData;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
|
|
|
return priv->namespaces &&
|
|
|
|
virBitmapIsBitSet(priv->namespaces, ns);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainEnableNamespace(virDomainObj *vm,
|
2020-07-20 16:18:57 +02:00
|
|
|
qemuDomainNamespace ns)
|
|
|
|
{
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainObjPrivate *priv = vm->privateData;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2020-10-01 17:42:11 +02:00
|
|
|
if (!priv->namespaces)
|
|
|
|
priv->namespaces = virBitmapNew(QEMU_DOMAIN_NS_LAST);
|
2020-07-20 16:18:57 +02:00
|
|
|
|
|
|
|
if (virBitmapSetBit(priv->namespaces, ns) < 0) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
_("Unable to enable namespace: %s"),
|
|
|
|
qemuDomainNamespaceTypeToString(ns));
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static void
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainDisableNamespace(virDomainObj *vm,
|
2020-07-20 16:18:57 +02:00
|
|
|
qemuDomainNamespace ns)
|
|
|
|
{
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainObjPrivate *priv = vm->privateData;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
|
|
|
if (priv->namespaces) {
|
|
|
|
ignore_value(virBitmapClearBit(priv->namespaces, ns));
|
|
|
|
if (virBitmapIsAllClear(priv->namespaces)) {
|
2022-01-28 18:42:45 +01:00
|
|
|
g_clear_pointer(&priv->namespaces, virBitmapFree);
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
void
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainDestroyNamespace(virQEMUDriver *driver G_GNUC_UNUSED,
|
|
|
|
virDomainObj *vm)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
|
|
|
if (qemuDomainNamespaceEnabled(vm, QEMU_DOMAIN_NS_MOUNT))
|
|
|
|
qemuDomainDisableNamespace(vm, QEMU_DOMAIN_NS_MOUNT);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
bool
|
|
|
|
qemuDomainNamespaceAvailable(qemuDomainNamespace ns G_GNUC_UNUSED)
|
|
|
|
{
|
|
|
|
#if !defined(__linux__)
|
|
|
|
/* Namespaces are Linux specific. */
|
|
|
|
return false;
|
|
|
|
|
|
|
|
#else /* defined(__linux__) */
|
|
|
|
|
|
|
|
switch (ns) {
|
|
|
|
case QEMU_DOMAIN_NS_MOUNT:
|
2021-05-26 18:42:40 +02:00
|
|
|
# if !defined(WITH_LIBACL) || !defined(WITH_SELINUX)
|
2020-07-20 16:18:57 +02:00
|
|
|
/* We can't create the exact copy of paths if either of
|
|
|
|
* these is not available. */
|
|
|
|
return false;
|
|
|
|
# else
|
|
|
|
if (virProcessNamespaceAvailable(VIR_PROCESS_NAMESPACE_MNT) < 0)
|
|
|
|
return false;
|
|
|
|
# endif
|
|
|
|
break;
|
|
|
|
case QEMU_DOMAIN_NS_LAST:
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
return true;
|
|
|
|
#endif /* defined(__linux__) */
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2020-07-20 20:00:19 +02:00
|
|
|
typedef struct _qemuNamespaceMknodItem qemuNamespaceMknodItem;
|
|
|
|
struct _qemuNamespaceMknodItem {
|
2020-09-07 13:35:50 +02:00
|
|
|
char *file;
|
2020-07-20 18:54:34 +02:00
|
|
|
char *target;
|
2020-07-20 20:00:19 +02:00
|
|
|
bool bindmounted;
|
2020-07-20 16:18:57 +02:00
|
|
|
GStatBuf sb;
|
|
|
|
void *acl;
|
|
|
|
char *tcon;
|
|
|
|
};
|
|
|
|
|
2020-07-20 20:00:19 +02:00
|
|
|
typedef struct _qemuNamespaceMknodData qemuNamespaceMknodData;
|
|
|
|
struct _qemuNamespaceMknodData {
|
2021-03-11 08:16:13 +01:00
|
|
|
virQEMUDriver *driver;
|
|
|
|
virDomainObj *vm;
|
|
|
|
qemuNamespaceMknodItem *items;
|
2020-07-20 20:00:19 +02:00
|
|
|
size_t nitems;
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
|
|
static void
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuNamespaceMknodItemClear(qemuNamespaceMknodItem *item)
|
2020-07-20 20:00:19 +02:00
|
|
|
{
|
2020-09-07 13:35:50 +02:00
|
|
|
VIR_FREE(item->file);
|
2020-07-20 20:00:19 +02:00
|
|
|
VIR_FREE(item->target);
|
|
|
|
virFileFreeACLs(&item->acl);
|
|
|
|
#ifdef WITH_SELINUX
|
|
|
|
freecon(item->tcon);
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2020-09-07 13:35:50 +02:00
|
|
|
G_DEFINE_AUTO_CLEANUP_CLEAR_FUNC(qemuNamespaceMknodItem, qemuNamespaceMknodItemClear);
|
|
|
|
|
2020-07-20 20:00:19 +02:00
|
|
|
static void
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuNamespaceMknodDataClear(qemuNamespaceMknodData *data)
|
2020-07-20 20:00:19 +02:00
|
|
|
{
|
|
|
|
size_t i;
|
|
|
|
|
|
|
|
for (i = 0; i < data->nitems; i++) {
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuNamespaceMknodItem *item = &data->items[i];
|
2020-07-20 20:00:19 +02:00
|
|
|
|
|
|
|
qemuNamespaceMknodItemClear(item);
|
|
|
|
}
|
|
|
|
|
|
|
|
VIR_FREE(data->items);
|
|
|
|
}
|
|
|
|
|
2020-07-20 16:18:57 +02:00
|
|
|
|
|
|
|
/* Our way of creating devices is highly linux specific */
|
|
|
|
#if defined(__linux__)
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuNamespaceMknodOne(qemuNamespaceMknodItem *data)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
|
|
|
int ret = -1;
|
|
|
|
bool delDevice = false;
|
|
|
|
bool isLink = S_ISLNK(data->sb.st_mode);
|
|
|
|
bool isDev = S_ISCHR(data->sb.st_mode) || S_ISBLK(data->sb.st_mode);
|
|
|
|
bool isReg = S_ISREG(data->sb.st_mode) || S_ISFIFO(data->sb.st_mode) || S_ISSOCK(data->sb.st_mode);
|
|
|
|
bool isDir = S_ISDIR(data->sb.st_mode);
|
2021-07-14 16:46:52 +02:00
|
|
|
bool exists = false;
|
|
|
|
|
|
|
|
if (virFileExists(data->file))
|
|
|
|
exists = true;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
|
|
|
if (virFileMakeParentPath(data->file) < 0) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("Unable to create %s"), data->file);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (isLink) {
|
2022-03-14 13:35:15 +01:00
|
|
|
g_autofree char *target = NULL;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2022-09-28 09:53:47 +02:00
|
|
|
if ((target = g_file_read_link(data->file, NULL)) &&
|
2022-03-14 13:35:15 +01:00
|
|
|
STREQ(target, data->target)) {
|
|
|
|
VIR_DEBUG("Skipping symlink %s -> %s which exists and points to correct target",
|
|
|
|
data->file, data->target);
|
2020-07-20 16:18:57 +02:00
|
|
|
} else {
|
2022-03-14 13:35:15 +01:00
|
|
|
VIR_DEBUG("Creating symlink %s -> %s", data->file, data->target);
|
|
|
|
|
|
|
|
/* First, unlink the symlink target. Symlinks change and
|
|
|
|
* therefore we have no guarantees that pre-existing
|
|
|
|
* symlink is still valid. */
|
|
|
|
if (unlink(data->file) < 0 &&
|
|
|
|
errno != ENOENT) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("Unable to remove symlink %s"),
|
|
|
|
data->file);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (symlink(data->target, data->file) < 0) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("Unable to create symlink %s (pointing to %s)"),
|
|
|
|
data->file, data->target);
|
|
|
|
goto cleanup;
|
|
|
|
} else {
|
|
|
|
delDevice = true;
|
|
|
|
}
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
|
|
|
} else if (isDev) {
|
2022-03-14 13:35:15 +01:00
|
|
|
GStatBuf sb;
|
|
|
|
|
|
|
|
if (g_lstat(data->file, &sb) >= 0 &&
|
|
|
|
sb.st_rdev == data->sb.st_rdev) {
|
|
|
|
VIR_DEBUG("Skipping dev %s (%d,%d) which exists and has correct MAJ:MIN",
|
|
|
|
data->file, major(data->sb.st_rdev), minor(data->sb.st_rdev));
|
2020-07-20 16:18:57 +02:00
|
|
|
} else {
|
2022-03-14 13:35:15 +01:00
|
|
|
VIR_DEBUG("Creating dev %s (%d,%d)",
|
|
|
|
data->file, major(data->sb.st_rdev), minor(data->sb.st_rdev));
|
|
|
|
unlink(data->file);
|
|
|
|
if (mknod(data->file, data->sb.st_mode, data->sb.st_rdev) < 0) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("Unable to create device %s"),
|
|
|
|
data->file);
|
|
|
|
goto cleanup;
|
|
|
|
} else {
|
|
|
|
delDevice = true;
|
|
|
|
}
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
|
|
|
} else if (isReg || isDir) {
|
|
|
|
/* We are not cleaning up disks on virDomainDetachDevice
|
|
|
|
* because disk might be still in use by different disk
|
|
|
|
* as its backing chain. This might however clash here.
|
|
|
|
* Therefore do the cleanup here. */
|
|
|
|
if (umount(data->file) < 0 &&
|
|
|
|
errno != ENOENT && errno != EINVAL) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("Unable to umount %s"),
|
|
|
|
data->file);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
if ((isReg && virFileTouch(data->file, data->sb.st_mode) < 0) ||
|
2021-02-26 09:17:30 +01:00
|
|
|
(isDir && g_mkdir_with_parents(data->file, data->sb.st_mode) < 0))
|
2020-07-20 16:18:57 +02:00
|
|
|
goto cleanup;
|
|
|
|
delDevice = true;
|
|
|
|
/* Just create the file here so that code below sets
|
|
|
|
* proper owner and mode. Move the mount only after that. */
|
|
|
|
} else {
|
|
|
|
virReportError(VIR_ERR_OPERATION_UNSUPPORTED,
|
|
|
|
_("unsupported device type %s 0%o"),
|
|
|
|
data->file, data->sb.st_mode);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (lchown(data->file, data->sb.st_uid, data->sb.st_gid) < 0) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("Failed to chown device %s"),
|
|
|
|
data->file);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Symlinks don't have mode */
|
|
|
|
if (!isLink &&
|
|
|
|
chmod(data->file, data->sb.st_mode) < 0) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("Failed to set permissions for device %s"),
|
|
|
|
data->file);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
2022-09-06 13:37:23 +02:00
|
|
|
if (data->acl &&
|
2020-07-20 16:18:57 +02:00
|
|
|
virFileSetACLs(data->file, data->acl) < 0 &&
|
|
|
|
errno != ENOTSUP) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("Unable to set ACLs on %s"), data->file);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
# ifdef WITH_SELINUX
|
|
|
|
if (data->tcon &&
|
|
|
|
lsetfilecon_raw(data->file, (const char *)data->tcon) < 0) {
|
|
|
|
VIR_WARNINGS_NO_WLOGICALOP_EQUAL_EXPR
|
|
|
|
if (errno != EOPNOTSUPP && errno != ENOTSUP) {
|
|
|
|
VIR_WARNINGS_RESET
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("Unable to set SELinux label on %s"),
|
|
|
|
data->file);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
# endif
|
|
|
|
|
|
|
|
/* Finish mount process started earlier. */
|
|
|
|
if ((isReg || isDir) &&
|
|
|
|
virFileMoveMount(data->target, data->file) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
2021-07-14 16:46:52 +02:00
|
|
|
ret = exists;
|
2020-07-20 16:18:57 +02:00
|
|
|
cleanup:
|
|
|
|
if (ret < 0 && delDevice) {
|
|
|
|
if (isDir)
|
|
|
|
virFileDeleteTree(data->file);
|
|
|
|
else
|
|
|
|
unlink(data->file);
|
|
|
|
}
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2020-07-21 09:44:36 +02:00
|
|
|
static bool
|
|
|
|
qemuNamespaceMknodItemNeedsBindMount(mode_t st_mode)
|
|
|
|
{
|
|
|
|
/* A block device S_ISBLK() or a chardev S_ISCHR() is intentionally not
|
|
|
|
* handled. We want to mknod() it instead of passing in through bind
|
|
|
|
* mounting. */
|
|
|
|
return S_ISREG(st_mode) || S_ISFIFO(st_mode) ||
|
|
|
|
S_ISSOCK(st_mode) || S_ISDIR(st_mode);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2020-07-20 16:18:57 +02:00
|
|
|
static int
|
2020-07-20 20:00:19 +02:00
|
|
|
qemuNamespaceMknodHelper(pid_t pid G_GNUC_UNUSED,
|
|
|
|
void *opaque)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuNamespaceMknodData *data = opaque;
|
2020-07-20 20:00:19 +02:00
|
|
|
size_t i;
|
2020-07-20 16:18:57 +02:00
|
|
|
int ret = -1;
|
2021-07-14 16:46:52 +02:00
|
|
|
bool exists = false;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2020-07-20 20:00:19 +02:00
|
|
|
qemuSecurityPostFork(data->driver->securityManager);
|
|
|
|
|
|
|
|
for (i = 0; i < data->nitems; i++) {
|
2021-07-14 16:46:52 +02:00
|
|
|
int rc = 0;
|
|
|
|
|
|
|
|
if ((rc = qemuNamespaceMknodOne(&data->items[i])) < 0)
|
2020-07-20 20:00:19 +02:00
|
|
|
goto cleanup;
|
2021-07-14 16:46:52 +02:00
|
|
|
|
|
|
|
if (rc > 0)
|
|
|
|
exists = true;
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
|
|
|
|
2021-07-14 16:46:52 +02:00
|
|
|
ret = exists;
|
2020-07-20 20:00:19 +02:00
|
|
|
cleanup:
|
|
|
|
qemuNamespaceMknodDataClear(data);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2020-07-20 20:00:19 +02:00
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuNamespaceMknodItemInit(qemuNamespaceMknodItem *item,
|
|
|
|
virQEMUDriverConfig *cfg,
|
|
|
|
virDomainObj *vm,
|
2020-07-20 20:00:19 +02:00
|
|
|
const char *file)
|
|
|
|
{
|
|
|
|
g_autofree char *target = NULL;
|
|
|
|
bool isLink;
|
|
|
|
bool needsBindMount;
|
|
|
|
|
2020-09-07 13:35:50 +02:00
|
|
|
item->file = g_strdup(file);
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2020-07-20 20:00:19 +02:00
|
|
|
if (g_lstat(file, &item->sb) < 0) {
|
qemu_namespace: Be tolerant to non-existent files when populating /dev
In 6.7.0 release I've changed how domain namespace is built and
populated. Previously it used to be done from a pre-exec hook
(ran in the forked off child, just before dropping all privileges
and exec()-ing QEMU), which not only meant we had to have two
different code paths for creating a node in domain's namespace
(one for this pre-exec hook, the other for hotplug ran from the
daemon), it also proved problematic because it was leaking FDs
into QEMU process.
To mitigate this problem, we've not only ditched libdevmapper
from the NS population process, I've also dropped the pre-exec
code and let the NS be populated from the daemon (using the
hotplug code). But, I was not careful when doing so, because the
pre-exec code was tolerant to files that doesn't exist, while
this new code isn't. For instance, the very first thing that is
done when the new NS is created is it's populated with
@defaultDeviceACL which contain files like /dev/null, /dev/zero,
/dev/random and /dev/kvm (and others). While the rest will
probably exist every time, /dev/kvm might not and thus the new
code I wrote has to be tolerant to that.
Of course, users can override the @defaultDeviceACL (by setting
cgroup_device_acl in qemu.conf) and remove /dev/kvm (which is
acceptable workaround), but we definitely want libvirt to work
out of the box even on hosts without KVM.
Fixes: 9048dc4e627ddf33996084167bece7b5fb83b0bc
Reported-by: Daniel P. Berrangé <berrange@redhat.com>
Signed-off-by: Michal Privoznik <mprivozn@redhat.com>
Reviewed-by: Daniel P. Berrangé <berrange@redhat.com>
Reviewed-by: Ján Tomko <jtomko@redhat.com>
2020-09-03 18:07:43 +02:00
|
|
|
if (errno == ENOENT)
|
|
|
|
return -2;
|
|
|
|
|
2020-07-20 16:18:57 +02:00
|
|
|
virReportSystemError(errno,
|
|
|
|
_("Unable to access %s"), file);
|
2020-07-20 20:00:19 +02:00
|
|
|
return -1;
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
|
|
|
|
2020-07-20 20:00:19 +02:00
|
|
|
isLink = S_ISLNK(item->sb.st_mode);
|
|
|
|
needsBindMount = qemuNamespaceMknodItemNeedsBindMount(item->sb.st_mode);
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2020-07-21 09:44:36 +02:00
|
|
|
if (needsBindMount && STRPREFIX(file, QEMU_DEVPREFIX)) {
|
2020-07-20 16:18:57 +02:00
|
|
|
if (!(target = qemuDomainGetPreservedMountPath(cfg, vm, file)))
|
2020-07-20 20:00:19 +02:00
|
|
|
return -1;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2020-07-20 20:00:19 +02:00
|
|
|
item->target = g_steal_pointer(&target);
|
2020-07-20 16:18:57 +02:00
|
|
|
} else if (isLink) {
|
|
|
|
g_autoptr(GError) gerr = NULL;
|
|
|
|
|
|
|
|
if (!(target = g_file_read_link(file, &gerr))) {
|
|
|
|
virReportError(VIR_ERR_SYSTEM_ERROR,
|
|
|
|
_("failed to resolve symlink %s: %s"), file, gerr->message);
|
2020-07-20 20:00:19 +02:00
|
|
|
return -1;
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
if (!g_path_is_absolute(target)) {
|
|
|
|
g_autofree char *fileTmp = g_strdup(file);
|
2020-07-20 20:00:19 +02:00
|
|
|
char *c = NULL;
|
|
|
|
char *tmp = NULL;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
|
|
|
if ((c = strrchr(fileTmp, '/')))
|
|
|
|
*(c + 1) = '\0';
|
|
|
|
|
|
|
|
tmp = g_strdup_printf("%s%s", fileTmp, target);
|
|
|
|
VIR_FREE(target);
|
|
|
|
target = g_steal_pointer(&tmp);
|
|
|
|
}
|
|
|
|
|
2020-07-20 20:00:19 +02:00
|
|
|
item->target = g_steal_pointer(&target);
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
/* Symlinks don't have ACLs. */
|
|
|
|
if (!isLink &&
|
2020-07-20 20:00:19 +02:00
|
|
|
virFileGetACLs(file, &item->acl) < 0 &&
|
2020-07-20 16:18:57 +02:00
|
|
|
errno != ENOTSUP) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("Unable to get ACLs on %s"), file);
|
2020-07-20 20:00:19 +02:00
|
|
|
return -1;
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
# ifdef WITH_SELINUX
|
2020-07-20 20:00:19 +02:00
|
|
|
if (lgetfilecon_raw(file, &item->tcon) < 0 &&
|
2020-07-20 16:18:57 +02:00
|
|
|
(errno != ENOTSUP && errno != ENODATA)) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("Unable to get SELinux label from %s"), file);
|
2020-07-20 20:00:19 +02:00
|
|
|
return -1;
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
|
|
|
# endif
|
|
|
|
|
2020-07-20 20:00:19 +02:00
|
|
|
return 0;
|
|
|
|
}
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2020-07-20 20:00:19 +02:00
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuNamespacePrepareOneItem(qemuNamespaceMknodData *data,
|
|
|
|
virQEMUDriverConfig *cfg,
|
|
|
|
virDomainObj *vm,
|
2020-07-21 10:58:41 +02:00
|
|
|
const char *file,
|
2021-08-03 12:43:19 +02:00
|
|
|
GStrv devMountsPath)
|
2020-07-20 20:00:19 +02:00
|
|
|
{
|
|
|
|
long ttl = sysconf(_SC_SYMLOOP_MAX);
|
2020-09-07 13:35:50 +02:00
|
|
|
g_autofree char *next = g_strdup(file);
|
2020-07-20 20:00:19 +02:00
|
|
|
|
|
|
|
while (1) {
|
2020-09-07 13:35:50 +02:00
|
|
|
g_auto(qemuNamespaceMknodItem) item = { 0 };
|
|
|
|
bool isLink;
|
qemu_namespace: Be tolerant to non-existent files when populating /dev
In 6.7.0 release I've changed how domain namespace is built and
populated. Previously it used to be done from a pre-exec hook
(ran in the forked off child, just before dropping all privileges
and exec()-ing QEMU), which not only meant we had to have two
different code paths for creating a node in domain's namespace
(one for this pre-exec hook, the other for hotplug ran from the
daemon), it also proved problematic because it was leaking FDs
into QEMU process.
To mitigate this problem, we've not only ditched libdevmapper
from the NS population process, I've also dropped the pre-exec
code and let the NS be populated from the daemon (using the
hotplug code). But, I was not careful when doing so, because the
pre-exec code was tolerant to files that doesn't exist, while
this new code isn't. For instance, the very first thing that is
done when the new NS is created is it's populated with
@defaultDeviceACL which contain files like /dev/null, /dev/zero,
/dev/random and /dev/kvm (and others). While the rest will
probably exist every time, /dev/kvm might not and thus the new
code I wrote has to be tolerant to that.
Of course, users can override the @defaultDeviceACL (by setting
cgroup_device_acl in qemu.conf) and remove /dev/kvm (which is
acceptable workaround), but we definitely want libvirt to work
out of the box even on hosts without KVM.
Fixes: 9048dc4e627ddf33996084167bece7b5fb83b0bc
Reported-by: Daniel P. Berrangé <berrange@redhat.com>
Signed-off-by: Michal Privoznik <mprivozn@redhat.com>
Reviewed-by: Daniel P. Berrangé <berrange@redhat.com>
Reviewed-by: Ján Tomko <jtomko@redhat.com>
2020-09-03 18:07:43 +02:00
|
|
|
int rc;
|
2020-07-20 20:00:19 +02:00
|
|
|
|
qemu_namespace: Be tolerant to non-existent files when populating /dev
In 6.7.0 release I've changed how domain namespace is built and
populated. Previously it used to be done from a pre-exec hook
(ran in the forked off child, just before dropping all privileges
and exec()-ing QEMU), which not only meant we had to have two
different code paths for creating a node in domain's namespace
(one for this pre-exec hook, the other for hotplug ran from the
daemon), it also proved problematic because it was leaking FDs
into QEMU process.
To mitigate this problem, we've not only ditched libdevmapper
from the NS population process, I've also dropped the pre-exec
code and let the NS be populated from the daemon (using the
hotplug code). But, I was not careful when doing so, because the
pre-exec code was tolerant to files that doesn't exist, while
this new code isn't. For instance, the very first thing that is
done when the new NS is created is it's populated with
@defaultDeviceACL which contain files like /dev/null, /dev/zero,
/dev/random and /dev/kvm (and others). While the rest will
probably exist every time, /dev/kvm might not and thus the new
code I wrote has to be tolerant to that.
Of course, users can override the @defaultDeviceACL (by setting
cgroup_device_acl in qemu.conf) and remove /dev/kvm (which is
acceptable workaround), but we definitely want libvirt to work
out of the box even on hosts without KVM.
Fixes: 9048dc4e627ddf33996084167bece7b5fb83b0bc
Reported-by: Daniel P. Berrangé <berrange@redhat.com>
Signed-off-by: Michal Privoznik <mprivozn@redhat.com>
Reviewed-by: Daniel P. Berrangé <berrange@redhat.com>
Reviewed-by: Ján Tomko <jtomko@redhat.com>
2020-09-03 18:07:43 +02:00
|
|
|
rc = qemuNamespaceMknodItemInit(&item, cfg, vm, next);
|
|
|
|
if (rc == -2) {
|
|
|
|
/* @file doesn't exist. We can break here. */
|
|
|
|
break;
|
|
|
|
} else if (rc < 0) {
|
|
|
|
/* Some other (critical) error. */
|
2020-07-20 20:00:19 +02:00
|
|
|
return -1;
|
qemu_namespace: Be tolerant to non-existent files when populating /dev
In 6.7.0 release I've changed how domain namespace is built and
populated. Previously it used to be done from a pre-exec hook
(ran in the forked off child, just before dropping all privileges
and exec()-ing QEMU), which not only meant we had to have two
different code paths for creating a node in domain's namespace
(one for this pre-exec hook, the other for hotplug ran from the
daemon), it also proved problematic because it was leaking FDs
into QEMU process.
To mitigate this problem, we've not only ditched libdevmapper
from the NS population process, I've also dropped the pre-exec
code and let the NS be populated from the daemon (using the
hotplug code). But, I was not careful when doing so, because the
pre-exec code was tolerant to files that doesn't exist, while
this new code isn't. For instance, the very first thing that is
done when the new NS is created is it's populated with
@defaultDeviceACL which contain files like /dev/null, /dev/zero,
/dev/random and /dev/kvm (and others). While the rest will
probably exist every time, /dev/kvm might not and thus the new
code I wrote has to be tolerant to that.
Of course, users can override the @defaultDeviceACL (by setting
cgroup_device_acl in qemu.conf) and remove /dev/kvm (which is
acceptable workaround), but we definitely want libvirt to work
out of the box even on hosts without KVM.
Fixes: 9048dc4e627ddf33996084167bece7b5fb83b0bc
Reported-by: Daniel P. Berrangé <berrange@redhat.com>
Signed-off-by: Michal Privoznik <mprivozn@redhat.com>
Reviewed-by: Daniel P. Berrangé <berrange@redhat.com>
Reviewed-by: Ján Tomko <jtomko@redhat.com>
2020-09-03 18:07:43 +02:00
|
|
|
}
|
2020-07-20 20:00:19 +02:00
|
|
|
|
2020-09-07 13:35:50 +02:00
|
|
|
isLink = S_ISLNK(item.sb.st_mode);
|
2021-08-05 17:00:45 +02:00
|
|
|
g_free(next);
|
|
|
|
next = g_strdup(item.target);
|
2020-09-07 13:35:50 +02:00
|
|
|
|
2021-08-05 17:00:45 +02:00
|
|
|
if (STRPREFIX(item.file, QEMU_DEVPREFIX)) {
|
2021-08-03 12:43:19 +02:00
|
|
|
GStrv n;
|
|
|
|
bool found = false;
|
|
|
|
|
|
|
|
for (n = devMountsPath; n && *n; n++) {
|
|
|
|
if (STREQ(*n, "/dev"))
|
2020-07-20 20:00:19 +02:00
|
|
|
continue;
|
2021-08-03 12:43:19 +02:00
|
|
|
if (STRPREFIX(item.file, *n)) {
|
|
|
|
found = true;
|
2020-07-20 20:00:19 +02:00
|
|
|
break;
|
2021-08-03 12:43:19 +02:00
|
|
|
}
|
2020-07-20 20:00:19 +02:00
|
|
|
}
|
|
|
|
|
2021-08-03 12:43:19 +02:00
|
|
|
if (!found)
|
2021-08-05 17:00:45 +02:00
|
|
|
VIR_APPEND_ELEMENT(data->items, data->nitems, item);
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
|
|
|
|
2020-09-07 13:35:50 +02:00
|
|
|
if (!isLink)
|
2020-07-20 20:00:19 +02:00
|
|
|
break;
|
|
|
|
|
|
|
|
if (ttl-- == 0) {
|
|
|
|
virReportSystemError(ELOOP,
|
|
|
|
_("Too many levels of symbolic links: %s"),
|
|
|
|
next);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuNamespaceMknodPaths(virDomainObj *vm,
|
2021-07-14 16:46:54 +02:00
|
|
|
GSList *paths,
|
|
|
|
bool *created)
|
2020-07-20 20:00:19 +02:00
|
|
|
{
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainObjPrivate *priv = vm->privateData;
|
|
|
|
virQEMUDriver *driver = priv->driver;
|
2020-07-21 10:58:41 +02:00
|
|
|
g_autoptr(virQEMUDriverConfig) cfg = NULL;
|
2021-08-03 12:45:37 +02:00
|
|
|
g_auto(GStrv) devMountsPath = NULL;
|
2020-07-20 20:00:19 +02:00
|
|
|
qemuNamespaceMknodData data = { 0 };
|
|
|
|
size_t i;
|
|
|
|
int ret = -1;
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList *next;
|
2020-07-20 20:00:19 +02:00
|
|
|
|
2021-02-04 14:10:42 +01:00
|
|
|
if (!paths)
|
2020-07-21 10:58:41 +02:00
|
|
|
return 0;
|
|
|
|
|
|
|
|
cfg = virQEMUDriverGetConfig(driver);
|
2021-08-03 12:45:37 +02:00
|
|
|
if (qemuDomainGetPreservedMounts(cfg, vm, &devMountsPath, NULL, NULL) < 0)
|
2020-07-21 10:58:41 +02:00
|
|
|
return -1;
|
|
|
|
|
2020-07-20 20:00:19 +02:00
|
|
|
data.driver = driver;
|
|
|
|
data.vm = vm;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2021-02-04 14:10:42 +01:00
|
|
|
for (next = paths; next; next = next->next) {
|
|
|
|
const char *path = next->data;
|
|
|
|
|
2021-08-03 12:43:19 +02:00
|
|
|
if (qemuNamespacePrepareOneItem(&data, cfg, vm, path, devMountsPath) < 0)
|
2020-07-21 10:58:41 +02:00
|
|
|
goto cleanup;
|
|
|
|
}
|
2020-07-20 20:00:19 +02:00
|
|
|
|
2022-09-28 09:47:37 +02:00
|
|
|
if (data.nitems == 0)
|
|
|
|
return 0;
|
|
|
|
|
2020-07-20 20:00:19 +02:00
|
|
|
for (i = 0; i < data.nitems; i++) {
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuNamespaceMknodItem *item = &data.items[i];
|
2020-07-20 20:00:19 +02:00
|
|
|
if (item->target &&
|
|
|
|
qemuNamespaceMknodItemNeedsBindMount(item->sb.st_mode)) {
|
|
|
|
if (virFileBindMountDevice(item->file, item->target) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
goto cleanup;
|
2020-07-20 20:00:19 +02:00
|
|
|
item->bindmounted = true;
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-07-20 20:00:19 +02:00
|
|
|
if (qemuSecurityPreFork(driver->securityManager) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
2021-07-14 16:46:54 +02:00
|
|
|
ret = virProcessRunInMountNamespace(vm->pid, qemuNamespaceMknodHelper,
|
|
|
|
&data);
|
2020-07-20 20:00:19 +02:00
|
|
|
qemuSecurityPostFork(driver->securityManager);
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2021-07-14 16:46:54 +02:00
|
|
|
if (ret == 0 && created != NULL)
|
|
|
|
*created = true;
|
|
|
|
|
2020-07-20 16:18:57 +02:00
|
|
|
cleanup:
|
2020-07-20 20:00:19 +02:00
|
|
|
for (i = 0; i < data.nitems; i++) {
|
|
|
|
if (data.items[i].bindmounted &&
|
|
|
|
umount(data.items[i].target) < 0) {
|
|
|
|
VIR_WARN("Unable to unmount %s", data.items[i].target);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
qemuNamespaceMknodDataClear(&data);
|
2020-07-20 16:18:57 +02:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
#else /* !defined(__linux__) */
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuNamespaceMknodPaths(virDomainObj *vm G_GNUC_UNUSED,
|
2021-07-14 16:46:54 +02:00
|
|
|
GSList *paths G_GNUC_UNUSED,
|
|
|
|
bool *created G_GNUC_UNUSED)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
|
|
|
virReportSystemError(ENOSYS, "%s",
|
|
|
|
_("Namespaces are not supported on this platform."));
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
#endif /* !defined(__linux__) */
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2020-07-21 15:04:38 +02:00
|
|
|
qemuNamespaceUnlinkHelper(pid_t pid G_GNUC_UNUSED,
|
|
|
|
void *opaque)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
2021-02-04 14:10:42 +01:00
|
|
|
g_autoptr(virGSListString) paths = opaque;
|
|
|
|
GSList *next;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2021-02-04 14:10:42 +01:00
|
|
|
for (next = paths; next; next = next->next) {
|
|
|
|
const char *path = next->data;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2020-07-21 15:04:38 +02:00
|
|
|
VIR_DEBUG("Unlinking %s", path);
|
|
|
|
if (unlink(path) < 0 && errno != ENOENT) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("Unable to remove device %s"), path);
|
|
|
|
return -1;
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuNamespaceUnlinkPaths(virDomainObj *vm,
|
2021-02-04 14:10:42 +01:00
|
|
|
GSList *paths)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainObjPrivate *priv = vm->privateData;
|
|
|
|
virQEMUDriver *driver = priv->driver;
|
2020-07-20 16:18:57 +02:00
|
|
|
g_autoptr(virQEMUDriverConfig) cfg = NULL;
|
2021-02-04 15:12:57 +01:00
|
|
|
g_auto(GStrv) devMountsPath = NULL;
|
2021-02-04 14:10:42 +01:00
|
|
|
g_autoptr(virGSListString) unlinkPaths = NULL;
|
|
|
|
GSList *next;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2021-02-04 14:10:42 +01:00
|
|
|
if (!paths)
|
2020-07-20 16:18:57 +02:00
|
|
|
return 0;
|
|
|
|
|
|
|
|
cfg = virQEMUDriverGetConfig(driver);
|
|
|
|
|
2021-02-04 15:12:57 +01:00
|
|
|
if (qemuDomainGetPreservedMounts(cfg, vm, &devMountsPath, NULL, NULL) < 0)
|
|
|
|
return -1;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2021-02-04 14:10:42 +01:00
|
|
|
for (next = paths; next; next = next->next) {
|
|
|
|
const char *path = next->data;
|
2020-07-21 15:04:38 +02:00
|
|
|
|
2021-02-04 14:10:42 +01:00
|
|
|
if (STRPREFIX(path, QEMU_DEVPREFIX)) {
|
2021-02-04 14:27:19 +01:00
|
|
|
GStrv mount;
|
|
|
|
bool inSubmount = false;
|
2022-03-14 15:05:11 +01:00
|
|
|
const char *const *devices = (const char *const *)cfg->cgroupDeviceACL;
|
2021-02-04 14:27:19 +01:00
|
|
|
|
|
|
|
for (mount = devMountsPath; *mount; mount++) {
|
|
|
|
if (STREQ(*mount, "/dev"))
|
2020-07-21 15:04:38 +02:00
|
|
|
continue;
|
2021-02-04 14:27:19 +01:00
|
|
|
|
2021-02-04 14:10:42 +01:00
|
|
|
if (STRPREFIX(path, *mount)) {
|
2021-02-04 14:27:19 +01:00
|
|
|
inSubmount = true;
|
2020-07-21 15:04:38 +02:00
|
|
|
break;
|
2021-02-04 14:27:19 +01:00
|
|
|
}
|
2020-07-21 15:04:38 +02:00
|
|
|
}
|
|
|
|
|
2022-03-14 15:05:11 +01:00
|
|
|
if (inSubmount)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
if (!devices)
|
|
|
|
devices = defaultDeviceACL;
|
|
|
|
|
|
|
|
if (g_strv_contains(devices, path))
|
|
|
|
continue;
|
|
|
|
|
|
|
|
unlinkPaths = g_slist_prepend(unlinkPaths, g_strdup(path));
|
2020-07-21 15:04:38 +02:00
|
|
|
}
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
|
|
|
|
2020-07-21 15:04:38 +02:00
|
|
|
if (unlinkPaths &&
|
|
|
|
virProcessRunInMountNamespace(vm->pid,
|
|
|
|
qemuNamespaceUnlinkHelper,
|
|
|
|
unlinkPaths) < 0)
|
|
|
|
return -1;
|
|
|
|
|
2021-02-04 15:12:57 +01:00
|
|
|
return 0;
|
2020-07-20 16:18:57 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2022-09-06 13:43:58 +02:00
|
|
|
int
|
|
|
|
qemuDomainNamespaceSetupPath(virDomainObj *vm,
|
|
|
|
const char *path,
|
|
|
|
bool *created)
|
|
|
|
{
|
|
|
|
g_autoptr(virGSListString) paths = NULL;
|
|
|
|
|
|
|
|
if (!qemuDomainNamespaceEnabled(vm, QEMU_DOMAIN_NS_MOUNT))
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
paths = g_slist_prepend(paths, g_strdup(path));
|
|
|
|
|
|
|
|
if (qemuNamespaceMknodPaths(vm, paths, created) < 0)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2020-07-20 16:18:57 +02:00
|
|
|
int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainNamespaceSetupDisk(virDomainObj *vm,
|
2021-07-14 16:46:54 +02:00
|
|
|
virStorageSource *src,
|
|
|
|
bool *created)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
2021-02-04 14:10:42 +01:00
|
|
|
g_autoptr(virGSListString) paths = NULL;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2020-07-20 18:01:16 +02:00
|
|
|
if (!qemuDomainNamespaceEnabled(vm, QEMU_DOMAIN_NS_MOUNT))
|
|
|
|
return 0;
|
|
|
|
|
2020-07-21 14:11:41 +02:00
|
|
|
if (qemuDomainSetupDisk(src, &paths) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
|
2021-07-14 16:46:54 +02:00
|
|
|
if (qemuNamespaceMknodPaths(vm, paths, created) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainNamespaceTeardownDisk(virDomainObj *vm G_GNUC_UNUSED,
|
|
|
|
virStorageSource *src G_GNUC_UNUSED)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
|
|
|
/* While in hotplug case we create the whole backing chain,
|
|
|
|
* here we must limit ourselves. The disk we want to remove
|
|
|
|
* might be a part of backing chain of another disk.
|
|
|
|
* If you are reading these lines and have some spare time
|
|
|
|
* you can come up with and algorithm that checks for that.
|
|
|
|
* I don't, therefore: */
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
* qemuDomainNamespaceSetupHostdev:
|
|
|
|
* @vm: domain object
|
|
|
|
* @hostdev: hostdev to create in @vm's namespace
|
|
|
|
*
|
|
|
|
* For given @hostdev, create its devfs representation (if it has one) in
|
|
|
|
* domain namespace. Note, @hostdev must not be in @vm's definition.
|
|
|
|
*
|
|
|
|
* Returns: 0 on success,
|
|
|
|
* -1 otherwise.
|
|
|
|
*/
|
|
|
|
int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainNamespaceSetupHostdev(virDomainObj *vm,
|
2021-07-14 16:46:54 +02:00
|
|
|
virDomainHostdevDef *hostdev,
|
|
|
|
bool *created)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
2021-02-04 14:10:42 +01:00
|
|
|
g_autoptr(virGSListString) paths = NULL;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2020-07-20 18:01:16 +02:00
|
|
|
if (!qemuDomainNamespaceEnabled(vm, QEMU_DOMAIN_NS_MOUNT))
|
|
|
|
return 0;
|
|
|
|
|
2020-07-21 14:18:59 +02:00
|
|
|
if (qemuDomainSetupHostdev(vm,
|
|
|
|
hostdev,
|
|
|
|
true,
|
|
|
|
&paths) < 0)
|
2020-07-21 12:14:02 +02:00
|
|
|
return -1;
|
|
|
|
|
2021-07-14 16:46:54 +02:00
|
|
|
if (qemuNamespaceMknodPaths(vm, paths, created) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
* qemuDomainNamespaceTeardownHostdev:
|
|
|
|
* @vm: domain object
|
|
|
|
* @hostdev: hostdev to remove in @vm's namespace
|
|
|
|
*
|
|
|
|
* For given @hostdev, remove its devfs representation (if it has one) in
|
|
|
|
* domain namespace. Note, @hostdev must not be in @vm's definition.
|
|
|
|
*
|
|
|
|
* Returns: 0 on success,
|
|
|
|
* -1 otherwise.
|
|
|
|
*/
|
|
|
|
int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainNamespaceTeardownHostdev(virDomainObj *vm,
|
|
|
|
virDomainHostdevDef *hostdev)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
2021-02-04 14:10:42 +01:00
|
|
|
g_autoptr(virGSListString) paths = NULL;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2020-07-20 18:01:16 +02:00
|
|
|
if (!qemuDomainNamespaceEnabled(vm, QEMU_DOMAIN_NS_MOUNT))
|
|
|
|
return 0;
|
|
|
|
|
2020-07-21 15:08:13 +02:00
|
|
|
if (qemuDomainSetupHostdev(vm,
|
|
|
|
hostdev,
|
|
|
|
true,
|
|
|
|
&paths) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
|
2021-02-04 14:10:42 +01:00
|
|
|
if (qemuNamespaceUnlinkPaths(vm, paths) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainNamespaceSetupMemory(virDomainObj *vm,
|
2021-07-14 16:46:54 +02:00
|
|
|
virDomainMemoryDef *mem,
|
|
|
|
bool *created)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
2021-02-04 14:10:42 +01:00
|
|
|
g_autoptr(virGSListString) paths = NULL;
|
2020-07-21 13:30:31 +02:00
|
|
|
|
2020-07-20 18:01:16 +02:00
|
|
|
if (!qemuDomainNamespaceEnabled(vm, QEMU_DOMAIN_NS_MOUNT))
|
|
|
|
return 0;
|
|
|
|
|
2020-07-21 13:30:31 +02:00
|
|
|
if (qemuDomainSetupMemory(mem, &paths) < 0)
|
|
|
|
return -1;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2021-07-14 16:46:54 +02:00
|
|
|
if (qemuNamespaceMknodPaths(vm, paths, created) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainNamespaceTeardownMemory(virDomainObj *vm,
|
|
|
|
virDomainMemoryDef *mem)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
2021-02-04 14:10:42 +01:00
|
|
|
g_autoptr(virGSListString) paths = NULL;
|
2020-07-21 15:09:30 +02:00
|
|
|
|
2020-07-20 18:01:16 +02:00
|
|
|
if (!qemuDomainNamespaceEnabled(vm, QEMU_DOMAIN_NS_MOUNT))
|
|
|
|
return 0;
|
|
|
|
|
2020-07-21 15:09:30 +02:00
|
|
|
if (qemuDomainSetupMemory(mem, &paths) < 0)
|
|
|
|
return -1;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2021-02-04 14:10:42 +01:00
|
|
|
if (qemuNamespaceUnlinkPaths(vm, paths) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainNamespaceSetupChardev(virDomainObj *vm,
|
2021-07-14 16:46:54 +02:00
|
|
|
virDomainChrDef *chr,
|
|
|
|
bool *created)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
2021-02-04 14:10:42 +01:00
|
|
|
g_autoptr(virGSListString) paths = NULL;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2020-07-20 18:01:16 +02:00
|
|
|
if (!qemuDomainNamespaceEnabled(vm, QEMU_DOMAIN_NS_MOUNT))
|
|
|
|
return 0;
|
|
|
|
|
2020-07-21 14:26:49 +02:00
|
|
|
if (qemuDomainSetupChardev(vm->def, chr, &paths) < 0)
|
|
|
|
return -1;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2021-07-14 16:46:54 +02:00
|
|
|
if (qemuNamespaceMknodPaths(vm, paths, created) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainNamespaceTeardownChardev(virDomainObj *vm,
|
|
|
|
virDomainChrDef *chr)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
2021-02-04 14:10:42 +01:00
|
|
|
g_autoptr(virGSListString) paths = NULL;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2020-07-20 18:01:16 +02:00
|
|
|
if (!qemuDomainNamespaceEnabled(vm, QEMU_DOMAIN_NS_MOUNT))
|
|
|
|
return 0;
|
|
|
|
|
2020-07-21 16:25:44 +02:00
|
|
|
if (qemuDomainSetupChardev(vm->def, chr, &paths) < 0)
|
|
|
|
return -1;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2021-02-04 14:10:42 +01:00
|
|
|
if (qemuNamespaceUnlinkPaths(vm, paths) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainNamespaceSetupRNG(virDomainObj *vm,
|
2021-07-14 16:46:54 +02:00
|
|
|
virDomainRNGDef *rng,
|
|
|
|
bool *created)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
2021-02-04 14:10:42 +01:00
|
|
|
g_autoptr(virGSListString) paths = NULL;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2020-07-20 18:01:16 +02:00
|
|
|
if (!qemuDomainNamespaceEnabled(vm, QEMU_DOMAIN_NS_MOUNT))
|
|
|
|
return 0;
|
|
|
|
|
2020-07-21 14:37:22 +02:00
|
|
|
if (qemuDomainSetupRNG(rng, &paths) < 0)
|
|
|
|
return -1;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2021-07-14 16:46:54 +02:00
|
|
|
if (qemuNamespaceMknodPaths(vm, paths, created) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainNamespaceTeardownRNG(virDomainObj *vm,
|
|
|
|
virDomainRNGDef *rng)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
2021-02-04 14:10:42 +01:00
|
|
|
g_autoptr(virGSListString) paths = NULL;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2020-07-20 18:01:16 +02:00
|
|
|
if (!qemuDomainNamespaceEnabled(vm, QEMU_DOMAIN_NS_MOUNT))
|
|
|
|
return 0;
|
|
|
|
|
2020-07-21 16:26:48 +02:00
|
|
|
if (qemuDomainSetupRNG(rng, &paths) < 0)
|
|
|
|
return -1;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2021-02-04 14:10:42 +01:00
|
|
|
if (qemuNamespaceUnlinkPaths(vm, paths) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainNamespaceSetupInput(virDomainObj *vm,
|
2021-07-14 16:46:54 +02:00
|
|
|
virDomainInputDef *input,
|
|
|
|
bool *created)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
2021-02-04 14:10:42 +01:00
|
|
|
g_autoptr(virGSListString) paths = NULL;
|
2021-07-14 16:46:54 +02:00
|
|
|
int ret = 0;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2020-07-20 18:01:16 +02:00
|
|
|
if (!qemuDomainNamespaceEnabled(vm, QEMU_DOMAIN_NS_MOUNT))
|
|
|
|
return 0;
|
|
|
|
|
2020-07-21 14:34:22 +02:00
|
|
|
if (qemuDomainSetupInput(input, &paths) < 0)
|
|
|
|
return -1;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2021-07-14 16:46:54 +02:00
|
|
|
if ((ret = qemuNamespaceMknodPaths(vm, paths, created)) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
2021-07-14 16:46:54 +02:00
|
|
|
|
2020-07-20 16:18:57 +02:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
int
|
2021-03-11 08:16:13 +01:00
|
|
|
qemuDomainNamespaceTeardownInput(virDomainObj *vm,
|
|
|
|
virDomainInputDef *input)
|
2020-07-20 16:18:57 +02:00
|
|
|
{
|
2021-02-04 14:10:42 +01:00
|
|
|
g_autoptr(virGSListString) paths = NULL;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2020-07-20 18:01:16 +02:00
|
|
|
if (!qemuDomainNamespaceEnabled(vm, QEMU_DOMAIN_NS_MOUNT))
|
|
|
|
return 0;
|
|
|
|
|
2020-07-21 16:27:52 +02:00
|
|
|
if (qemuDomainSetupInput(input, &paths) < 0)
|
|
|
|
return -1;
|
2020-07-20 16:18:57 +02:00
|
|
|
|
2021-02-04 14:10:42 +01:00
|
|
|
if (qemuNamespaceUnlinkPaths(vm, paths) < 0)
|
2020-07-20 16:18:57 +02:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|