Don't create dirs in cgroup controllers we don't want to use

Currently when getting an instance of virCgroupPtr we will
create the path in all cgroup controllers. Only at the virt
driver layer are we attempting to filter controllers. This
is bad because the mere act of creating the dirs in the
controllers can have a functional impact on the kernel,
particularly for performance.

Update the virCgroupForDriver() method to accept a bitmask
of controllers to use. Only create dirs in the controllers
that are requested. When creating cgroups for domains,
respect the active controller list from the parent cgroup

Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
This commit is contained in:
Daniel P. Berrange 2013-03-21 13:27:13 +00:00
parent 804a809a06
commit 56f27b3bbc
7 changed files with 115 additions and 107 deletions

View File

@ -530,7 +530,7 @@ virCgroupPtr virLXCCgroupCreate(virDomainDefPtr def)
int ret = -1; int ret = -1;
int rc; int rc;
rc = virCgroupForDriver("lxc", &driver, 1, 0); rc = virCgroupForDriver("lxc", &driver, 1, 0, -1);
if (rc != 0) { if (rc != 0) {
virReportSystemError(-rc, "%s", virReportSystemError(-rc, "%s",
_("Unable to get cgroup for driver")); _("Unable to get cgroup for driver"));

View File

@ -1459,7 +1459,7 @@ static int lxcStartup(bool privileged,
lxc_driver->log_libvirtd = 0; /* by default log to container logfile */ lxc_driver->log_libvirtd = 0; /* by default log to container logfile */
lxc_driver->have_netns = lxcCheckNetNsSupport(); lxc_driver->have_netns = lxcCheckNetNsSupport();
rc = virCgroupForDriver("lxc", &lxc_driver->cgroup, privileged, 1); rc = virCgroupForDriver("lxc", &lxc_driver->cgroup, privileged, 1, -1);
if (rc < 0) { if (rc < 0) {
char buf[1024] ATTRIBUTE_UNUSED; char buf[1024] ATTRIBUTE_UNUSED;
VIR_DEBUG("Unable to create cgroup for LXC driver: %s", VIR_DEBUG("Unable to create cgroup for LXC driver: %s",

View File

@ -57,8 +57,6 @@ bool qemuCgroupControllerActive(virQEMUDriverPtr driver,
goto cleanup; goto cleanup;
if (!virCgroupMounted(driver->cgroup, controller)) if (!virCgroupMounted(driver->cgroup, controller))
goto cleanup; goto cleanup;
if (cfg->cgroupControllers & (1 << controller))
ret = true;
cleanup: cleanup:
virObjectUnref(cfg); virObjectUnref(cfg);
@ -668,7 +666,7 @@ int qemuSetupCgroupForEmulator(virQEMUDriverPtr driver,
virDomainDefPtr def = vm->def; virDomainDefPtr def = vm->def;
unsigned long long period = vm->def->cputune.emulator_period; unsigned long long period = vm->def->cputune.emulator_period;
long long quota = vm->def->cputune.emulator_quota; long long quota = vm->def->cputune.emulator_quota;
int rc, i; int rc;
if ((period || quota) && if ((period || quota) &&
(!driver->cgroup || (!driver->cgroup ||
@ -697,23 +695,14 @@ int qemuSetupCgroupForEmulator(virQEMUDriverPtr driver,
goto cleanup; goto cleanup;
} }
for (i = 0; i < VIR_CGROUP_CONTROLLER_LAST; i++) { rc = virCgroupMoveTask(cgroup, cgroup_emulator);
if (i != VIR_CGROUP_CONTROLLER_CPU &&
i != VIR_CGROUP_CONTROLLER_CPUACCT &&
i != VIR_CGROUP_CONTROLLER_CPUSET)
continue;
if (!qemuCgroupControllerActive(driver, i))
continue;
rc = virCgroupMoveTask(cgroup, cgroup_emulator, i);
if (rc < 0) { if (rc < 0) {
virReportSystemError(-rc, virReportSystemError(-rc,
_("Unable to move tasks from domain cgroup to " _("Unable to move tasks from domain cgroup to "
"emulator cgroup in controller %d for %s"), "emulator cgroup for %s"),
i, vm->def->name); vm->def->name);
goto cleanup; goto cleanup;
} }
}
if (def->placement_mode == VIR_DOMAIN_CPU_PLACEMENT_MODE_AUTO) { if (def->placement_mode == VIR_DOMAIN_CPU_PLACEMENT_MODE_AUTO) {
if (!(cpumap = qemuPrepareCpumap(driver, nodemask))) if (!(cpumap = qemuPrepareCpumap(driver, nodemask)))

View File

@ -134,14 +134,7 @@ virQEMUDriverConfigPtr virQEMUDriverConfigNew(bool privileged)
} }
cfg->dynamicOwnership = privileged; cfg->dynamicOwnership = privileged;
cfg->cgroupControllers = cfg->cgroupControllers = -1; /* -1 == auto-detect */
(1 << VIR_CGROUP_CONTROLLER_CPU) |
(1 << VIR_CGROUP_CONTROLLER_DEVICES) |
(1 << VIR_CGROUP_CONTROLLER_MEMORY) |
(1 << VIR_CGROUP_CONTROLLER_BLKIO) |
(1 << VIR_CGROUP_CONTROLLER_CPUSET) |
(1 << VIR_CGROUP_CONTROLLER_CPUACCT);
if (privileged) { if (privileged) {
if (virAsprintf(&cfg->logDir, if (virAsprintf(&cfg->logDir,
@ -454,6 +447,7 @@ int virQEMUDriverConfigLoadFile(virQEMUDriverConfigPtr cfg,
p = virConfGetValue(conf, "cgroup_controllers"); p = virConfGetValue(conf, "cgroup_controllers");
CHECK_TYPE("cgroup_controllers", VIR_CONF_LIST); CHECK_TYPE("cgroup_controllers", VIR_CONF_LIST);
if (p) { if (p) {
cfg->cgroupControllers = 0;
virConfValuePtr pp; virConfValuePtr pp;
for (i = 0, pp = p->list; pp; ++i, pp = pp->next) { for (i = 0, pp = p->list; pp; ++i, pp = pp->next) {
int ctl; int ctl;
@ -472,12 +466,6 @@ int virQEMUDriverConfigLoadFile(virQEMUDriverConfigPtr cfg,
cfg->cgroupControllers |= (1 << ctl); cfg->cgroupControllers |= (1 << ctl);
} }
} }
for (i = 0 ; i < VIR_CGROUP_CONTROLLER_LAST ; i++) {
if (cfg->cgroupControllers & (1 << i)) {
VIR_INFO("Configured cgroup controller '%s'",
virCgroupControllerTypeToString(i));
}
}
p = virConfGetValue(conf, "cgroup_device_acl"); p = virConfGetValue(conf, "cgroup_device_acl");
CHECK_TYPE("cgroup_device_acl", VIR_CONF_LIST); CHECK_TYPE("cgroup_device_acl", VIR_CONF_LIST);

View File

@ -628,7 +628,8 @@ qemuStartup(bool privileged,
goto error; goto error;
} }
rc = virCgroupForDriver("qemu", &qemu_driver->cgroup, privileged, 1); rc = virCgroupForDriver("qemu", &qemu_driver->cgroup, privileged, 1,
cfg->cgroupControllers);
if (rc < 0) { if (rc < 0) {
VIR_INFO("Unable to create cgroup for driver: %s", VIR_INFO("Unable to create cgroup for driver: %s",
virStrerror(-rc, ebuf, sizeof(ebuf))); virStrerror(-rc, ebuf, sizeof(ebuf)));

View File

@ -70,8 +70,6 @@ typedef enum {
* before creating subcgroups and * before creating subcgroups and
* attaching tasks * attaching tasks
*/ */
VIR_CGROUP_VCPU = 1 << 1, /* create subdir only under the cgroup cpu,
* cpuacct and cpuset if possible. */
} virCgroupFlags; } virCgroupFlags;
/** /**
@ -230,11 +228,12 @@ no_memory:
} }
static int virCgroupDetect(virCgroupPtr group) static int virCgroupDetect(virCgroupPtr group,
int controllers)
{ {
int any = 0;
int rc; int rc;
int i; int i;
int j;
rc = virCgroupDetectMounts(group); rc = virCgroupDetectMounts(group);
if (rc < 0) { if (rc < 0) {
@ -242,14 +241,55 @@ static int virCgroupDetect(virCgroupPtr group)
return rc; return rc;
} }
/* Check that at least 1 controller is available */ if (controllers >= 0) {
VIR_DEBUG("Validating controllers %d", controllers);
for (i = 0 ; i < VIR_CGROUP_CONTROLLER_LAST ; i++) { for (i = 0 ; i < VIR_CGROUP_CONTROLLER_LAST ; i++) {
if (group->controllers[i].mountPoint != NULL) VIR_DEBUG("Controller '%s' wanted=%s",
any = 1; virCgroupControllerTypeToString(i),
(1 << i) & controllers ? "yes" : "no");
if (((1 << i) & controllers)) {
/* Ensure requested controller is present */
if (!group->controllers[i].mountPoint) {
VIR_DEBUG("Requested controlled '%s' not mounted",
virCgroupControllerTypeToString(i));
return -ENOENT;
} }
if (!any) } else {
return -ENXIO; /* Check whether a request to disable a controller
* clashes with co-mounting of controllers */
for (j = 0 ; j < VIR_CGROUP_CONTROLLER_LAST ; j++) {
if (j == i)
continue;
if (!((1 << j) & controllers))
continue;
if (STREQ_NULLABLE(group->controllers[i].mountPoint,
group->controllers[j].mountPoint)) {
VIR_DEBUG("Controller '%s' is not wanted, but '%s' is co-mounted",
virCgroupControllerTypeToString(i),
virCgroupControllerTypeToString(j));
return -EINVAL;
}
}
VIR_FREE(group->controllers[i].mountPoint);
}
}
} else {
VIR_DEBUG("Auto-detecting controllers");
controllers = 0;
for (i = 0 ; i < VIR_CGROUP_CONTROLLER_LAST ; i++) {
VIR_DEBUG("Controller '%s' present=%s",
virCgroupControllerTypeToString(i),
group->controllers[i].mountPoint ? "yes" : "no");
if (group->controllers[i].mountPoint == NULL)
continue;
controllers |= (1 << i);
}
}
/* Check that at least 1 controller is available */
if (!controllers)
return -ENXIO;
rc = virCgroupDetectPlacement(group); rc = virCgroupDetectPlacement(group);
@ -542,16 +582,6 @@ static int virCgroupMakeGroup(virCgroupPtr parent,
if (!group->controllers[i].mountPoint) if (!group->controllers[i].mountPoint)
continue; continue;
/* We need to control cpu bandwidth for each vcpu now */
if ((flags & VIR_CGROUP_VCPU) &&
(i != VIR_CGROUP_CONTROLLER_CPU &&
i != VIR_CGROUP_CONTROLLER_CPUACCT &&
i != VIR_CGROUP_CONTROLLER_CPUSET)) {
/* treat it as unmounted and we can use virCgroupAddTask */
VIR_FREE(group->controllers[i].mountPoint);
continue;
}
rc = virCgroupPathOfController(group, i, "", &path); rc = virCgroupPathOfController(group, i, "", &path);
if (rc < 0) if (rc < 0)
return rc; return rc;
@ -611,12 +641,13 @@ static int virCgroupMakeGroup(virCgroupPtr parent,
static int virCgroupNew(const char *path, static int virCgroupNew(const char *path,
int controllers,
virCgroupPtr *group) virCgroupPtr *group)
{ {
int rc = 0; int rc = 0;
char *typpath = NULL; char *typpath = NULL;
VIR_DEBUG("New group %s", path); VIR_DEBUG("path=%s controllers=%d", path, controllers);
*group = NULL; *group = NULL;
if (VIR_ALLOC((*group)) != 0) { if (VIR_ALLOC((*group)) != 0) {
@ -629,7 +660,7 @@ static int virCgroupNew(const char *path,
goto err; goto err;
} }
rc = virCgroupDetect(*group); rc = virCgroupDetect(*group, controllers);
if (rc < 0) if (rc < 0)
goto err; goto err;
@ -645,17 +676,18 @@ err:
static int virCgroupAppRoot(bool privileged, static int virCgroupAppRoot(bool privileged,
virCgroupPtr *group, virCgroupPtr *group,
bool create) bool create,
int controllers)
{ {
virCgroupPtr rootgrp = NULL; virCgroupPtr rootgrp = NULL;
int rc; int rc;
rc = virCgroupNew("/", &rootgrp); rc = virCgroupNew("/", controllers, &rootgrp);
if (rc != 0) if (rc != 0)
return rc; return rc;
if (privileged) { if (privileged) {
rc = virCgroupNew("/libvirt", group); rc = virCgroupNew("/libvirt", controllers, group);
} else { } else {
char *rootname; char *rootname;
char *username; char *username;
@ -671,7 +703,7 @@ static int virCgroupAppRoot(bool privileged,
goto cleanup; goto cleanup;
} }
rc = virCgroupNew(rootname, group); rc = virCgroupNew(rootname, controllers, group);
VIR_FREE(rootname); VIR_FREE(rootname);
} }
if (rc != 0) if (rc != 0)
@ -779,6 +811,7 @@ int virCgroupRemove(virCgroupPtr group)
return rc; return rc;
} }
/** /**
* virCgroupAddTask: * virCgroupAddTask:
* *
@ -872,45 +905,30 @@ cleanup:
* *
* Returns: 0 on success or -errno on failure * Returns: 0 on success or -errno on failure
*/ */
int virCgroupMoveTask(virCgroupPtr src_group, virCgroupPtr dest_group, int virCgroupMoveTask(virCgroupPtr src_group, virCgroupPtr dest_group)
int controller)
{ {
int rc = 0, err = 0; int rc = 0;
char *content = NULL; char *content = NULL;
int i;
if (controller < VIR_CGROUP_CONTROLLER_CPU || for (i = 0 ; i < VIR_CGROUP_CONTROLLER_LAST ; i++) {
controller > VIR_CGROUP_CONTROLLER_BLKIO) if (!src_group->controllers[i].mountPoint ||
return -EINVAL; !dest_group->controllers[i].mountPoint)
continue;
if (!src_group->controllers[controller].mountPoint || rc = virCgroupGetValueStr(src_group, i, "tasks", &content);
!dest_group->controllers[controller].mountPoint) {
return -EINVAL;
}
rc = virCgroupGetValueStr(src_group, controller, "tasks", &content);
if (rc != 0) if (rc != 0)
return rc; return rc;
rc = virCgroupAddTaskStrController(dest_group, content, controller); rc = virCgroupAddTaskStrController(dest_group, content, i);
if (rc != 0) if (rc != 0)
goto cleanup; goto cleanup;
VIR_FREE(content); VIR_FREE(content);
}
return 0;
cleanup: cleanup:
/*
* We don't need to recover dest_cgroup because cgroup will make sure
* that one task only resides in one cgroup of the same controller.
*/
err = virCgroupAddTaskStrController(src_group, content, controller);
if (err != 0)
VIR_ERROR(_("Cannot recover cgroup %s from %s"),
src_group->controllers[controller].mountPoint,
dest_group->controllers[controller].mountPoint);
VIR_FREE(content); VIR_FREE(content);
return rc; return rc;
} }
@ -926,13 +944,15 @@ cleanup:
int virCgroupForDriver(const char *name, int virCgroupForDriver(const char *name,
virCgroupPtr *group, virCgroupPtr *group,
bool privileged, bool privileged,
bool create) bool create,
int controllers)
{ {
int rc; int rc;
char *path = NULL; char *path = NULL;
virCgroupPtr rootgrp = NULL; virCgroupPtr rootgrp = NULL;
rc = virCgroupAppRoot(privileged, &rootgrp, create); rc = virCgroupAppRoot(privileged, &rootgrp,
create, controllers);
if (rc != 0) if (rc != 0)
goto out; goto out;
@ -941,7 +961,7 @@ int virCgroupForDriver(const char *name,
goto out; goto out;
} }
rc = virCgroupNew(path, group); rc = virCgroupNew(path, controllers, group);
VIR_FREE(path); VIR_FREE(path);
if (rc == 0) { if (rc == 0) {
@ -979,7 +999,7 @@ int virCgroupForDriver(const char *name ATTRIBUTE_UNUSED,
#if defined HAVE_MNTENT_H && defined HAVE_GETMNTENT_R #if defined HAVE_MNTENT_H && defined HAVE_GETMNTENT_R
int virCgroupForSelf(virCgroupPtr *group) int virCgroupForSelf(virCgroupPtr *group)
{ {
return virCgroupNew("/", group); return virCgroupNew("/", -1, group);
} }
#else #else
int virCgroupForSelf(virCgroupPtr *group ATTRIBUTE_UNUSED) int virCgroupForSelf(virCgroupPtr *group ATTRIBUTE_UNUSED)
@ -1012,7 +1032,7 @@ int virCgroupForDomain(virCgroupPtr driver,
if (virAsprintf(&path, "%s/%s", driver->path, name) < 0) if (virAsprintf(&path, "%s/%s", driver->path, name) < 0)
return -ENOMEM; return -ENOMEM;
rc = virCgroupNew(path, group); rc = virCgroupNew(path, -1, group);
VIR_FREE(path); VIR_FREE(path);
if (rc == 0) { if (rc == 0) {
@ -1060,6 +1080,7 @@ int virCgroupForVcpu(virCgroupPtr driver,
{ {
int rc; int rc;
char *path; char *path;
int controllers;
if (driver == NULL) if (driver == NULL)
return -EINVAL; return -EINVAL;
@ -1067,11 +1088,15 @@ int virCgroupForVcpu(virCgroupPtr driver,
if (virAsprintf(&path, "%s/vcpu%d", driver->path, vcpuid) < 0) if (virAsprintf(&path, "%s/vcpu%d", driver->path, vcpuid) < 0)
return -ENOMEM; return -ENOMEM;
rc = virCgroupNew(path, group); controllers = ((1 << VIR_CGROUP_CONTROLLER_CPU) |
(1 << VIR_CGROUP_CONTROLLER_CPUACCT) |
(1 << VIR_CGROUP_CONTROLLER_CPUSET));
rc = virCgroupNew(path, controllers, group);
VIR_FREE(path); VIR_FREE(path);
if (rc == 0) { if (rc == 0) {
rc = virCgroupMakeGroup(driver, *group, create, VIR_CGROUP_VCPU); rc = virCgroupMakeGroup(driver, *group, create, VIR_CGROUP_NONE);
if (rc != 0) if (rc != 0)
virCgroupFree(group); virCgroupFree(group);
} }
@ -1103,6 +1128,7 @@ int virCgroupForEmulator(virCgroupPtr driver,
{ {
int rc; int rc;
char *path; char *path;
int controllers;
if (driver == NULL) if (driver == NULL)
return -EINVAL; return -EINVAL;
@ -1110,11 +1136,15 @@ int virCgroupForEmulator(virCgroupPtr driver,
if (virAsprintf(&path, "%s/emulator", driver->path) < 0) if (virAsprintf(&path, "%s/emulator", driver->path) < 0)
return -ENOMEM; return -ENOMEM;
rc = virCgroupNew(path, group); controllers = ((1 << VIR_CGROUP_CONTROLLER_CPU) |
(1 << VIR_CGROUP_CONTROLLER_CPUACCT) |
(1 << VIR_CGROUP_CONTROLLER_CPUSET));
rc = virCgroupNew(path, controllers, group);
VIR_FREE(path); VIR_FREE(path);
if (rc == 0) { if (rc == 0) {
rc = virCgroupMakeGroup(driver, *group, create, VIR_CGROUP_VCPU); rc = virCgroupMakeGroup(driver, *group, create, VIR_CGROUP_NONE);
if (rc != 0) if (rc != 0)
virCgroupFree(group); virCgroupFree(group);
} }
@ -2014,7 +2044,7 @@ static int virCgroupKillRecursiveInternal(virCgroupPtr group, int signum, virHas
goto cleanup; goto cleanup;
} }
if ((rc = virCgroupNew(subpath, &subgroup)) != 0) if ((rc = virCgroupNew(subpath, -1, &subgroup)) != 0)
goto cleanup; goto cleanup;
if ((rc = virCgroupKillRecursiveInternal(subgroup, signum, pids, true)) < 0) if ((rc = virCgroupKillRecursiveInternal(subgroup, signum, pids, true)) < 0)

View File

@ -47,7 +47,8 @@ VIR_ENUM_DECL(virCgroupController);
int virCgroupForDriver(const char *name, int virCgroupForDriver(const char *name,
virCgroupPtr *group, virCgroupPtr *group,
bool privileged, bool privileged,
bool create); bool create,
int controllers);
int virCgroupForSelf(virCgroupPtr *group); int virCgroupForSelf(virCgroupPtr *group);
@ -77,8 +78,7 @@ int virCgroupAddTaskController(virCgroupPtr group,
int controller); int controller);
int virCgroupMoveTask(virCgroupPtr src_group, int virCgroupMoveTask(virCgroupPtr src_group,
virCgroupPtr dest_group, virCgroupPtr dest_group);
int controller);
int virCgroupSetBlkioWeight(virCgroupPtr group, unsigned int weight); int virCgroupSetBlkioWeight(virCgroupPtr group, unsigned int weight);
int virCgroupGetBlkioWeight(virCgroupPtr group, unsigned int *weight); int virCgroupGetBlkioWeight(virCgroupPtr group, unsigned int *weight);