2007-07-25 23:16:30 +00:00
|
|
|
/*
|
|
|
|
* nodeinfo.c: Helper routines for OS specific node information
|
|
|
|
*
|
2015-07-06 21:03:51 +00:00
|
|
|
* Copyright (C) 2006-2008, 2010-2015 Red Hat, Inc.
|
2007-07-25 23:16:30 +00:00
|
|
|
* Copyright (C) 2006 Daniel P. Berrange
|
|
|
|
*
|
|
|
|
* This library is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
|
|
* License as published by the Free Software Foundation; either
|
|
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This library is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
* Lesser General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU Lesser General Public
|
2012-09-20 22:30:55 +00:00
|
|
|
* License along with this library. If not, see
|
2012-07-21 10:06:23 +00:00
|
|
|
* <http://www.gnu.org/licenses/>.
|
2007-07-25 23:16:30 +00:00
|
|
|
*
|
|
|
|
* Author: Daniel P. Berrange <berrange@redhat.com>
|
|
|
|
*/
|
|
|
|
|
2008-01-29 18:15:54 +00:00
|
|
|
#include <config.h>
|
2007-12-05 21:40:15 +00:00
|
|
|
|
2007-07-25 23:16:30 +00:00
|
|
|
#include <stdio.h>
|
|
|
|
#include <string.h>
|
|
|
|
#include <stdlib.h>
|
make NUMA-initialization code more portable and more robust
qemudCapsInitNUMA and umlCapsInitNUMA were identical, so this change
factors them into a new function, virCapsInitNUMA, and puts it in
nodeinfo.c.
In addition to factoring out the duplicates, this change also
adjusts that function definition (along with its macros) so
that it works with Fedora 9's numactl version 1, and makes it
so the code will work even if someone builds the kernel with
CONFIG_NR_CPUS > 4096.
Finally, also perform this NUMA initialization for the lxc
and openvz drivers.
* src/nodeinfo.c: Include <stdint.h>, <numa.h> and "memory.h".
(virCapsInitNUMA): Rename from qemudCapsInitNUMA and umlCapsInitNUMA.
(NUMA_MAX_N_CPUS): Define depending on NUMA API version.
(n_bits, MASK_CPU_ISSET): Define, adjust, use uint64 rather than long.
* src/nodeinfo.h: Include "capabilities.h".
(virCapsInitNUMA): Declare it.
* examples/domain-events/events-c/Makefile.am:
* src/Makefile.am: Add $(NUMACTL_CFLAGS) and $(NUMACTL_LIBS) to various
compile/link-related variables.
* src/qemu_conf.c: Include "nodeinfo.h".
(qemudCapsInitNUMA): Remove duplicate code. Adjust caller.
* src/uml_conf.c (umlCapsInitNUMA): Likewise.
Include "nodeinfo.h".
* src/lxc_conf.c: Include "nodeinfo.h".
(lxcCapsInit): Perform NUMA initialization here, too.
* src/openvz_conf.c (openvzCapsInit): And here.
Include "nodeinfo.h".
* src/libvirt_sym.version.in: Add virCapsInitNUMA so that libvirtd
can link to this function.
2008-12-21 18:55:09 +00:00
|
|
|
#include <stdint.h>
|
2007-07-25 23:16:30 +00:00
|
|
|
#include <errno.h>
|
2010-03-04 22:28:40 +00:00
|
|
|
#include <dirent.h>
|
2010-04-29 03:06:46 +00:00
|
|
|
#include <sys/utsname.h>
|
2012-03-02 02:54:22 +00:00
|
|
|
#include "conf/domain_conf.h"
|
nodeinfo: Fix output on PPC64 KVM hosts
The nodeinfo is reporting incorrect number of cpus and incorrect host
topology on PPC64 KVM hosts. The KVM hypervisor on PPC64 needs only
the primary thread in a core to be online, and the secondaries offlined.
While scheduling a guest in, the kvm scheduler wakes up the secondaries to
run in guest context.
The host scheduling of the guests happen at the core level(as only primary
thread is online). The kvm scheduler exploits as many threads of the core
as needed by guest. Further, starting POWER8, the processor allows splitting
a physical core into multiple subcores with 2 or 4 threads each. Again, only
the primary thread in a subcore is online in the host. The KVM-PPC
scheduler allows guests to exploit all the offline threads in the subcore,
by bringing them online when needed.
(Kernel patches on split-core http://www.spinics.net/lists/kvm-ppc/msg09121.html)
Recently with dynamic micro-threading changes in ppc-kvm, makes sure
to utilize all the offline cpus across guests, and across guests with
different cpu topologies.
(https://www.mail-archive.com/kvm@vger.kernel.org/msg115978.html)
Since the offline cpus are brought online in the guest context, it is safe
to count them as online. Nodeinfo today discounts these offline cpus from
cpu count/topology calclulation, and the nodeinfo output is not of any help
and the host appears overcommited when it is actually not.
The patch carefully counts those offline threads whose primary threads are
online. The host topology displayed by the nodeinfo is also fixed when the
host is in valid kvm state.
Signed-off-by: Shivaprasad G Bhat <sbhat@linux.vnet.ibm.com>
Signed-off-by: Andrea Bolognani <abologna@redhat.com>
2015-07-30 09:37:04 +00:00
|
|
|
#include <fcntl.h>
|
|
|
|
#include <sys/ioctl.h>
|
|
|
|
|
|
|
|
#if HAVE_LINUX_KVM_H
|
|
|
|
# include <linux/kvm.h>
|
|
|
|
#endif
|
make NUMA-initialization code more portable and more robust
qemudCapsInitNUMA and umlCapsInitNUMA were identical, so this change
factors them into a new function, virCapsInitNUMA, and puts it in
nodeinfo.c.
In addition to factoring out the duplicates, this change also
adjusts that function definition (along with its macros) so
that it works with Fedora 9's numactl version 1, and makes it
so the code will work even if someone builds the kernel with
CONFIG_NR_CPUS > 4096.
Finally, also perform this NUMA initialization for the lxc
and openvz drivers.
* src/nodeinfo.c: Include <stdint.h>, <numa.h> and "memory.h".
(virCapsInitNUMA): Rename from qemudCapsInitNUMA and umlCapsInitNUMA.
(NUMA_MAX_N_CPUS): Define depending on NUMA API version.
(n_bits, MASK_CPU_ISSET): Define, adjust, use uint64 rather than long.
* src/nodeinfo.h: Include "capabilities.h".
(virCapsInitNUMA): Declare it.
* examples/domain-events/events-c/Makefile.am:
* src/Makefile.am: Add $(NUMACTL_CFLAGS) and $(NUMACTL_LIBS) to various
compile/link-related variables.
* src/qemu_conf.c: Include "nodeinfo.h".
(qemudCapsInitNUMA): Remove duplicate code. Adjust caller.
* src/uml_conf.c (umlCapsInitNUMA): Likewise.
Include "nodeinfo.h".
* src/lxc_conf.c: Include "nodeinfo.h".
(lxcCapsInit): Perform NUMA initialization here, too.
* src/openvz_conf.c (openvzCapsInit): And here.
Include "nodeinfo.h".
* src/libvirt_sym.version.in: Add virCapsInitNUMA so that libvirtd
can link to this function.
2008-12-21 18:55:09 +00:00
|
|
|
|
2013-10-05 05:56:37 +00:00
|
|
|
#if defined(__FreeBSD__) || defined(__APPLE__)
|
2014-01-28 17:49:24 +00:00
|
|
|
# include <sys/time.h>
|
2012-12-17 18:12:44 +00:00
|
|
|
# include <sys/types.h>
|
|
|
|
# include <sys/sysctl.h>
|
2014-01-28 17:49:24 +00:00
|
|
|
# include <sys/resource.h>
|
2012-12-17 18:12:44 +00:00
|
|
|
#endif
|
|
|
|
|
make NUMA-initialization code more portable and more robust
qemudCapsInitNUMA and umlCapsInitNUMA were identical, so this change
factors them into a new function, virCapsInitNUMA, and puts it in
nodeinfo.c.
In addition to factoring out the duplicates, this change also
adjusts that function definition (along with its macros) so
that it works with Fedora 9's numactl version 1, and makes it
so the code will work even if someone builds the kernel with
CONFIG_NR_CPUS > 4096.
Finally, also perform this NUMA initialization for the lxc
and openvz drivers.
* src/nodeinfo.c: Include <stdint.h>, <numa.h> and "memory.h".
(virCapsInitNUMA): Rename from qemudCapsInitNUMA and umlCapsInitNUMA.
(NUMA_MAX_N_CPUS): Define depending on NUMA API version.
(n_bits, MASK_CPU_ISSET): Define, adjust, use uint64 rather than long.
* src/nodeinfo.h: Include "capabilities.h".
(virCapsInitNUMA): Declare it.
* examples/domain-events/events-c/Makefile.am:
* src/Makefile.am: Add $(NUMACTL_CFLAGS) and $(NUMACTL_LIBS) to various
compile/link-related variables.
* src/qemu_conf.c: Include "nodeinfo.h".
(qemudCapsInitNUMA): Remove duplicate code. Adjust caller.
* src/uml_conf.c (umlCapsInitNUMA): Likewise.
Include "nodeinfo.h".
* src/lxc_conf.c: Include "nodeinfo.h".
(lxcCapsInit): Perform NUMA initialization here, too.
* src/openvz_conf.c (openvzCapsInit): And here.
Include "nodeinfo.h".
* src/libvirt_sym.version.in: Add virCapsInitNUMA so that libvirtd
can link to this function.
2008-12-21 18:55:09 +00:00
|
|
|
#include "c-ctype.h"
|
2012-12-12 18:06:53 +00:00
|
|
|
#include "viralloc.h"
|
2014-01-22 11:56:06 +00:00
|
|
|
#include "nodeinfopriv.h"
|
2015-06-26 22:27:29 +00:00
|
|
|
#include "nodeinfo.h"
|
Use gnulib, starting with its physmem and getaddrinfo modules.
New files go into these directories:
gnulib/lib
gnulib/m4
gnulib/tests
* bootstrap: A wrapper around gnulib-tool.
* configure.in: Invoke gl_EARLY and gl_INIT, being careful to put gl_EARLY
before any macro that uses AC_COMPILE_IFELSE.
(AC_OUTPUT): Add lib/Makefile and gl-tests/Makefile. Remove m4/Makefile.
* Makefile.am (SUBDIRS): Add gnulib/lib and remove m4. Add gnulib/tests
early enough that those tests run before any libvirt unit tests.
* m4/Makefile.am: Remove file. Not needed.
* src/Makefile.am (INCLUDES): Add -I$(top_srcdir)/gnulib/lib -I../gnulib/lib.
(LDADDS, libvirt_la_LIBADD): Add ../gnulib/lib/libgnu.la.
* src/nodeinfo.c: Include "physmem.h".
* qemud/qemud.c, src/remote_internal.c: Include "getaddrinfo.h".
(MEMINFO_PATH, linuxNodeInfoMemPopulate): Remove definitions.
(virNodeInfoPopulate): Use physmem_total, not linuxNodeInfoMemPopulate.
* tests/Makefile.am (INCLUDES): Add -I$(top_srcdir)/gnulib/lib -I../gnulib/lib.
(LDADDS): Add ../gnulib/lib/libgnu.la.
* qemud/Makefile.am (libvirtd_LDADD): Add ../gnulib/lib/libgnu.la.
* tests/nodeinfotest.c (linuxTestCompareFiles): No longer read total
memory from a file.
Update expected output not to include "Memory: NNNN"
* tests/nodeinfodata/linux-nodeinfo-1.txt:
* tests/nodeinfodata/linux-nodeinfo-2.txt:
* tests/nodeinfodata/linux-nodeinfo-3.txt:
* tests/nodeinfodata/linux-nodeinfo-4.txt:
* tests/nodeinfodata/linux-nodeinfo-5.txt:
* tests/nodeinfodata/linux-nodeinfo-6.txt:
* src/test.c [WITH_TEST]: Remove definition of _GNU_SOURCE that
would conflict with the one now in "config.h".
* autogen.sh: Add -I gnulib/m4.
* src/conf.c, src/sexpr.c: Don't define _GNU_SOURCE.
Instead, include "config.h".
* qemud/qemud.c: Remove definition of _GNU_SOURCE.
* src/openvz_driver.c: Likewise.
* src/qemu_driver.c: Likewise.
* src/remote_internal.c: Likewise.
* configure.in: Use AC_CONFIG_AUX_DIR(build-aux), so that a bunch
of gettextize-generated files go into build-aux/, rather than in
the top-level directory.
* .cvsignore: Adjust.
* build-aux/.cvsignore: New file.
Author: Jim Meyering <meyering@redhat.com>
2007-12-05 21:31:07 +00:00
|
|
|
#include "physmem.h"
|
2012-12-13 18:21:53 +00:00
|
|
|
#include "virerror.h"
|
2010-03-04 22:28:40 +00:00
|
|
|
#include "count-one-bits.h"
|
2010-08-10 21:33:37 +00:00
|
|
|
#include "intprops.h"
|
2012-12-10 21:58:16 +00:00
|
|
|
#include "virarch.h"
|
2011-07-19 18:32:58 +00:00
|
|
|
#include "virfile.h"
|
2012-09-14 14:42:16 +00:00
|
|
|
#include "virtypedparam.h"
|
2013-04-03 10:36:23 +00:00
|
|
|
#include "virstring.h"
|
2013-10-17 14:57:29 +00:00
|
|
|
#include "virnuma.h"
|
2014-06-17 10:25:23 +00:00
|
|
|
#include "virlog.h"
|
2009-01-20 17:13:33 +00:00
|
|
|
|
|
|
|
#define VIR_FROM_THIS VIR_FROM_NONE
|
|
|
|
|
2014-06-17 10:25:23 +00:00
|
|
|
VIR_LOG_INIT("nodeinfo");
|
|
|
|
|
2015-07-17 17:07:45 +00:00
|
|
|
#define SYSFS_SYSTEM_PATH "/sys/devices/system"
|
|
|
|
|
2013-10-05 05:56:37 +00:00
|
|
|
#if defined(__FreeBSD__) || defined(__APPLE__)
|
2012-12-17 18:12:44 +00:00
|
|
|
static int
|
2013-10-05 05:56:37 +00:00
|
|
|
appleFreebsdNodeGetCPUCount(void)
|
2012-12-17 18:12:44 +00:00
|
|
|
{
|
|
|
|
int ncpu_mib[2] = { CTL_HW, HW_NCPU };
|
|
|
|
unsigned long ncpu;
|
|
|
|
size_t ncpu_len = sizeof(ncpu);
|
|
|
|
|
|
|
|
if (sysctl(ncpu_mib, 2, &ncpu, &ncpu_len, NULL, 0) == -1) {
|
|
|
|
virReportSystemError(errno, "%s", _("Cannot obtain CPU count"));
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
return ncpu;
|
|
|
|
}
|
2013-10-20 15:14:52 +00:00
|
|
|
|
|
|
|
/* VIR_HW_PHYSMEM - the resulting value of HW_PHYSMEM of FreeBSD
|
|
|
|
* is 64 bits while that of Mac OS X is still 32 bits.
|
|
|
|
* Mac OS X provides HW_MEMSIZE for 64 bits version of HW_PHYSMEM
|
|
|
|
* since 10.6.8 (Snow Leopard) at least.
|
|
|
|
*/
|
|
|
|
# ifdef HW_MEMSIZE
|
|
|
|
# define VIR_HW_PHYSMEM HW_MEMSIZE
|
|
|
|
# else
|
|
|
|
# define VIR_HW_PHYSMEM HW_PHYSMEM
|
|
|
|
# endif
|
|
|
|
static int
|
|
|
|
appleFreebsdNodeGetMemorySize(unsigned long *memory)
|
|
|
|
{
|
|
|
|
int mib[2] = { CTL_HW, VIR_HW_PHYSMEM };
|
|
|
|
unsigned long physmem;
|
|
|
|
size_t len = sizeof(physmem);
|
|
|
|
|
|
|
|
if (sysctl(mib, 2, &physmem, &len, NULL, 0) == -1) {
|
|
|
|
virReportSystemError(errno, "%s", _("cannot obtain memory size"));
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
*memory = (unsigned long)(physmem / 1024);
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
2014-01-03 18:35:50 +00:00
|
|
|
#endif /* defined(__FreeBSD__) || defined(__APPLE__) */
|
|
|
|
|
|
|
|
#ifdef __FreeBSD__
|
2014-01-28 17:49:24 +00:00
|
|
|
# define BSD_CPU_STATS_ALL 4
|
2014-01-03 18:35:50 +00:00
|
|
|
# define BSD_MEMORY_STATS_ALL 4
|
|
|
|
|
2014-01-28 17:49:24 +00:00
|
|
|
# define TICK_TO_NSEC (1000ull * 1000ull * 1000ull / (stathz ? stathz : hz))
|
|
|
|
|
|
|
|
static int
|
|
|
|
freebsdNodeGetCPUStats(int cpuNum,
|
|
|
|
virNodeCPUStatsPtr params,
|
|
|
|
int *nparams)
|
|
|
|
{
|
|
|
|
const char *sysctl_name;
|
|
|
|
long *cpu_times;
|
|
|
|
struct clockinfo clkinfo;
|
|
|
|
size_t i, j, cpu_times_size, clkinfo_size;
|
|
|
|
int cpu_times_num, offset, hz, stathz, ret = -1;
|
|
|
|
struct field_cpu_map {
|
|
|
|
const char *field;
|
|
|
|
int idx[CPUSTATES];
|
|
|
|
} cpu_map[] = {
|
|
|
|
{VIR_NODE_CPU_STATS_KERNEL, {CP_SYS}},
|
|
|
|
{VIR_NODE_CPU_STATS_USER, {CP_USER, CP_NICE}},
|
|
|
|
{VIR_NODE_CPU_STATS_IDLE, {CP_IDLE}},
|
|
|
|
{VIR_NODE_CPU_STATS_INTR, {CP_INTR}},
|
|
|
|
{NULL, {0}}
|
|
|
|
};
|
|
|
|
|
|
|
|
if ((*nparams) == 0) {
|
|
|
|
*nparams = BSD_CPU_STATS_ALL;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ((*nparams) != BSD_CPU_STATS_ALL) {
|
|
|
|
virReportInvalidArg(*nparams,
|
|
|
|
_("nparams in %s must be equal to %d"),
|
|
|
|
__FUNCTION__, BSD_CPU_STATS_ALL);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
clkinfo_size = sizeof(clkinfo);
|
|
|
|
if (sysctlbyname("kern.clockrate", &clkinfo, &clkinfo_size, NULL, 0) < 0) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("sysctl failed for '%s'"),
|
|
|
|
"kern.clockrate");
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
stathz = clkinfo.stathz;
|
|
|
|
hz = clkinfo.hz;
|
|
|
|
|
|
|
|
if (cpuNum == VIR_NODE_CPU_STATS_ALL_CPUS) {
|
|
|
|
sysctl_name = "kern.cp_time";
|
|
|
|
cpu_times_num = 1;
|
|
|
|
offset = 0;
|
|
|
|
} else {
|
|
|
|
sysctl_name = "kern.cp_times";
|
|
|
|
cpu_times_num = appleFreebsdNodeGetCPUCount();
|
|
|
|
|
|
|
|
if (cpuNum >= cpu_times_num) {
|
|
|
|
virReportInvalidArg(cpuNum,
|
|
|
|
_("Invalid cpuNum in %s"),
|
|
|
|
__FUNCTION__);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
offset = cpu_times_num * CPUSTATES;
|
|
|
|
}
|
|
|
|
|
|
|
|
cpu_times_size = sizeof(long) * cpu_times_num * CPUSTATES;
|
|
|
|
|
|
|
|
if (VIR_ALLOC_N(cpu_times, cpu_times_num * CPUSTATES) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
if (sysctlbyname(sysctl_name, cpu_times, &cpu_times_size, NULL, 0) < 0) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("sysctl failed for '%s'"),
|
|
|
|
sysctl_name);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
for (i = 0; cpu_map[i].field != NULL; i++) {
|
|
|
|
virNodeCPUStatsPtr param = ¶ms[i];
|
|
|
|
|
|
|
|
if (virStrcpyStatic(param->field, cpu_map[i].field) == NULL) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
_("Field '%s' too long for destination"),
|
|
|
|
cpu_map[i].field);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
param->value = 0;
|
|
|
|
for (j = 0; j < ARRAY_CARDINALITY(cpu_map[i].idx); j++)
|
|
|
|
param->value += cpu_times[offset + cpu_map[i].idx[j]] * TICK_TO_NSEC;
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = 0;
|
|
|
|
|
2014-03-25 06:57:22 +00:00
|
|
|
cleanup:
|
2014-01-28 17:49:24 +00:00
|
|
|
VIR_FREE(cpu_times);
|
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2014-01-03 18:35:50 +00:00
|
|
|
static int
|
|
|
|
freebsdNodeGetMemoryStats(virNodeMemoryStatsPtr params,
|
2015-07-14 09:40:14 +00:00
|
|
|
int *nparams)
|
2014-01-03 18:35:50 +00:00
|
|
|
{
|
|
|
|
size_t i, j = 0;
|
|
|
|
unsigned long pagesize = getpagesize() >> 10;
|
|
|
|
long bufpages;
|
|
|
|
size_t bufpages_size = sizeof(bufpages);
|
|
|
|
struct field_sysctl_map {
|
|
|
|
const char *field;
|
|
|
|
const char *sysctl_name;
|
|
|
|
} sysctl_map[] = {
|
|
|
|
{VIR_NODE_MEMORY_STATS_TOTAL, "vm.stats.vm.v_page_count"},
|
|
|
|
{VIR_NODE_MEMORY_STATS_FREE, "vm.stats.vm.v_free_count"},
|
|
|
|
{VIR_NODE_MEMORY_STATS_CACHED, "vm.stats.vm.v_cache_count"},
|
|
|
|
{NULL, NULL}
|
|
|
|
};
|
|
|
|
|
|
|
|
if ((*nparams) == 0) {
|
|
|
|
*nparams = BSD_MEMORY_STATS_ALL;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ((*nparams) != BSD_MEMORY_STATS_ALL) {
|
|
|
|
virReportInvalidArg(nparams,
|
|
|
|
_("nparams in %s must be %d"),
|
|
|
|
__FUNCTION__, BSD_MEMORY_STATS_ALL);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
for (i = 0; sysctl_map[i].field != NULL; i++) {
|
|
|
|
u_int value;
|
|
|
|
size_t value_size = sizeof(value);
|
|
|
|
virNodeMemoryStatsPtr param;
|
|
|
|
|
|
|
|
if (sysctlbyname(sysctl_map[i].sysctl_name, &value,
|
|
|
|
&value_size, NULL, 0) < 0) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("sysctl failed for '%s'"),
|
|
|
|
sysctl_map[i].sysctl_name);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
param = ¶ms[j++];
|
|
|
|
if (virStrcpyStatic(param->field, sysctl_map[i].field) == NULL) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
_("Field '%s' too long for destination"),
|
|
|
|
sysctl_map[i].field);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
param->value = (unsigned long long)value * pagesize;
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
virNodeMemoryStatsPtr param = ¶ms[j++];
|
|
|
|
|
|
|
|
if (sysctlbyname("vfs.bufspace", &bufpages, &bufpages_size, NULL, 0) < 0) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("sysctl failed for '%s'"),
|
|
|
|
"vfs.bufspace");
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
if (virStrcpyStatic(param->field, VIR_NODE_MEMORY_STATS_BUFFERS) == NULL) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
_("Field '%s' too long for destination"),
|
|
|
|
VIR_NODE_MEMORY_STATS_BUFFERS);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
param->value = (unsigned long long)bufpages >> 10;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
#endif /* __FreeBSD__ */
|
2012-12-17 18:12:44 +00:00
|
|
|
|
2007-07-25 23:16:30 +00:00
|
|
|
#ifdef __linux__
|
2010-03-09 18:22:22 +00:00
|
|
|
# define CPUINFO_PATH "/proc/cpuinfo"
|
2011-06-07 01:02:55 +00:00
|
|
|
# define PROCSTAT_PATH "/proc/stat"
|
2011-06-07 01:11:17 +00:00
|
|
|
# define MEMINFO_PATH "/proc/meminfo"
|
2012-09-14 14:42:16 +00:00
|
|
|
# define SYSFS_MEMORY_SHARED_PATH "/sys/kernel/mm/ksm"
|
2015-03-26 04:48:13 +00:00
|
|
|
# define SYSFS_THREAD_SIBLINGS_LIST_LENGTH_MAX 8192
|
2011-06-07 01:02:55 +00:00
|
|
|
|
|
|
|
# define LINUX_NB_CPU_STATS 4
|
2011-06-07 01:11:17 +00:00
|
|
|
# define LINUX_NB_MEMORY_STATS_ALL 4
|
|
|
|
# define LINUX_NB_MEMORY_STATS_CELL 2
|
2007-07-25 23:16:30 +00:00
|
|
|
|
2010-08-10 21:33:37 +00:00
|
|
|
/* Return the positive decimal contents of the given
|
2012-11-01 22:20:09 +00:00
|
|
|
* DIR/cpu%u/FILE, or -1 on error. If DEFAULT_VALUE is non-negative
|
|
|
|
* and the file could not be found, return that instead of an error;
|
|
|
|
* this is useful for machines that cannot hot-unplug cpu0, or where
|
|
|
|
* hot-unplugging is disabled, or where the kernel is too old
|
|
|
|
* to support NUMA cells, etc. */
|
2010-08-10 21:33:37 +00:00
|
|
|
static int
|
nodeinfo: drop static variable
We were wasting time to malloc a copy of a constant string, then
copy it into static storage, for every call to nodeGetInfo. At
least we were lucky that it was a constant source, and thus not
subject to even worse issues with one thread clobbering the static
storage while another was using it. This gets rid of the waste,
by passing the string through the stack instead, as well as renaming
internal functions to better match our conventions.
* src/nodeinfo.c (sysfs_path): Delete.
(get_cpu_value, count_thread_siblings, parse_socket): Add
parameter, and rename...
(virNodeGetCpuValue, virNodeCountThreadSiblings)
(virNodeParseSocket): ... into a common namespace.
(cpu_online, parse_core): Inline into callers.
(linuxNodeInfoCPUPopulate): Update caller.
(nodeGetInfo): Drop a useless malloc.
2012-05-11 18:50:08 +00:00
|
|
|
virNodeGetCpuValue(const char *dir, unsigned int cpu, const char *file,
|
2012-11-01 22:20:09 +00:00
|
|
|
int default_value)
|
2010-08-10 21:33:37 +00:00
|
|
|
{
|
|
|
|
char *path;
|
|
|
|
FILE *pathfp;
|
|
|
|
int value = -1;
|
|
|
|
char value_str[INT_BUFSIZE_BOUND(value)];
|
|
|
|
char *tmp;
|
|
|
|
|
2013-07-04 10:20:00 +00:00
|
|
|
if (virAsprintf(&path, "%s/cpu%u/%s", dir, cpu, file) < 0)
|
2010-08-10 21:33:37 +00:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
pathfp = fopen(path, "r");
|
|
|
|
if (pathfp == NULL) {
|
2012-11-01 22:20:09 +00:00
|
|
|
if (default_value >= 0 && errno == ENOENT)
|
|
|
|
value = default_value;
|
2010-08-10 21:33:37 +00:00
|
|
|
else
|
|
|
|
virReportSystemError(errno, _("cannot open %s"), path);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (fgets(value_str, sizeof(value_str), pathfp) == NULL) {
|
|
|
|
virReportSystemError(errno, _("cannot read from %s"), path);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
if (virStrToLong_i(value_str, &tmp, 10, &value) < 0) {
|
2012-07-18 18:19:23 +00:00
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
_("could not convert '%s' to an integer"),
|
|
|
|
value_str);
|
2010-08-10 21:33:37 +00:00
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
2014-03-25 06:57:22 +00:00
|
|
|
cleanup:
|
2010-11-17 02:13:29 +00:00
|
|
|
VIR_FORCE_FCLOSE(pathfp);
|
2010-08-10 21:33:37 +00:00
|
|
|
VIR_FREE(path);
|
|
|
|
|
|
|
|
return value;
|
|
|
|
}
|
|
|
|
|
nodeinfo: drop static variable
We were wasting time to malloc a copy of a constant string, then
copy it into static storage, for every call to nodeGetInfo. At
least we were lucky that it was a constant source, and thus not
subject to even worse issues with one thread clobbering the static
storage while another was using it. This gets rid of the waste,
by passing the string through the stack instead, as well as renaming
internal functions to better match our conventions.
* src/nodeinfo.c (sysfs_path): Delete.
(get_cpu_value, count_thread_siblings, parse_socket): Add
parameter, and rename...
(virNodeGetCpuValue, virNodeCountThreadSiblings)
(virNodeParseSocket): ... into a common namespace.
(cpu_online, parse_core): Inline into callers.
(linuxNodeInfoCPUPopulate): Update caller.
(nodeGetInfo): Drop a useless malloc.
2012-05-11 18:50:08 +00:00
|
|
|
static unsigned long
|
|
|
|
virNodeCountThreadSiblings(const char *dir, unsigned int cpu)
|
2010-03-04 22:28:40 +00:00
|
|
|
{
|
|
|
|
unsigned long ret = 0;
|
2010-03-09 15:17:59 +00:00
|
|
|
char *path;
|
2015-03-26 04:48:13 +00:00
|
|
|
char *str = NULL;
|
Convert 'int i' to 'size_t i' in src/node_device/ files
Convert the type of loop iterators named 'i', 'j', k',
'ii', 'jj', 'kk', to be 'size_t' instead of 'int' or
'unsigned int', also santizing 'ii', 'jj', 'kk' to use
the normal 'i', 'j', 'k' naming
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2013-07-08 14:09:33 +00:00
|
|
|
size_t i;
|
2010-03-04 22:28:40 +00:00
|
|
|
|
2011-10-03 12:45:30 +00:00
|
|
|
if (virAsprintf(&path, "%s/cpu%u/topology/thread_siblings",
|
2013-07-04 10:20:00 +00:00
|
|
|
dir, cpu) < 0)
|
2010-03-04 22:28:40 +00:00
|
|
|
return 0;
|
|
|
|
|
2015-06-02 12:24:03 +00:00
|
|
|
if (!virFileExists(path)) {
|
2013-04-03 19:28:35 +00:00
|
|
|
/* If file doesn't exist, then pretend our only
|
|
|
|
* sibling is ourself */
|
2015-06-02 12:24:03 +00:00
|
|
|
ret = 1;
|
2015-03-26 04:48:13 +00:00
|
|
|
goto cleanup;
|
2015-06-02 12:24:03 +00:00
|
|
|
}
|
2015-03-26 04:48:13 +00:00
|
|
|
|
2015-06-02 12:24:03 +00:00
|
|
|
if (virFileReadAll(path, SYSFS_THREAD_SIBLINGS_LIST_LENGTH_MAX, &str) < 0)
|
2010-03-04 22:28:40 +00:00
|
|
|
goto cleanup;
|
|
|
|
|
2015-06-02 12:29:54 +00:00
|
|
|
for (i = 0; str[i] != '\0'; i++) {
|
|
|
|
if (c_isxdigit(str[i]))
|
|
|
|
ret += count_one_bits(virHexToBin(str[i]));
|
2010-03-04 22:28:40 +00:00
|
|
|
}
|
|
|
|
|
2014-03-25 06:57:22 +00:00
|
|
|
cleanup:
|
2015-03-26 04:48:13 +00:00
|
|
|
VIR_FREE(str);
|
2010-03-04 22:28:40 +00:00
|
|
|
VIR_FREE(path);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
nodeinfo: drop static variable
We were wasting time to malloc a copy of a constant string, then
copy it into static storage, for every call to nodeGetInfo. At
least we were lucky that it was a constant source, and thus not
subject to even worse issues with one thread clobbering the static
storage while another was using it. This gets rid of the waste,
by passing the string through the stack instead, as well as renaming
internal functions to better match our conventions.
* src/nodeinfo.c (sysfs_path): Delete.
(get_cpu_value, count_thread_siblings, parse_socket): Add
parameter, and rename...
(virNodeGetCpuValue, virNodeCountThreadSiblings)
(virNodeParseSocket): ... into a common namespace.
(cpu_online, parse_core): Inline into callers.
(linuxNodeInfoCPUPopulate): Update caller.
(nodeGetInfo): Drop a useless malloc.
2012-05-11 18:50:08 +00:00
|
|
|
static int
|
2014-06-17 11:58:48 +00:00
|
|
|
virNodeParseSocket(const char *dir,
|
|
|
|
virArch arch,
|
|
|
|
unsigned int cpu)
|
2010-03-04 22:28:40 +00:00
|
|
|
{
|
2014-06-17 11:58:48 +00:00
|
|
|
int ret = virNodeGetCpuValue(dir, cpu, "topology/physical_package_id", 0);
|
|
|
|
|
2014-06-17 09:22:05 +00:00
|
|
|
if (ARCH_IS_ARM(arch) || ARCH_IS_PPC(arch) || ARCH_IS_S390(arch)) {
|
|
|
|
/* arm, ppc and s390(x) has -1 */
|
2014-06-17 11:58:48 +00:00
|
|
|
if (ret < 0)
|
|
|
|
ret = 0;
|
|
|
|
}
|
|
|
|
|
2011-04-14 18:50:22 +00:00
|
|
|
return ret;
|
2010-03-04 22:28:40 +00:00
|
|
|
}
|
|
|
|
|
2012-07-09 14:57:49 +00:00
|
|
|
/* parses a node entry, returning number of processors in the node and
|
|
|
|
* filling arguments */
|
2012-05-11 19:59:59 +00:00
|
|
|
static int
|
2015-07-20 16:37:30 +00:00
|
|
|
ATTRIBUTE_NONNULL(1) ATTRIBUTE_NONNULL(3)
|
nodeinfo: Fix output on PPC64 KVM hosts
The nodeinfo is reporting incorrect number of cpus and incorrect host
topology on PPC64 KVM hosts. The KVM hypervisor on PPC64 needs only
the primary thread in a core to be online, and the secondaries offlined.
While scheduling a guest in, the kvm scheduler wakes up the secondaries to
run in guest context.
The host scheduling of the guests happen at the core level(as only primary
thread is online). The kvm scheduler exploits as many threads of the core
as needed by guest. Further, starting POWER8, the processor allows splitting
a physical core into multiple subcores with 2 or 4 threads each. Again, only
the primary thread in a subcore is online in the host. The KVM-PPC
scheduler allows guests to exploit all the offline threads in the subcore,
by bringing them online when needed.
(Kernel patches on split-core http://www.spinics.net/lists/kvm-ppc/msg09121.html)
Recently with dynamic micro-threading changes in ppc-kvm, makes sure
to utilize all the offline cpus across guests, and across guests with
different cpu topologies.
(https://www.mail-archive.com/kvm@vger.kernel.org/msg115978.html)
Since the offline cpus are brought online in the guest context, it is safe
to count them as online. Nodeinfo today discounts these offline cpus from
cpu count/topology calclulation, and the nodeinfo output is not of any help
and the host appears overcommited when it is actually not.
The patch carefully counts those offline threads whose primary threads are
online. The host topology displayed by the nodeinfo is also fixed when the
host is in valid kvm state.
Signed-off-by: Shivaprasad G Bhat <sbhat@linux.vnet.ibm.com>
Signed-off-by: Andrea Bolognani <abologna@redhat.com>
2015-07-30 09:37:04 +00:00
|
|
|
ATTRIBUTE_NONNULL(4) ATTRIBUTE_NONNULL(6)
|
|
|
|
ATTRIBUTE_NONNULL(7) ATTRIBUTE_NONNULL(8)
|
|
|
|
ATTRIBUTE_NONNULL(9)
|
2015-07-20 16:37:30 +00:00
|
|
|
virNodeParseNode(const char *node,
|
2014-06-17 11:58:48 +00:00
|
|
|
virArch arch,
|
2015-07-20 16:37:30 +00:00
|
|
|
virBitmapPtr present_cpus_map,
|
|
|
|
virBitmapPtr online_cpus_map,
|
nodeinfo: Fix output on PPC64 KVM hosts
The nodeinfo is reporting incorrect number of cpus and incorrect host
topology on PPC64 KVM hosts. The KVM hypervisor on PPC64 needs only
the primary thread in a core to be online, and the secondaries offlined.
While scheduling a guest in, the kvm scheduler wakes up the secondaries to
run in guest context.
The host scheduling of the guests happen at the core level(as only primary
thread is online). The kvm scheduler exploits as many threads of the core
as needed by guest. Further, starting POWER8, the processor allows splitting
a physical core into multiple subcores with 2 or 4 threads each. Again, only
the primary thread in a subcore is online in the host. The KVM-PPC
scheduler allows guests to exploit all the offline threads in the subcore,
by bringing them online when needed.
(Kernel patches on split-core http://www.spinics.net/lists/kvm-ppc/msg09121.html)
Recently with dynamic micro-threading changes in ppc-kvm, makes sure
to utilize all the offline cpus across guests, and across guests with
different cpu topologies.
(https://www.mail-archive.com/kvm@vger.kernel.org/msg115978.html)
Since the offline cpus are brought online in the guest context, it is safe
to count them as online. Nodeinfo today discounts these offline cpus from
cpu count/topology calclulation, and the nodeinfo output is not of any help
and the host appears overcommited when it is actually not.
The patch carefully counts those offline threads whose primary threads are
online. The host topology displayed by the nodeinfo is also fixed when the
host is in valid kvm state.
Signed-off-by: Shivaprasad G Bhat <sbhat@linux.vnet.ibm.com>
Signed-off-by: Andrea Bolognani <abologna@redhat.com>
2015-07-30 09:37:04 +00:00
|
|
|
int threads_per_subcore,
|
2012-11-07 13:53:36 +00:00
|
|
|
int *sockets,
|
|
|
|
int *cores,
|
|
|
|
int *threads,
|
|
|
|
int *offline)
|
2012-05-11 19:59:59 +00:00
|
|
|
{
|
2015-07-20 16:37:27 +00:00
|
|
|
/* Biggest value we can expect to be used as either socket id
|
|
|
|
* or core id. Bitmaps will need to be sized accordingly */
|
|
|
|
const int ID_MAX = 4095;
|
2012-05-11 19:59:59 +00:00
|
|
|
int ret = -1;
|
2012-07-09 14:57:49 +00:00
|
|
|
int processors = 0;
|
|
|
|
DIR *cpudir = NULL;
|
|
|
|
struct dirent *cpudirent = NULL;
|
2015-07-20 16:37:29 +00:00
|
|
|
virBitmapPtr node_cpus_map = NULL;
|
2015-07-20 16:37:27 +00:00
|
|
|
virBitmapPtr sockets_map = NULL;
|
|
|
|
virBitmapPtr *cores_maps = NULL;
|
2015-07-20 16:37:30 +00:00
|
|
|
int npresent_cpus = virBitmapSize(present_cpus_map);
|
2012-07-09 14:57:49 +00:00
|
|
|
int sock_max = 0;
|
|
|
|
int sock;
|
|
|
|
int core;
|
Convert 'int i' to 'size_t i' in src/node_device/ files
Convert the type of loop iterators named 'i', 'j', k',
'ii', 'jj', 'kk', to be 'size_t' instead of 'int' or
'unsigned int', also santizing 'ii', 'jj', 'kk' to use
the normal 'i', 'j', 'k' naming
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2013-07-08 14:09:33 +00:00
|
|
|
size_t i;
|
2012-07-09 14:57:49 +00:00
|
|
|
int siblings;
|
|
|
|
unsigned int cpu;
|
2014-04-20 11:53:46 +00:00
|
|
|
int direrr;
|
2012-05-11 19:59:59 +00:00
|
|
|
|
2012-07-09 14:57:49 +00:00
|
|
|
*threads = 0;
|
|
|
|
*cores = 0;
|
|
|
|
*sockets = 0;
|
|
|
|
|
|
|
|
if (!(cpudir = opendir(node))) {
|
|
|
|
virReportSystemError(errno, _("cannot opendir %s"), node);
|
2012-05-11 19:59:59 +00:00
|
|
|
goto cleanup;
|
|
|
|
}
|
2012-07-09 14:57:49 +00:00
|
|
|
|
2015-07-20 16:37:29 +00:00
|
|
|
/* Keep track of the CPUs that belong to the current node */
|
|
|
|
if (!(node_cpus_map = virBitmapNew(npresent_cpus)))
|
|
|
|
goto cleanup;
|
|
|
|
|
2012-07-09 14:57:49 +00:00
|
|
|
/* enumerate sockets in the node */
|
2015-07-20 16:37:27 +00:00
|
|
|
if (!(sockets_map = virBitmapNew(ID_MAX + 1)))
|
|
|
|
goto cleanup;
|
|
|
|
|
2014-04-20 11:53:46 +00:00
|
|
|
while ((direrr = virDirRead(cpudir, &cpudirent, node)) > 0) {
|
2012-07-09 14:57:49 +00:00
|
|
|
if (sscanf(cpudirent->d_name, "cpu%u", &cpu) != 1)
|
|
|
|
continue;
|
|
|
|
|
2015-07-20 16:37:30 +00:00
|
|
|
if (!virBitmapIsBitSet(present_cpus_map, cpu))
|
2015-06-26 22:27:29 +00:00
|
|
|
continue;
|
|
|
|
|
2015-07-20 16:37:29 +00:00
|
|
|
/* Mark this CPU as part of the current node */
|
|
|
|
if (virBitmapSetBit(node_cpus_map, cpu) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
2015-07-20 16:37:28 +00:00
|
|
|
if (!virBitmapIsBitSet(online_cpus_map, cpu))
|
2012-07-18 01:46:29 +00:00
|
|
|
continue;
|
|
|
|
|
2012-07-09 14:57:49 +00:00
|
|
|
/* Parse socket */
|
2014-06-17 11:58:48 +00:00
|
|
|
if ((sock = virNodeParseSocket(node, arch, cpu)) < 0)
|
2012-11-01 22:20:09 +00:00
|
|
|
goto cleanup;
|
2015-07-20 16:37:27 +00:00
|
|
|
if (sock > ID_MAX) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
_("Socket %d can't be handled (max socket is %d)"),
|
|
|
|
sock, ID_MAX);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (virBitmapSetBit(sockets_map, sock) < 0)
|
|
|
|
goto cleanup;
|
2012-07-09 14:57:49 +00:00
|
|
|
|
|
|
|
if (sock > sock_max)
|
|
|
|
sock_max = sock;
|
|
|
|
}
|
|
|
|
|
2014-04-20 11:53:46 +00:00
|
|
|
if (direrr < 0)
|
2012-05-11 19:59:59 +00:00
|
|
|
goto cleanup;
|
2012-07-09 14:57:49 +00:00
|
|
|
|
|
|
|
sock_max++;
|
|
|
|
|
2015-07-20 16:37:27 +00:00
|
|
|
/* allocate cores maps for each socket */
|
|
|
|
if (VIR_ALLOC_N(cores_maps, sock_max) < 0)
|
2012-05-11 19:59:59 +00:00
|
|
|
goto cleanup;
|
2012-07-09 14:57:49 +00:00
|
|
|
|
|
|
|
for (i = 0; i < sock_max; i++)
|
2015-07-20 16:37:27 +00:00
|
|
|
if (!(cores_maps[i] = virBitmapNew(ID_MAX + 1)))
|
|
|
|
goto cleanup;
|
2012-07-09 14:57:49 +00:00
|
|
|
|
2015-07-20 16:37:29 +00:00
|
|
|
/* Iterate over all CPUs in the node, in ascending order */
|
|
|
|
for (cpu = 0; cpu < npresent_cpus; cpu++) {
|
2012-07-09 14:57:49 +00:00
|
|
|
|
2015-07-20 16:37:29 +00:00
|
|
|
/* Skip CPUs that are not part of the current node */
|
|
|
|
if (!virBitmapIsBitSet(node_cpus_map, cpu))
|
2015-06-26 22:27:29 +00:00
|
|
|
continue;
|
|
|
|
|
2015-07-20 16:37:28 +00:00
|
|
|
if (!virBitmapIsBitSet(online_cpus_map, cpu)) {
|
nodeinfo: Fix output on PPC64 KVM hosts
The nodeinfo is reporting incorrect number of cpus and incorrect host
topology on PPC64 KVM hosts. The KVM hypervisor on PPC64 needs only
the primary thread in a core to be online, and the secondaries offlined.
While scheduling a guest in, the kvm scheduler wakes up the secondaries to
run in guest context.
The host scheduling of the guests happen at the core level(as only primary
thread is online). The kvm scheduler exploits as many threads of the core
as needed by guest. Further, starting POWER8, the processor allows splitting
a physical core into multiple subcores with 2 or 4 threads each. Again, only
the primary thread in a subcore is online in the host. The KVM-PPC
scheduler allows guests to exploit all the offline threads in the subcore,
by bringing them online when needed.
(Kernel patches on split-core http://www.spinics.net/lists/kvm-ppc/msg09121.html)
Recently with dynamic micro-threading changes in ppc-kvm, makes sure
to utilize all the offline cpus across guests, and across guests with
different cpu topologies.
(https://www.mail-archive.com/kvm@vger.kernel.org/msg115978.html)
Since the offline cpus are brought online in the guest context, it is safe
to count them as online. Nodeinfo today discounts these offline cpus from
cpu count/topology calclulation, and the nodeinfo output is not of any help
and the host appears overcommited when it is actually not.
The patch carefully counts those offline threads whose primary threads are
online. The host topology displayed by the nodeinfo is also fixed when the
host is in valid kvm state.
Signed-off-by: Shivaprasad G Bhat <sbhat@linux.vnet.ibm.com>
Signed-off-by: Andrea Bolognani <abologna@redhat.com>
2015-07-30 09:37:04 +00:00
|
|
|
if (threads_per_subcore > 0 &&
|
|
|
|
cpu % threads_per_subcore != 0 &&
|
|
|
|
virBitmapIsBitSet(online_cpus_map,
|
|
|
|
cpu - (cpu % threads_per_subcore))) {
|
|
|
|
/* Secondary offline threads are counted as online when
|
|
|
|
* subcores are in use and the corresponding primary
|
|
|
|
* thread is online */
|
|
|
|
processors++;
|
|
|
|
} else {
|
|
|
|
/* But they are counted as offline otherwise */
|
|
|
|
(*offline)++;
|
|
|
|
}
|
2012-07-09 14:57:49 +00:00
|
|
|
continue;
|
2012-11-07 13:53:36 +00:00
|
|
|
}
|
2012-07-09 14:57:49 +00:00
|
|
|
|
|
|
|
processors++;
|
|
|
|
|
|
|
|
/* Parse socket */
|
2014-06-17 11:58:48 +00:00
|
|
|
if ((sock = virNodeParseSocket(node, arch, cpu)) < 0)
|
2012-11-01 22:20:09 +00:00
|
|
|
goto cleanup;
|
2015-07-20 16:37:27 +00:00
|
|
|
if (!virBitmapIsBitSet(sockets_map, sock)) {
|
2012-07-18 18:19:23 +00:00
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
|
|
|
|
_("CPU socket topology has changed"));
|
2012-07-09 14:57:49 +00:00
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Parse core */
|
2014-06-17 11:58:48 +00:00
|
|
|
if (ARCH_IS_S390(arch)) {
|
|
|
|
/* logical cpu is equivalent to a core on s390 */
|
|
|
|
core = cpu;
|
|
|
|
} else {
|
2015-07-23 09:47:05 +00:00
|
|
|
if ((core = virNodeGetCpuValue(node, cpu,
|
|
|
|
"topology/core_id", 0)) < 0)
|
|
|
|
goto cleanup;
|
2014-06-17 11:58:48 +00:00
|
|
|
}
|
2015-07-20 16:37:27 +00:00
|
|
|
if (core > ID_MAX) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
_("Core %d can't be handled (max core is %d)"),
|
|
|
|
core, ID_MAX);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
2012-07-09 14:57:49 +00:00
|
|
|
|
2015-07-20 16:37:27 +00:00
|
|
|
if (virBitmapSetBit(cores_maps[sock], core) < 0)
|
|
|
|
goto cleanup;
|
2012-07-09 14:57:49 +00:00
|
|
|
|
|
|
|
if (!(siblings = virNodeCountThreadSiblings(node, cpu)))
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
if (siblings > *threads)
|
|
|
|
*threads = siblings;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* finalize the returned data */
|
2015-07-20 16:37:27 +00:00
|
|
|
*sockets = virBitmapCountBits(sockets_map);
|
2012-07-09 14:57:49 +00:00
|
|
|
|
|
|
|
for (i = 0; i < sock_max; i++) {
|
2015-07-20 16:37:27 +00:00
|
|
|
if (!virBitmapIsBitSet(sockets_map, i))
|
2012-07-09 14:57:49 +00:00
|
|
|
continue;
|
|
|
|
|
2015-07-20 16:37:27 +00:00
|
|
|
core = virBitmapCountBits(cores_maps[i]);
|
2012-07-09 14:57:49 +00:00
|
|
|
if (core > *cores)
|
|
|
|
*cores = core;
|
|
|
|
}
|
|
|
|
|
nodeinfo: Fix output on PPC64 KVM hosts
The nodeinfo is reporting incorrect number of cpus and incorrect host
topology on PPC64 KVM hosts. The KVM hypervisor on PPC64 needs only
the primary thread in a core to be online, and the secondaries offlined.
While scheduling a guest in, the kvm scheduler wakes up the secondaries to
run in guest context.
The host scheduling of the guests happen at the core level(as only primary
thread is online). The kvm scheduler exploits as many threads of the core
as needed by guest. Further, starting POWER8, the processor allows splitting
a physical core into multiple subcores with 2 or 4 threads each. Again, only
the primary thread in a subcore is online in the host. The KVM-PPC
scheduler allows guests to exploit all the offline threads in the subcore,
by bringing them online when needed.
(Kernel patches on split-core http://www.spinics.net/lists/kvm-ppc/msg09121.html)
Recently with dynamic micro-threading changes in ppc-kvm, makes sure
to utilize all the offline cpus across guests, and across guests with
different cpu topologies.
(https://www.mail-archive.com/kvm@vger.kernel.org/msg115978.html)
Since the offline cpus are brought online in the guest context, it is safe
to count them as online. Nodeinfo today discounts these offline cpus from
cpu count/topology calclulation, and the nodeinfo output is not of any help
and the host appears overcommited when it is actually not.
The patch carefully counts those offline threads whose primary threads are
online. The host topology displayed by the nodeinfo is also fixed when the
host is in valid kvm state.
Signed-off-by: Shivaprasad G Bhat <sbhat@linux.vnet.ibm.com>
Signed-off-by: Andrea Bolognani <abologna@redhat.com>
2015-07-30 09:37:04 +00:00
|
|
|
if (threads_per_subcore > 0) {
|
|
|
|
/* The thread count ignores offline threads, which means that only
|
|
|
|
* only primary threads have been considered so far. If subcores
|
|
|
|
* are in use, we need to also account for secondary threads */
|
|
|
|
*threads *= threads_per_subcore;
|
|
|
|
}
|
2012-07-09 14:57:49 +00:00
|
|
|
ret = processors;
|
2012-05-11 19:59:59 +00:00
|
|
|
|
2014-03-25 06:57:22 +00:00
|
|
|
cleanup:
|
2012-07-09 14:57:49 +00:00
|
|
|
/* don't shadow a more serious error */
|
|
|
|
if (cpudir && closedir(cpudir) < 0 && ret >= 0) {
|
|
|
|
virReportSystemError(errno, _("problem closing %s"), node);
|
|
|
|
ret = -1;
|
|
|
|
}
|
2015-07-20 16:37:27 +00:00
|
|
|
if (cores_maps)
|
|
|
|
for (i = 0; i < sock_max; i++)
|
|
|
|
virBitmapFree(cores_maps[i]);
|
|
|
|
VIR_FREE(cores_maps);
|
|
|
|
virBitmapFree(sockets_map);
|
2015-07-20 16:37:29 +00:00
|
|
|
virBitmapFree(node_cpus_map);
|
2012-07-09 14:57:49 +00:00
|
|
|
|
2012-05-11 19:59:59 +00:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
nodeinfo: Fix output on PPC64 KVM hosts
The nodeinfo is reporting incorrect number of cpus and incorrect host
topology on PPC64 KVM hosts. The KVM hypervisor on PPC64 needs only
the primary thread in a core to be online, and the secondaries offlined.
While scheduling a guest in, the kvm scheduler wakes up the secondaries to
run in guest context.
The host scheduling of the guests happen at the core level(as only primary
thread is online). The kvm scheduler exploits as many threads of the core
as needed by guest. Further, starting POWER8, the processor allows splitting
a physical core into multiple subcores with 2 or 4 threads each. Again, only
the primary thread in a subcore is online in the host. The KVM-PPC
scheduler allows guests to exploit all the offline threads in the subcore,
by bringing them online when needed.
(Kernel patches on split-core http://www.spinics.net/lists/kvm-ppc/msg09121.html)
Recently with dynamic micro-threading changes in ppc-kvm, makes sure
to utilize all the offline cpus across guests, and across guests with
different cpu topologies.
(https://www.mail-archive.com/kvm@vger.kernel.org/msg115978.html)
Since the offline cpus are brought online in the guest context, it is safe
to count them as online. Nodeinfo today discounts these offline cpus from
cpu count/topology calclulation, and the nodeinfo output is not of any help
and the host appears overcommited when it is actually not.
The patch carefully counts those offline threads whose primary threads are
online. The host topology displayed by the nodeinfo is also fixed when the
host is in valid kvm state.
Signed-off-by: Shivaprasad G Bhat <sbhat@linux.vnet.ibm.com>
Signed-off-by: Andrea Bolognani <abologna@redhat.com>
2015-07-30 09:37:04 +00:00
|
|
|
/* Check whether the host subcore configuration is valid.
|
|
|
|
*
|
|
|
|
* A valid configuration is one where no secondary thread is online;
|
|
|
|
* the primary thread in a subcore is always the first one */
|
|
|
|
static bool
|
|
|
|
nodeHasValidSubcoreConfiguration(const char *sysfs_prefix,
|
|
|
|
int threads_per_subcore)
|
|
|
|
{
|
|
|
|
virBitmapPtr online_cpus = NULL;
|
|
|
|
int cpu = -1;
|
|
|
|
bool ret = false;
|
|
|
|
|
|
|
|
/* No point in checking if subcores are not in use */
|
|
|
|
if (threads_per_subcore <= 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
if (!(online_cpus = nodeGetOnlineCPUBitmap(sysfs_prefix)))
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
while ((cpu = virBitmapNextSetBit(online_cpus, cpu)) >= 0) {
|
|
|
|
|
|
|
|
/* A single online secondary thread is enough to
|
|
|
|
* make the configuration invalid */
|
|
|
|
if (cpu % threads_per_subcore != 0)
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = true;
|
|
|
|
|
|
|
|
cleanup:
|
|
|
|
virBitmapFree(online_cpus);
|
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2015-07-14 09:40:14 +00:00
|
|
|
int
|
|
|
|
linuxNodeInfoCPUPopulate(const char *sysfs_prefix,
|
|
|
|
FILE *cpuinfo,
|
|
|
|
virArch arch,
|
|
|
|
virNodeInfoPtr nodeinfo)
|
2010-03-04 22:28:40 +00:00
|
|
|
{
|
2015-07-14 09:40:13 +00:00
|
|
|
const char *prefix = sysfs_prefix ? sysfs_prefix : SYSFS_SYSTEM_PATH;
|
2015-07-20 16:37:30 +00:00
|
|
|
virBitmapPtr present_cpus_map = NULL;
|
|
|
|
virBitmapPtr online_cpus_map = NULL;
|
2007-07-25 23:16:30 +00:00
|
|
|
char line[1024];
|
2012-07-09 14:57:49 +00:00
|
|
|
DIR *nodedir = NULL;
|
|
|
|
struct dirent *nodedirent = NULL;
|
2012-11-07 13:53:36 +00:00
|
|
|
int cpus, cores, socks, threads, offline = 0;
|
nodeinfo: Fix output on PPC64 KVM hosts
The nodeinfo is reporting incorrect number of cpus and incorrect host
topology on PPC64 KVM hosts. The KVM hypervisor on PPC64 needs only
the primary thread in a core to be online, and the secondaries offlined.
While scheduling a guest in, the kvm scheduler wakes up the secondaries to
run in guest context.
The host scheduling of the guests happen at the core level(as only primary
thread is online). The kvm scheduler exploits as many threads of the core
as needed by guest. Further, starting POWER8, the processor allows splitting
a physical core into multiple subcores with 2 or 4 threads each. Again, only
the primary thread in a subcore is online in the host. The KVM-PPC
scheduler allows guests to exploit all the offline threads in the subcore,
by bringing them online when needed.
(Kernel patches on split-core http://www.spinics.net/lists/kvm-ppc/msg09121.html)
Recently with dynamic micro-threading changes in ppc-kvm, makes sure
to utilize all the offline cpus across guests, and across guests with
different cpu topologies.
(https://www.mail-archive.com/kvm@vger.kernel.org/msg115978.html)
Since the offline cpus are brought online in the guest context, it is safe
to count them as online. Nodeinfo today discounts these offline cpus from
cpu count/topology calclulation, and the nodeinfo output is not of any help
and the host appears overcommited when it is actually not.
The patch carefully counts those offline threads whose primary threads are
online. The host topology displayed by the nodeinfo is also fixed when the
host is in valid kvm state.
Signed-off-by: Shivaprasad G Bhat <sbhat@linux.vnet.ibm.com>
Signed-off-by: Andrea Bolognani <abologna@redhat.com>
2015-07-30 09:37:04 +00:00
|
|
|
int threads_per_subcore = 0;
|
2012-07-09 14:57:49 +00:00
|
|
|
unsigned int node;
|
2012-05-11 19:59:59 +00:00
|
|
|
int ret = -1;
|
2012-07-09 14:57:49 +00:00
|
|
|
char *sysfs_nodedir = NULL;
|
2012-05-11 19:59:59 +00:00
|
|
|
char *sysfs_cpudir = NULL;
|
2014-04-20 11:53:46 +00:00
|
|
|
int direrr;
|
2007-07-25 23:16:30 +00:00
|
|
|
|
2012-07-09 14:57:49 +00:00
|
|
|
/* Start with parsing CPU clock speed from /proc/cpuinfo */
|
2007-07-25 23:16:30 +00:00
|
|
|
while (fgets(line, sizeof(line), cpuinfo) != NULL) {
|
2014-06-17 10:25:23 +00:00
|
|
|
if (ARCH_IS_X86(arch)) {
|
|
|
|
char *buf = line;
|
|
|
|
if (STRPREFIX(buf, "cpu MHz")) {
|
|
|
|
char *p;
|
|
|
|
unsigned int ui;
|
|
|
|
|
|
|
|
buf += 7;
|
|
|
|
while (*buf && c_isspace(*buf))
|
|
|
|
buf++;
|
|
|
|
|
|
|
|
if (*buf != ':' || !buf[1]) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
|
|
|
|
_("parsing cpu MHz from cpuinfo"));
|
|
|
|
goto cleanup;
|
|
|
|
}
|
2012-05-14 13:12:53 +00:00
|
|
|
|
2014-06-17 10:25:23 +00:00
|
|
|
if (virStrToLong_ui(buf+1, &p, 10, &ui) == 0 &&
|
|
|
|
/* Accept trailing fractional part. */
|
|
|
|
(*p == '\0' || *p == '.' || c_isspace(*p)))
|
|
|
|
nodeinfo->mhz = ui;
|
2007-07-25 23:16:30 +00:00
|
|
|
}
|
2012-05-14 13:12:53 +00:00
|
|
|
|
2014-06-17 10:25:23 +00:00
|
|
|
} else if (ARCH_IS_PPC(arch)) {
|
|
|
|
char *buf = line;
|
|
|
|
if (STRPREFIX(buf, "clock")) {
|
|
|
|
char *p;
|
|
|
|
unsigned int ui;
|
2012-05-14 13:12:53 +00:00
|
|
|
|
2014-06-17 10:25:23 +00:00
|
|
|
buf += 5;
|
|
|
|
while (*buf && c_isspace(*buf))
|
|
|
|
buf++;
|
2012-05-14 13:12:53 +00:00
|
|
|
|
2014-06-17 10:25:23 +00:00
|
|
|
if (*buf != ':' || !buf[1]) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
|
|
|
|
_("parsing cpu MHz from cpuinfo"));
|
|
|
|
goto cleanup;
|
|
|
|
}
|
2012-05-14 13:12:53 +00:00
|
|
|
|
2014-06-17 10:25:23 +00:00
|
|
|
if (virStrToLong_ui(buf+1, &p, 10, &ui) == 0 &&
|
|
|
|
/* Accept trailing fractional part. */
|
|
|
|
(*p == '\0' || *p == '.' || c_isspace(*p)))
|
|
|
|
nodeinfo->mhz = ui;
|
|
|
|
/* No other interesting infos are available in /proc/cpuinfo.
|
|
|
|
* However, there is a line identifying processor's version,
|
|
|
|
* identification and machine, but we don't want it to be caught
|
|
|
|
* and parsed in next iteration, because it is not in expected
|
|
|
|
* format and thus lead to error. */
|
2011-04-14 18:50:22 +00:00
|
|
|
}
|
2014-06-17 10:25:23 +00:00
|
|
|
} else if (ARCH_IS_ARM(arch)) {
|
|
|
|
char *buf = line;
|
|
|
|
if (STRPREFIX(buf, "BogoMIPS")) {
|
|
|
|
char *p;
|
|
|
|
unsigned int ui;
|
2012-05-14 13:12:53 +00:00
|
|
|
|
2014-06-17 10:25:23 +00:00
|
|
|
buf += 8;
|
|
|
|
while (*buf && c_isspace(*buf))
|
|
|
|
buf++;
|
2012-07-26 13:32:07 +00:00
|
|
|
|
2014-06-17 10:25:23 +00:00
|
|
|
if (*buf != ':' || !buf[1]) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
"%s", _("parsing cpu MHz from cpuinfo"));
|
|
|
|
goto cleanup;
|
|
|
|
}
|
2012-07-26 13:32:07 +00:00
|
|
|
|
2014-06-17 10:25:23 +00:00
|
|
|
if (virStrToLong_ui(buf+1, &p, 10, &ui) == 0
|
|
|
|
/* Accept trailing fractional part. */
|
|
|
|
&& (*p == '\0' || *p == '.' || c_isspace(*p)))
|
|
|
|
nodeinfo->mhz = ui;
|
2012-07-26 13:32:07 +00:00
|
|
|
}
|
2014-06-17 10:25:23 +00:00
|
|
|
} else if (ARCH_IS_S390(arch)) {
|
|
|
|
/* s390x has no realistic value for CPU speed,
|
|
|
|
* assign a value of zero to signify this */
|
|
|
|
nodeinfo->mhz = 0;
|
|
|
|
} else {
|
|
|
|
VIR_WARN("Parser for /proc/cpuinfo needs to be adapted for your architecture");
|
|
|
|
break;
|
2012-07-26 13:32:07 +00:00
|
|
|
}
|
2007-07-25 23:16:30 +00:00
|
|
|
}
|
|
|
|
|
2015-07-20 16:37:30 +00:00
|
|
|
/* Get information about what CPUs are present in the host and what
|
|
|
|
* CPUs are online, so that we don't have to so for each node */
|
|
|
|
present_cpus_map = nodeGetPresentCPUBitmap(sysfs_prefix);
|
|
|
|
if (!present_cpus_map)
|
|
|
|
goto cleanup;
|
|
|
|
online_cpus_map = nodeGetOnlineCPUBitmap(sysfs_prefix);
|
|
|
|
if (!online_cpus_map)
|
|
|
|
goto cleanup;
|
|
|
|
|
2012-05-11 19:59:59 +00:00
|
|
|
/* OK, we've parsed clock speed out of /proc/cpuinfo. Get the
|
|
|
|
* core, node, socket, thread and topology information from /sys
|
2007-07-25 23:16:30 +00:00
|
|
|
*/
|
2015-07-14 09:40:13 +00:00
|
|
|
if (virAsprintf(&sysfs_nodedir, "%s/node", prefix) < 0)
|
2012-05-11 19:59:59 +00:00
|
|
|
goto cleanup;
|
2011-10-03 12:45:30 +00:00
|
|
|
|
2012-07-09 14:57:49 +00:00
|
|
|
if (!(nodedir = opendir(sysfs_nodedir))) {
|
|
|
|
/* the host isn't probably running a NUMA architecture */
|
|
|
|
goto fallback;
|
|
|
|
}
|
2011-10-03 12:45:30 +00:00
|
|
|
|
nodeinfo: Fix output on PPC64 KVM hosts
The nodeinfo is reporting incorrect number of cpus and incorrect host
topology on PPC64 KVM hosts. The KVM hypervisor on PPC64 needs only
the primary thread in a core to be online, and the secondaries offlined.
While scheduling a guest in, the kvm scheduler wakes up the secondaries to
run in guest context.
The host scheduling of the guests happen at the core level(as only primary
thread is online). The kvm scheduler exploits as many threads of the core
as needed by guest. Further, starting POWER8, the processor allows splitting
a physical core into multiple subcores with 2 or 4 threads each. Again, only
the primary thread in a subcore is online in the host. The KVM-PPC
scheduler allows guests to exploit all the offline threads in the subcore,
by bringing them online when needed.
(Kernel patches on split-core http://www.spinics.net/lists/kvm-ppc/msg09121.html)
Recently with dynamic micro-threading changes in ppc-kvm, makes sure
to utilize all the offline cpus across guests, and across guests with
different cpu topologies.
(https://www.mail-archive.com/kvm@vger.kernel.org/msg115978.html)
Since the offline cpus are brought online in the guest context, it is safe
to count them as online. Nodeinfo today discounts these offline cpus from
cpu count/topology calclulation, and the nodeinfo output is not of any help
and the host appears overcommited when it is actually not.
The patch carefully counts those offline threads whose primary threads are
online. The host topology displayed by the nodeinfo is also fixed when the
host is in valid kvm state.
Signed-off-by: Shivaprasad G Bhat <sbhat@linux.vnet.ibm.com>
Signed-off-by: Andrea Bolognani <abologna@redhat.com>
2015-07-30 09:37:04 +00:00
|
|
|
/* PPC-KVM needs the secondary threads of a core to be offline on the
|
|
|
|
* host. The kvm scheduler brings the secondary threads online in the
|
|
|
|
* guest context. Moreover, P8 processor has split-core capability
|
|
|
|
* where, there can be 1,2 or 4 subcores per core. The primaries of the
|
|
|
|
* subcores alone will be online on the host for a subcore in the
|
|
|
|
* host. Even though the actual threads per core for P8 processor is 8,
|
|
|
|
* depending on the subcores_per_core = 1, 2 or 4, the threads per
|
|
|
|
* subcore will vary accordingly to 8, 4 and 2 repectively.
|
|
|
|
* So, On host threads_per_core what is arrived at from sysfs in the
|
|
|
|
* current logic is actually the subcores_per_core. Threads per subcore
|
|
|
|
* can only be obtained from the kvm device. For example, on P8 wih 1
|
|
|
|
* core having 8 threads, sub_cores_percore=4, the threads 0,2,4 & 6
|
|
|
|
* will be online. The sysfs reflects this and in the current logic
|
|
|
|
* variable 'threads' will be 4 which is nothing but subcores_per_core.
|
|
|
|
* If the user tampers the cpu online/offline states using chcpu or other
|
|
|
|
* means, then it is an unsupported configuration for kvm.
|
|
|
|
* The code below tries to keep in mind
|
|
|
|
* - when the libvirtd is run inside a KVM guest or Phyp based guest.
|
|
|
|
* - Or on the kvm host where user manually tampers the cpu states to
|
|
|
|
* offline/online randomly.
|
|
|
|
* On hosts other than POWER this will be 0, in which case a simpler
|
|
|
|
* thread-counting logic will be used */
|
|
|
|
if ((threads_per_subcore = nodeGetThreadsPerSubcore(arch)) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
/* If the subcore configuration is not valid, just pretend subcores
|
|
|
|
* are not in use and count threads one by one */
|
|
|
|
if (!nodeHasValidSubcoreConfiguration(sysfs_prefix, threads_per_subcore))
|
|
|
|
threads_per_subcore = 0;
|
|
|
|
|
2014-04-20 11:53:46 +00:00
|
|
|
while ((direrr = virDirRead(nodedir, &nodedirent, sysfs_nodedir)) > 0) {
|
2012-07-09 14:57:49 +00:00
|
|
|
if (sscanf(nodedirent->d_name, "node%u", &node) != 1)
|
2010-03-04 22:28:40 +00:00
|
|
|
continue;
|
|
|
|
|
2012-07-09 14:57:49 +00:00
|
|
|
nodeinfo->nodes++;
|
|
|
|
|
|
|
|
if (virAsprintf(&sysfs_cpudir, "%s/node/%s",
|
2015-07-14 09:40:13 +00:00
|
|
|
prefix, nodedirent->d_name) < 0)
|
2012-05-11 19:59:59 +00:00
|
|
|
goto cleanup;
|
2010-08-10 21:33:37 +00:00
|
|
|
|
2015-07-20 16:37:30 +00:00
|
|
|
if ((cpus = virNodeParseNode(sysfs_cpudir, arch,
|
|
|
|
present_cpus_map,
|
|
|
|
online_cpus_map,
|
nodeinfo: Fix output on PPC64 KVM hosts
The nodeinfo is reporting incorrect number of cpus and incorrect host
topology on PPC64 KVM hosts. The KVM hypervisor on PPC64 needs only
the primary thread in a core to be online, and the secondaries offlined.
While scheduling a guest in, the kvm scheduler wakes up the secondaries to
run in guest context.
The host scheduling of the guests happen at the core level(as only primary
thread is online). The kvm scheduler exploits as many threads of the core
as needed by guest. Further, starting POWER8, the processor allows splitting
a physical core into multiple subcores with 2 or 4 threads each. Again, only
the primary thread in a subcore is online in the host. The KVM-PPC
scheduler allows guests to exploit all the offline threads in the subcore,
by bringing them online when needed.
(Kernel patches on split-core http://www.spinics.net/lists/kvm-ppc/msg09121.html)
Recently with dynamic micro-threading changes in ppc-kvm, makes sure
to utilize all the offline cpus across guests, and across guests with
different cpu topologies.
(https://www.mail-archive.com/kvm@vger.kernel.org/msg115978.html)
Since the offline cpus are brought online in the guest context, it is safe
to count them as online. Nodeinfo today discounts these offline cpus from
cpu count/topology calclulation, and the nodeinfo output is not of any help
and the host appears overcommited when it is actually not.
The patch carefully counts those offline threads whose primary threads are
online. The host topology displayed by the nodeinfo is also fixed when the
host is in valid kvm state.
Signed-off-by: Shivaprasad G Bhat <sbhat@linux.vnet.ibm.com>
Signed-off-by: Andrea Bolognani <abologna@redhat.com>
2015-07-30 09:37:04 +00:00
|
|
|
threads_per_subcore,
|
2014-06-17 11:58:48 +00:00
|
|
|
&socks, &cores,
|
2012-11-07 13:53:36 +00:00
|
|
|
&threads, &offline)) < 0)
|
2012-07-09 14:57:49 +00:00
|
|
|
goto cleanup;
|
2011-10-03 12:45:30 +00:00
|
|
|
|
2012-07-09 14:57:49 +00:00
|
|
|
VIR_FREE(sysfs_cpudir);
|
2010-03-04 22:28:40 +00:00
|
|
|
|
2012-07-09 14:57:49 +00:00
|
|
|
nodeinfo->cpus += cpus;
|
|
|
|
|
|
|
|
if (socks > nodeinfo->sockets)
|
|
|
|
nodeinfo->sockets = socks;
|
|
|
|
|
|
|
|
if (cores > nodeinfo->cores)
|
|
|
|
nodeinfo->cores = cores;
|
|
|
|
|
|
|
|
if (threads > nodeinfo->threads)
|
|
|
|
nodeinfo->threads = threads;
|
2010-03-04 22:28:40 +00:00
|
|
|
}
|
2012-07-09 14:57:49 +00:00
|
|
|
|
2014-04-20 11:53:46 +00:00
|
|
|
if (direrr < 0)
|
2012-05-11 19:59:59 +00:00
|
|
|
goto cleanup;
|
2012-07-09 14:57:49 +00:00
|
|
|
|
|
|
|
if (nodeinfo->cpus && nodeinfo->nodes)
|
|
|
|
goto done;
|
|
|
|
|
2014-03-25 06:57:22 +00:00
|
|
|
fallback:
|
2012-07-09 14:57:49 +00:00
|
|
|
VIR_FREE(sysfs_cpudir);
|
|
|
|
|
2015-07-14 09:40:13 +00:00
|
|
|
if (virAsprintf(&sysfs_cpudir, "%s/cpu", prefix) < 0)
|
2012-05-11 19:59:59 +00:00
|
|
|
goto cleanup;
|
2010-03-04 22:28:40 +00:00
|
|
|
|
2015-07-20 16:37:30 +00:00
|
|
|
if ((cpus = virNodeParseNode(sysfs_cpudir, arch,
|
|
|
|
present_cpus_map,
|
|
|
|
online_cpus_map,
|
nodeinfo: Fix output on PPC64 KVM hosts
The nodeinfo is reporting incorrect number of cpus and incorrect host
topology on PPC64 KVM hosts. The KVM hypervisor on PPC64 needs only
the primary thread in a core to be online, and the secondaries offlined.
While scheduling a guest in, the kvm scheduler wakes up the secondaries to
run in guest context.
The host scheduling of the guests happen at the core level(as only primary
thread is online). The kvm scheduler exploits as many threads of the core
as needed by guest. Further, starting POWER8, the processor allows splitting
a physical core into multiple subcores with 2 or 4 threads each. Again, only
the primary thread in a subcore is online in the host. The KVM-PPC
scheduler allows guests to exploit all the offline threads in the subcore,
by bringing them online when needed.
(Kernel patches on split-core http://www.spinics.net/lists/kvm-ppc/msg09121.html)
Recently with dynamic micro-threading changes in ppc-kvm, makes sure
to utilize all the offline cpus across guests, and across guests with
different cpu topologies.
(https://www.mail-archive.com/kvm@vger.kernel.org/msg115978.html)
Since the offline cpus are brought online in the guest context, it is safe
to count them as online. Nodeinfo today discounts these offline cpus from
cpu count/topology calclulation, and the nodeinfo output is not of any help
and the host appears overcommited when it is actually not.
The patch carefully counts those offline threads whose primary threads are
online. The host topology displayed by the nodeinfo is also fixed when the
host is in valid kvm state.
Signed-off-by: Shivaprasad G Bhat <sbhat@linux.vnet.ibm.com>
Signed-off-by: Andrea Bolognani <abologna@redhat.com>
2015-07-30 09:37:04 +00:00
|
|
|
threads_per_subcore,
|
2014-06-17 11:58:48 +00:00
|
|
|
&socks, &cores,
|
2012-11-07 13:53:36 +00:00
|
|
|
&threads, &offline)) < 0)
|
2012-05-11 19:59:59 +00:00
|
|
|
goto cleanup;
|
2007-07-25 23:16:30 +00:00
|
|
|
|
2012-07-09 14:57:49 +00:00
|
|
|
nodeinfo->nodes = 1;
|
|
|
|
nodeinfo->cpus = cpus;
|
|
|
|
nodeinfo->sockets = socks;
|
|
|
|
nodeinfo->cores = cores;
|
|
|
|
nodeinfo->threads = threads;
|
|
|
|
|
2014-03-25 06:57:22 +00:00
|
|
|
done:
|
2012-05-11 19:59:59 +00:00
|
|
|
/* There should always be at least one cpu, socket, node, and thread. */
|
2011-10-03 12:45:30 +00:00
|
|
|
if (nodeinfo->cpus == 0) {
|
2012-07-18 18:19:23 +00:00
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR, "%s", _("no CPUs found"));
|
2012-05-11 19:59:59 +00:00
|
|
|
goto cleanup;
|
2011-10-03 12:45:30 +00:00
|
|
|
}
|
2012-07-09 14:57:49 +00:00
|
|
|
|
2010-03-09 15:17:59 +00:00
|
|
|
if (nodeinfo->sockets == 0) {
|
2012-07-18 18:19:23 +00:00
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR, "%s", _("no sockets found"));
|
2012-05-11 19:59:59 +00:00
|
|
|
goto cleanup;
|
2010-03-09 15:17:59 +00:00
|
|
|
}
|
2012-07-09 14:57:49 +00:00
|
|
|
|
2010-03-09 15:17:59 +00:00
|
|
|
if (nodeinfo->threads == 0) {
|
2012-07-18 18:19:23 +00:00
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR, "%s", _("no threads found"));
|
2012-05-11 19:59:59 +00:00
|
|
|
goto cleanup;
|
2010-03-09 15:17:59 +00:00
|
|
|
}
|
|
|
|
|
2012-11-07 13:53:36 +00:00
|
|
|
/* Now check if the topology makes sense. There are machines that don't
|
|
|
|
* expose their real number of nodes or for example the AMD Bulldozer
|
|
|
|
* architecture that exposes their Clustered integer core modules as both
|
|
|
|
* threads and cores. This approach throws off our detection. Unfortunately
|
|
|
|
* the nodeinfo structure isn't designed to carry the full topology so
|
|
|
|
* we're going to lie about the detected topology to notify the user
|
|
|
|
* to check the host capabilities for the actual topology. */
|
|
|
|
if ((nodeinfo->nodes *
|
|
|
|
nodeinfo->sockets *
|
|
|
|
nodeinfo->cores *
|
|
|
|
nodeinfo->threads) != (nodeinfo->cpus + offline)) {
|
|
|
|
nodeinfo->nodes = 1;
|
|
|
|
nodeinfo->sockets = 1;
|
|
|
|
nodeinfo->cores = nodeinfo->cpus + offline;
|
|
|
|
nodeinfo->threads = 1;
|
|
|
|
}
|
|
|
|
|
2012-05-11 19:59:59 +00:00
|
|
|
ret = 0;
|
|
|
|
|
2014-03-25 06:57:22 +00:00
|
|
|
cleanup:
|
2012-07-09 14:57:49 +00:00
|
|
|
/* don't shadow a more serious error */
|
|
|
|
if (nodedir && closedir(nodedir) < 0 && ret >= 0) {
|
|
|
|
virReportSystemError(errno, _("problem closing %s"), sysfs_nodedir);
|
|
|
|
ret = -1;
|
|
|
|
}
|
|
|
|
|
2015-07-20 16:37:30 +00:00
|
|
|
virBitmapFree(present_cpus_map);
|
|
|
|
virBitmapFree(online_cpus_map);
|
2012-07-09 14:57:49 +00:00
|
|
|
VIR_FREE(sysfs_nodedir);
|
2012-05-11 19:59:59 +00:00
|
|
|
VIR_FREE(sysfs_cpudir);
|
|
|
|
return ret;
|
2007-07-25 23:16:30 +00:00
|
|
|
}
|
|
|
|
|
2014-01-21 12:57:30 +00:00
|
|
|
static int
|
|
|
|
virNodeCPUStatsAssign(virNodeCPUStatsPtr param,
|
|
|
|
const char *name,
|
|
|
|
unsigned long long value)
|
|
|
|
{
|
|
|
|
if (virStrcpyStatic(param->field, name) == NULL) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
2014-01-22 12:58:26 +00:00
|
|
|
"%s", _("kernel cpu time field is too long"
|
|
|
|
" for the destination"));
|
2014-01-21 12:57:30 +00:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
param->value = value;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2011-06-07 01:02:55 +00:00
|
|
|
# define TICK_TO_NSEC (1000ull * 1000ull * 1000ull / sysconf(_SC_CLK_TCK))
|
|
|
|
|
2014-01-16 11:37:27 +00:00
|
|
|
int
|
2013-10-15 13:44:48 +00:00
|
|
|
linuxNodeGetCPUStats(FILE *procstat,
|
|
|
|
int cpuNum,
|
|
|
|
virNodeCPUStatsPtr params,
|
|
|
|
int *nparams)
|
2011-06-07 01:02:55 +00:00
|
|
|
{
|
|
|
|
int ret = -1;
|
|
|
|
char line[1024];
|
|
|
|
unsigned long long usr, ni, sys, idle, iowait;
|
|
|
|
unsigned long long irq, softirq, steal, guest, guest_nice;
|
2014-01-21 05:21:49 +00:00
|
|
|
char cpu_header[4 + INT_BUFSIZE_BOUND(cpuNum)];
|
2011-06-07 01:02:55 +00:00
|
|
|
|
|
|
|
if ((*nparams) == 0) {
|
|
|
|
/* Current number of cpu stats supported by linux */
|
|
|
|
*nparams = LINUX_NB_CPU_STATS;
|
|
|
|
ret = 0;
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ((*nparams) != LINUX_NB_CPU_STATS) {
|
Santize the reporting of VIR_ERR_INVALID_ERROR
To ensure consistent error reporting of invalid arguments,
provide a number of predefined helper methods & macros.
- An arg which must not be NULL:
virCheckNonNullArgReturn(argname, retvalue)
virCheckNonNullArgGoto(argname, label)
- An arg which must be NULL
virCheckNullArgGoto(argname, label)
- An arg which must be positive (ie 1 or greater)
virCheckPositiveArgGoto(argname, label)
- An arg which must not be 0
virCheckNonZeroArgGoto(argname, label)
- An arg which must be zero
virCheckZeroArgGoto(argname, label)
- An arg which must not be negative (ie 0 or greater)
virCheckNonNegativeArgGoto(argname, label)
* src/libvirt.c, src/libvirt-qemu.c,
src/nodeinfo.c, src/datatypes.c: Update to use
virCheckXXXX macros
* po/POTFILES.in: Add libvirt-qemu.c and virterror_internal.h
* src/internal.h: Define macros for checking invalid args
* src/util/virterror_internal.h: Define macros for reporting
invalid args
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2012-05-25 17:41:07 +00:00
|
|
|
virReportInvalidArg(*nparams,
|
|
|
|
_("nparams in %s must be equal to %d"),
|
|
|
|
__FUNCTION__, LINUX_NB_CPU_STATS);
|
2011-06-07 01:02:55 +00:00
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
2011-06-15 10:39:57 +00:00
|
|
|
if (cpuNum == VIR_NODE_CPU_STATS_ALL_CPUS) {
|
2014-01-16 08:18:09 +00:00
|
|
|
strcpy(cpu_header, "cpu ");
|
2011-06-07 01:02:55 +00:00
|
|
|
} else {
|
2014-01-16 08:18:09 +00:00
|
|
|
snprintf(cpu_header, sizeof(cpu_header), "cpu%d ", cpuNum);
|
2011-06-07 01:02:55 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
while (fgets(line, sizeof(line), procstat) != NULL) {
|
|
|
|
char *buf = line;
|
|
|
|
|
|
|
|
if (STRPREFIX(buf, cpu_header)) { /* aka logical CPU time */
|
|
|
|
if (sscanf(buf,
|
|
|
|
"%*s %llu %llu %llu %llu %llu" // user ~ iowait
|
|
|
|
"%llu %llu %llu %llu %llu", // irq ~ guest_nice
|
|
|
|
&usr, &ni, &sys, &idle, &iowait,
|
|
|
|
&irq, &softirq, &steal, &guest, &guest_nice) < 4) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2014-01-21 12:57:30 +00:00
|
|
|
if (virNodeCPUStatsAssign(¶ms[0], VIR_NODE_CPU_STATS_KERNEL,
|
|
|
|
(sys + irq + softirq) * TICK_TO_NSEC) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
if (virNodeCPUStatsAssign(¶ms[1], VIR_NODE_CPU_STATS_USER,
|
|
|
|
(usr + ni) * TICK_TO_NSEC) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
if (virNodeCPUStatsAssign(¶ms[2], VIR_NODE_CPU_STATS_IDLE,
|
|
|
|
idle * TICK_TO_NSEC) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
if (virNodeCPUStatsAssign(¶ms[3], VIR_NODE_CPU_STATS_IOWAIT,
|
|
|
|
iowait * TICK_TO_NSEC) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
2011-06-07 01:02:55 +00:00
|
|
|
ret = 0;
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
Santize the reporting of VIR_ERR_INVALID_ERROR
To ensure consistent error reporting of invalid arguments,
provide a number of predefined helper methods & macros.
- An arg which must not be NULL:
virCheckNonNullArgReturn(argname, retvalue)
virCheckNonNullArgGoto(argname, label)
- An arg which must be NULL
virCheckNullArgGoto(argname, label)
- An arg which must be positive (ie 1 or greater)
virCheckPositiveArgGoto(argname, label)
- An arg which must not be 0
virCheckNonZeroArgGoto(argname, label)
- An arg which must be zero
virCheckZeroArgGoto(argname, label)
- An arg which must not be negative (ie 0 or greater)
virCheckNonNegativeArgGoto(argname, label)
* src/libvirt.c, src/libvirt-qemu.c,
src/nodeinfo.c, src/datatypes.c: Update to use
virCheckXXXX macros
* po/POTFILES.in: Add libvirt-qemu.c and virterror_internal.h
* src/internal.h: Define macros for checking invalid args
* src/util/virterror_internal.h: Define macros for reporting
invalid args
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2012-05-25 17:41:07 +00:00
|
|
|
virReportInvalidArg(cpuNum,
|
|
|
|
_("Invalid cpuNum in %s"),
|
|
|
|
__FUNCTION__);
|
2011-06-07 01:02:55 +00:00
|
|
|
|
2014-03-25 06:57:22 +00:00
|
|
|
cleanup:
|
2011-06-07 01:11:17 +00:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2013-10-15 13:44:48 +00:00
|
|
|
static int
|
|
|
|
linuxNodeGetMemoryStats(FILE *meminfo,
|
|
|
|
int cellNum,
|
|
|
|
virNodeMemoryStatsPtr params,
|
|
|
|
int *nparams)
|
2011-06-07 01:11:17 +00:00
|
|
|
{
|
|
|
|
int ret = -1;
|
Convert 'int i' to 'size_t i' in src/node_device/ files
Convert the type of loop iterators named 'i', 'j', k',
'ii', 'jj', 'kk', to be 'size_t' instead of 'int' or
'unsigned int', also santizing 'ii', 'jj', 'kk' to use
the normal 'i', 'j', 'k' naming
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2013-07-08 14:09:33 +00:00
|
|
|
size_t i = 0, j = 0, k = 0;
|
2011-06-07 01:11:17 +00:00
|
|
|
int found = 0;
|
|
|
|
int nr_param;
|
|
|
|
char line[1024];
|
2011-06-15 10:39:57 +00:00
|
|
|
char meminfo_hdr[VIR_NODE_MEMORY_STATS_FIELD_LENGTH];
|
2011-06-07 01:11:17 +00:00
|
|
|
unsigned long val;
|
|
|
|
struct field_conv {
|
|
|
|
const char *meminfo_hdr; // meminfo header
|
|
|
|
const char *field; // MemoryStats field name
|
|
|
|
} field_conv[] = {
|
2011-06-15 10:39:57 +00:00
|
|
|
{"MemTotal:", VIR_NODE_MEMORY_STATS_TOTAL},
|
|
|
|
{"MemFree:", VIR_NODE_MEMORY_STATS_FREE},
|
|
|
|
{"Buffers:", VIR_NODE_MEMORY_STATS_BUFFERS},
|
|
|
|
{"Cached:", VIR_NODE_MEMORY_STATS_CACHED},
|
2011-06-07 01:11:17 +00:00
|
|
|
{NULL, NULL}
|
|
|
|
};
|
|
|
|
|
2011-06-15 10:39:57 +00:00
|
|
|
if (cellNum == VIR_NODE_MEMORY_STATS_ALL_CELLS) {
|
2011-06-07 01:11:17 +00:00
|
|
|
nr_param = LINUX_NB_MEMORY_STATS_ALL;
|
|
|
|
} else {
|
|
|
|
nr_param = LINUX_NB_MEMORY_STATS_CELL;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ((*nparams) == 0) {
|
|
|
|
/* Current number of memory stats supported by linux */
|
|
|
|
*nparams = nr_param;
|
|
|
|
ret = 0;
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ((*nparams) != nr_param) {
|
Santize the reporting of VIR_ERR_INVALID_ERROR
To ensure consistent error reporting of invalid arguments,
provide a number of predefined helper methods & macros.
- An arg which must not be NULL:
virCheckNonNullArgReturn(argname, retvalue)
virCheckNonNullArgGoto(argname, label)
- An arg which must be NULL
virCheckNullArgGoto(argname, label)
- An arg which must be positive (ie 1 or greater)
virCheckPositiveArgGoto(argname, label)
- An arg which must not be 0
virCheckNonZeroArgGoto(argname, label)
- An arg which must be zero
virCheckZeroArgGoto(argname, label)
- An arg which must not be negative (ie 0 or greater)
virCheckNonNegativeArgGoto(argname, label)
* src/libvirt.c, src/libvirt-qemu.c,
src/nodeinfo.c, src/datatypes.c: Update to use
virCheckXXXX macros
* po/POTFILES.in: Add libvirt-qemu.c and virterror_internal.h
* src/internal.h: Define macros for checking invalid args
* src/util/virterror_internal.h: Define macros for reporting
invalid args
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2012-05-25 17:41:07 +00:00
|
|
|
virReportInvalidArg(nparams,
|
|
|
|
_("nparams in %s must be %d"),
|
|
|
|
__FUNCTION__, nr_param);
|
2011-06-07 01:11:17 +00:00
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
while (fgets(line, sizeof(line), meminfo) != NULL) {
|
|
|
|
char *buf = line;
|
|
|
|
|
|
|
|
if (STRPREFIX(buf, "Node ")) {
|
|
|
|
/*
|
|
|
|
* /sys/devices/system/node/nodeX/meminfo format is below.
|
|
|
|
* So, skip prefix "Node XX ".
|
|
|
|
*
|
|
|
|
* Node 0 MemTotal: 8386980 kB
|
|
|
|
* Node 0 MemFree: 5300920 kB
|
|
|
|
* :
|
|
|
|
*/
|
|
|
|
char *p;
|
|
|
|
|
|
|
|
p = buf;
|
|
|
|
for (i = 0; i < 2; i++) {
|
|
|
|
p = strchr(p, ' ');
|
|
|
|
if (p == NULL) {
|
2012-07-18 18:19:23 +00:00
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
"%s", _("no prefix found"));
|
2011-06-07 01:11:17 +00:00
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
p++;
|
|
|
|
}
|
|
|
|
buf = p;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (sscanf(buf, "%s %lu kB", meminfo_hdr, &val) < 2)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
for (j = 0; field_conv[j].meminfo_hdr != NULL; j++) {
|
|
|
|
struct field_conv *convp = &field_conv[j];
|
|
|
|
|
|
|
|
if (STREQ(meminfo_hdr, convp->meminfo_hdr)) {
|
2011-06-15 10:39:57 +00:00
|
|
|
virNodeMemoryStatsPtr param = ¶ms[k++];
|
2011-06-07 01:11:17 +00:00
|
|
|
|
|
|
|
if (virStrcpyStatic(param->field, convp->field) == NULL) {
|
2012-07-18 18:19:23 +00:00
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
"%s", _("Field kernel memory too long for destination"));
|
2011-06-07 01:11:17 +00:00
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
param->value = val;
|
|
|
|
found++;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (found >= nr_param)
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (found == 0) {
|
2012-07-18 18:19:23 +00:00
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
"%s", _("no available memory line found"));
|
2011-06-07 01:11:17 +00:00
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = 0;
|
|
|
|
|
2014-03-25 06:57:22 +00:00
|
|
|
cleanup:
|
2011-06-07 01:02:55 +00:00
|
|
|
return ret;
|
|
|
|
}
|
2012-03-02 02:54:22 +00:00
|
|
|
|
2015-07-06 21:03:51 +00:00
|
|
|
static char *
|
2015-07-20 16:37:21 +00:00
|
|
|
linuxGetCPUGlobalPath(const char *sysfs_prefix,
|
|
|
|
const char *file)
|
2015-07-06 21:03:51 +00:00
|
|
|
{
|
|
|
|
const char *prefix = sysfs_prefix ? sysfs_prefix : SYSFS_SYSTEM_PATH;
|
|
|
|
char *path = NULL;
|
|
|
|
|
2015-07-20 16:37:21 +00:00
|
|
|
if (virAsprintf(&path, "%s/cpu/%s", prefix, file) < 0)
|
2015-07-06 21:03:51 +00:00
|
|
|
return NULL;
|
2015-07-20 16:37:21 +00:00
|
|
|
|
2015-07-06 21:03:51 +00:00
|
|
|
return path;
|
|
|
|
}
|
2012-10-24 22:43:26 +00:00
|
|
|
|
2015-07-20 16:37:21 +00:00
|
|
|
static char *
|
|
|
|
linuxGetCPUPresentPath(const char *sysfs_prefix)
|
|
|
|
{
|
|
|
|
return linuxGetCPUGlobalPath(sysfs_prefix, "present");
|
|
|
|
}
|
|
|
|
|
2015-07-20 16:37:22 +00:00
|
|
|
static char *
|
|
|
|
linuxGetCPUOnlinePath(const char *sysfs_prefix)
|
|
|
|
{
|
|
|
|
return linuxGetCPUGlobalPath(sysfs_prefix, "online");
|
|
|
|
}
|
|
|
|
|
2015-07-20 16:37:23 +00:00
|
|
|
/* Determine the number of CPUs (maximum CPU id + 1) from a file containing
|
|
|
|
* a list of CPU ids, like the Linux sysfs cpu/present file */
|
2012-10-24 22:43:26 +00:00
|
|
|
static int
|
2015-07-20 16:37:23 +00:00
|
|
|
linuxParseCPUCount(const char *path)
|
2012-10-24 22:43:26 +00:00
|
|
|
{
|
|
|
|
char *str = NULL;
|
|
|
|
char *tmp;
|
|
|
|
int ret = -1;
|
|
|
|
|
2012-11-15 14:04:33 +00:00
|
|
|
if (virFileReadAll(path, 5 * VIR_DOMAIN_CPUMASK_LEN, &str) < 0)
|
2012-10-24 22:43:26 +00:00
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
tmp = str;
|
|
|
|
do {
|
|
|
|
if (virStrToLong_i(tmp, &tmp, 10, &ret) < 0 ||
|
|
|
|
!strchr(",-\n", *tmp)) {
|
|
|
|
virReportError(VIR_ERR_NO_SUPPORT,
|
|
|
|
_("failed to parse %s"), path);
|
|
|
|
ret = -1;
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
} while (*tmp++ != '\n');
|
|
|
|
ret++;
|
|
|
|
|
2014-03-25 06:57:22 +00:00
|
|
|
cleanup:
|
2012-10-24 22:43:26 +00:00
|
|
|
VIR_FREE(str);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2012-03-02 02:54:22 +00:00
|
|
|
/*
|
2012-10-24 22:43:26 +00:00
|
|
|
* Linux maintains cpu bit map under cpu/online. For example, if
|
|
|
|
* cpuid=5's flag is not set and max cpu is 7, the map file shows
|
|
|
|
* 0-4,6-7. This function parses it and returns cpumap.
|
2012-03-02 02:54:22 +00:00
|
|
|
*/
|
2012-09-14 07:47:03 +00:00
|
|
|
static virBitmapPtr
|
2012-10-24 22:43:26 +00:00
|
|
|
linuxParseCPUmap(int max_cpuid, const char *path)
|
2012-03-02 02:54:22 +00:00
|
|
|
{
|
2012-09-14 07:47:03 +00:00
|
|
|
virBitmapPtr map = NULL;
|
2012-03-02 02:54:22 +00:00
|
|
|
char *str = NULL;
|
|
|
|
|
2013-07-04 10:20:00 +00:00
|
|
|
if (virFileReadAll(path, 5 * VIR_DOMAIN_CPUMASK_LEN, &str) < 0)
|
2012-03-02 02:54:22 +00:00
|
|
|
goto error;
|
|
|
|
|
2012-10-24 22:43:26 +00:00
|
|
|
if (virBitmapParse(str, 0, &map, max_cpuid) < 0)
|
2012-03-02 02:54:22 +00:00
|
|
|
goto error;
|
|
|
|
|
2012-04-24 08:55:06 +00:00
|
|
|
VIR_FREE(str);
|
2012-03-02 02:54:22 +00:00
|
|
|
return map;
|
|
|
|
|
2014-03-25 06:57:22 +00:00
|
|
|
error:
|
2012-03-02 02:54:22 +00:00
|
|
|
VIR_FREE(str);
|
2012-09-14 07:47:03 +00:00
|
|
|
virBitmapFree(map);
|
2012-03-02 02:54:22 +00:00
|
|
|
return NULL;
|
|
|
|
}
|
2013-11-07 00:09:26 +00:00
|
|
|
|
|
|
|
|
|
|
|
static virBitmapPtr
|
|
|
|
virNodeGetSiblingsList(const char *dir, int cpu_id)
|
|
|
|
{
|
|
|
|
char *path = NULL;
|
|
|
|
char *buf = NULL;
|
|
|
|
virBitmapPtr ret = NULL;
|
|
|
|
|
|
|
|
if (virAsprintf(&path, "%s/cpu%u/topology/thread_siblings_list",
|
|
|
|
dir, cpu_id) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
if (virFileReadAll(path, SYSFS_THREAD_SIBLINGS_LIST_LENGTH_MAX, &buf) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
if (virBitmapParse(buf, 0, &ret, virNumaGetMaxCPUs()) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
2014-03-25 06:57:22 +00:00
|
|
|
cleanup:
|
2013-11-07 00:09:26 +00:00
|
|
|
VIR_FREE(buf);
|
|
|
|
VIR_FREE(path);
|
|
|
|
return ret;
|
|
|
|
}
|
2007-07-25 23:16:30 +00:00
|
|
|
#endif
|
|
|
|
|
2015-07-14 09:40:14 +00:00
|
|
|
int
|
|
|
|
nodeGetInfo(const char *sysfs_prefix ATTRIBUTE_UNUSED,
|
|
|
|
virNodeInfoPtr nodeinfo)
|
2012-12-10 21:58:16 +00:00
|
|
|
{
|
|
|
|
virArch hostarch = virArchFromHost();
|
2009-01-20 17:13:33 +00:00
|
|
|
|
2013-01-23 15:43:21 +00:00
|
|
|
memset(nodeinfo, 0, sizeof(*nodeinfo));
|
|
|
|
|
2012-12-10 21:58:16 +00:00
|
|
|
if (virStrcpyStatic(nodeinfo->model, virArchToString(hostarch)) == NULL)
|
2009-08-03 12:37:44 +00:00
|
|
|
return -1;
|
2007-12-07 14:45:39 +00:00
|
|
|
|
2007-07-25 23:16:30 +00:00
|
|
|
#ifdef __linux__
|
Use gnulib, starting with its physmem and getaddrinfo modules.
New files go into these directories:
gnulib/lib
gnulib/m4
gnulib/tests
* bootstrap: A wrapper around gnulib-tool.
* configure.in: Invoke gl_EARLY and gl_INIT, being careful to put gl_EARLY
before any macro that uses AC_COMPILE_IFELSE.
(AC_OUTPUT): Add lib/Makefile and gl-tests/Makefile. Remove m4/Makefile.
* Makefile.am (SUBDIRS): Add gnulib/lib and remove m4. Add gnulib/tests
early enough that those tests run before any libvirt unit tests.
* m4/Makefile.am: Remove file. Not needed.
* src/Makefile.am (INCLUDES): Add -I$(top_srcdir)/gnulib/lib -I../gnulib/lib.
(LDADDS, libvirt_la_LIBADD): Add ../gnulib/lib/libgnu.la.
* src/nodeinfo.c: Include "physmem.h".
* qemud/qemud.c, src/remote_internal.c: Include "getaddrinfo.h".
(MEMINFO_PATH, linuxNodeInfoMemPopulate): Remove definitions.
(virNodeInfoPopulate): Use physmem_total, not linuxNodeInfoMemPopulate.
* tests/Makefile.am (INCLUDES): Add -I$(top_srcdir)/gnulib/lib -I../gnulib/lib.
(LDADDS): Add ../gnulib/lib/libgnu.la.
* qemud/Makefile.am (libvirtd_LDADD): Add ../gnulib/lib/libgnu.la.
* tests/nodeinfotest.c (linuxTestCompareFiles): No longer read total
memory from a file.
Update expected output not to include "Memory: NNNN"
* tests/nodeinfodata/linux-nodeinfo-1.txt:
* tests/nodeinfodata/linux-nodeinfo-2.txt:
* tests/nodeinfodata/linux-nodeinfo-3.txt:
* tests/nodeinfodata/linux-nodeinfo-4.txt:
* tests/nodeinfodata/linux-nodeinfo-5.txt:
* tests/nodeinfodata/linux-nodeinfo-6.txt:
* src/test.c [WITH_TEST]: Remove definition of _GNU_SOURCE that
would conflict with the one now in "config.h".
* autogen.sh: Add -I gnulib/m4.
* src/conf.c, src/sexpr.c: Don't define _GNU_SOURCE.
Instead, include "config.h".
* qemud/qemud.c: Remove definition of _GNU_SOURCE.
* src/openvz_driver.c: Likewise.
* src/qemu_driver.c: Likewise.
* src/remote_internal.c: Likewise.
* configure.in: Use AC_CONFIG_AUX_DIR(build-aux), so that a bunch
of gettextize-generated files go into build-aux/, rather than in
the top-level directory.
* .cvsignore: Adjust.
* build-aux/.cvsignore: New file.
Author: Jim Meyering <meyering@redhat.com>
2007-12-05 21:31:07 +00:00
|
|
|
{
|
2012-05-02 15:18:03 +00:00
|
|
|
int ret = -1;
|
Use gnulib, starting with its physmem and getaddrinfo modules.
New files go into these directories:
gnulib/lib
gnulib/m4
gnulib/tests
* bootstrap: A wrapper around gnulib-tool.
* configure.in: Invoke gl_EARLY and gl_INIT, being careful to put gl_EARLY
before any macro that uses AC_COMPILE_IFELSE.
(AC_OUTPUT): Add lib/Makefile and gl-tests/Makefile. Remove m4/Makefile.
* Makefile.am (SUBDIRS): Add gnulib/lib and remove m4. Add gnulib/tests
early enough that those tests run before any libvirt unit tests.
* m4/Makefile.am: Remove file. Not needed.
* src/Makefile.am (INCLUDES): Add -I$(top_srcdir)/gnulib/lib -I../gnulib/lib.
(LDADDS, libvirt_la_LIBADD): Add ../gnulib/lib/libgnu.la.
* src/nodeinfo.c: Include "physmem.h".
* qemud/qemud.c, src/remote_internal.c: Include "getaddrinfo.h".
(MEMINFO_PATH, linuxNodeInfoMemPopulate): Remove definitions.
(virNodeInfoPopulate): Use physmem_total, not linuxNodeInfoMemPopulate.
* tests/Makefile.am (INCLUDES): Add -I$(top_srcdir)/gnulib/lib -I../gnulib/lib.
(LDADDS): Add ../gnulib/lib/libgnu.la.
* qemud/Makefile.am (libvirtd_LDADD): Add ../gnulib/lib/libgnu.la.
* tests/nodeinfotest.c (linuxTestCompareFiles): No longer read total
memory from a file.
Update expected output not to include "Memory: NNNN"
* tests/nodeinfodata/linux-nodeinfo-1.txt:
* tests/nodeinfodata/linux-nodeinfo-2.txt:
* tests/nodeinfodata/linux-nodeinfo-3.txt:
* tests/nodeinfodata/linux-nodeinfo-4.txt:
* tests/nodeinfodata/linux-nodeinfo-5.txt:
* tests/nodeinfodata/linux-nodeinfo-6.txt:
* src/test.c [WITH_TEST]: Remove definition of _GNU_SOURCE that
would conflict with the one now in "config.h".
* autogen.sh: Add -I gnulib/m4.
* src/conf.c, src/sexpr.c: Don't define _GNU_SOURCE.
Instead, include "config.h".
* qemud/qemud.c: Remove definition of _GNU_SOURCE.
* src/openvz_driver.c: Likewise.
* src/qemu_driver.c: Likewise.
* src/remote_internal.c: Likewise.
* configure.in: Use AC_CONFIG_AUX_DIR(build-aux), so that a bunch
of gettextize-generated files go into build-aux/, rather than in
the top-level directory.
* .cvsignore: Adjust.
* build-aux/.cvsignore: New file.
Author: Jim Meyering <meyering@redhat.com>
2007-12-05 21:31:07 +00:00
|
|
|
FILE *cpuinfo = fopen(CPUINFO_PATH, "r");
|
2015-07-07 11:27:53 +00:00
|
|
|
|
2007-07-25 23:16:30 +00:00
|
|
|
if (!cpuinfo) {
|
2010-02-04 20:02:58 +00:00
|
|
|
virReportSystemError(errno,
|
2009-01-20 17:13:33 +00:00
|
|
|
_("cannot open %s"), CPUINFO_PATH);
|
2007-07-25 23:16:30 +00:00
|
|
|
return -1;
|
|
|
|
}
|
2011-10-03 12:45:30 +00:00
|
|
|
|
2015-07-14 09:40:13 +00:00
|
|
|
ret = linuxNodeInfoCPUPopulate(sysfs_prefix, cpuinfo,
|
2014-06-17 10:25:23 +00:00
|
|
|
hostarch, nodeinfo);
|
2012-05-02 15:18:03 +00:00
|
|
|
if (ret < 0)
|
|
|
|
goto cleanup;
|
2007-07-25 23:16:30 +00:00
|
|
|
|
Use gnulib, starting with its physmem and getaddrinfo modules.
New files go into these directories:
gnulib/lib
gnulib/m4
gnulib/tests
* bootstrap: A wrapper around gnulib-tool.
* configure.in: Invoke gl_EARLY and gl_INIT, being careful to put gl_EARLY
before any macro that uses AC_COMPILE_IFELSE.
(AC_OUTPUT): Add lib/Makefile and gl-tests/Makefile. Remove m4/Makefile.
* Makefile.am (SUBDIRS): Add gnulib/lib and remove m4. Add gnulib/tests
early enough that those tests run before any libvirt unit tests.
* m4/Makefile.am: Remove file. Not needed.
* src/Makefile.am (INCLUDES): Add -I$(top_srcdir)/gnulib/lib -I../gnulib/lib.
(LDADDS, libvirt_la_LIBADD): Add ../gnulib/lib/libgnu.la.
* src/nodeinfo.c: Include "physmem.h".
* qemud/qemud.c, src/remote_internal.c: Include "getaddrinfo.h".
(MEMINFO_PATH, linuxNodeInfoMemPopulate): Remove definitions.
(virNodeInfoPopulate): Use physmem_total, not linuxNodeInfoMemPopulate.
* tests/Makefile.am (INCLUDES): Add -I$(top_srcdir)/gnulib/lib -I../gnulib/lib.
(LDADDS): Add ../gnulib/lib/libgnu.la.
* qemud/Makefile.am (libvirtd_LDADD): Add ../gnulib/lib/libgnu.la.
* tests/nodeinfotest.c (linuxTestCompareFiles): No longer read total
memory from a file.
Update expected output not to include "Memory: NNNN"
* tests/nodeinfodata/linux-nodeinfo-1.txt:
* tests/nodeinfodata/linux-nodeinfo-2.txt:
* tests/nodeinfodata/linux-nodeinfo-3.txt:
* tests/nodeinfodata/linux-nodeinfo-4.txt:
* tests/nodeinfodata/linux-nodeinfo-5.txt:
* tests/nodeinfodata/linux-nodeinfo-6.txt:
* src/test.c [WITH_TEST]: Remove definition of _GNU_SOURCE that
would conflict with the one now in "config.h".
* autogen.sh: Add -I gnulib/m4.
* src/conf.c, src/sexpr.c: Don't define _GNU_SOURCE.
Instead, include "config.h".
* qemud/qemud.c: Remove definition of _GNU_SOURCE.
* src/openvz_driver.c: Likewise.
* src/qemu_driver.c: Likewise.
* src/remote_internal.c: Likewise.
* configure.in: Use AC_CONFIG_AUX_DIR(build-aux), so that a bunch
of gettextize-generated files go into build-aux/, rather than in
the top-level directory.
* .cvsignore: Adjust.
* build-aux/.cvsignore: New file.
Author: Jim Meyering <meyering@redhat.com>
2007-12-05 21:31:07 +00:00
|
|
|
/* Convert to KB. */
|
2012-10-17 09:23:12 +00:00
|
|
|
nodeinfo->memory = physmem_total() / 1024;
|
2007-07-25 23:16:30 +00:00
|
|
|
|
2014-03-25 06:57:22 +00:00
|
|
|
cleanup:
|
2012-05-02 15:18:03 +00:00
|
|
|
VIR_FORCE_FCLOSE(cpuinfo);
|
2007-07-25 23:16:30 +00:00
|
|
|
return ret;
|
Use gnulib, starting with its physmem and getaddrinfo modules.
New files go into these directories:
gnulib/lib
gnulib/m4
gnulib/tests
* bootstrap: A wrapper around gnulib-tool.
* configure.in: Invoke gl_EARLY and gl_INIT, being careful to put gl_EARLY
before any macro that uses AC_COMPILE_IFELSE.
(AC_OUTPUT): Add lib/Makefile and gl-tests/Makefile. Remove m4/Makefile.
* Makefile.am (SUBDIRS): Add gnulib/lib and remove m4. Add gnulib/tests
early enough that those tests run before any libvirt unit tests.
* m4/Makefile.am: Remove file. Not needed.
* src/Makefile.am (INCLUDES): Add -I$(top_srcdir)/gnulib/lib -I../gnulib/lib.
(LDADDS, libvirt_la_LIBADD): Add ../gnulib/lib/libgnu.la.
* src/nodeinfo.c: Include "physmem.h".
* qemud/qemud.c, src/remote_internal.c: Include "getaddrinfo.h".
(MEMINFO_PATH, linuxNodeInfoMemPopulate): Remove definitions.
(virNodeInfoPopulate): Use physmem_total, not linuxNodeInfoMemPopulate.
* tests/Makefile.am (INCLUDES): Add -I$(top_srcdir)/gnulib/lib -I../gnulib/lib.
(LDADDS): Add ../gnulib/lib/libgnu.la.
* qemud/Makefile.am (libvirtd_LDADD): Add ../gnulib/lib/libgnu.la.
* tests/nodeinfotest.c (linuxTestCompareFiles): No longer read total
memory from a file.
Update expected output not to include "Memory: NNNN"
* tests/nodeinfodata/linux-nodeinfo-1.txt:
* tests/nodeinfodata/linux-nodeinfo-2.txt:
* tests/nodeinfodata/linux-nodeinfo-3.txt:
* tests/nodeinfodata/linux-nodeinfo-4.txt:
* tests/nodeinfodata/linux-nodeinfo-5.txt:
* tests/nodeinfodata/linux-nodeinfo-6.txt:
* src/test.c [WITH_TEST]: Remove definition of _GNU_SOURCE that
would conflict with the one now in "config.h".
* autogen.sh: Add -I gnulib/m4.
* src/conf.c, src/sexpr.c: Don't define _GNU_SOURCE.
Instead, include "config.h".
* qemud/qemud.c: Remove definition of _GNU_SOURCE.
* src/openvz_driver.c: Likewise.
* src/qemu_driver.c: Likewise.
* src/remote_internal.c: Likewise.
* configure.in: Use AC_CONFIG_AUX_DIR(build-aux), so that a bunch
of gettextize-generated files go into build-aux/, rather than in
the top-level directory.
* .cvsignore: Adjust.
* build-aux/.cvsignore: New file.
Author: Jim Meyering <meyering@redhat.com>
2007-12-05 21:31:07 +00:00
|
|
|
}
|
2013-10-05 05:56:37 +00:00
|
|
|
#elif defined(__FreeBSD__) || defined(__APPLE__)
|
2012-12-17 18:12:44 +00:00
|
|
|
{
|
|
|
|
nodeinfo->nodes = 1;
|
|
|
|
nodeinfo->sockets = 1;
|
|
|
|
nodeinfo->threads = 1;
|
|
|
|
|
2013-10-05 05:56:37 +00:00
|
|
|
nodeinfo->cpus = appleFreebsdNodeGetCPUCount();
|
2012-12-17 18:12:44 +00:00
|
|
|
if (nodeinfo->cpus == -1)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
nodeinfo->cores = nodeinfo->cpus;
|
|
|
|
|
|
|
|
unsigned long cpu_freq;
|
|
|
|
size_t cpu_freq_len = sizeof(cpu_freq);
|
|
|
|
|
2013-10-05 05:56:37 +00:00
|
|
|
# ifdef __FreeBSD__
|
2012-12-17 18:12:44 +00:00
|
|
|
if (sysctlbyname("dev.cpu.0.freq", &cpu_freq, &cpu_freq_len, NULL, 0) < 0) {
|
|
|
|
virReportSystemError(errno, "%s", _("cannot obtain CPU freq"));
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
nodeinfo->mhz = cpu_freq;
|
2013-10-05 05:56:37 +00:00
|
|
|
# else
|
|
|
|
if (sysctlbyname("hw.cpufrequency", &cpu_freq, &cpu_freq_len, NULL, 0) < 0) {
|
|
|
|
virReportSystemError(errno, "%s", _("cannot obtain CPU freq"));
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
nodeinfo->mhz = cpu_freq / 1000000;
|
|
|
|
# endif
|
2012-12-17 18:12:44 +00:00
|
|
|
|
2013-10-20 15:14:52 +00:00
|
|
|
if (appleFreebsdNodeGetMemorySize(&nodeinfo->memory) < 0)
|
2012-12-17 18:12:44 +00:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
2007-07-25 23:16:30 +00:00
|
|
|
#else
|
|
|
|
/* XXX Solaris will need an impl later if they port QEMU driver */
|
2012-07-18 18:19:23 +00:00
|
|
|
virReportError(VIR_ERR_NO_SUPPORT, "%s",
|
|
|
|
_("node info not implemented on this platform"));
|
2007-07-25 23:16:30 +00:00
|
|
|
return -1;
|
|
|
|
#endif
|
|
|
|
}
|
make NUMA-initialization code more portable and more robust
qemudCapsInitNUMA and umlCapsInitNUMA were identical, so this change
factors them into a new function, virCapsInitNUMA, and puts it in
nodeinfo.c.
In addition to factoring out the duplicates, this change also
adjusts that function definition (along with its macros) so
that it works with Fedora 9's numactl version 1, and makes it
so the code will work even if someone builds the kernel with
CONFIG_NR_CPUS > 4096.
Finally, also perform this NUMA initialization for the lxc
and openvz drivers.
* src/nodeinfo.c: Include <stdint.h>, <numa.h> and "memory.h".
(virCapsInitNUMA): Rename from qemudCapsInitNUMA and umlCapsInitNUMA.
(NUMA_MAX_N_CPUS): Define depending on NUMA API version.
(n_bits, MASK_CPU_ISSET): Define, adjust, use uint64 rather than long.
* src/nodeinfo.h: Include "capabilities.h".
(virCapsInitNUMA): Declare it.
* examples/domain-events/events-c/Makefile.am:
* src/Makefile.am: Add $(NUMACTL_CFLAGS) and $(NUMACTL_LIBS) to various
compile/link-related variables.
* src/qemu_conf.c: Include "nodeinfo.h".
(qemudCapsInitNUMA): Remove duplicate code. Adjust caller.
* src/uml_conf.c (umlCapsInitNUMA): Likewise.
Include "nodeinfo.h".
* src/lxc_conf.c: Include "nodeinfo.h".
(lxcCapsInit): Perform NUMA initialization here, too.
* src/openvz_conf.c (openvzCapsInit): And here.
Include "nodeinfo.h".
* src/libvirt_sym.version.in: Add virCapsInitNUMA so that libvirtd
can link to this function.
2008-12-21 18:55:09 +00:00
|
|
|
|
2015-07-14 09:40:14 +00:00
|
|
|
int
|
|
|
|
nodeGetCPUStats(int cpuNum ATTRIBUTE_UNUSED,
|
|
|
|
virNodeCPUStatsPtr params ATTRIBUTE_UNUSED,
|
|
|
|
int *nparams ATTRIBUTE_UNUSED,
|
|
|
|
unsigned int flags)
|
2011-06-07 01:02:55 +00:00
|
|
|
{
|
|
|
|
virCheckFlags(0, -1);
|
|
|
|
|
|
|
|
#ifdef __linux__
|
|
|
|
{
|
|
|
|
int ret;
|
|
|
|
FILE *procstat = fopen(PROCSTAT_PATH, "r");
|
|
|
|
if (!procstat) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("cannot open %s"), PROCSTAT_PATH);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
ret = linuxNodeGetCPUStats(procstat, cpuNum, params, nparams);
|
|
|
|
VIR_FORCE_FCLOSE(procstat);
|
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
2014-01-28 17:49:24 +00:00
|
|
|
#elif defined(__FreeBSD__)
|
|
|
|
return freebsdNodeGetCPUStats(cpuNum, params, nparams);
|
2011-06-07 01:02:55 +00:00
|
|
|
#else
|
2012-07-18 18:19:23 +00:00
|
|
|
virReportError(VIR_ERR_NO_SUPPORT, "%s",
|
|
|
|
_("node CPU stats not implemented on this platform"));
|
2011-06-07 01:02:55 +00:00
|
|
|
return -1;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2015-07-14 09:40:14 +00:00
|
|
|
int
|
|
|
|
nodeGetMemoryStats(const char *sysfs_prefix ATTRIBUTE_UNUSED,
|
|
|
|
int cellNum ATTRIBUTE_UNUSED,
|
|
|
|
virNodeMemoryStatsPtr params ATTRIBUTE_UNUSED,
|
|
|
|
int *nparams ATTRIBUTE_UNUSED,
|
|
|
|
unsigned int flags)
|
2011-06-07 01:11:17 +00:00
|
|
|
{
|
|
|
|
virCheckFlags(0, -1);
|
|
|
|
|
|
|
|
#ifdef __linux__
|
|
|
|
{
|
|
|
|
int ret;
|
2015-07-07 21:37:36 +00:00
|
|
|
const char *prefix = sysfs_prefix ? sysfs_prefix : SYSFS_SYSTEM_PATH;
|
2011-06-07 01:11:17 +00:00
|
|
|
char *meminfo_path = NULL;
|
|
|
|
FILE *meminfo;
|
2013-10-17 15:42:22 +00:00
|
|
|
int max_node;
|
2011-06-07 01:11:17 +00:00
|
|
|
|
2011-06-15 10:39:57 +00:00
|
|
|
if (cellNum == VIR_NODE_MEMORY_STATS_ALL_CELLS) {
|
2013-05-03 12:52:48 +00:00
|
|
|
if (VIR_STRDUP(meminfo_path, MEMINFO_PATH) < 0)
|
2011-06-07 01:11:17 +00:00
|
|
|
return -1;
|
|
|
|
} else {
|
2013-10-17 15:42:22 +00:00
|
|
|
if ((max_node = virNumaGetMaxNode()) < 0)
|
2011-06-07 01:11:17 +00:00
|
|
|
return -1;
|
|
|
|
|
2013-10-17 15:42:22 +00:00
|
|
|
if (cellNum > max_node) {
|
Santize the reporting of VIR_ERR_INVALID_ERROR
To ensure consistent error reporting of invalid arguments,
provide a number of predefined helper methods & macros.
- An arg which must not be NULL:
virCheckNonNullArgReturn(argname, retvalue)
virCheckNonNullArgGoto(argname, label)
- An arg which must be NULL
virCheckNullArgGoto(argname, label)
- An arg which must be positive (ie 1 or greater)
virCheckPositiveArgGoto(argname, label)
- An arg which must not be 0
virCheckNonZeroArgGoto(argname, label)
- An arg which must be zero
virCheckZeroArgGoto(argname, label)
- An arg which must not be negative (ie 0 or greater)
virCheckNonNegativeArgGoto(argname, label)
* src/libvirt.c, src/libvirt-qemu.c,
src/nodeinfo.c, src/datatypes.c: Update to use
virCheckXXXX macros
* po/POTFILES.in: Add libvirt-qemu.c and virterror_internal.h
* src/internal.h: Define macros for checking invalid args
* src/util/virterror_internal.h: Define macros for reporting
invalid args
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2012-05-25 17:41:07 +00:00
|
|
|
virReportInvalidArg(cellNum,
|
|
|
|
_("cellNum in %s must be less than or equal to %d"),
|
2013-10-17 15:42:22 +00:00
|
|
|
__FUNCTION__, max_node);
|
2011-06-07 01:11:17 +00:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
2012-05-11 19:59:59 +00:00
|
|
|
if (virAsprintf(&meminfo_path, "%s/node/node%d/meminfo",
|
2015-07-07 21:37:36 +00:00
|
|
|
prefix, cellNum) < 0)
|
2011-06-07 01:11:17 +00:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
meminfo = fopen(meminfo_path, "r");
|
|
|
|
|
|
|
|
if (!meminfo) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("cannot open %s"), meminfo_path);
|
|
|
|
VIR_FREE(meminfo_path);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
ret = linuxNodeGetMemoryStats(meminfo, cellNum, params, nparams);
|
|
|
|
VIR_FORCE_FCLOSE(meminfo);
|
|
|
|
VIR_FREE(meminfo_path);
|
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
2014-01-03 18:35:50 +00:00
|
|
|
#elif defined(__FreeBSD__)
|
|
|
|
return freebsdNodeGetMemoryStats(params, nparams);
|
2011-06-07 01:11:17 +00:00
|
|
|
#else
|
2012-07-18 18:19:23 +00:00
|
|
|
virReportError(VIR_ERR_NO_SUPPORT, "%s",
|
|
|
|
_("node memory stats not implemented on this platform"));
|
2011-06-07 01:11:17 +00:00
|
|
|
return -1;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2012-10-25 20:44:32 +00:00
|
|
|
int
|
2015-07-07 23:49:10 +00:00
|
|
|
nodeGetCPUCount(const char *sysfs_prefix ATTRIBUTE_UNUSED)
|
2012-10-25 20:44:32 +00:00
|
|
|
{
|
2012-12-17 18:12:44 +00:00
|
|
|
#if defined(__linux__)
|
2012-11-13 12:54:36 +00:00
|
|
|
/* To support older kernels that lack cpu/present, such as 2.6.18
|
|
|
|
* in RHEL5, we fall back to count cpu/cpuNN entries; this assumes
|
|
|
|
* that such kernels also lack hotplug, and therefore cpu/cpuNN
|
|
|
|
* will be consecutive.
|
|
|
|
*/
|
2015-07-06 21:03:51 +00:00
|
|
|
char *present_path = NULL;
|
2015-07-07 23:49:10 +00:00
|
|
|
const char *prefix = sysfs_prefix ? sysfs_prefix : SYSFS_SYSTEM_PATH;
|
2012-11-13 12:54:36 +00:00
|
|
|
char *cpupath = NULL;
|
2015-07-06 21:03:51 +00:00
|
|
|
int ncpu = -1;
|
|
|
|
|
2015-07-14 09:40:13 +00:00
|
|
|
if (!(present_path = linuxGetCPUPresentPath(sysfs_prefix)))
|
2015-07-06 21:03:51 +00:00
|
|
|
return -1;
|
2012-11-13 12:54:36 +00:00
|
|
|
|
2015-07-06 21:03:51 +00:00
|
|
|
if (virFileExists(present_path)) {
|
2015-07-20 16:37:23 +00:00
|
|
|
ncpu = linuxParseCPUCount(present_path);
|
2015-07-07 23:49:10 +00:00
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (virAsprintf(&cpupath, "%s/cpu/cpu0", prefix) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
if (virFileExists(cpupath)) {
|
Convert 'int i' to 'size_t i' in src/node_device/ files
Convert the type of loop iterators named 'i', 'j', k',
'ii', 'jj', 'kk', to be 'size_t' instead of 'int' or
'unsigned int', also santizing 'ii', 'jj', 'kk' to use
the normal 'i', 'j', 'k' naming
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2013-07-08 14:09:33 +00:00
|
|
|
ncpu = 0;
|
2012-11-13 12:54:36 +00:00
|
|
|
do {
|
Convert 'int i' to 'size_t i' in src/node_device/ files
Convert the type of loop iterators named 'i', 'j', k',
'ii', 'jj', 'kk', to be 'size_t' instead of 'int' or
'unsigned int', also santizing 'ii', 'jj', 'kk' to use
the normal 'i', 'j', 'k' naming
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2013-07-08 14:09:33 +00:00
|
|
|
ncpu++;
|
2012-11-13 12:54:36 +00:00
|
|
|
VIR_FREE(cpupath);
|
|
|
|
if (virAsprintf(&cpupath, "%s/cpu/cpu%d",
|
2015-07-07 23:49:10 +00:00
|
|
|
prefix, ncpu) < 0) {
|
2015-07-06 21:03:51 +00:00
|
|
|
ncpu = -1;
|
|
|
|
goto cleanup;
|
|
|
|
}
|
2012-11-13 12:54:36 +00:00
|
|
|
} while (virFileExists(cpupath));
|
|
|
|
} else {
|
|
|
|
/* no cpu/cpu0: we give up */
|
|
|
|
virReportError(VIR_ERR_NO_SUPPORT, "%s",
|
|
|
|
_("host cpu counting not supported on this node"));
|
|
|
|
}
|
|
|
|
|
2015-07-06 21:03:51 +00:00
|
|
|
cleanup:
|
|
|
|
VIR_FREE(present_path);
|
2012-11-13 12:54:36 +00:00
|
|
|
VIR_FREE(cpupath);
|
Convert 'int i' to 'size_t i' in src/node_device/ files
Convert the type of loop iterators named 'i', 'j', k',
'ii', 'jj', 'kk', to be 'size_t' instead of 'int' or
'unsigned int', also santizing 'ii', 'jj', 'kk' to use
the normal 'i', 'j', 'k' naming
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2013-07-08 14:09:33 +00:00
|
|
|
return ncpu;
|
2013-10-08 16:21:04 +00:00
|
|
|
#elif defined(__FreeBSD__) || defined(__APPLE__)
|
|
|
|
return appleFreebsdNodeGetCPUCount();
|
2012-10-25 20:44:32 +00:00
|
|
|
#else
|
|
|
|
virReportError(VIR_ERR_NO_SUPPORT, "%s",
|
|
|
|
_("host cpu counting not implemented on this platform"));
|
|
|
|
return -1;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2015-01-22 10:54:50 +00:00
|
|
|
virBitmapPtr
|
2015-07-20 16:37:24 +00:00
|
|
|
nodeGetPresentCPUBitmap(const char *sysfs_prefix ATTRIBUTE_UNUSED)
|
2015-01-22 10:54:50 +00:00
|
|
|
{
|
2015-07-06 21:03:51 +00:00
|
|
|
#ifdef __linux__
|
2015-07-20 16:37:24 +00:00
|
|
|
virBitmapPtr present_cpus = NULL;
|
2015-07-06 21:03:51 +00:00
|
|
|
char *present_path = NULL;
|
2015-07-20 16:37:24 +00:00
|
|
|
int npresent_cpus;
|
2015-01-22 10:54:50 +00:00
|
|
|
|
2015-07-20 16:37:24 +00:00
|
|
|
if ((npresent_cpus = nodeGetCPUCount(sysfs_prefix)) < 0)
|
|
|
|
goto cleanup;
|
2015-01-22 10:54:50 +00:00
|
|
|
|
2015-07-14 09:40:13 +00:00
|
|
|
if (!(present_path = linuxGetCPUPresentPath(sysfs_prefix)))
|
2015-07-20 16:37:24 +00:00
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
/* If the cpu/present file is available, parse it and exit */
|
|
|
|
if (virFileExists(present_path)) {
|
|
|
|
present_cpus = linuxParseCPUmap(npresent_cpus, present_path);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* If the file is not available, we can assume that the kernel is
|
|
|
|
* too old to support non-consecutive CPU ids and just mark all
|
|
|
|
* possible CPUs as present */
|
|
|
|
if (!(present_cpus = virBitmapNew(npresent_cpus)))
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
virBitmapSetAll(present_cpus);
|
|
|
|
|
|
|
|
cleanup:
|
2015-07-06 21:03:51 +00:00
|
|
|
VIR_FREE(present_path);
|
2015-07-20 16:37:24 +00:00
|
|
|
|
|
|
|
return present_cpus;
|
2015-01-22 10:54:50 +00:00
|
|
|
#endif
|
|
|
|
virReportError(VIR_ERR_NO_SUPPORT, "%s",
|
2015-07-20 16:37:24 +00:00
|
|
|
_("node present CPU map not implemented on this platform"));
|
2015-01-22 10:54:50 +00:00
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2012-09-14 07:47:03 +00:00
|
|
|
virBitmapPtr
|
2015-07-20 16:37:26 +00:00
|
|
|
nodeGetOnlineCPUBitmap(const char *sysfs_prefix ATTRIBUTE_UNUSED)
|
2012-03-02 02:54:22 +00:00
|
|
|
{
|
|
|
|
#ifdef __linux__
|
2015-07-07 23:26:52 +00:00
|
|
|
const char *prefix = sysfs_prefix ? sysfs_prefix : SYSFS_SYSTEM_PATH;
|
|
|
|
char *online_path = NULL;
|
2015-07-17 16:12:50 +00:00
|
|
|
char *cpudir = NULL;
|
2012-09-14 07:47:03 +00:00
|
|
|
virBitmapPtr cpumap;
|
2012-10-24 22:43:26 +00:00
|
|
|
int present;
|
|
|
|
|
2015-07-14 09:40:13 +00:00
|
|
|
present = nodeGetCPUCount(sysfs_prefix);
|
2012-10-24 22:43:26 +00:00
|
|
|
if (present < 0)
|
2012-03-02 02:54:22 +00:00
|
|
|
return NULL;
|
2012-11-15 14:04:33 +00:00
|
|
|
|
2015-07-20 16:37:22 +00:00
|
|
|
if (!(online_path = linuxGetCPUOnlinePath(sysfs_prefix)))
|
2015-07-07 23:26:52 +00:00
|
|
|
return NULL;
|
|
|
|
if (virFileExists(online_path)) {
|
|
|
|
cpumap = linuxParseCPUmap(present, online_path);
|
2012-11-15 14:04:33 +00:00
|
|
|
} else {
|
Convert 'int i' to 'size_t i' in src/node_device/ files
Convert the type of loop iterators named 'i', 'j', k',
'ii', 'jj', 'kk', to be 'size_t' instead of 'int' or
'unsigned int', also santizing 'ii', 'jj', 'kk' to use
the normal 'i', 'j', 'k' naming
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2013-07-08 14:09:33 +00:00
|
|
|
size_t i;
|
2012-11-15 14:04:33 +00:00
|
|
|
|
|
|
|
cpumap = virBitmapNew(present);
|
2013-07-04 10:20:00 +00:00
|
|
|
if (!cpumap)
|
2015-07-07 23:26:52 +00:00
|
|
|
goto cleanup;
|
2015-07-17 16:12:50 +00:00
|
|
|
|
|
|
|
if (virAsprintf(&cpudir, "%s/cpu", prefix) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
2012-11-15 14:04:33 +00:00
|
|
|
for (i = 0; i < present; i++) {
|
2015-07-17 16:12:50 +00:00
|
|
|
int online = virNodeGetCpuValue(cpudir, i, "online", 1);
|
2012-11-15 14:04:33 +00:00
|
|
|
if (online < 0) {
|
|
|
|
virBitmapFree(cpumap);
|
2015-07-07 23:26:52 +00:00
|
|
|
cpumap = NULL;
|
|
|
|
goto cleanup;
|
2012-11-15 14:04:33 +00:00
|
|
|
}
|
|
|
|
if (online)
|
|
|
|
ignore_value(virBitmapSetBit(cpumap, i));
|
|
|
|
}
|
|
|
|
}
|
2015-07-20 16:37:25 +00:00
|
|
|
|
2015-07-07 23:26:52 +00:00
|
|
|
cleanup:
|
|
|
|
VIR_FREE(online_path);
|
2015-07-17 16:12:50 +00:00
|
|
|
VIR_FREE(cpudir);
|
2012-03-02 02:54:22 +00:00
|
|
|
return cpumap;
|
|
|
|
#else
|
2012-07-18 18:19:23 +00:00
|
|
|
virReportError(VIR_ERR_NO_SUPPORT, "%s",
|
2015-07-20 16:37:26 +00:00
|
|
|
_("node online CPU map not implemented on this platform"));
|
2012-03-02 02:54:22 +00:00
|
|
|
return NULL;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2012-09-18 23:04:50 +00:00
|
|
|
#ifdef __linux__
|
2012-09-14 14:42:16 +00:00
|
|
|
static int
|
2012-11-28 14:11:06 +00:00
|
|
|
nodeSetMemoryParameterValue(virTypedParameterPtr param)
|
2012-09-14 14:42:16 +00:00
|
|
|
{
|
|
|
|
char *path = NULL;
|
|
|
|
char *strval = NULL;
|
|
|
|
int ret = -1;
|
|
|
|
int rc = -1;
|
|
|
|
|
2012-11-28 14:11:06 +00:00
|
|
|
char *field = strchr(param->field, '_');
|
2013-01-22 22:09:23 +00:00
|
|
|
sa_assert(field);
|
2012-11-28 14:11:06 +00:00
|
|
|
field++;
|
2012-09-14 14:42:16 +00:00
|
|
|
if (virAsprintf(&path, "%s/%s",
|
|
|
|
SYSFS_MEMORY_SHARED_PATH, field) < 0) {
|
|
|
|
ret = -2;
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (virAsprintf(&strval, "%u", param->value.ui) == -1) {
|
|
|
|
ret = -2;
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ((rc = virFileWriteStr(path, strval, 0)) < 0) {
|
2012-11-28 14:11:06 +00:00
|
|
|
virReportSystemError(-rc, _("failed to set %s"), param->field);
|
2012-09-14 14:42:16 +00:00
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = 0;
|
2014-03-25 06:57:22 +00:00
|
|
|
cleanup:
|
2012-09-14 14:42:16 +00:00
|
|
|
VIR_FREE(path);
|
|
|
|
VIR_FREE(strval);
|
|
|
|
return ret;
|
|
|
|
}
|
2012-11-28 14:11:06 +00:00
|
|
|
|
|
|
|
static bool
|
|
|
|
nodeMemoryParametersIsAllSupported(virTypedParameterPtr params,
|
|
|
|
int nparams)
|
|
|
|
{
|
|
|
|
char *path = NULL;
|
Convert 'int i' to 'size_t i' in src/node_device/ files
Convert the type of loop iterators named 'i', 'j', k',
'ii', 'jj', 'kk', to be 'size_t' instead of 'int' or
'unsigned int', also santizing 'ii', 'jj', 'kk' to use
the normal 'i', 'j', 'k' naming
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2013-07-08 14:09:33 +00:00
|
|
|
size_t i;
|
2012-11-28 14:11:06 +00:00
|
|
|
|
|
|
|
for (i = 0; i < nparams; i++) {
|
|
|
|
virTypedParameterPtr param = ¶ms[i];
|
|
|
|
|
|
|
|
char *field = strchr(param->field, '_');
|
2013-01-22 22:09:23 +00:00
|
|
|
sa_assert(field);
|
2012-11-28 14:11:06 +00:00
|
|
|
field++;
|
|
|
|
if (virAsprintf(&path, "%s/%s",
|
2013-07-04 10:20:00 +00:00
|
|
|
SYSFS_MEMORY_SHARED_PATH, field) < 0)
|
2012-11-28 14:11:06 +00:00
|
|
|
return false;
|
|
|
|
|
|
|
|
if (!virFileExists(path)) {
|
|
|
|
virReportError(VIR_ERR_OPERATION_INVALID,
|
|
|
|
_("Parameter '%s' is not supported by "
|
|
|
|
"this kernel"), param->field);
|
|
|
|
VIR_FREE(path);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
VIR_FREE(path);
|
|
|
|
}
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
2012-09-18 23:04:50 +00:00
|
|
|
#endif
|
2012-09-14 14:42:16 +00:00
|
|
|
|
|
|
|
int
|
2013-04-26 17:21:58 +00:00
|
|
|
nodeSetMemoryParameters(virTypedParameterPtr params ATTRIBUTE_UNUSED,
|
2012-09-17 14:05:48 +00:00
|
|
|
int nparams ATTRIBUTE_UNUSED,
|
2012-09-14 14:42:16 +00:00
|
|
|
unsigned int flags)
|
|
|
|
{
|
|
|
|
virCheckFlags(0, -1);
|
|
|
|
|
|
|
|
#ifdef __linux__
|
Convert 'int i' to 'size_t i' in src/node_device/ files
Convert the type of loop iterators named 'i', 'j', k',
'ii', 'jj', 'kk', to be 'size_t' instead of 'int' or
'unsigned int', also santizing 'ii', 'jj', 'kk' to use
the normal 'i', 'j', 'k' naming
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2013-07-08 14:09:33 +00:00
|
|
|
size_t i;
|
2012-11-28 14:11:06 +00:00
|
|
|
int rc;
|
2012-09-14 14:42:16 +00:00
|
|
|
|
2013-05-03 13:34:10 +00:00
|
|
|
if (virTypedParamsValidate(params, nparams,
|
|
|
|
VIR_NODE_MEMORY_SHARED_PAGES_TO_SCAN,
|
|
|
|
VIR_TYPED_PARAM_UINT,
|
|
|
|
VIR_NODE_MEMORY_SHARED_SLEEP_MILLISECS,
|
|
|
|
VIR_TYPED_PARAM_UINT,
|
|
|
|
VIR_NODE_MEMORY_SHARED_MERGE_ACROSS_NODES,
|
|
|
|
VIR_TYPED_PARAM_UINT,
|
|
|
|
NULL) < 0)
|
2012-09-14 14:42:16 +00:00
|
|
|
return -1;
|
|
|
|
|
2012-11-28 14:11:06 +00:00
|
|
|
if (!nodeMemoryParametersIsAllSupported(params, nparams))
|
|
|
|
return -1;
|
2012-09-14 14:42:16 +00:00
|
|
|
|
2012-11-28 14:11:06 +00:00
|
|
|
for (i = 0; i < nparams; i++) {
|
|
|
|
rc = nodeSetMemoryParameterValue(¶ms[i]);
|
2012-10-12 08:25:42 +00:00
|
|
|
|
2014-11-07 10:27:00 +00:00
|
|
|
if (rc < 0)
|
2012-11-28 14:11:06 +00:00
|
|
|
return -1;
|
2012-09-14 14:42:16 +00:00
|
|
|
}
|
|
|
|
|
2012-11-28 14:11:06 +00:00
|
|
|
return 0;
|
2012-09-14 14:42:16 +00:00
|
|
|
#else
|
|
|
|
virReportError(VIR_ERR_NO_SUPPORT, "%s",
|
|
|
|
_("node set memory parameters not implemented"
|
|
|
|
" on this platform"));
|
|
|
|
return -1;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2012-09-18 23:04:50 +00:00
|
|
|
#ifdef __linux__
|
2012-09-14 14:42:16 +00:00
|
|
|
static int
|
|
|
|
nodeGetMemoryParameterValue(const char *field,
|
|
|
|
void *value)
|
|
|
|
{
|
|
|
|
char *path = NULL;
|
|
|
|
char *buf = NULL;
|
|
|
|
char *tmp = NULL;
|
|
|
|
int ret = -1;
|
|
|
|
int rc = -1;
|
|
|
|
|
|
|
|
if (virAsprintf(&path, "%s/%s",
|
2013-07-04 10:20:00 +00:00
|
|
|
SYSFS_MEMORY_SHARED_PATH, field) < 0)
|
2012-09-14 14:42:16 +00:00
|
|
|
goto cleanup;
|
|
|
|
|
2012-11-28 14:11:06 +00:00
|
|
|
if (!virFileExists(path)) {
|
|
|
|
ret = -2;
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
2012-09-14 14:42:16 +00:00
|
|
|
if (virFileReadAll(path, 1024, &buf) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
if ((tmp = strchr(buf, '\n')))
|
|
|
|
*tmp = '\0';
|
|
|
|
|
2012-10-12 08:25:42 +00:00
|
|
|
if (STREQ(field, "pages_to_scan") ||
|
|
|
|
STREQ(field, "sleep_millisecs") ||
|
|
|
|
STREQ(field, "merge_across_nodes"))
|
2012-09-14 14:42:16 +00:00
|
|
|
rc = virStrToLong_ui(buf, NULL, 10, (unsigned int *)value);
|
|
|
|
else if (STREQ(field, "pages_shared") ||
|
|
|
|
STREQ(field, "pages_sharing") ||
|
|
|
|
STREQ(field, "pages_unshared") ||
|
|
|
|
STREQ(field, "pages_volatile") ||
|
|
|
|
STREQ(field, "full_scans"))
|
|
|
|
rc = virStrToLong_ull(buf, NULL, 10, (unsigned long long *)value);
|
|
|
|
|
|
|
|
if (rc < 0) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
_("failed to parse %s"), field);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = 0;
|
2014-03-25 06:57:22 +00:00
|
|
|
cleanup:
|
2012-09-14 14:42:16 +00:00
|
|
|
VIR_FREE(path);
|
|
|
|
VIR_FREE(buf);
|
|
|
|
return ret;
|
|
|
|
}
|
2012-09-18 23:04:50 +00:00
|
|
|
#endif
|
2012-09-14 14:42:16 +00:00
|
|
|
|
2012-10-12 08:25:42 +00:00
|
|
|
#define NODE_MEMORY_PARAMETERS_NUM 8
|
2012-09-14 14:42:16 +00:00
|
|
|
int
|
2013-04-26 17:21:58 +00:00
|
|
|
nodeGetMemoryParameters(virTypedParameterPtr params ATTRIBUTE_UNUSED,
|
2012-09-17 14:05:48 +00:00
|
|
|
int *nparams ATTRIBUTE_UNUSED,
|
2012-09-14 14:42:16 +00:00
|
|
|
unsigned int flags)
|
|
|
|
{
|
|
|
|
virCheckFlags(VIR_TYPED_PARAM_STRING_OKAY, -1);
|
|
|
|
|
|
|
|
#ifdef __linux__
|
|
|
|
unsigned int pages_to_scan;
|
|
|
|
unsigned int sleep_millisecs;
|
2012-10-12 08:25:42 +00:00
|
|
|
unsigned int merge_across_nodes;
|
2012-09-14 14:42:16 +00:00
|
|
|
unsigned long long pages_shared;
|
|
|
|
unsigned long long pages_sharing;
|
|
|
|
unsigned long long pages_unshared;
|
|
|
|
unsigned long long pages_volatile;
|
|
|
|
unsigned long long full_scans = 0;
|
Convert 'int i' to 'size_t i' in src/node_device/ files
Convert the type of loop iterators named 'i', 'j', k',
'ii', 'jj', 'kk', to be 'size_t' instead of 'int' or
'unsigned int', also santizing 'ii', 'jj', 'kk' to use
the normal 'i', 'j', 'k' naming
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2013-07-08 14:09:33 +00:00
|
|
|
size_t i;
|
2012-11-28 14:11:06 +00:00
|
|
|
int ret;
|
2012-09-14 14:42:16 +00:00
|
|
|
|
|
|
|
if ((*nparams) == 0) {
|
|
|
|
*nparams = NODE_MEMORY_PARAMETERS_NUM;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
for (i = 0; i < *nparams && i < NODE_MEMORY_PARAMETERS_NUM; i++) {
|
|
|
|
virTypedParameterPtr param = ¶ms[i];
|
|
|
|
|
2012-10-17 09:23:12 +00:00
|
|
|
switch (i) {
|
2012-09-14 14:42:16 +00:00
|
|
|
case 0:
|
2012-11-28 14:11:06 +00:00
|
|
|
ret = nodeGetMemoryParameterValue("pages_to_scan", &pages_to_scan);
|
|
|
|
if (ret == -2)
|
|
|
|
continue;
|
|
|
|
else if (ret == -1)
|
2012-09-14 14:42:16 +00:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
if (virTypedParameterAssign(param, VIR_NODE_MEMORY_SHARED_PAGES_TO_SCAN,
|
|
|
|
VIR_TYPED_PARAM_UINT, pages_to_scan) < 0)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
case 1:
|
2012-11-28 14:11:06 +00:00
|
|
|
ret = nodeGetMemoryParameterValue("sleep_millisecs", &sleep_millisecs);
|
|
|
|
if (ret == -2)
|
|
|
|
continue;
|
|
|
|
else if (ret == -1)
|
2012-09-14 14:42:16 +00:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
if (virTypedParameterAssign(param, VIR_NODE_MEMORY_SHARED_SLEEP_MILLISECS,
|
|
|
|
VIR_TYPED_PARAM_UINT, sleep_millisecs) < 0)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
case 2:
|
2012-11-28 14:11:06 +00:00
|
|
|
ret = nodeGetMemoryParameterValue("pages_shared", &pages_shared);
|
|
|
|
if (ret == -2)
|
|
|
|
continue;
|
|
|
|
else if (ret == -1)
|
2012-09-14 14:42:16 +00:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
if (virTypedParameterAssign(param, VIR_NODE_MEMORY_SHARED_PAGES_SHARED,
|
|
|
|
VIR_TYPED_PARAM_ULLONG, pages_shared) < 0)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
case 3:
|
2012-11-28 14:11:06 +00:00
|
|
|
ret = nodeGetMemoryParameterValue("pages_sharing", &pages_sharing);
|
|
|
|
if (ret == -2)
|
|
|
|
continue;
|
|
|
|
else if (ret == -1)
|
2012-09-14 14:42:16 +00:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
if (virTypedParameterAssign(param, VIR_NODE_MEMORY_SHARED_PAGES_SHARING,
|
|
|
|
VIR_TYPED_PARAM_ULLONG, pages_sharing) < 0)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
case 4:
|
2012-11-28 14:11:06 +00:00
|
|
|
ret = nodeGetMemoryParameterValue("pages_unshared", &pages_unshared);
|
|
|
|
if (ret == -2)
|
|
|
|
continue;
|
|
|
|
else if (ret == -1)
|
2012-09-14 14:42:16 +00:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
if (virTypedParameterAssign(param, VIR_NODE_MEMORY_SHARED_PAGES_UNSHARED,
|
|
|
|
VIR_TYPED_PARAM_ULLONG, pages_unshared) < 0)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
case 5:
|
2012-11-28 14:11:06 +00:00
|
|
|
ret = nodeGetMemoryParameterValue("pages_volatile", &pages_volatile);
|
|
|
|
if (ret == -2)
|
|
|
|
continue;
|
|
|
|
else if (ret == -1)
|
2012-09-14 14:42:16 +00:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
if (virTypedParameterAssign(param, VIR_NODE_MEMORY_SHARED_PAGES_VOLATILE,
|
|
|
|
VIR_TYPED_PARAM_ULLONG, pages_volatile) < 0)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
case 6:
|
2012-11-28 14:11:06 +00:00
|
|
|
ret = nodeGetMemoryParameterValue("full_scans", &full_scans);
|
|
|
|
if (ret == -2)
|
|
|
|
continue;
|
|
|
|
else if (ret == -1)
|
2012-09-14 14:42:16 +00:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
if (virTypedParameterAssign(param, VIR_NODE_MEMORY_SHARED_FULL_SCANS,
|
|
|
|
VIR_TYPED_PARAM_ULLONG, full_scans) < 0)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
break;
|
|
|
|
|
2012-10-12 08:25:42 +00:00
|
|
|
case 7:
|
2012-11-28 14:11:06 +00:00
|
|
|
ret = nodeGetMemoryParameterValue("merge_across_nodes", &merge_across_nodes);
|
|
|
|
if (ret == -2)
|
|
|
|
continue;
|
|
|
|
else if (ret == -1)
|
2012-10-12 08:25:42 +00:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
if (virTypedParameterAssign(param, VIR_NODE_MEMORY_SHARED_MERGE_ACROSS_NODES,
|
|
|
|
VIR_TYPED_PARAM_UINT, merge_across_nodes) < 0)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
break;
|
2012-09-14 14:42:16 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
#else
|
|
|
|
virReportError(VIR_ERR_NO_SUPPORT, "%s",
|
|
|
|
_("node get memory parameters not implemented"
|
|
|
|
" on this platform"));
|
|
|
|
return -1;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2012-10-25 20:44:32 +00:00
|
|
|
int
|
2015-07-06 21:49:04 +00:00
|
|
|
nodeGetCPUMap(const char *sysfs_prefix,
|
|
|
|
unsigned char **cpumap,
|
2012-10-25 20:44:32 +00:00
|
|
|
unsigned int *online,
|
|
|
|
unsigned int flags)
|
2012-10-16 14:05:14 +00:00
|
|
|
{
|
|
|
|
virBitmapPtr cpus = NULL;
|
|
|
|
int ret = -1;
|
|
|
|
int dummy;
|
|
|
|
|
|
|
|
virCheckFlags(0, -1);
|
|
|
|
|
2012-11-01 23:55:43 +00:00
|
|
|
if (!cpumap && !online)
|
2015-07-14 09:40:13 +00:00
|
|
|
return nodeGetCPUCount(sysfs_prefix);
|
2012-11-01 23:55:43 +00:00
|
|
|
|
2015-07-20 16:37:26 +00:00
|
|
|
if (!(cpus = nodeGetOnlineCPUBitmap(sysfs_prefix)))
|
2012-10-16 14:05:14 +00:00
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
if (cpumap && virBitmapToData(cpus, cpumap, &dummy) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
if (online)
|
|
|
|
*online = virBitmapCountBits(cpus);
|
|
|
|
|
2015-07-20 16:37:25 +00:00
|
|
|
ret = virBitmapSize(cpus);
|
|
|
|
|
2014-03-25 06:57:22 +00:00
|
|
|
cleanup:
|
2012-10-16 14:05:14 +00:00
|
|
|
if (ret < 0 && cpumap)
|
|
|
|
VIR_FREE(*cpumap);
|
|
|
|
virBitmapFree(cpus);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2013-04-03 20:11:15 +00:00
|
|
|
static int
|
2015-07-14 09:40:13 +00:00
|
|
|
nodeCapsInitNUMAFake(const char *sysfs_prefix,
|
2015-07-07 21:22:28 +00:00
|
|
|
const char *cpupath ATTRIBUTE_UNUSED,
|
|
|
|
virCapsPtr caps ATTRIBUTE_UNUSED)
|
2013-04-03 20:11:15 +00:00
|
|
|
{
|
|
|
|
virNodeInfo nodeinfo;
|
|
|
|
virCapsHostNUMACellCPUPtr cpus;
|
|
|
|
int ncpus;
|
|
|
|
int s, c, t;
|
2015-05-26 16:40:34 +00:00
|
|
|
int id, cid;
|
|
|
|
int onlinecpus ATTRIBUTE_UNUSED;
|
2013-04-03 20:11:15 +00:00
|
|
|
|
2015-07-14 09:40:13 +00:00
|
|
|
if (nodeGetInfo(sysfs_prefix, &nodeinfo) < 0)
|
2013-04-03 20:11:15 +00:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
ncpus = VIR_NODEINFO_MAXCPUS(nodeinfo);
|
2015-05-26 16:40:34 +00:00
|
|
|
onlinecpus = nodeinfo.cpus;
|
2013-04-03 20:11:15 +00:00
|
|
|
|
2013-07-04 10:20:00 +00:00
|
|
|
if (VIR_ALLOC_N(cpus, ncpus) < 0)
|
2013-04-03 20:11:15 +00:00
|
|
|
return -1;
|
|
|
|
|
2015-05-26 16:40:34 +00:00
|
|
|
id = cid = 0;
|
2013-05-21 08:08:42 +00:00
|
|
|
for (s = 0; s < nodeinfo.sockets; s++) {
|
|
|
|
for (c = 0; c < nodeinfo.cores; c++) {
|
|
|
|
for (t = 0; t < nodeinfo.threads; t++) {
|
2015-05-26 16:40:34 +00:00
|
|
|
#ifdef __linux__
|
2015-07-07 21:22:28 +00:00
|
|
|
if (virNodeGetCpuValue(cpupath, id, "online", 1)) {
|
2015-05-26 16:40:34 +00:00
|
|
|
#endif
|
|
|
|
cpus[cid].id = id;
|
|
|
|
cpus[cid].socket_id = s;
|
|
|
|
cpus[cid].core_id = c;
|
|
|
|
if (!(cpus[cid].siblings = virBitmapNew(ncpus)))
|
|
|
|
goto error;
|
|
|
|
ignore_value(virBitmapSetBit(cpus[cid].siblings, id));
|
|
|
|
cid++;
|
|
|
|
#ifdef __linux__
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2013-04-03 20:11:15 +00:00
|
|
|
id++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (virCapabilitiesAddHostNUMACell(caps, 0,
|
|
|
|
nodeinfo.memory,
|
2015-05-26 16:40:34 +00:00
|
|
|
#ifdef __linux__
|
|
|
|
onlinecpus, cpus,
|
|
|
|
#else
|
2014-06-03 13:18:27 +00:00
|
|
|
ncpus, cpus,
|
2015-05-26 16:40:34 +00:00
|
|
|
#endif
|
2014-06-06 16:12:51 +00:00
|
|
|
0, NULL,
|
2014-06-03 13:18:27 +00:00
|
|
|
0, NULL) < 0)
|
2013-04-03 20:11:15 +00:00
|
|
|
goto error;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
error:
|
2013-05-21 08:08:42 +00:00
|
|
|
for (; id >= 0; id--)
|
2013-04-03 20:11:15 +00:00
|
|
|
virBitmapFree(cpus[id].siblings);
|
|
|
|
VIR_FREE(cpus);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int
|
2013-04-26 17:21:58 +00:00
|
|
|
nodeGetCellsFreeMemoryFake(unsigned long long *freeMems,
|
2013-04-03 20:11:15 +00:00
|
|
|
int startCell,
|
|
|
|
int maxCells ATTRIBUTE_UNUSED)
|
|
|
|
{
|
|
|
|
double avail = physmem_available();
|
|
|
|
|
|
|
|
if (startCell != 0) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
_("start cell %d out of range (0-%d)"),
|
|
|
|
startCell, 0);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
freeMems[0] = (unsigned long long)avail;
|
|
|
|
|
|
|
|
if (!freeMems[0]) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
|
|
|
|
_("Cannot determine free memory"));
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
2014-06-16 12:02:34 +00:00
|
|
|
static int
|
|
|
|
nodeGetMemoryFake(unsigned long long *mem,
|
|
|
|
unsigned long long *freeMem)
|
2013-04-03 20:11:15 +00:00
|
|
|
{
|
2014-06-16 12:02:34 +00:00
|
|
|
int ret = -1;
|
|
|
|
|
2014-03-20 08:39:23 +00:00
|
|
|
#if defined(__FreeBSD__)
|
|
|
|
unsigned long pagesize = getpagesize();
|
|
|
|
u_int value;
|
|
|
|
size_t value_size = sizeof(value);
|
|
|
|
|
2014-06-16 12:02:34 +00:00
|
|
|
if (mem) {
|
|
|
|
if (sysctlbyname("vm.stats.vm.v_page_count", &value,
|
|
|
|
&value_size, NULL, 0) < 0) {
|
|
|
|
virReportSystemError(errno, "%s",
|
|
|
|
_("sysctl failed for vm.stats.vm.v_page_count"));
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
*mem = value * (unsigned long long)pagesize;
|
2014-03-20 08:39:23 +00:00
|
|
|
}
|
|
|
|
|
2014-06-16 12:02:34 +00:00
|
|
|
if (freeMem) {
|
|
|
|
if (sysctlbyname("vm.stats.vm.v_free_count", &value,
|
|
|
|
&value_size, NULL, 0) < 0) {
|
|
|
|
virReportSystemError(errno, "%s",
|
|
|
|
_("sysctl failed for vm.stats.vm.v_free_count"));
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
*freeMem = value * (unsigned long long)pagesize;
|
|
|
|
}
|
2014-03-20 08:39:23 +00:00
|
|
|
|
|
|
|
#else
|
2014-06-16 12:02:34 +00:00
|
|
|
if (mem) {
|
|
|
|
double total = physmem_total();
|
|
|
|
if (!total) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
|
|
|
|
_("Cannot determine free memory"));
|
|
|
|
goto cleanup;
|
|
|
|
}
|
2013-04-03 20:11:15 +00:00
|
|
|
|
2014-06-16 12:02:34 +00:00
|
|
|
*mem = (unsigned long long) total;
|
2013-04-03 20:11:15 +00:00
|
|
|
}
|
|
|
|
|
2014-06-16 12:02:34 +00:00
|
|
|
if (freeMem) {
|
|
|
|
double avail = physmem_available();
|
|
|
|
|
|
|
|
if (!avail) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
|
|
|
|
_("Cannot determine free memory"));
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
*freeMem = (unsigned long long) avail;
|
|
|
|
}
|
2014-03-20 08:39:23 +00:00
|
|
|
#endif
|
2014-06-16 12:02:34 +00:00
|
|
|
|
|
|
|
ret = 0;
|
|
|
|
cleanup:
|
|
|
|
return ret;
|
2013-04-03 20:11:15 +00:00
|
|
|
}
|
|
|
|
|
2013-01-18 22:06:55 +00:00
|
|
|
/* returns 1 on success, 0 if the detection failed and -1 on hard error */
|
|
|
|
static int
|
2015-07-07 21:22:28 +00:00
|
|
|
virNodeCapsFillCPUInfo(const char *cpupath ATTRIBUTE_UNUSED,
|
|
|
|
int cpu_id ATTRIBUTE_UNUSED,
|
2013-11-07 00:09:26 +00:00
|
|
|
virCapsHostNUMACellCPUPtr cpu ATTRIBUTE_UNUSED)
|
2013-01-18 22:06:55 +00:00
|
|
|
{
|
2013-11-07 00:09:26 +00:00
|
|
|
#ifdef __linux__
|
2013-01-18 22:06:55 +00:00
|
|
|
int tmp;
|
|
|
|
cpu->id = cpu_id;
|
|
|
|
|
2015-07-07 21:22:28 +00:00
|
|
|
if ((tmp = virNodeGetCpuValue(cpupath, cpu_id,
|
2013-01-18 22:06:55 +00:00
|
|
|
"topology/physical_package_id", -1)) < 0)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
cpu->socket_id = tmp;
|
|
|
|
|
2015-07-07 21:22:28 +00:00
|
|
|
if ((tmp = virNodeGetCpuValue(cpupath, cpu_id,
|
2013-01-18 22:06:55 +00:00
|
|
|
"topology/core_id", -1)) < 0)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
cpu->core_id = tmp;
|
|
|
|
|
2015-07-07 21:22:28 +00:00
|
|
|
if (!(cpu->siblings = virNodeGetSiblingsList(cpupath, cpu_id)))
|
2013-01-18 22:06:55 +00:00
|
|
|
return -1;
|
|
|
|
|
|
|
|
return 0;
|
2013-11-07 00:09:26 +00:00
|
|
|
#else
|
|
|
|
virReportError(VIR_ERR_NO_SUPPORT, "%s",
|
|
|
|
_("node cpu info not implemented on this platform"));
|
|
|
|
return -1;
|
|
|
|
#endif
|
2013-01-18 22:06:55 +00:00
|
|
|
}
|
|
|
|
|
2014-06-03 13:18:27 +00:00
|
|
|
static int
|
|
|
|
virNodeCapsGetSiblingInfo(int node,
|
|
|
|
virCapsHostNUMACellSiblingInfoPtr *siblings,
|
|
|
|
int *nsiblings)
|
|
|
|
{
|
|
|
|
virCapsHostNUMACellSiblingInfoPtr tmp = NULL;
|
|
|
|
int tmp_size = 0;
|
|
|
|
int ret = -1;
|
|
|
|
int *distances = NULL;
|
|
|
|
int ndistances = 0;
|
|
|
|
size_t i;
|
|
|
|
|
|
|
|
if (virNumaGetDistances(node, &distances, &ndistances) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
if (!distances) {
|
|
|
|
*siblings = NULL;
|
|
|
|
*nsiblings = 0;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (VIR_ALLOC_N(tmp, ndistances) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
for (i = 0; i < ndistances; i++) {
|
|
|
|
if (!distances[i])
|
|
|
|
continue;
|
|
|
|
|
|
|
|
tmp[tmp_size].node = i;
|
|
|
|
tmp[tmp_size].distance = distances[i];
|
|
|
|
tmp_size++;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (VIR_REALLOC_N(tmp, tmp_size) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
*siblings = tmp;
|
|
|
|
*nsiblings = tmp_size;
|
|
|
|
tmp = NULL;
|
|
|
|
tmp_size = 0;
|
|
|
|
ret = 0;
|
|
|
|
cleanup:
|
|
|
|
VIR_FREE(distances);
|
|
|
|
VIR_FREE(tmp);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2014-06-06 16:12:51 +00:00
|
|
|
static int
|
|
|
|
virNodeCapsGetPagesInfo(int node,
|
|
|
|
virCapsHostNUMACellPageInfoPtr *pageinfo,
|
|
|
|
int *npageinfo)
|
|
|
|
{
|
|
|
|
int ret = -1;
|
|
|
|
unsigned int *pages_size = NULL, *pages_avail = NULL;
|
|
|
|
size_t npages, i;
|
|
|
|
|
|
|
|
if (virNumaGetPages(node, &pages_size, &pages_avail, NULL, &npages) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
if (VIR_ALLOC_N(*pageinfo, npages) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
*npageinfo = npages;
|
|
|
|
|
|
|
|
for (i = 0; i < npages; i++) {
|
|
|
|
(*pageinfo)[i].size = pages_size[i];
|
|
|
|
(*pageinfo)[i].avail = pages_avail[i];
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = 0;
|
|
|
|
|
|
|
|
cleanup:
|
|
|
|
VIR_FREE(pages_avail);
|
|
|
|
VIR_FREE(pages_size);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
make NUMA-initialization code more portable and more robust
qemudCapsInitNUMA and umlCapsInitNUMA were identical, so this change
factors them into a new function, virCapsInitNUMA, and puts it in
nodeinfo.c.
In addition to factoring out the duplicates, this change also
adjusts that function definition (along with its macros) so
that it works with Fedora 9's numactl version 1, and makes it
so the code will work even if someone builds the kernel with
CONFIG_NR_CPUS > 4096.
Finally, also perform this NUMA initialization for the lxc
and openvz drivers.
* src/nodeinfo.c: Include <stdint.h>, <numa.h> and "memory.h".
(virCapsInitNUMA): Rename from qemudCapsInitNUMA and umlCapsInitNUMA.
(NUMA_MAX_N_CPUS): Define depending on NUMA API version.
(n_bits, MASK_CPU_ISSET): Define, adjust, use uint64 rather than long.
* src/nodeinfo.h: Include "capabilities.h".
(virCapsInitNUMA): Declare it.
* examples/domain-events/events-c/Makefile.am:
* src/Makefile.am: Add $(NUMACTL_CFLAGS) and $(NUMACTL_LIBS) to various
compile/link-related variables.
* src/qemu_conf.c: Include "nodeinfo.h".
(qemudCapsInitNUMA): Remove duplicate code. Adjust caller.
* src/uml_conf.c (umlCapsInitNUMA): Likewise.
Include "nodeinfo.h".
* src/lxc_conf.c: Include "nodeinfo.h".
(lxcCapsInit): Perform NUMA initialization here, too.
* src/openvz_conf.c (openvzCapsInit): And here.
Include "nodeinfo.h".
* src/libvirt_sym.version.in: Add virCapsInitNUMA so that libvirtd
can link to this function.
2008-12-21 18:55:09 +00:00
|
|
|
int
|
2015-07-07 21:22:28 +00:00
|
|
|
nodeCapsInitNUMA(const char *sysfs_prefix,
|
|
|
|
virCapsPtr caps)
|
make NUMA-initialization code more portable and more robust
qemudCapsInitNUMA and umlCapsInitNUMA were identical, so this change
factors them into a new function, virCapsInitNUMA, and puts it in
nodeinfo.c.
In addition to factoring out the duplicates, this change also
adjusts that function definition (along with its macros) so
that it works with Fedora 9's numactl version 1, and makes it
so the code will work even if someone builds the kernel with
CONFIG_NR_CPUS > 4096.
Finally, also perform this NUMA initialization for the lxc
and openvz drivers.
* src/nodeinfo.c: Include <stdint.h>, <numa.h> and "memory.h".
(virCapsInitNUMA): Rename from qemudCapsInitNUMA and umlCapsInitNUMA.
(NUMA_MAX_N_CPUS): Define depending on NUMA API version.
(n_bits, MASK_CPU_ISSET): Define, adjust, use uint64 rather than long.
* src/nodeinfo.h: Include "capabilities.h".
(virCapsInitNUMA): Declare it.
* examples/domain-events/events-c/Makefile.am:
* src/Makefile.am: Add $(NUMACTL_CFLAGS) and $(NUMACTL_LIBS) to various
compile/link-related variables.
* src/qemu_conf.c: Include "nodeinfo.h".
(qemudCapsInitNUMA): Remove duplicate code. Adjust caller.
* src/uml_conf.c (umlCapsInitNUMA): Likewise.
Include "nodeinfo.h".
* src/lxc_conf.c: Include "nodeinfo.h".
(lxcCapsInit): Perform NUMA initialization here, too.
* src/openvz_conf.c (openvzCapsInit): And here.
Include "nodeinfo.h".
* src/libvirt_sym.version.in: Add virCapsInitNUMA so that libvirtd
can link to this function.
2008-12-21 18:55:09 +00:00
|
|
|
{
|
2015-07-07 21:22:28 +00:00
|
|
|
const char *prefix = sysfs_prefix ? sysfs_prefix : SYSFS_SYSTEM_PATH;
|
|
|
|
char *cpupath;
|
make NUMA-initialization code more portable and more robust
qemudCapsInitNUMA and umlCapsInitNUMA were identical, so this change
factors them into a new function, virCapsInitNUMA, and puts it in
nodeinfo.c.
In addition to factoring out the duplicates, this change also
adjusts that function definition (along with its macros) so
that it works with Fedora 9's numactl version 1, and makes it
so the code will work even if someone builds the kernel with
CONFIG_NR_CPUS > 4096.
Finally, also perform this NUMA initialization for the lxc
and openvz drivers.
* src/nodeinfo.c: Include <stdint.h>, <numa.h> and "memory.h".
(virCapsInitNUMA): Rename from qemudCapsInitNUMA and umlCapsInitNUMA.
(NUMA_MAX_N_CPUS): Define depending on NUMA API version.
(n_bits, MASK_CPU_ISSET): Define, adjust, use uint64 rather than long.
* src/nodeinfo.h: Include "capabilities.h".
(virCapsInitNUMA): Declare it.
* examples/domain-events/events-c/Makefile.am:
* src/Makefile.am: Add $(NUMACTL_CFLAGS) and $(NUMACTL_LIBS) to various
compile/link-related variables.
* src/qemu_conf.c: Include "nodeinfo.h".
(qemudCapsInitNUMA): Remove duplicate code. Adjust caller.
* src/uml_conf.c (umlCapsInitNUMA): Likewise.
Include "nodeinfo.h".
* src/lxc_conf.c: Include "nodeinfo.h".
(lxcCapsInit): Perform NUMA initialization here, too.
* src/openvz_conf.c (openvzCapsInit): And here.
Include "nodeinfo.h".
* src/libvirt_sym.version.in: Add virCapsInitNUMA so that libvirtd
can link to this function.
2008-12-21 18:55:09 +00:00
|
|
|
int n;
|
2013-03-07 16:03:36 +00:00
|
|
|
unsigned long long memory;
|
2013-01-22 17:42:08 +00:00
|
|
|
virCapsHostNUMACellCPUPtr cpus = NULL;
|
2013-10-18 14:21:24 +00:00
|
|
|
virBitmapPtr cpumap = NULL;
|
2014-06-03 13:18:27 +00:00
|
|
|
virCapsHostNUMACellSiblingInfoPtr siblings = NULL;
|
2014-06-10 22:23:09 +00:00
|
|
|
int nsiblings = 0;
|
2014-06-06 16:12:51 +00:00
|
|
|
virCapsHostNUMACellPageInfoPtr pageinfo = NULL;
|
|
|
|
int npageinfo;
|
make NUMA-initialization code more portable and more robust
qemudCapsInitNUMA and umlCapsInitNUMA were identical, so this change
factors them into a new function, virCapsInitNUMA, and puts it in
nodeinfo.c.
In addition to factoring out the duplicates, this change also
adjusts that function definition (along with its macros) so
that it works with Fedora 9's numactl version 1, and makes it
so the code will work even if someone builds the kernel with
CONFIG_NR_CPUS > 4096.
Finally, also perform this NUMA initialization for the lxc
and openvz drivers.
* src/nodeinfo.c: Include <stdint.h>, <numa.h> and "memory.h".
(virCapsInitNUMA): Rename from qemudCapsInitNUMA and umlCapsInitNUMA.
(NUMA_MAX_N_CPUS): Define depending on NUMA API version.
(n_bits, MASK_CPU_ISSET): Define, adjust, use uint64 rather than long.
* src/nodeinfo.h: Include "capabilities.h".
(virCapsInitNUMA): Declare it.
* examples/domain-events/events-c/Makefile.am:
* src/Makefile.am: Add $(NUMACTL_CFLAGS) and $(NUMACTL_LIBS) to various
compile/link-related variables.
* src/qemu_conf.c: Include "nodeinfo.h".
(qemudCapsInitNUMA): Remove duplicate code. Adjust caller.
* src/uml_conf.c (umlCapsInitNUMA): Likewise.
Include "nodeinfo.h".
* src/lxc_conf.c: Include "nodeinfo.h".
(lxcCapsInit): Perform NUMA initialization here, too.
* src/openvz_conf.c (openvzCapsInit): And here.
Include "nodeinfo.h".
* src/libvirt_sym.version.in: Add virCapsInitNUMA so that libvirtd
can link to this function.
2008-12-21 18:55:09 +00:00
|
|
|
int ret = -1;
|
2013-01-22 17:42:08 +00:00
|
|
|
int ncpus = 0;
|
2013-10-18 14:21:24 +00:00
|
|
|
int cpu;
|
2013-01-18 22:06:55 +00:00
|
|
|
bool topology_failed = false;
|
2013-10-17 15:42:22 +00:00
|
|
|
int max_node;
|
make NUMA-initialization code more portable and more robust
qemudCapsInitNUMA and umlCapsInitNUMA were identical, so this change
factors them into a new function, virCapsInitNUMA, and puts it in
nodeinfo.c.
In addition to factoring out the duplicates, this change also
adjusts that function definition (along with its macros) so
that it works with Fedora 9's numactl version 1, and makes it
so the code will work even if someone builds the kernel with
CONFIG_NR_CPUS > 4096.
Finally, also perform this NUMA initialization for the lxc
and openvz drivers.
* src/nodeinfo.c: Include <stdint.h>, <numa.h> and "memory.h".
(virCapsInitNUMA): Rename from qemudCapsInitNUMA and umlCapsInitNUMA.
(NUMA_MAX_N_CPUS): Define depending on NUMA API version.
(n_bits, MASK_CPU_ISSET): Define, adjust, use uint64 rather than long.
* src/nodeinfo.h: Include "capabilities.h".
(virCapsInitNUMA): Declare it.
* examples/domain-events/events-c/Makefile.am:
* src/Makefile.am: Add $(NUMACTL_CFLAGS) and $(NUMACTL_LIBS) to various
compile/link-related variables.
* src/qemu_conf.c: Include "nodeinfo.h".
(qemudCapsInitNUMA): Remove duplicate code. Adjust caller.
* src/uml_conf.c (umlCapsInitNUMA): Likewise.
Include "nodeinfo.h".
* src/lxc_conf.c: Include "nodeinfo.h".
(lxcCapsInit): Perform NUMA initialization here, too.
* src/openvz_conf.c (openvzCapsInit): And here.
Include "nodeinfo.h".
* src/libvirt_sym.version.in: Add virCapsInitNUMA so that libvirtd
can link to this function.
2008-12-21 18:55:09 +00:00
|
|
|
|
2015-07-07 21:22:28 +00:00
|
|
|
if (virAsprintf(&cpupath, "%s/cpu", prefix) < 0)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
if (!virNumaIsAvailable()) {
|
2015-07-14 09:40:13 +00:00
|
|
|
ret = nodeCapsInitNUMAFake(sysfs_prefix, cpupath, caps);
|
2015-07-07 21:22:28 +00:00
|
|
|
goto cleanup;
|
|
|
|
}
|
make NUMA-initialization code more portable and more robust
qemudCapsInitNUMA and umlCapsInitNUMA were identical, so this change
factors them into a new function, virCapsInitNUMA, and puts it in
nodeinfo.c.
In addition to factoring out the duplicates, this change also
adjusts that function definition (along with its macros) so
that it works with Fedora 9's numactl version 1, and makes it
so the code will work even if someone builds the kernel with
CONFIG_NR_CPUS > 4096.
Finally, also perform this NUMA initialization for the lxc
and openvz drivers.
* src/nodeinfo.c: Include <stdint.h>, <numa.h> and "memory.h".
(virCapsInitNUMA): Rename from qemudCapsInitNUMA and umlCapsInitNUMA.
(NUMA_MAX_N_CPUS): Define depending on NUMA API version.
(n_bits, MASK_CPU_ISSET): Define, adjust, use uint64 rather than long.
* src/nodeinfo.h: Include "capabilities.h".
(virCapsInitNUMA): Declare it.
* examples/domain-events/events-c/Makefile.am:
* src/Makefile.am: Add $(NUMACTL_CFLAGS) and $(NUMACTL_LIBS) to various
compile/link-related variables.
* src/qemu_conf.c: Include "nodeinfo.h".
(qemudCapsInitNUMA): Remove duplicate code. Adjust caller.
* src/uml_conf.c (umlCapsInitNUMA): Likewise.
Include "nodeinfo.h".
* src/lxc_conf.c: Include "nodeinfo.h".
(lxcCapsInit): Perform NUMA initialization here, too.
* src/openvz_conf.c (openvzCapsInit): And here.
Include "nodeinfo.h".
* src/libvirt_sym.version.in: Add virCapsInitNUMA so that libvirtd
can link to this function.
2008-12-21 18:55:09 +00:00
|
|
|
|
2013-10-17 15:42:22 +00:00
|
|
|
if ((max_node = virNumaGetMaxNode()) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
for (n = 0; n <= max_node; n++) {
|
Convert 'int i' to 'size_t i' in src/node_device/ files
Convert the type of loop iterators named 'i', 'j', k',
'ii', 'jj', 'kk', to be 'size_t' instead of 'int' or
'unsigned int', also santizing 'ii', 'jj', 'kk' to use
the normal 'i', 'j', 'k' naming
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2013-07-08 14:09:33 +00:00
|
|
|
size_t i;
|
make NUMA-initialization code more portable and more robust
qemudCapsInitNUMA and umlCapsInitNUMA were identical, so this change
factors them into a new function, virCapsInitNUMA, and puts it in
nodeinfo.c.
In addition to factoring out the duplicates, this change also
adjusts that function definition (along with its macros) so
that it works with Fedora 9's numactl version 1, and makes it
so the code will work even if someone builds the kernel with
CONFIG_NR_CPUS > 4096.
Finally, also perform this NUMA initialization for the lxc
and openvz drivers.
* src/nodeinfo.c: Include <stdint.h>, <numa.h> and "memory.h".
(virCapsInitNUMA): Rename from qemudCapsInitNUMA and umlCapsInitNUMA.
(NUMA_MAX_N_CPUS): Define depending on NUMA API version.
(n_bits, MASK_CPU_ISSET): Define, adjust, use uint64 rather than long.
* src/nodeinfo.h: Include "capabilities.h".
(virCapsInitNUMA): Declare it.
* examples/domain-events/events-c/Makefile.am:
* src/Makefile.am: Add $(NUMACTL_CFLAGS) and $(NUMACTL_LIBS) to various
compile/link-related variables.
* src/qemu_conf.c: Include "nodeinfo.h".
(qemudCapsInitNUMA): Remove duplicate code. Adjust caller.
* src/uml_conf.c (umlCapsInitNUMA): Likewise.
Include "nodeinfo.h".
* src/lxc_conf.c: Include "nodeinfo.h".
(lxcCapsInit): Perform NUMA initialization here, too.
* src/openvz_conf.c (openvzCapsInit): And here.
Include "nodeinfo.h".
* src/libvirt_sym.version.in: Add virCapsInitNUMA so that libvirtd
can link to this function.
2008-12-21 18:55:09 +00:00
|
|
|
|
2013-10-18 14:21:24 +00:00
|
|
|
if ((ncpus = virNumaGetNodeCPUs(n, &cpumap)) < 0) {
|
|
|
|
if (ncpus == -2)
|
|
|
|
continue;
|
2013-03-07 16:03:36 +00:00
|
|
|
|
2013-10-18 14:21:24 +00:00
|
|
|
goto cleanup;
|
|
|
|
}
|
make NUMA-initialization code more portable and more robust
qemudCapsInitNUMA and umlCapsInitNUMA were identical, so this change
factors them into a new function, virCapsInitNUMA, and puts it in
nodeinfo.c.
In addition to factoring out the duplicates, this change also
adjusts that function definition (along with its macros) so
that it works with Fedora 9's numactl version 1, and makes it
so the code will work even if someone builds the kernel with
CONFIG_NR_CPUS > 4096.
Finally, also perform this NUMA initialization for the lxc
and openvz drivers.
* src/nodeinfo.c: Include <stdint.h>, <numa.h> and "memory.h".
(virCapsInitNUMA): Rename from qemudCapsInitNUMA and umlCapsInitNUMA.
(NUMA_MAX_N_CPUS): Define depending on NUMA API version.
(n_bits, MASK_CPU_ISSET): Define, adjust, use uint64 rather than long.
* src/nodeinfo.h: Include "capabilities.h".
(virCapsInitNUMA): Declare it.
* examples/domain-events/events-c/Makefile.am:
* src/Makefile.am: Add $(NUMACTL_CFLAGS) and $(NUMACTL_LIBS) to various
compile/link-related variables.
* src/qemu_conf.c: Include "nodeinfo.h".
(qemudCapsInitNUMA): Remove duplicate code. Adjust caller.
* src/uml_conf.c (umlCapsInitNUMA): Likewise.
Include "nodeinfo.h".
* src/lxc_conf.c: Include "nodeinfo.h".
(lxcCapsInit): Perform NUMA initialization here, too.
* src/openvz_conf.c (openvzCapsInit): And here.
Include "nodeinfo.h".
* src/libvirt_sym.version.in: Add virCapsInitNUMA so that libvirtd
can link to this function.
2008-12-21 18:55:09 +00:00
|
|
|
|
|
|
|
if (VIR_ALLOC_N(cpus, ncpus) < 0)
|
|
|
|
goto cleanup;
|
2013-10-18 14:21:24 +00:00
|
|
|
cpu = 0;
|
make NUMA-initialization code more portable and more robust
qemudCapsInitNUMA and umlCapsInitNUMA were identical, so this change
factors them into a new function, virCapsInitNUMA, and puts it in
nodeinfo.c.
In addition to factoring out the duplicates, this change also
adjusts that function definition (along with its macros) so
that it works with Fedora 9's numactl version 1, and makes it
so the code will work even if someone builds the kernel with
CONFIG_NR_CPUS > 4096.
Finally, also perform this NUMA initialization for the lxc
and openvz drivers.
* src/nodeinfo.c: Include <stdint.h>, <numa.h> and "memory.h".
(virCapsInitNUMA): Rename from qemudCapsInitNUMA and umlCapsInitNUMA.
(NUMA_MAX_N_CPUS): Define depending on NUMA API version.
(n_bits, MASK_CPU_ISSET): Define, adjust, use uint64 rather than long.
* src/nodeinfo.h: Include "capabilities.h".
(virCapsInitNUMA): Declare it.
* examples/domain-events/events-c/Makefile.am:
* src/Makefile.am: Add $(NUMACTL_CFLAGS) and $(NUMACTL_LIBS) to various
compile/link-related variables.
* src/qemu_conf.c: Include "nodeinfo.h".
(qemudCapsInitNUMA): Remove duplicate code. Adjust caller.
* src/uml_conf.c (umlCapsInitNUMA): Likewise.
Include "nodeinfo.h".
* src/lxc_conf.c: Include "nodeinfo.h".
(lxcCapsInit): Perform NUMA initialization here, too.
* src/openvz_conf.c (openvzCapsInit): And here.
Include "nodeinfo.h".
* src/libvirt_sym.version.in: Add virCapsInitNUMA so that libvirtd
can link to this function.
2008-12-21 18:55:09 +00:00
|
|
|
|
2013-10-18 14:21:24 +00:00
|
|
|
for (i = 0; i < virBitmapSize(cpumap); i++) {
|
2015-03-11 15:41:57 +00:00
|
|
|
if (virBitmapIsBitSet(cpumap, i)) {
|
2015-07-07 21:22:28 +00:00
|
|
|
if (virNodeCapsFillCPUInfo(cpupath, i, cpus + cpu++) < 0) {
|
2013-01-18 22:06:55 +00:00
|
|
|
topology_failed = true;
|
|
|
|
virResetLastError();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
make NUMA-initialization code more portable and more robust
qemudCapsInitNUMA and umlCapsInitNUMA were identical, so this change
factors them into a new function, virCapsInitNUMA, and puts it in
nodeinfo.c.
In addition to factoring out the duplicates, this change also
adjusts that function definition (along with its macros) so
that it works with Fedora 9's numactl version 1, and makes it
so the code will work even if someone builds the kernel with
CONFIG_NR_CPUS > 4096.
Finally, also perform this NUMA initialization for the lxc
and openvz drivers.
* src/nodeinfo.c: Include <stdint.h>, <numa.h> and "memory.h".
(virCapsInitNUMA): Rename from qemudCapsInitNUMA and umlCapsInitNUMA.
(NUMA_MAX_N_CPUS): Define depending on NUMA API version.
(n_bits, MASK_CPU_ISSET): Define, adjust, use uint64 rather than long.
* src/nodeinfo.h: Include "capabilities.h".
(virCapsInitNUMA): Declare it.
* examples/domain-events/events-c/Makefile.am:
* src/Makefile.am: Add $(NUMACTL_CFLAGS) and $(NUMACTL_LIBS) to various
compile/link-related variables.
* src/qemu_conf.c: Include "nodeinfo.h".
(qemudCapsInitNUMA): Remove duplicate code. Adjust caller.
* src/uml_conf.c (umlCapsInitNUMA): Likewise.
Include "nodeinfo.h".
* src/lxc_conf.c: Include "nodeinfo.h".
(lxcCapsInit): Perform NUMA initialization here, too.
* src/openvz_conf.c (openvzCapsInit): And here.
Include "nodeinfo.h".
* src/libvirt_sym.version.in: Add virCapsInitNUMA so that libvirtd
can link to this function.
2008-12-21 18:55:09 +00:00
|
|
|
|
2014-06-03 13:18:27 +00:00
|
|
|
if (virNodeCapsGetSiblingInfo(n, &siblings, &nsiblings) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
2014-06-06 16:12:51 +00:00
|
|
|
if (virNodeCapsGetPagesInfo(n, &pageinfo, &npageinfo) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
2013-10-18 14:21:24 +00:00
|
|
|
/* Detect the amount of memory in the numa cell in KiB */
|
|
|
|
virNumaGetNodeMemory(n, &memory, NULL);
|
|
|
|
memory >>= 10;
|
|
|
|
|
2014-06-03 13:18:27 +00:00
|
|
|
if (virCapabilitiesAddHostNUMACell(caps, n, memory,
|
|
|
|
ncpus, cpus,
|
2014-06-06 16:12:51 +00:00
|
|
|
nsiblings, siblings,
|
|
|
|
npageinfo, pageinfo) < 0)
|
make NUMA-initialization code more portable and more robust
qemudCapsInitNUMA and umlCapsInitNUMA were identical, so this change
factors them into a new function, virCapsInitNUMA, and puts it in
nodeinfo.c.
In addition to factoring out the duplicates, this change also
adjusts that function definition (along with its macros) so
that it works with Fedora 9's numactl version 1, and makes it
so the code will work even if someone builds the kernel with
CONFIG_NR_CPUS > 4096.
Finally, also perform this NUMA initialization for the lxc
and openvz drivers.
* src/nodeinfo.c: Include <stdint.h>, <numa.h> and "memory.h".
(virCapsInitNUMA): Rename from qemudCapsInitNUMA and umlCapsInitNUMA.
(NUMA_MAX_N_CPUS): Define depending on NUMA API version.
(n_bits, MASK_CPU_ISSET): Define, adjust, use uint64 rather than long.
* src/nodeinfo.h: Include "capabilities.h".
(virCapsInitNUMA): Declare it.
* examples/domain-events/events-c/Makefile.am:
* src/Makefile.am: Add $(NUMACTL_CFLAGS) and $(NUMACTL_LIBS) to various
compile/link-related variables.
* src/qemu_conf.c: Include "nodeinfo.h".
(qemudCapsInitNUMA): Remove duplicate code. Adjust caller.
* src/uml_conf.c (umlCapsInitNUMA): Likewise.
Include "nodeinfo.h".
* src/lxc_conf.c: Include "nodeinfo.h".
(lxcCapsInit): Perform NUMA initialization here, too.
* src/openvz_conf.c (openvzCapsInit): And here.
Include "nodeinfo.h".
* src/libvirt_sym.version.in: Add virCapsInitNUMA so that libvirtd
can link to this function.
2008-12-21 18:55:09 +00:00
|
|
|
goto cleanup;
|
2013-10-18 14:21:24 +00:00
|
|
|
|
|
|
|
cpus = NULL;
|
2014-06-03 13:18:27 +00:00
|
|
|
siblings = NULL;
|
2014-06-06 16:12:51 +00:00
|
|
|
pageinfo = NULL;
|
2014-08-20 13:59:25 +00:00
|
|
|
virBitmapFree(cpumap);
|
|
|
|
cpumap = NULL;
|
make NUMA-initialization code more portable and more robust
qemudCapsInitNUMA and umlCapsInitNUMA were identical, so this change
factors them into a new function, virCapsInitNUMA, and puts it in
nodeinfo.c.
In addition to factoring out the duplicates, this change also
adjusts that function definition (along with its macros) so
that it works with Fedora 9's numactl version 1, and makes it
so the code will work even if someone builds the kernel with
CONFIG_NR_CPUS > 4096.
Finally, also perform this NUMA initialization for the lxc
and openvz drivers.
* src/nodeinfo.c: Include <stdint.h>, <numa.h> and "memory.h".
(virCapsInitNUMA): Rename from qemudCapsInitNUMA and umlCapsInitNUMA.
(NUMA_MAX_N_CPUS): Define depending on NUMA API version.
(n_bits, MASK_CPU_ISSET): Define, adjust, use uint64 rather than long.
* src/nodeinfo.h: Include "capabilities.h".
(virCapsInitNUMA): Declare it.
* examples/domain-events/events-c/Makefile.am:
* src/Makefile.am: Add $(NUMACTL_CFLAGS) and $(NUMACTL_LIBS) to various
compile/link-related variables.
* src/qemu_conf.c: Include "nodeinfo.h".
(qemudCapsInitNUMA): Remove duplicate code. Adjust caller.
* src/uml_conf.c (umlCapsInitNUMA): Likewise.
Include "nodeinfo.h".
* src/lxc_conf.c: Include "nodeinfo.h".
(lxcCapsInit): Perform NUMA initialization here, too.
* src/openvz_conf.c (openvzCapsInit): And here.
Include "nodeinfo.h".
* src/libvirt_sym.version.in: Add virCapsInitNUMA so that libvirtd
can link to this function.
2008-12-21 18:55:09 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
ret = 0;
|
|
|
|
|
2014-03-25 06:57:22 +00:00
|
|
|
cleanup:
|
2014-09-04 21:00:30 +00:00
|
|
|
if ((topology_failed || ret < 0) && cpus)
|
2013-01-18 22:06:55 +00:00
|
|
|
virCapabilitiesClearHostNUMACellCPUTopology(cpus, ncpus);
|
|
|
|
|
2013-10-18 14:21:24 +00:00
|
|
|
virBitmapFree(cpumap);
|
|
|
|
VIR_FREE(cpus);
|
2014-06-03 13:18:27 +00:00
|
|
|
VIR_FREE(siblings);
|
2014-06-06 16:12:51 +00:00
|
|
|
VIR_FREE(pageinfo);
|
2015-07-07 21:22:28 +00:00
|
|
|
VIR_FREE(cpupath);
|
make NUMA-initialization code more portable and more robust
qemudCapsInitNUMA and umlCapsInitNUMA were identical, so this change
factors them into a new function, virCapsInitNUMA, and puts it in
nodeinfo.c.
In addition to factoring out the duplicates, this change also
adjusts that function definition (along with its macros) so
that it works with Fedora 9's numactl version 1, and makes it
so the code will work even if someone builds the kernel with
CONFIG_NR_CPUS > 4096.
Finally, also perform this NUMA initialization for the lxc
and openvz drivers.
* src/nodeinfo.c: Include <stdint.h>, <numa.h> and "memory.h".
(virCapsInitNUMA): Rename from qemudCapsInitNUMA and umlCapsInitNUMA.
(NUMA_MAX_N_CPUS): Define depending on NUMA API version.
(n_bits, MASK_CPU_ISSET): Define, adjust, use uint64 rather than long.
* src/nodeinfo.h: Include "capabilities.h".
(virCapsInitNUMA): Declare it.
* examples/domain-events/events-c/Makefile.am:
* src/Makefile.am: Add $(NUMACTL_CFLAGS) and $(NUMACTL_LIBS) to various
compile/link-related variables.
* src/qemu_conf.c: Include "nodeinfo.h".
(qemudCapsInitNUMA): Remove duplicate code. Adjust caller.
* src/uml_conf.c (umlCapsInitNUMA): Likewise.
Include "nodeinfo.h".
* src/lxc_conf.c: Include "nodeinfo.h".
(lxcCapsInit): Perform NUMA initialization here, too.
* src/openvz_conf.c (openvzCapsInit): And here.
Include "nodeinfo.h".
* src/libvirt_sym.version.in: Add virCapsInitNUMA so that libvirtd
can link to this function.
2008-12-21 18:55:09 +00:00
|
|
|
return ret;
|
|
|
|
}
|
2009-06-03 13:28:02 +00:00
|
|
|
|
|
|
|
|
|
|
|
int
|
2013-04-26 17:21:58 +00:00
|
|
|
nodeGetCellsFreeMemory(unsigned long long *freeMems,
|
2009-06-03 13:28:02 +00:00
|
|
|
int startCell,
|
|
|
|
int maxCells)
|
|
|
|
{
|
2013-10-17 16:30:09 +00:00
|
|
|
unsigned long long mem;
|
2009-06-03 13:28:02 +00:00
|
|
|
int n, lastCell, numCells;
|
|
|
|
int ret = -1;
|
|
|
|
int maxCell;
|
|
|
|
|
2013-10-17 14:57:29 +00:00
|
|
|
if (!virNumaIsAvailable())
|
2013-04-26 17:21:58 +00:00
|
|
|
return nodeGetCellsFreeMemoryFake(freeMems,
|
2013-04-03 20:11:15 +00:00
|
|
|
startCell, maxCells);
|
|
|
|
|
2013-10-17 15:42:22 +00:00
|
|
|
if ((maxCell = virNumaGetMaxNode()) < 0)
|
|
|
|
return 0;
|
|
|
|
|
2009-06-03 13:28:02 +00:00
|
|
|
if (startCell > maxCell) {
|
2012-07-18 18:19:23 +00:00
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
_("start cell %d out of range (0-%d)"),
|
|
|
|
startCell, maxCell);
|
2009-06-03 13:28:02 +00:00
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
lastCell = startCell + maxCells - 1;
|
|
|
|
if (lastCell > maxCell)
|
|
|
|
lastCell = maxCell;
|
|
|
|
|
2013-05-21 08:08:42 +00:00
|
|
|
for (numCells = 0, n = startCell; n <= lastCell; n++) {
|
2013-10-17 16:30:09 +00:00
|
|
|
virNumaGetNodeMemory(n, NULL, &mem);
|
2013-07-08 14:03:05 +00:00
|
|
|
|
2009-06-03 13:28:02 +00:00
|
|
|
freeMems[numCells++] = mem;
|
|
|
|
}
|
|
|
|
ret = numCells;
|
|
|
|
|
2014-03-25 06:57:22 +00:00
|
|
|
cleanup:
|
2009-06-03 13:28:02 +00:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2014-06-16 12:02:34 +00:00
|
|
|
int
|
|
|
|
nodeGetMemory(unsigned long long *mem,
|
|
|
|
unsigned long long *freeMem)
|
2009-06-03 13:28:02 +00:00
|
|
|
{
|
2013-10-17 15:42:22 +00:00
|
|
|
int max_node;
|
2009-06-03 13:28:02 +00:00
|
|
|
int n;
|
|
|
|
|
2014-06-16 12:02:34 +00:00
|
|
|
if (mem)
|
|
|
|
*mem = 0;
|
|
|
|
|
|
|
|
if (freeMem)
|
|
|
|
*freeMem = 0;
|
|
|
|
|
2013-10-17 14:57:29 +00:00
|
|
|
if (!virNumaIsAvailable())
|
2014-06-16 12:02:34 +00:00
|
|
|
return nodeGetMemoryFake(mem, freeMem);
|
2013-04-03 20:11:15 +00:00
|
|
|
|
2013-10-17 15:42:22 +00:00
|
|
|
if ((max_node = virNumaGetMaxNode()) < 0)
|
2014-06-16 12:02:34 +00:00
|
|
|
return -1;
|
2009-06-03 13:28:02 +00:00
|
|
|
|
2013-10-17 15:42:22 +00:00
|
|
|
for (n = 0; n <= max_node; n++) {
|
2014-06-16 12:02:34 +00:00
|
|
|
unsigned long long tmp_mem = 0, tmp_freeMem = 0;
|
|
|
|
|
|
|
|
if (!virNumaNodeIsAvailable(n))
|
|
|
|
continue;
|
|
|
|
|
|
|
|
if (virNumaGetNodeMemory(n, &tmp_mem, &tmp_freeMem) < 0)
|
|
|
|
return -1;
|
2013-07-08 14:03:05 +00:00
|
|
|
|
2014-06-16 12:02:34 +00:00
|
|
|
if (mem)
|
|
|
|
*mem += tmp_mem;
|
|
|
|
|
|
|
|
if (freeMem)
|
|
|
|
*freeMem += tmp_freeMem;
|
2009-06-03 13:28:02 +00:00
|
|
|
}
|
|
|
|
|
2014-06-16 12:02:34 +00:00
|
|
|
return 0;
|
2009-06-03 13:28:02 +00:00
|
|
|
}
|
2014-06-10 14:16:44 +00:00
|
|
|
|
|
|
|
int
|
|
|
|
nodeGetFreePages(unsigned int npages,
|
|
|
|
unsigned int *pages,
|
|
|
|
int startCell,
|
|
|
|
unsigned int cellCount,
|
|
|
|
unsigned long long *counts)
|
|
|
|
{
|
|
|
|
int ret = -1;
|
2014-09-22 10:14:27 +00:00
|
|
|
int cell, lastCell;
|
2014-06-10 14:16:44 +00:00
|
|
|
size_t i, ncounts = 0;
|
|
|
|
|
2014-09-22 10:14:27 +00:00
|
|
|
if ((lastCell = virNumaGetMaxNode()) < 0)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
if (startCell > lastCell) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
_("start cell %d out of range (0-%d)"),
|
|
|
|
startCell, lastCell);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
2014-09-24 13:10:18 +00:00
|
|
|
lastCell = MIN(lastCell, startCell + (int) cellCount - 1);
|
2014-09-22 10:14:27 +00:00
|
|
|
|
2014-09-24 05:45:30 +00:00
|
|
|
for (cell = startCell; cell <= lastCell; cell++) {
|
2014-06-10 14:16:44 +00:00
|
|
|
for (i = 0; i < npages; i++) {
|
|
|
|
unsigned int page_size = pages[i];
|
|
|
|
unsigned int page_free;
|
|
|
|
|
2014-06-23 13:04:11 +00:00
|
|
|
if (virNumaGetPageInfo(cell, page_size, 0, NULL, &page_free) < 0)
|
2014-06-10 14:16:44 +00:00
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
counts[ncounts++] = page_free;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!ncounts) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
|
|
|
|
_("no suitable info found"));
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = ncounts;
|
|
|
|
cleanup:
|
|
|
|
return ret;
|
|
|
|
}
|
2014-09-18 07:47:07 +00:00
|
|
|
|
|
|
|
int
|
|
|
|
nodeAllocPages(unsigned int npages,
|
|
|
|
unsigned int *pageSizes,
|
|
|
|
unsigned long long *pageCounts,
|
|
|
|
int startCell,
|
|
|
|
unsigned int cellCount,
|
|
|
|
bool add)
|
|
|
|
{
|
|
|
|
int ret = -1;
|
|
|
|
int cell, lastCell;
|
|
|
|
size_t i, ncounts = 0;
|
|
|
|
|
|
|
|
if ((lastCell = virNumaGetMaxNode()) < 0)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
if (startCell > lastCell) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
_("start cell %d out of range (0-%d)"),
|
|
|
|
startCell, lastCell);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
lastCell = MIN(lastCell, startCell + (int) cellCount - 1);
|
|
|
|
|
|
|
|
for (cell = startCell; cell <= lastCell; cell++) {
|
|
|
|
for (i = 0; i < npages; i++) {
|
|
|
|
unsigned int page_size = pageSizes[i];
|
|
|
|
unsigned long long page_count = pageCounts[i];
|
|
|
|
|
|
|
|
if (virNumaSetPagePoolSize(cell, page_size, page_count, add) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
ncounts++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = ncounts;
|
|
|
|
cleanup:
|
|
|
|
return ret;
|
|
|
|
}
|
nodeinfo: Fix output on PPC64 KVM hosts
The nodeinfo is reporting incorrect number of cpus and incorrect host
topology on PPC64 KVM hosts. The KVM hypervisor on PPC64 needs only
the primary thread in a core to be online, and the secondaries offlined.
While scheduling a guest in, the kvm scheduler wakes up the secondaries to
run in guest context.
The host scheduling of the guests happen at the core level(as only primary
thread is online). The kvm scheduler exploits as many threads of the core
as needed by guest. Further, starting POWER8, the processor allows splitting
a physical core into multiple subcores with 2 or 4 threads each. Again, only
the primary thread in a subcore is online in the host. The KVM-PPC
scheduler allows guests to exploit all the offline threads in the subcore,
by bringing them online when needed.
(Kernel patches on split-core http://www.spinics.net/lists/kvm-ppc/msg09121.html)
Recently with dynamic micro-threading changes in ppc-kvm, makes sure
to utilize all the offline cpus across guests, and across guests with
different cpu topologies.
(https://www.mail-archive.com/kvm@vger.kernel.org/msg115978.html)
Since the offline cpus are brought online in the guest context, it is safe
to count them as online. Nodeinfo today discounts these offline cpus from
cpu count/topology calclulation, and the nodeinfo output is not of any help
and the host appears overcommited when it is actually not.
The patch carefully counts those offline threads whose primary threads are
online. The host topology displayed by the nodeinfo is also fixed when the
host is in valid kvm state.
Signed-off-by: Shivaprasad G Bhat <sbhat@linux.vnet.ibm.com>
Signed-off-by: Andrea Bolognani <abologna@redhat.com>
2015-07-30 09:37:04 +00:00
|
|
|
|
2015-08-03 15:02:39 +00:00
|
|
|
#if HAVE_LINUX_KVM_H && defined(KVM_CAP_PPC_SMT)
|
|
|
|
|
nodeinfo: Fix output on PPC64 KVM hosts
The nodeinfo is reporting incorrect number of cpus and incorrect host
topology on PPC64 KVM hosts. The KVM hypervisor on PPC64 needs only
the primary thread in a core to be online, and the secondaries offlined.
While scheduling a guest in, the kvm scheduler wakes up the secondaries to
run in guest context.
The host scheduling of the guests happen at the core level(as only primary
thread is online). The kvm scheduler exploits as many threads of the core
as needed by guest. Further, starting POWER8, the processor allows splitting
a physical core into multiple subcores with 2 or 4 threads each. Again, only
the primary thread in a subcore is online in the host. The KVM-PPC
scheduler allows guests to exploit all the offline threads in the subcore,
by bringing them online when needed.
(Kernel patches on split-core http://www.spinics.net/lists/kvm-ppc/msg09121.html)
Recently with dynamic micro-threading changes in ppc-kvm, makes sure
to utilize all the offline cpus across guests, and across guests with
different cpu topologies.
(https://www.mail-archive.com/kvm@vger.kernel.org/msg115978.html)
Since the offline cpus are brought online in the guest context, it is safe
to count them as online. Nodeinfo today discounts these offline cpus from
cpu count/topology calclulation, and the nodeinfo output is not of any help
and the host appears overcommited when it is actually not.
The patch carefully counts those offline threads whose primary threads are
online. The host topology displayed by the nodeinfo is also fixed when the
host is in valid kvm state.
Signed-off-by: Shivaprasad G Bhat <sbhat@linux.vnet.ibm.com>
Signed-off-by: Andrea Bolognani <abologna@redhat.com>
2015-07-30 09:37:04 +00:00
|
|
|
/* Get the number of threads per subcore.
|
|
|
|
*
|
|
|
|
* This will be 2, 4 or 8 on POWER hosts, depending on the current
|
|
|
|
* micro-threading configuration, and 0 everywhere else.
|
|
|
|
*
|
|
|
|
* Returns the number of threads per subcore if subcores are in use, zero
|
|
|
|
* if subcores are not in use, and a negative value on error */
|
|
|
|
int
|
|
|
|
nodeGetThreadsPerSubcore(virArch arch)
|
|
|
|
{
|
|
|
|
int threads_per_subcore = 0;
|
|
|
|
const char *kvmpath = "/dev/kvm";
|
|
|
|
int kvmfd;
|
|
|
|
|
|
|
|
if (ARCH_IS_PPC64(arch)) {
|
|
|
|
|
|
|
|
/* It's okay if /dev/kvm doesn't exist, because
|
|
|
|
* a. we might be running in a guest
|
|
|
|
* b. the kvm module might not be installed or enabled
|
|
|
|
* In either case, falling back to the subcore-unaware thread
|
|
|
|
* counting logic is the right thing to do */
|
|
|
|
if (!virFileExists(kvmpath))
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
if ((kvmfd = open(kvmpath, O_RDONLY)) < 0) {
|
|
|
|
/* This can happen when running as a regular user if
|
|
|
|
* permissions are tight enough, in which case erroring out
|
|
|
|
* is better than silently falling back and reporting
|
|
|
|
* different nodeinfo depending on the user */
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("Failed to open '%s'"),
|
|
|
|
kvmpath);
|
|
|
|
threads_per_subcore = -1;
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* For Phyp and KVM based guests the ioctl for KVM_CAP_PPC_SMT
|
|
|
|
* returns zero and both primary and secondary threads will be
|
|
|
|
* online */
|
|
|
|
threads_per_subcore = ioctl(kvmfd,
|
|
|
|
KVM_CHECK_EXTENSION,
|
|
|
|
KVM_CAP_PPC_SMT);
|
|
|
|
|
|
|
|
VIR_FORCE_CLOSE(kvmfd);
|
|
|
|
}
|
|
|
|
|
|
|
|
out:
|
|
|
|
return threads_per_subcore;
|
|
|
|
}
|
2015-08-03 15:02:39 +00:00
|
|
|
|
|
|
|
#else
|
|
|
|
|
|
|
|
/* Fallback for nodeGetThreadsPerSubcore() used when KVM headers
|
|
|
|
* are not available on the system */
|
|
|
|
int
|
|
|
|
nodeGetThreadsPerSubcore(virArch arch ATTRIBUTE_UNUSED)
|
|
|
|
{
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
#endif /* HAVE_LINUX_KVM_H && defined(KVM_CAP_PPC_SMT) */
|