2007-07-19 16:22:40 +00:00
|
|
|
/*
|
2012-12-13 17:44:57 +00:00
|
|
|
* virutil.c: common, generic utility functions
|
2007-07-19 16:22:40 +00:00
|
|
|
*
|
2014-03-18 09:14:35 +01:00
|
|
|
* Copyright (C) 2006-2014 Red Hat, Inc.
|
2007-07-19 16:22:40 +00:00
|
|
|
* Copyright (C) 2006 Daniel P. Berrange
|
|
|
|
* Copyright (C) 2006, 2007 Binary Karma
|
|
|
|
* Copyright (C) 2006 Shuveb Hussain
|
|
|
|
*
|
|
|
|
* This library is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
|
|
* License as published by the Free Software Foundation; either
|
|
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This library is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
* Lesser General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU Lesser General Public
|
2012-09-20 16:30:55 -06:00
|
|
|
* License along with this library. If not, see
|
2012-07-21 18:06:23 +08:00
|
|
|
* <http://www.gnu.org/licenses/>.
|
2007-07-19 16:22:40 +00:00
|
|
|
*/
|
|
|
|
|
2008-01-29 18:15:54 +00:00
|
|
|
#include <config.h>
|
2007-12-03 16:19:41 +00:00
|
|
|
|
2007-07-19 16:22:40 +00:00
|
|
|
#include <unistd.h>
|
|
|
|
#include <fcntl.h>
|
2008-11-05 18:57:42 +00:00
|
|
|
#include <poll.h>
|
2007-12-03 14:30:46 +00:00
|
|
|
#include <sys/stat.h>
|
2016-04-14 15:11:45 +02:00
|
|
|
|
|
|
|
#ifdef MAJOR_IN_MKDEV
|
|
|
|
# include <sys/mkdev.h>
|
|
|
|
#elif MAJOR_IN_SYSMACROS
|
|
|
|
# include <sys/sysmacros.h>
|
|
|
|
#endif
|
|
|
|
|
Make sure sys/types.h is included after sys/sysmacros.h
In the latest glibc, major() and minor() functions are marked as
deprecated (glibc commit dbab6577):
CC util/libvirt_util_la-vircgroup.lo
util/vircgroup.c: In function 'virCgroupGetBlockDevString':
util/vircgroup.c:768:5: error: '__major_from_sys_types' is deprecated:
In the GNU C Library, `major' is defined by <sys/sysmacros.h>.
For historical compatibility, it is currently defined by
<sys/types.h> as well, but we plan to remove this soon.
To use `major', include <sys/sysmacros.h> directly.
If you did not intend to use a system-defined macro `major',
you should #undef it after including <sys/types.h>.
[-Werror=deprecated-declarations]
if (virAsprintf(&ret, "%d:%d ", major(sb.st_rdev), minor(sb.st_rdev)) < 0)
^~
In file included from /usr/include/features.h:397:0,
from /usr/include/bits/libc-header-start.h:33,
from /usr/include/stdio.h:28,
from ../gnulib/lib/stdio.h:43,
from util/vircgroup.c:26:
/usr/include/sys/sysmacros.h:87:1: note: declared here
__SYSMACROS_DEFINE_MAJOR (__SYSMACROS_FST_IMPL_TEMPL)
^
Moreover, in the glibc commit, there's suggestion to keep
ordering of including of header files as implemented here.
Signed-off-by: Michal Privoznik <mprivozn@redhat.com>
2016-09-06 14:20:04 +02:00
|
|
|
#include <sys/types.h>
|
2010-09-22 12:08:58 -06:00
|
|
|
#include <termios.h>
|
2011-11-03 14:56:13 -06:00
|
|
|
|
2016-12-12 13:33:42 +01:00
|
|
|
#if WITH_DEVMAPPER
|
2011-02-18 12:00:47 -07:00
|
|
|
# include <libdevmapper.h>
|
|
|
|
#endif
|
2007-12-03 16:19:41 +00:00
|
|
|
|
2009-01-07 10:43:16 +00:00
|
|
|
#include <netdb.h>
|
2009-01-22 19:41:48 +00:00
|
|
|
#ifdef HAVE_GETPWUID_R
|
2010-03-09 19:22:22 +01:00
|
|
|
# include <pwd.h>
|
|
|
|
# include <grp.h>
|
2009-01-22 19:41:48 +00:00
|
|
|
#endif
|
2012-09-20 15:17:56 +01:00
|
|
|
#if WITH_CAPNG
|
2010-03-09 19:22:22 +01:00
|
|
|
# include <cap-ng.h>
|
util: virSetUIDGIDWithCaps - change uid while keeping caps
Normally when a process' uid is changed to non-0, all the capabilities
bits are cleared, even those explicitly set with calls to
capng_update()/capng_apply() made immediately before setuid. And
*after* the process' uid has been changed, it no longer has the
necessary privileges to add capabilities back to the process.
In order to set a non-0 uid while still maintaining any capabilities
bits, it is necessary to either call capng_change_id() (which
unfortunately doesn't currently call initgroups to setup auxiliary
group membership), or to perform the small amount of calisthenics
contained in the new utility function virSetUIDGIDWithCaps().
Another very important difference between the capabilities
setting/clearing in virSetUIDGIDWithCaps() and virCommand's
virSetCapabilities() (which it will replace in the next patch) is that
the new function properly clears the capabilities bounding set, so it
will not be possible for a child process to set any new
capabilities.
A short description of what is done by virSetUIDGIDWithCaps():
1) clear all capabilities then set all those desired by the caller (in
capBits) plus CAP_SETGID, CAP_SETUID, and CAP_SETPCAP (which is needed
to change the capabilities bounding set).
2) call prctl(), telling it that we want to maintain current
capabilities across an upcoming setuid().
3) switch to the new uid/gid
4) again call prctl(), telling it we will no longer want capabilities
maintained if this process does another setuid().
5) clear the capabilities that we added to allow us to
setuid/setgid/change the bounding set (unless they were also requested
by the caller via the virCommand API).
Because the modification/maintaining of capabilities is intermingled
with setting the uid, this is necessarily done in a single function,
rather than having two independent functions.
Note that, due to the way that effective capabilities are computed (at
time of execve) for a process that has uid != 0, the *file*
capabilities of the binary being executed must also have the desired
capabilities bit(s) set (see "man 7 capabilities"). This can be done
with the "filecap" command. (e.g. "filecap /usr/bin/qemu-kvm sys_rawio").
2013-02-05 10:30:32 -05:00
|
|
|
# include <sys/prctl.h>
|
2009-06-29 17:00:52 +00:00
|
|
|
#endif
|
2007-12-07 14:45:39 +00:00
|
|
|
|
2012-05-24 14:37:54 +01:00
|
|
|
#ifdef WIN32
|
2012-06-21 14:37:34 +01:00
|
|
|
# ifdef HAVE_WINSOCK2_H
|
|
|
|
# include <winsock2.h>
|
|
|
|
# endif
|
2012-05-24 14:37:54 +01:00
|
|
|
# include <windows.h>
|
|
|
|
# include <shlobj.h>
|
|
|
|
#endif
|
|
|
|
|
2018-01-19 13:48:10 +00:00
|
|
|
#ifdef HAVE_SYS_UN_H
|
|
|
|
# include <sys/un.h>
|
|
|
|
#endif
|
|
|
|
|
2013-05-21 17:47:48 -06:00
|
|
|
#include "mgetgroups.h"
|
2012-12-13 18:21:53 +00:00
|
|
|
#include "virerror.h"
|
2012-12-12 17:59:27 +00:00
|
|
|
#include "virlog.h"
|
2012-12-04 12:04:07 +00:00
|
|
|
#include "virbuffer.h"
|
2012-12-12 18:06:53 +00:00
|
|
|
#include "viralloc.h"
|
2010-04-28 21:36:03 -06:00
|
|
|
#include "verify.h"
|
2013-05-09 14:59:04 -04:00
|
|
|
#include "virfile.h"
|
|
|
|
#include "vircommand.h"
|
|
|
|
#include "nonblocking.h"
|
|
|
|
#include "virprocess.h"
|
|
|
|
#include "virstring.h"
|
|
|
|
#include "virutil.h"
|
2007-12-03 14:30:46 +00:00
|
|
|
|
2013-05-09 14:59:04 -04:00
|
|
|
verify(sizeof(gid_t) <= sizeof(unsigned int) &&
|
|
|
|
sizeof(uid_t) <= sizeof(unsigned int));
|
2011-07-06 15:39:21 +02:00
|
|
|
|
2013-05-09 14:59:04 -04:00
|
|
|
#define VIR_FROM_THIS VIR_FROM_NONE
|
2011-07-06 15:39:21 +02:00
|
|
|
|
2014-02-28 12:16:17 +00:00
|
|
|
VIR_LOG_INIT("util.util");
|
|
|
|
|
2013-05-09 14:59:04 -04:00
|
|
|
#ifndef WIN32
|
2007-12-03 14:30:46 +00:00
|
|
|
|
2014-03-18 09:14:35 +01:00
|
|
|
int virSetInherit(int fd, bool inherit)
|
|
|
|
{
|
2013-05-09 14:59:04 -04:00
|
|
|
int fflags;
|
|
|
|
if ((fflags = fcntl(fd, F_GETFD)) < 0)
|
2011-07-05 23:02:53 +02:00
|
|
|
return -1;
|
2013-05-09 14:59:04 -04:00
|
|
|
if (inherit)
|
|
|
|
fflags &= ~FD_CLOEXEC;
|
|
|
|
else
|
|
|
|
fflags |= FD_CLOEXEC;
|
|
|
|
if ((fcntl(fd, F_SETFD, fflags)) < 0)
|
2011-07-05 23:02:53 +02:00
|
|
|
return -1;
|
2007-12-03 14:30:46 +00:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2013-05-09 14:59:04 -04:00
|
|
|
#else /* WIN32 */
|
2012-07-10 19:24:04 +08:00
|
|
|
|
2019-10-14 14:45:33 +02:00
|
|
|
int virSetInherit(int fd G_GNUC_UNUSED, bool inherit G_GNUC_UNUSED)
|
2010-01-26 14:47:02 +01:00
|
|
|
{
|
2013-05-09 14:59:04 -04:00
|
|
|
/* FIXME: Currently creating child processes is not supported on
|
|
|
|
* Win32, so there is no point in failing calls that are only relevant
|
|
|
|
* when creating child processes. So just pretend that we changed the
|
|
|
|
* inheritance property of the given fd as requested. */
|
|
|
|
return 0;
|
2010-01-26 14:47:02 +01:00
|
|
|
}
|
|
|
|
|
2013-05-09 14:59:04 -04:00
|
|
|
#endif /* WIN32 */
|
2011-04-03 11:21:14 +02:00
|
|
|
|
2014-03-18 09:14:35 +01:00
|
|
|
int virSetBlocking(int fd, bool blocking)
|
|
|
|
{
|
2013-05-09 14:59:04 -04:00
|
|
|
return set_nonblocking_flag(fd, !blocking);
|
2007-12-03 14:30:46 +00:00
|
|
|
}
|
|
|
|
|
2014-03-18 09:14:35 +01:00
|
|
|
int virSetNonBlock(int fd)
|
|
|
|
{
|
2013-05-09 14:59:04 -04:00
|
|
|
return virSetBlocking(fd, false);
|
2011-10-20 10:02:27 +01:00
|
|
|
}
|
2008-08-13 10:52:15 +00:00
|
|
|
|
2013-05-09 14:59:04 -04:00
|
|
|
int virSetCloseExec(int fd)
|
2012-05-24 14:37:54 +01:00
|
|
|
{
|
2013-05-09 14:59:04 -04:00
|
|
|
return virSetInherit(fd, false);
|
2012-05-24 14:37:54 +01:00
|
|
|
}
|
|
|
|
|
2014-04-25 17:47:08 +01:00
|
|
|
#ifdef WIN32
|
2019-10-14 14:45:33 +02:00
|
|
|
int virSetSockReuseAddr(int fd G_GNUC_UNUSED, bool fatal G_GNUC_UNUSED)
|
2014-04-25 17:47:08 +01:00
|
|
|
{
|
|
|
|
/*
|
|
|
|
* SO_REUSEADDR on Windows is actually akin to SO_REUSEPORT
|
|
|
|
* on Linux/BSD. ie it allows 2 apps to listen to the same
|
|
|
|
* port at once which is certainly not what we want here.
|
|
|
|
*
|
|
|
|
* Win32 sockets have Linux/BSD-like SO_REUSEADDR behaviour
|
|
|
|
* by default, so we can be a no-op.
|
|
|
|
*
|
|
|
|
* http://msdn.microsoft.com/en-us/library/windows/desktop/ms740621.aspx
|
|
|
|
*/
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
#else
|
2014-09-07 17:05:03 +02:00
|
|
|
int virSetSockReuseAddr(int fd, bool fatal)
|
2014-04-25 17:47:08 +01:00
|
|
|
{
|
|
|
|
int opt = 1;
|
2014-09-07 17:05:03 +02:00
|
|
|
int ret = setsockopt(fd, SOL_SOCKET, SO_REUSEADDR, &opt, sizeof(opt));
|
|
|
|
|
|
|
|
if (ret < 0 && fatal) {
|
|
|
|
virReportSystemError(errno, "%s",
|
|
|
|
_("Unable to set socket reuse addr flag"));
|
|
|
|
}
|
|
|
|
|
|
|
|
return ret;
|
2014-04-25 17:47:08 +01:00
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2010-05-20 11:41:31 -04:00
|
|
|
|
2010-08-27 23:13:45 +02:00
|
|
|
/* Convert C from hexadecimal character to integer. */
|
|
|
|
int
|
|
|
|
virHexToBin(unsigned char c)
|
|
|
|
{
|
|
|
|
switch (c) {
|
|
|
|
default: return c - '0';
|
|
|
|
case 'a': case 'A': return 10;
|
|
|
|
case 'b': case 'B': return 11;
|
|
|
|
case 'c': case 'C': return 12;
|
|
|
|
case 'd': case 'D': return 13;
|
|
|
|
case 'e': case 'E': return 14;
|
|
|
|
case 'f': case 'F': return 15;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2012-03-05 09:28:59 -07:00
|
|
|
/* Scale an integer VALUE in-place by an optional case-insensitive
|
|
|
|
* SUFFIX, defaulting to SCALE if suffix is NULL or empty (scale is
|
|
|
|
* typically 1 or 1024). Recognized suffixes include 'b' or 'bytes',
|
|
|
|
* as well as power-of-two scaling via binary abbreviations ('KiB',
|
|
|
|
* 'MiB', ...) or their one-letter counterpart ('k', 'M', ...), and
|
|
|
|
* power-of-ten scaling via SI abbreviations ('KB', 'MB', ...).
|
|
|
|
* Ensure that the result does not exceed LIMIT. Return 0 on success,
|
|
|
|
* -1 with error message raised on failure. */
|
|
|
|
int
|
|
|
|
virScaleInteger(unsigned long long *value, const char *suffix,
|
|
|
|
unsigned long long scale, unsigned long long limit)
|
|
|
|
{
|
|
|
|
if (!suffix || !*suffix) {
|
|
|
|
if (!scale) {
|
2012-07-18 11:26:24 +01:00
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
_("invalid scale %llu"), scale);
|
2012-03-05 09:28:59 -07:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
suffix = "";
|
|
|
|
} else if (STRCASEEQ(suffix, "b") || STRCASEEQ(suffix, "byte") ||
|
|
|
|
STRCASEEQ(suffix, "bytes")) {
|
|
|
|
scale = 1;
|
|
|
|
} else {
|
|
|
|
int base;
|
|
|
|
|
|
|
|
if (!suffix[1] || STRCASEEQ(suffix + 1, "iB")) {
|
|
|
|
base = 1024;
|
2019-11-18 15:15:31 +01:00
|
|
|
} else if (g_ascii_tolower(suffix[1]) == 'b' && !suffix[2]) {
|
2012-03-05 09:28:59 -07:00
|
|
|
base = 1000;
|
|
|
|
} else {
|
2012-07-18 11:26:24 +01:00
|
|
|
virReportError(VIR_ERR_INVALID_ARG,
|
2018-09-19 16:38:14 +08:00
|
|
|
_("unknown suffix '%s'"), suffix);
|
2012-03-05 09:28:59 -07:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
scale = 1;
|
2019-11-18 15:15:31 +01:00
|
|
|
switch (g_ascii_tolower(*suffix)) {
|
2012-03-05 09:28:59 -07:00
|
|
|
case 'e':
|
|
|
|
scale *= base;
|
2019-10-15 13:38:21 +02:00
|
|
|
G_GNUC_FALLTHROUGH;
|
2012-03-05 09:28:59 -07:00
|
|
|
case 'p':
|
|
|
|
scale *= base;
|
2019-10-15 13:38:21 +02:00
|
|
|
G_GNUC_FALLTHROUGH;
|
2012-03-05 09:28:59 -07:00
|
|
|
case 't':
|
|
|
|
scale *= base;
|
2019-10-15 13:38:21 +02:00
|
|
|
G_GNUC_FALLTHROUGH;
|
2012-03-05 09:28:59 -07:00
|
|
|
case 'g':
|
|
|
|
scale *= base;
|
2019-10-15 13:38:21 +02:00
|
|
|
G_GNUC_FALLTHROUGH;
|
2012-03-05 09:28:59 -07:00
|
|
|
case 'm':
|
|
|
|
scale *= base;
|
2019-10-15 13:38:21 +02:00
|
|
|
G_GNUC_FALLTHROUGH;
|
2012-03-05 09:28:59 -07:00
|
|
|
case 'k':
|
|
|
|
scale *= base;
|
|
|
|
break;
|
|
|
|
default:
|
2012-07-18 11:26:24 +01:00
|
|
|
virReportError(VIR_ERR_INVALID_ARG,
|
|
|
|
_("unknown suffix '%s'"), suffix);
|
2012-03-05 09:28:59 -07:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-03-05 23:13:21 +08:00
|
|
|
if (*value && *value > (limit / scale)) {
|
2012-07-18 11:26:24 +01:00
|
|
|
virReportError(VIR_ERR_OVERFLOW, _("value too large: %llu%s"),
|
|
|
|
*value, suffix);
|
2012-03-05 09:28:59 -07:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
*value *= scale;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2011-06-29 11:47:08 -06:00
|
|
|
|
2010-03-30 16:15:13 +02:00
|
|
|
/**
|
|
|
|
* virParseVersionString:
|
|
|
|
* @str: const char pointer to the version string
|
|
|
|
* @version: unsigned long pointer to output the version number
|
2011-07-01 07:23:02 -06:00
|
|
|
* @allowMissing: true to treat 3 like 3.0.0, false to error out on
|
|
|
|
* missing minor or micro
|
2010-03-30 16:15:13 +02:00
|
|
|
*
|
|
|
|
* Parse an unsigned version number from a version string. Expecting
|
|
|
|
* 'major.minor.micro' format, ignoring an optional suffix.
|
|
|
|
*
|
|
|
|
* The major, minor and micro numbers are encoded into a single version number:
|
|
|
|
*
|
|
|
|
* 1000000 * major + 1000 * minor + micro
|
|
|
|
*
|
|
|
|
* Returns the 0 for success, -1 for error.
|
|
|
|
*/
|
|
|
|
int
|
2011-07-01 07:23:02 -06:00
|
|
|
virParseVersionString(const char *str, unsigned long *version,
|
|
|
|
bool allowMissing)
|
2010-03-30 16:15:13 +02:00
|
|
|
{
|
2011-07-01 06:40:21 -04:00
|
|
|
unsigned int major, minor = 0, micro = 0;
|
2010-03-30 16:15:13 +02:00
|
|
|
char *tmp;
|
|
|
|
|
2011-07-01 06:40:21 -04:00
|
|
|
if (virStrToLong_ui(str, &tmp, 10, &major) < 0)
|
2010-03-30 16:15:13 +02:00
|
|
|
return -1;
|
|
|
|
|
2011-07-01 07:23:02 -06:00
|
|
|
if (!allowMissing && *tmp != '.')
|
|
|
|
return -1;
|
|
|
|
|
2011-07-01 06:40:21 -04:00
|
|
|
if ((*tmp == '.') && virStrToLong_ui(tmp + 1, &tmp, 10, &minor) < 0)
|
2010-03-30 16:15:13 +02:00
|
|
|
return -1;
|
|
|
|
|
2011-07-01 07:23:02 -06:00
|
|
|
if (!allowMissing && *tmp != '.')
|
|
|
|
return -1;
|
|
|
|
|
2011-07-01 06:40:21 -04:00
|
|
|
if ((*tmp == '.') && virStrToLong_ui(tmp + 1, &tmp, 10, µ) < 0)
|
2010-03-30 16:15:13 +02:00
|
|
|
return -1;
|
|
|
|
|
2011-07-01 07:23:02 -06:00
|
|
|
if (major > UINT_MAX / 1000000 || minor > 999 || micro > 999)
|
|
|
|
return -1;
|
|
|
|
|
2010-03-30 16:15:13 +02:00
|
|
|
*version = 1000000 * major + 1000 * minor + micro;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2012-09-25 18:31:01 +01:00
|
|
|
/**
|
|
|
|
* Format @val as a base-10 decimal number, in the
|
|
|
|
* buffer @buf of size @buflen. To allocate a suitable
|
|
|
|
* sized buffer, the INT_BUFLEN(int) macro should be
|
|
|
|
* used
|
|
|
|
*
|
|
|
|
* Returns pointer to start of the number in @buf
|
|
|
|
*/
|
|
|
|
char *
|
|
|
|
virFormatIntDecimal(char *buf, size_t buflen, int val)
|
|
|
|
{
|
|
|
|
char *p = buf + buflen - 1;
|
|
|
|
*p = '\0';
|
|
|
|
if (val >= 0) {
|
|
|
|
do {
|
|
|
|
*--p = '0' + (val % 10);
|
|
|
|
val /= 10;
|
|
|
|
} while (val != 0);
|
|
|
|
} else {
|
|
|
|
do {
|
|
|
|
*--p = '0' - (val % 10);
|
|
|
|
val /= 10;
|
|
|
|
} while (val != 0);
|
|
|
|
*--p = '-';
|
|
|
|
}
|
|
|
|
return p;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2017-11-09 16:19:25 +01:00
|
|
|
/**
|
|
|
|
* virFormatIntPretty
|
|
|
|
*
|
|
|
|
* @val: Value in bytes to be shortened
|
|
|
|
* @unit: unit to be used
|
|
|
|
*
|
|
|
|
* Similar to vshPrettyCapacity, but operates on integers and not doubles
|
|
|
|
*
|
2018-09-27 18:49:41 -04:00
|
|
|
* NB: Since using unsigned long long, we are limited to at most a "PiB"
|
|
|
|
* to make pretty. This is because a PiB is 1152921504606846976 bytes,
|
|
|
|
* but that value * 1024 > ULLONG_MAX value 18446744073709551615 bytes.
|
|
|
|
*
|
2017-11-09 16:19:25 +01:00
|
|
|
* Returns shortened value that can be used with @unit.
|
|
|
|
*/
|
|
|
|
unsigned long long
|
|
|
|
virFormatIntPretty(unsigned long long val,
|
|
|
|
const char **unit)
|
|
|
|
{
|
|
|
|
unsigned long long limit = 1024;
|
|
|
|
|
|
|
|
if (val % limit || val == 0) {
|
|
|
|
*unit = "B";
|
|
|
|
return val;
|
|
|
|
}
|
|
|
|
limit *= 1024;
|
|
|
|
if (val % limit) {
|
|
|
|
*unit = "KiB";
|
|
|
|
return val / (limit / 1024);
|
|
|
|
}
|
|
|
|
limit *= 1024;
|
|
|
|
if (val % limit) {
|
|
|
|
*unit = "MiB";
|
|
|
|
return val / (limit / 1024);
|
|
|
|
}
|
|
|
|
limit *= 1024;
|
|
|
|
if (val % limit) {
|
|
|
|
*unit = "GiB";
|
|
|
|
return val / (limit / 1024);
|
|
|
|
}
|
|
|
|
limit *= 1024;
|
|
|
|
if (val % limit) {
|
|
|
|
*unit = "TiB";
|
|
|
|
return val / (limit / 1024);
|
|
|
|
}
|
|
|
|
limit *= 1024;
|
2018-09-27 18:49:41 -04:00
|
|
|
*unit = "PiB";
|
2017-11-09 16:19:25 +01:00
|
|
|
return val / (limit / 1024);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2010-03-19 18:26:09 +01:00
|
|
|
/* Translates a device name of the form (regex) /^[fhv]d[a-z]+[0-9]*$/
|
2015-11-13 13:14:44 +00:00
|
|
|
* into the corresponding index and partition number
|
|
|
|
* (e.g. sda0 => (0,0), hdz2 => (25,2), vdaa12 => (26,12))
|
2008-05-09 16:41:19 +00:00
|
|
|
* @param name The name of the device
|
2015-11-13 13:14:44 +00:00
|
|
|
* @param disk The disk index to be returned
|
|
|
|
* @param partition The partition index to be returned
|
|
|
|
* @return 0 on success, or -1 on failure
|
2008-05-09 16:41:19 +00:00
|
|
|
*/
|
2015-11-13 13:14:44 +00:00
|
|
|
int virDiskNameParse(const char *name, int *disk, int *partition)
|
2014-03-18 09:14:35 +01:00
|
|
|
{
|
2008-05-09 16:41:19 +00:00
|
|
|
const char *ptr = NULL;
|
2015-11-13 13:14:44 +00:00
|
|
|
char *rem;
|
2008-05-09 16:41:19 +00:00
|
|
|
int idx = 0;
|
2010-08-10 13:46:46 +02:00
|
|
|
static char const* const drive_prefix[] = {"fd", "hd", "vd", "sd", "xvd", "ubd"};
|
Convert 'int i' to 'size_t i' in src/util/ files
Convert the type of loop iterators named 'i', 'j', k',
'ii', 'jj', 'kk', to be 'size_t' instead of 'int' or
'unsigned int', also santizing 'ii', 'jj', 'kk' to use
the normal 'i', 'j', 'k' naming
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2013-07-08 15:09:33 +01:00
|
|
|
size_t i;
|
2008-05-09 16:41:19 +00:00
|
|
|
|
2019-10-15 13:55:26 +02:00
|
|
|
for (i = 0; i < G_N_ELEMENTS(drive_prefix); i++) {
|
2008-05-15 16:05:41 +00:00
|
|
|
if (STRPREFIX(name, drive_prefix[i])) {
|
|
|
|
ptr = name + strlen(drive_prefix[i]);
|
2008-05-09 16:41:19 +00:00
|
|
|
break;
|
2008-05-15 16:05:41 +00:00
|
|
|
}
|
2008-05-09 16:41:19 +00:00
|
|
|
}
|
|
|
|
|
2019-11-18 15:16:54 +01:00
|
|
|
if (!ptr || !g_ascii_islower(*ptr))
|
2008-05-09 16:41:19 +00:00
|
|
|
return -1;
|
|
|
|
|
2008-10-10 08:37:35 +00:00
|
|
|
for (i = 0; *ptr; i++) {
|
2019-11-18 15:16:54 +01:00
|
|
|
if (!g_ascii_islower(*ptr))
|
2010-03-19 18:26:09 +01:00
|
|
|
break;
|
2008-05-09 16:41:19 +00:00
|
|
|
|
2012-11-22 14:56:08 +00:00
|
|
|
idx = (idx + (i < 1 ? 0 : 1)) * 26;
|
2008-05-09 16:41:19 +00:00
|
|
|
idx += *ptr - 'a';
|
|
|
|
ptr++;
|
|
|
|
}
|
|
|
|
|
2010-03-19 18:26:09 +01:00
|
|
|
/* Count the trailing digits. */
|
|
|
|
size_t n_digits = strspn(ptr, "0123456789");
|
|
|
|
if (ptr[n_digits] != '\0')
|
|
|
|
return -1;
|
|
|
|
|
2015-11-13 13:14:44 +00:00
|
|
|
*disk = idx;
|
|
|
|
|
|
|
|
/* Convert trailing digits into our partition index */
|
|
|
|
if (partition) {
|
|
|
|
*partition = 0;
|
|
|
|
|
|
|
|
/* Shouldn't start by zero */
|
|
|
|
if (n_digits > 1 && *ptr == '0')
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
if (n_digits && virStrToLong_i(ptr, &rem, 10, partition) < 0)
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Translates a device name of the form (regex) /^[fhv]d[a-z]+[0-9]*$/
|
|
|
|
* into the corresponding index (e.g. sda => 0, hdz => 25, vdaa => 26)
|
|
|
|
* Note that any trailing string of digits is simply ignored.
|
|
|
|
* @param name The name of the device
|
|
|
|
* @return name's index, or -1 on failure
|
|
|
|
*/
|
|
|
|
int virDiskNameToIndex(const char *name)
|
|
|
|
{
|
|
|
|
int idx;
|
|
|
|
|
2017-11-01 10:30:04 +01:00
|
|
|
if (virDiskNameParse(name, &idx, NULL) < 0)
|
2015-11-13 13:14:44 +00:00
|
|
|
idx = -1;
|
|
|
|
|
2008-05-09 16:41:19 +00:00
|
|
|
return idx;
|
|
|
|
}
|
2009-01-06 17:46:46 +00:00
|
|
|
|
2009-12-03 17:17:40 +01:00
|
|
|
char *virIndexToDiskName(int idx, const char *prefix)
|
|
|
|
{
|
|
|
|
char *name = NULL;
|
Convert 'int i' to 'size_t i' in src/util/ files
Convert the type of loop iterators named 'i', 'j', k',
'ii', 'jj', 'kk', to be 'size_t' instead of 'int' or
'unsigned int', also santizing 'ii', 'jj', 'kk' to use
the normal 'i', 'j', 'k' naming
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2013-07-08 15:09:33 +01:00
|
|
|
size_t i;
|
|
|
|
int ctr;
|
|
|
|
int offset;
|
2009-12-03 17:17:40 +01:00
|
|
|
|
|
|
|
if (idx < 0) {
|
2012-07-18 11:26:24 +01:00
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
_("Disk index %d is negative"), idx);
|
2009-12-03 17:17:40 +01:00
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
Convert 'int i' to 'size_t i' in src/util/ files
Convert the type of loop iterators named 'i', 'j', k',
'ii', 'jj', 'kk', to be 'size_t' instead of 'int' or
'unsigned int', also santizing 'ii', 'jj', 'kk' to use
the normal 'i', 'j', 'k' naming
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2013-07-08 15:09:33 +01:00
|
|
|
for (i = 0, ctr = idx; ctr >= 0; ++i, ctr = ctr / 26 - 1) { }
|
2009-12-03 17:17:40 +01:00
|
|
|
|
|
|
|
offset = strlen(prefix);
|
|
|
|
|
2013-07-04 12:17:18 +02:00
|
|
|
if (VIR_ALLOC_N(name, offset + i + 1))
|
2009-12-03 17:17:40 +01:00
|
|
|
return NULL;
|
|
|
|
|
|
|
|
strcpy(name, prefix);
|
|
|
|
name[offset + i] = '\0';
|
|
|
|
|
2014-11-13 15:28:18 +01:00
|
|
|
for (i = i - 1, ctr = idx; ctr >= 0; --i, ctr = ctr / 26 - 1)
|
Convert 'int i' to 'size_t i' in src/util/ files
Convert the type of loop iterators named 'i', 'j', k',
'ii', 'jj', 'kk', to be 'size_t' instead of 'int' or
'unsigned int', also santizing 'ii', 'jj', 'kk' to use
the normal 'i', 'j', 'k' naming
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2013-07-08 15:09:33 +01:00
|
|
|
name[offset + i] = 'a' + (ctr % 26);
|
2009-12-03 17:17:40 +01:00
|
|
|
|
|
|
|
return name;
|
|
|
|
}
|
|
|
|
|
2009-01-07 10:43:16 +00:00
|
|
|
#ifndef AI_CANONIDN
|
2010-03-09 19:22:22 +01:00
|
|
|
# define AI_CANONIDN 0
|
2009-01-07 10:43:16 +00:00
|
|
|
#endif
|
|
|
|
|
2017-07-05 11:19:43 +01:00
|
|
|
#ifndef HOST_NAME_MAX
|
|
|
|
# define HOST_NAME_MAX 256
|
|
|
|
#endif
|
|
|
|
|
2010-05-20 13:16:30 -04:00
|
|
|
/* Who knew getting a hostname could be so delicate. In Linux (and Unices
|
|
|
|
* in general), many things depend on "hostname" returning a value that will
|
|
|
|
* resolve one way or another. In the modern world where networks frequently
|
|
|
|
* come and go this is often being hard-coded to resolve to "localhost". If
|
|
|
|
* it *doesn't* resolve to localhost, then we would prefer to have the FQDN.
|
|
|
|
* That leads us to 3 possibilities:
|
|
|
|
*
|
|
|
|
* 1) gethostname() returns an FQDN (not localhost) - we return the string
|
|
|
|
* as-is, it's all of the information we want
|
|
|
|
* 2) gethostname() returns "localhost" - we return localhost; doing further
|
|
|
|
* work to try to resolve it is pointless
|
|
|
|
* 3) gethostname() returns a shortened hostname - in this case, we want to
|
|
|
|
* try to resolve this to a fully-qualified name. Therefore we pass it
|
|
|
|
* to getaddrinfo(). There are two possible responses:
|
|
|
|
* a) getaddrinfo() resolves to a FQDN - return the FQDN
|
2011-10-14 16:25:50 +02:00
|
|
|
* b) getaddrinfo() fails or resolves to localhost - in this case, the
|
2011-10-13 16:19:37 +02:00
|
|
|
* data we got from gethostname() is actually more useful than what
|
|
|
|
* we got from getaddrinfo(). Return the value from gethostname()
|
|
|
|
* and hope for the best.
|
2010-05-20 13:16:30 -04:00
|
|
|
*/
|
2015-12-04 17:35:54 +00:00
|
|
|
static char *
|
|
|
|
virGetHostnameImpl(bool quiet)
|
2009-01-07 10:43:16 +00:00
|
|
|
{
|
|
|
|
int r;
|
2015-12-04 17:35:54 +00:00
|
|
|
char hostname[HOST_NAME_MAX+1], *result = NULL;
|
2010-05-20 13:16:30 -04:00
|
|
|
struct addrinfo hints, *info;
|
2009-01-07 10:43:16 +00:00
|
|
|
|
2012-10-17 10:23:12 +01:00
|
|
|
r = gethostname(hostname, sizeof(hostname));
|
2009-10-23 13:01:22 -04:00
|
|
|
if (r == -1) {
|
2015-12-04 17:35:54 +00:00
|
|
|
if (!quiet)
|
|
|
|
virReportSystemError(errno,
|
|
|
|
"%s", _("failed to determine host name"));
|
2009-01-07 10:43:16 +00:00
|
|
|
return NULL;
|
2009-10-23 13:01:22 -04:00
|
|
|
}
|
2009-01-07 10:43:16 +00:00
|
|
|
NUL_TERMINATE(hostname);
|
|
|
|
|
2010-05-20 13:16:30 -04:00
|
|
|
if (STRPREFIX(hostname, "localhost") || strchr(hostname, '.')) {
|
|
|
|
/* in this case, gethostname returned localhost (meaning we can't
|
|
|
|
* do any further canonicalization), or it returned an FQDN (and
|
|
|
|
* we don't need to do any further canonicalization). Return the
|
|
|
|
* string as-is; it's up to callers to check whether "localhost"
|
|
|
|
* is allowed.
|
|
|
|
*/
|
2019-10-18 13:27:03 +02:00
|
|
|
result = g_strdup(hostname);
|
2013-05-24 09:19:51 +02:00
|
|
|
goto cleanup;
|
2010-05-20 13:16:30 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
/* otherwise, it's a shortened, non-localhost, hostname. Attempt to
|
|
|
|
* canonicalize the hostname by running it through getaddrinfo
|
|
|
|
*/
|
|
|
|
|
2009-01-07 10:43:16 +00:00
|
|
|
memset(&hints, 0, sizeof(hints));
|
|
|
|
hints.ai_flags = AI_CANONNAME|AI_CANONIDN;
|
|
|
|
hints.ai_family = AF_UNSPEC;
|
|
|
|
r = getaddrinfo(hostname, NULL, &hints, &info);
|
2009-10-23 13:01:22 -04:00
|
|
|
if (r != 0) {
|
2015-12-04 17:35:54 +00:00
|
|
|
if (!quiet)
|
|
|
|
VIR_WARN("getaddrinfo failed for '%s': %s",
|
|
|
|
hostname, gai_strerror(r));
|
2019-10-18 13:27:03 +02:00
|
|
|
result = g_strdup(hostname);
|
2013-05-24 09:19:51 +02:00
|
|
|
goto cleanup;
|
2009-10-23 13:01:22 -04:00
|
|
|
}
|
2010-02-19 16:15:21 +01:00
|
|
|
|
2010-04-07 17:23:24 +02:00
|
|
|
/* Tell static analyzers about getaddrinfo semantics. */
|
2012-10-17 10:23:12 +01:00
|
|
|
sa_assert(info);
|
2010-04-07 17:23:24 +02:00
|
|
|
|
2010-05-20 13:16:30 -04:00
|
|
|
if (info->ai_canonname == NULL ||
|
|
|
|
STRPREFIX(info->ai_canonname, "localhost"))
|
|
|
|
/* in this case, we tried to canonicalize and we ended up back with
|
|
|
|
* localhost. Ignore the canonicalized name and just return the
|
|
|
|
* original hostname
|
|
|
|
*/
|
2019-10-18 13:27:03 +02:00
|
|
|
result = g_strdup(hostname);
|
2010-05-20 13:16:30 -04:00
|
|
|
else
|
|
|
|
/* Caller frees this string. */
|
2019-10-18 13:27:03 +02:00
|
|
|
result = g_strdup(info->ai_canonname);
|
2010-02-19 16:15:21 +01:00
|
|
|
|
2010-05-20 13:16:30 -04:00
|
|
|
freeaddrinfo(info);
|
2009-01-07 10:43:16 +00:00
|
|
|
|
2014-03-25 07:53:22 +01:00
|
|
|
cleanup:
|
2015-12-04 17:35:54 +00:00
|
|
|
if (!result)
|
|
|
|
virReportOOMError();
|
2009-01-07 10:43:16 +00:00
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2013-07-30 15:55:44 -04:00
|
|
|
|
2015-12-04 17:35:54 +00:00
|
|
|
char *
|
|
|
|
virGetHostname(void)
|
|
|
|
{
|
|
|
|
return virGetHostnameImpl(false);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
char *
|
|
|
|
virGetHostnameQuiet(void)
|
|
|
|
{
|
|
|
|
return virGetHostnameImpl(true);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2013-07-30 15:55:44 -04:00
|
|
|
char *
|
|
|
|
virGetUserDirectory(void)
|
|
|
|
{
|
2019-12-17 16:24:38 +01:00
|
|
|
return g_strdup(g_get_home_dir());
|
2013-07-30 15:55:44 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2019-12-17 16:31:11 +01:00
|
|
|
char *virGetUserConfigDirectory(void)
|
|
|
|
{
|
|
|
|
#ifdef WIN32
|
|
|
|
return g_strdup(g_get_user_config_dir());
|
|
|
|
#else
|
|
|
|
return g_build_filename(g_get_user_config_dir(), "libvirt", NULL);
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2019-12-17 16:34:28 +01:00
|
|
|
char *virGetUserCacheDirectory(void)
|
|
|
|
{
|
|
|
|
#ifdef WIN32
|
|
|
|
return g_strdup(g_get_user_cache_dir());
|
|
|
|
#else
|
|
|
|
return g_build_filename(g_get_user_cache_dir(), "libvirt", NULL);
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2019-12-17 16:42:09 +01:00
|
|
|
char *virGetUserRuntimeDirectory(void)
|
|
|
|
{
|
|
|
|
#ifdef WIN32
|
|
|
|
return g_strdup(g_get_user_runtime_dir());
|
|
|
|
#else
|
|
|
|
return g_build_filename(g_get_user_runtime_dir(), "libvirt", NULL);
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2009-01-22 19:41:48 +00:00
|
|
|
#ifdef HAVE_GETPWUID_R
|
2013-07-09 17:57:48 -06:00
|
|
|
/* Look up fields from the user database for the given user. On
|
2016-06-17 13:54:52 +02:00
|
|
|
* error, set errno, report the error if not instructed otherwise via @quiet,
|
|
|
|
* and return -1. */
|
2013-07-09 17:57:48 -06:00
|
|
|
static int
|
2016-06-17 13:54:52 +02:00
|
|
|
virGetUserEnt(uid_t uid, char **name, gid_t *group, char **dir, char **shell, bool quiet)
|
2009-01-22 19:41:48 +00:00
|
|
|
{
|
|
|
|
char *strbuf;
|
|
|
|
struct passwd pwbuf;
|
2009-01-30 15:43:05 +00:00
|
|
|
struct passwd *pw = NULL;
|
2010-01-28 13:37:05 +01:00
|
|
|
long val = sysconf(_SC_GETPW_R_SIZE_MAX);
|
|
|
|
size_t strbuflen = val;
|
2011-05-16 15:37:15 -06:00
|
|
|
int rc;
|
2013-07-09 17:57:48 -06:00
|
|
|
int ret = -1;
|
|
|
|
|
|
|
|
if (name)
|
|
|
|
*name = NULL;
|
|
|
|
if (dir)
|
|
|
|
*dir = NULL;
|
2016-04-12 18:11:20 +01:00
|
|
|
if (shell)
|
|
|
|
*shell = NULL;
|
2010-01-28 13:37:05 +01:00
|
|
|
|
2011-05-16 15:37:15 -06:00
|
|
|
/* sysconf is a hint; if it fails, fall back to a reasonable size */
|
|
|
|
if (val < 0)
|
|
|
|
strbuflen = 1024;
|
2009-01-22 19:41:48 +00:00
|
|
|
|
2013-07-04 12:17:18 +02:00
|
|
|
if (VIR_ALLOC_N(strbuf, strbuflen) < 0)
|
2013-07-09 17:57:48 -06:00
|
|
|
return -1;
|
2009-01-22 19:41:48 +00:00
|
|
|
|
2009-01-30 15:43:05 +00:00
|
|
|
/*
|
|
|
|
* From the manpage (terrifying but true):
|
|
|
|
*
|
|
|
|
* ERRORS
|
|
|
|
* 0 or ENOENT or ESRCH or EBADF or EPERM or ...
|
|
|
|
* The given name or uid was not found.
|
|
|
|
*/
|
2011-05-16 15:37:15 -06:00
|
|
|
while ((rc = getpwuid_r(uid, &pwbuf, strbuf, strbuflen, &pw)) == ERANGE) {
|
2013-07-04 12:17:18 +02:00
|
|
|
if (VIR_RESIZE_N(strbuf, strbuflen, strbuflen, strbuflen) < 0)
|
2013-07-09 17:57:48 -06:00
|
|
|
goto cleanup;
|
2011-05-16 15:37:15 -06:00
|
|
|
}
|
2016-06-17 13:54:52 +02:00
|
|
|
|
2013-09-04 11:15:34 -05:00
|
|
|
if (rc != 0) {
|
2016-06-17 13:54:52 +02:00
|
|
|
if (quiet)
|
|
|
|
goto cleanup;
|
|
|
|
|
2011-05-16 15:37:15 -06:00
|
|
|
virReportSystemError(rc,
|
2010-04-28 21:36:03 -06:00
|
|
|
_("Failed to find user record for uid '%u'"),
|
|
|
|
(unsigned int) uid);
|
2013-07-09 17:57:48 -06:00
|
|
|
goto cleanup;
|
2013-09-04 11:15:34 -05:00
|
|
|
} else if (pw == NULL) {
|
2016-06-17 13:54:52 +02:00
|
|
|
if (quiet)
|
|
|
|
goto cleanup;
|
|
|
|
|
2013-09-04 11:15:34 -05:00
|
|
|
virReportError(VIR_ERR_SYSTEM_ERROR,
|
|
|
|
_("Failed to find user record for uid '%u'"),
|
|
|
|
(unsigned int) uid);
|
|
|
|
goto cleanup;
|
2013-07-09 17:57:48 -06:00
|
|
|
}
|
|
|
|
|
2019-10-20 13:49:46 +02:00
|
|
|
if (name)
|
|
|
|
*name = g_strdup(pw->pw_name);
|
2013-07-09 17:57:48 -06:00
|
|
|
if (group)
|
|
|
|
*group = pw->pw_gid;
|
2019-10-20 13:49:46 +02:00
|
|
|
if (dir)
|
|
|
|
*dir = g_strdup(pw->pw_dir);
|
|
|
|
if (shell)
|
|
|
|
*shell = g_strdup(pw->pw_shell);
|
2009-01-22 19:41:48 +00:00
|
|
|
|
2013-07-09 17:57:48 -06:00
|
|
|
ret = 0;
|
2014-03-25 07:53:22 +01:00
|
|
|
cleanup:
|
2016-04-12 18:11:20 +01:00
|
|
|
if (ret < 0) {
|
|
|
|
if (name)
|
|
|
|
VIR_FREE(*name);
|
|
|
|
if (dir)
|
|
|
|
VIR_FREE(*dir);
|
|
|
|
if (shell)
|
|
|
|
VIR_FREE(*shell);
|
|
|
|
}
|
2009-01-22 19:41:48 +00:00
|
|
|
VIR_FREE(strbuf);
|
|
|
|
return ret;
|
|
|
|
}
|
2009-07-15 22:25:01 +01:00
|
|
|
|
2011-12-16 00:55:19 +00:00
|
|
|
static char *virGetGroupEnt(gid_t gid)
|
|
|
|
{
|
|
|
|
char *strbuf;
|
|
|
|
char *ret;
|
|
|
|
struct group grbuf;
|
|
|
|
struct group *gr = NULL;
|
|
|
|
long val = sysconf(_SC_GETGR_R_SIZE_MAX);
|
|
|
|
size_t strbuflen = val;
|
|
|
|
int rc;
|
|
|
|
|
|
|
|
/* sysconf is a hint; if it fails, fall back to a reasonable size */
|
|
|
|
if (val < 0)
|
|
|
|
strbuflen = 1024;
|
|
|
|
|
2013-07-04 12:17:18 +02:00
|
|
|
if (VIR_ALLOC_N(strbuf, strbuflen) < 0)
|
2011-12-16 00:55:19 +00:00
|
|
|
return NULL;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* From the manpage (terrifying but true):
|
|
|
|
*
|
|
|
|
* ERRORS
|
|
|
|
* 0 or ENOENT or ESRCH or EBADF or EPERM or ...
|
|
|
|
* The given name or gid was not found.
|
|
|
|
*/
|
|
|
|
while ((rc = getgrgid_r(gid, &grbuf, strbuf, strbuflen, &gr)) == ERANGE) {
|
|
|
|
if (VIR_RESIZE_N(strbuf, strbuflen, strbuflen, strbuflen) < 0) {
|
|
|
|
VIR_FREE(strbuf);
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (rc != 0 || gr == NULL) {
|
2013-09-04 11:15:34 -05:00
|
|
|
if (rc != 0) {
|
|
|
|
virReportSystemError(rc,
|
|
|
|
_("Failed to find group record for gid '%u'"),
|
|
|
|
(unsigned int) gid);
|
|
|
|
} else {
|
|
|
|
virReportError(VIR_ERR_SYSTEM_ERROR,
|
|
|
|
_("Failed to find group record for gid '%u'"),
|
|
|
|
(unsigned int) gid);
|
|
|
|
}
|
|
|
|
|
2011-12-16 00:55:19 +00:00
|
|
|
VIR_FREE(strbuf);
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2019-10-18 13:27:03 +02:00
|
|
|
ret = g_strdup(gr->gr_name);
|
2011-12-16 00:55:19 +00:00
|
|
|
VIR_FREE(strbuf);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2013-07-30 15:55:44 -04:00
|
|
|
|
|
|
|
char *
|
|
|
|
virGetUserDirectoryByUID(uid_t uid)
|
2009-07-10 11:40:04 +01:00
|
|
|
{
|
2013-07-09 17:57:48 -06:00
|
|
|
char *ret;
|
2016-06-17 13:54:52 +02:00
|
|
|
virGetUserEnt(uid, NULL, NULL, &ret, NULL, false);
|
2016-04-12 18:11:20 +01:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
char *virGetUserShell(uid_t uid)
|
|
|
|
{
|
|
|
|
char *ret;
|
2016-06-17 13:54:52 +02:00
|
|
|
virGetUserEnt(uid, NULL, NULL, NULL, &ret, false);
|
2013-07-09 17:57:48 -06:00
|
|
|
return ret;
|
2009-07-10 11:40:04 +01:00
|
|
|
}
|
|
|
|
|
2013-07-30 15:55:44 -04:00
|
|
|
|
2010-02-04 23:41:52 +01:00
|
|
|
char *virGetUserName(uid_t uid)
|
2009-07-10 11:40:04 +01:00
|
|
|
{
|
2013-07-09 17:57:48 -06:00
|
|
|
char *ret;
|
2016-06-17 13:54:52 +02:00
|
|
|
virGetUserEnt(uid, &ret, NULL, NULL, NULL, false);
|
2013-07-09 17:57:48 -06:00
|
|
|
return ret;
|
2009-07-10 11:40:04 +01:00
|
|
|
}
|
|
|
|
|
2011-12-16 00:55:19 +00:00
|
|
|
char *virGetGroupName(gid_t gid)
|
|
|
|
{
|
|
|
|
return virGetGroupEnt(gid);
|
|
|
|
}
|
|
|
|
|
2012-10-08 17:37:01 -03:00
|
|
|
/* Search in the password database for a user id that matches the user name
|
|
|
|
* `name`. Returns 0 on success, -1 on failure or 1 if name cannot be found.
|
2018-09-12 16:24:30 +02:00
|
|
|
*
|
|
|
|
* Warns if @missing_ok is false
|
2012-10-08 17:37:01 -03:00
|
|
|
*/
|
|
|
|
static int
|
2018-09-12 16:24:30 +02:00
|
|
|
virGetUserIDByName(const char *name, uid_t *uid, bool missing_ok)
|
2009-07-15 22:25:01 +01:00
|
|
|
{
|
2012-10-08 17:37:01 -03:00
|
|
|
char *strbuf = NULL;
|
2009-07-15 22:25:01 +01:00
|
|
|
struct passwd pwbuf;
|
|
|
|
struct passwd *pw = NULL;
|
2010-02-01 21:45:06 +01:00
|
|
|
long val = sysconf(_SC_GETPW_R_SIZE_MAX);
|
|
|
|
size_t strbuflen = val;
|
2011-05-16 15:37:15 -06:00
|
|
|
int rc;
|
2012-10-08 17:37:01 -03:00
|
|
|
int ret = -1;
|
2010-02-01 21:45:06 +01:00
|
|
|
|
2011-05-16 15:37:15 -06:00
|
|
|
/* sysconf is a hint; if it fails, fall back to a reasonable size */
|
|
|
|
if (val < 0)
|
|
|
|
strbuflen = 1024;
|
2009-07-15 22:25:01 +01:00
|
|
|
|
2013-07-04 12:17:18 +02:00
|
|
|
if (VIR_ALLOC_N(strbuf, strbuflen) < 0)
|
2012-10-08 17:37:01 -03:00
|
|
|
goto cleanup;
|
2009-07-15 22:25:01 +01:00
|
|
|
|
2011-05-16 15:37:15 -06:00
|
|
|
while ((rc = getpwnam_r(name, &pwbuf, strbuf, strbuflen, &pw)) == ERANGE) {
|
2013-07-04 12:17:18 +02:00
|
|
|
if (VIR_RESIZE_N(strbuf, strbuflen, strbuflen, strbuflen) < 0)
|
2012-10-08 17:37:01 -03:00
|
|
|
goto cleanup;
|
2011-05-16 15:37:15 -06:00
|
|
|
}
|
2012-10-08 17:37:01 -03:00
|
|
|
|
|
|
|
if (!pw) {
|
2018-09-12 16:24:30 +02:00
|
|
|
if (rc != 0 && !missing_ok) {
|
2012-12-11 21:26:52 +01:00
|
|
|
char buf[1024];
|
|
|
|
/* log the possible error from getpwnam_r. Unfortunately error
|
|
|
|
* reporting from this function is bad and we can't really
|
|
|
|
* rely on it, so we just report that the user wasn't found */
|
2012-12-12 14:19:03 +01:00
|
|
|
VIR_WARN("User record for user '%s' was not found: %s",
|
2012-12-11 21:26:52 +01:00
|
|
|
name, virStrerror(rc, buf, sizeof(buf)));
|
|
|
|
}
|
|
|
|
|
2012-10-08 17:37:01 -03:00
|
|
|
ret = 1;
|
|
|
|
goto cleanup;
|
2009-07-15 22:25:01 +01:00
|
|
|
}
|
|
|
|
|
2018-09-12 16:24:30 +02:00
|
|
|
if (uid)
|
|
|
|
*uid = pw->pw_uid;
|
2012-10-08 17:37:01 -03:00
|
|
|
ret = 0;
|
2009-07-15 22:25:01 +01:00
|
|
|
|
2014-03-25 07:53:22 +01:00
|
|
|
cleanup:
|
2009-07-15 22:25:01 +01:00
|
|
|
VIR_FREE(strbuf);
|
|
|
|
|
2012-10-08 17:37:01 -03:00
|
|
|
return ret;
|
2009-07-15 22:25:01 +01:00
|
|
|
}
|
|
|
|
|
2012-10-08 17:37:01 -03:00
|
|
|
/* Try to match a user id based on `user`. The default behavior is to parse
|
|
|
|
* `user` first as a user name and then as a user id. However if `user`
|
|
|
|
* contains a leading '+', the rest of the string is always parsed as a uid.
|
|
|
|
*
|
|
|
|
* Returns 0 on success and -1 otherwise.
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
virGetUserID(const char *user, uid_t *uid)
|
|
|
|
{
|
|
|
|
unsigned int uint_uid;
|
|
|
|
|
|
|
|
if (*user == '+') {
|
|
|
|
user++;
|
|
|
|
} else {
|
2018-09-12 16:24:30 +02:00
|
|
|
int rc = virGetUserIDByName(user, uid, false);
|
2012-10-08 17:37:01 -03:00
|
|
|
if (rc <= 0)
|
|
|
|
return rc;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (virStrToLong_ui(user, NULL, 10, &uint_uid) < 0 ||
|
|
|
|
((uid_t) uint_uid) != uint_uid) {
|
|
|
|
virReportError(VIR_ERR_INVALID_ARG, _("Failed to parse user '%s'"),
|
|
|
|
user);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
*uid = uint_uid;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
2009-07-15 22:25:01 +01:00
|
|
|
|
2012-10-08 17:37:01 -03:00
|
|
|
/* Search in the group database for a group id that matches the group name
|
|
|
|
* `name`. Returns 0 on success, -1 on failure or 1 if name cannot be found.
|
2018-09-12 16:24:30 +02:00
|
|
|
*
|
|
|
|
* Warns if @missing_ok is false
|
2012-10-08 17:37:01 -03:00
|
|
|
*/
|
|
|
|
static int
|
2018-09-12 16:24:30 +02:00
|
|
|
virGetGroupIDByName(const char *name, gid_t *gid, bool missing_ok)
|
2009-07-15 22:25:01 +01:00
|
|
|
{
|
2012-10-08 17:37:01 -03:00
|
|
|
char *strbuf = NULL;
|
2009-07-15 22:25:01 +01:00
|
|
|
struct group grbuf;
|
|
|
|
struct group *gr = NULL;
|
2010-02-01 21:45:06 +01:00
|
|
|
long val = sysconf(_SC_GETGR_R_SIZE_MAX);
|
|
|
|
size_t strbuflen = val;
|
2011-05-16 15:37:15 -06:00
|
|
|
int rc;
|
2012-10-08 17:37:01 -03:00
|
|
|
int ret = -1;
|
2010-02-01 21:45:06 +01:00
|
|
|
|
2011-05-16 15:37:15 -06:00
|
|
|
/* sysconf is a hint; if it fails, fall back to a reasonable size */
|
|
|
|
if (val < 0)
|
|
|
|
strbuflen = 1024;
|
2009-07-15 22:25:01 +01:00
|
|
|
|
2013-07-04 12:17:18 +02:00
|
|
|
if (VIR_ALLOC_N(strbuf, strbuflen) < 0)
|
2012-10-08 17:37:01 -03:00
|
|
|
goto cleanup;
|
2009-07-15 22:25:01 +01:00
|
|
|
|
2011-05-16 15:37:15 -06:00
|
|
|
while ((rc = getgrnam_r(name, &grbuf, strbuf, strbuflen, &gr)) == ERANGE) {
|
2013-07-04 12:17:18 +02:00
|
|
|
if (VIR_RESIZE_N(strbuf, strbuflen, strbuflen, strbuflen) < 0)
|
2012-10-08 17:37:01 -03:00
|
|
|
goto cleanup;
|
2011-05-16 15:37:15 -06:00
|
|
|
}
|
2012-10-08 17:37:01 -03:00
|
|
|
|
|
|
|
if (!gr) {
|
2018-09-12 16:24:30 +02:00
|
|
|
if (rc != 0 && !missing_ok) {
|
2012-12-11 21:26:52 +01:00
|
|
|
char buf[1024];
|
|
|
|
/* log the possible error from getgrnam_r. Unfortunately error
|
|
|
|
* reporting from this function is bad and we can't really
|
|
|
|
* rely on it, so we just report that the user wasn't found */
|
2012-12-12 14:19:03 +01:00
|
|
|
VIR_WARN("Group record for user '%s' was not found: %s",
|
2012-12-11 21:26:52 +01:00
|
|
|
name, virStrerror(rc, buf, sizeof(buf)));
|
|
|
|
}
|
|
|
|
|
2012-10-08 17:37:01 -03:00
|
|
|
ret = 1;
|
|
|
|
goto cleanup;
|
2009-07-15 22:25:01 +01:00
|
|
|
}
|
|
|
|
|
2018-09-12 16:24:30 +02:00
|
|
|
if (gid)
|
|
|
|
*gid = gr->gr_gid;
|
2012-10-08 17:37:01 -03:00
|
|
|
ret = 0;
|
2009-07-15 22:25:01 +01:00
|
|
|
|
2014-03-25 07:53:22 +01:00
|
|
|
cleanup:
|
2009-07-15 22:25:01 +01:00
|
|
|
VIR_FREE(strbuf);
|
|
|
|
|
2012-10-08 17:37:01 -03:00
|
|
|
return ret;
|
2009-07-15 22:25:01 +01:00
|
|
|
}
|
2010-03-17 01:06:31 +01:00
|
|
|
|
2012-10-08 17:37:01 -03:00
|
|
|
/* Try to match a group id based on `group`. The default behavior is to parse
|
|
|
|
* `group` first as a group name and then as a group id. However if `group`
|
|
|
|
* contains a leading '+', the rest of the string is always parsed as a guid.
|
|
|
|
*
|
|
|
|
* Returns 0 on success and -1 otherwise.
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
virGetGroupID(const char *group, gid_t *gid)
|
|
|
|
{
|
|
|
|
unsigned int uint_gid;
|
|
|
|
|
|
|
|
if (*group == '+') {
|
|
|
|
group++;
|
|
|
|
} else {
|
2018-09-12 16:24:30 +02:00
|
|
|
int rc = virGetGroupIDByName(group, gid, false);
|
2012-10-08 17:37:01 -03:00
|
|
|
if (rc <= 0)
|
|
|
|
return rc;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (virStrToLong_ui(group, NULL, 10, &uint_gid) < 0 ||
|
|
|
|
((gid_t) uint_gid) != uint_gid) {
|
|
|
|
virReportError(VIR_ERR_INVALID_ARG, _("Failed to parse group '%s'"),
|
|
|
|
group);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
*gid = uint_gid;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
2010-12-23 01:44:02 -05:00
|
|
|
|
2018-09-12 16:24:30 +02:00
|
|
|
/* Silently checks if User @name exists.
|
|
|
|
* Returns if the user exists and fallbacks to false on error.
|
|
|
|
*/
|
2018-11-19 22:31:01 +01:00
|
|
|
bool
|
2018-09-12 16:24:30 +02:00
|
|
|
virDoesUserExist(const char *name)
|
|
|
|
{
|
|
|
|
return virGetUserIDByName(name, NULL, true) == 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Silently checks if Group @name exists.
|
|
|
|
* Returns if the group exists and fallbacks to false on error.
|
|
|
|
*/
|
2018-11-19 22:31:01 +01:00
|
|
|
bool
|
2018-09-12 16:24:30 +02:00
|
|
|
virDoesGroupExist(const char *name)
|
|
|
|
{
|
|
|
|
return virGetGroupIDByName(name, NULL, true) == 0;
|
|
|
|
}
|
|
|
|
|
2013-05-21 17:47:48 -06:00
|
|
|
|
2013-08-05 11:07:27 +02:00
|
|
|
/* Compute the list of primary and supplementary groups associated
|
|
|
|
* with @uid, and including @gid in the list (unless it is -1),
|
2016-06-17 15:32:58 +02:00
|
|
|
* storing a malloc'd result into @list. If uid is -1 or doesn't exist in the
|
|
|
|
* system database querying of the supplementary groups is skipped.
|
|
|
|
*
|
|
|
|
* Returns the size of the list on success, or -1 on failure with error
|
|
|
|
* reported and errno set. May not be called between fork and exec.
|
|
|
|
* */
|
2013-05-21 17:47:48 -06:00
|
|
|
int
|
|
|
|
virGetGroupList(uid_t uid, gid_t gid, gid_t **list)
|
|
|
|
{
|
2016-06-17 15:32:58 +02:00
|
|
|
int ret = 0;
|
2013-05-21 17:47:48 -06:00
|
|
|
char *user = NULL;
|
2013-08-05 11:07:27 +02:00
|
|
|
gid_t primary;
|
2013-05-21 17:47:48 -06:00
|
|
|
|
|
|
|
*list = NULL;
|
|
|
|
|
2016-06-17 15:32:58 +02:00
|
|
|
/* invalid users have no supplementary groups */
|
|
|
|
if (uid != (uid_t)-1 &&
|
|
|
|
virGetUserEnt(uid, &user, &primary, NULL, NULL, true) >= 0) {
|
|
|
|
if ((ret = mgetgroups(user, primary, list)) < 0) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("cannot get group list for '%s'"), user);
|
|
|
|
ret = -1;
|
|
|
|
goto cleanup;
|
|
|
|
}
|
2013-08-05 11:07:27 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
if (gid != (gid_t)-1) {
|
2013-08-07 16:44:58 -06:00
|
|
|
size_t i;
|
2013-08-05 11:07:27 +02:00
|
|
|
|
2013-08-07 16:44:58 -06:00
|
|
|
for (i = 0; i < ret; i++) {
|
2013-08-05 11:07:27 +02:00
|
|
|
if ((*list)[i] == gid)
|
|
|
|
goto cleanup;
|
|
|
|
}
|
2013-08-07 16:44:58 -06:00
|
|
|
if (VIR_APPEND_ELEMENT(*list, i, gid) < 0) {
|
2013-08-05 11:07:27 +02:00
|
|
|
ret = -1;
|
|
|
|
VIR_FREE(*list);
|
|
|
|
goto cleanup;
|
|
|
|
} else {
|
2013-08-07 16:44:58 -06:00
|
|
|
ret = i;
|
2013-08-05 11:07:27 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-03-25 07:53:22 +01:00
|
|
|
cleanup:
|
2013-05-21 17:47:48 -06:00
|
|
|
VIR_FREE(user);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
util: make virSetUIDGID async-signal-safe
https://bugzilla.redhat.com/show_bug.cgi?id=964358
POSIX states that multi-threaded apps should not use functions
that are not async-signal-safe between fork and exec, yet we
were using getpwuid_r and initgroups. Although rare, it is
possible to hit deadlock in the child, when it tries to grab
a mutex that was already held by another thread in the parent.
I actually hit this deadlock when testing multiple domains
being started in parallel with a command hook, with the following
backtrace in the child:
Thread 1 (Thread 0x7fd56bbf2700 (LWP 3212)):
#0 __lll_lock_wait ()
at ../nptl/sysdeps/unix/sysv/linux/x86_64/lowlevellock.S:136
#1 0x00007fd5761e7388 in _L_lock_854 () from /lib64/libpthread.so.0
#2 0x00007fd5761e7257 in __pthread_mutex_lock (mutex=0x7fd56be00360)
at pthread_mutex_lock.c:61
#3 0x00007fd56bbf9fc5 in _nss_files_getpwuid_r (uid=0, result=0x7fd56bbf0c70,
buffer=0x7fd55c2a65f0 "", buflen=1024, errnop=0x7fd56bbf25b8)
at nss_files/files-pwd.c:40
#4 0x00007fd575aeff1d in __getpwuid_r (uid=0, resbuf=0x7fd56bbf0c70,
buffer=0x7fd55c2a65f0 "", buflen=1024, result=0x7fd56bbf0cb0)
at ../nss/getXXbyYY_r.c:253
#5 0x00007fd578aebafc in virSetUIDGID (uid=0, gid=0) at util/virutil.c:1031
#6 0x00007fd578aebf43 in virSetUIDGIDWithCaps (uid=0, gid=0, capBits=0,
clearExistingCaps=true) at util/virutil.c:1388
#7 0x00007fd578a9a20b in virExec (cmd=0x7fd55c231f10) at util/vircommand.c:654
#8 0x00007fd578a9dfa2 in virCommandRunAsync (cmd=0x7fd55c231f10, pid=0x0)
at util/vircommand.c:2247
#9 0x00007fd578a9d74e in virCommandRun (cmd=0x7fd55c231f10, exitstatus=0x0)
at util/vircommand.c:2100
#10 0x00007fd56326fde5 in qemuProcessStart (conn=0x7fd53c000df0,
driver=0x7fd55c0dc4f0, vm=0x7fd54800b100, migrateFrom=0x0, stdin_fd=-1,
stdin_path=0x0, snapshot=0x0, vmop=VIR_NETDEV_VPORT_PROFILE_OP_CREATE,
flags=1) at qemu/qemu_process.c:3694
...
The solution is to split the work of getpwuid_r/initgroups into the
unsafe portions (getgrouplist, called pre-fork) and safe portions
(setgroups, called post-fork).
* src/util/virutil.h (virSetUIDGID, virSetUIDGIDWithCaps): Adjust
signature.
* src/util/virutil.c (virSetUIDGID): Add parameters.
(virSetUIDGIDWithCaps): Adjust clients.
* src/util/vircommand.c (virExec): Likewise.
* src/util/virfile.c (virFileAccessibleAs, virFileOpenForked)
(virDirCreate): Likewise.
* src/security/security_dac.c (virSecurityDACSetProcessLabel):
Likewise.
* src/lxc/lxc_container.c (lxcContainerSetID): Likewise.
* configure.ac (AC_CHECK_FUNCS_ONCE): Check for setgroups, not
initgroups.
Signed-off-by: Eric Blake <eblake@redhat.com>
2013-05-21 20:59:10 -06:00
|
|
|
/* Set the real and effective uid and gid to the given values, as well
|
|
|
|
* as all the supplementary groups, so that the process has all the
|
|
|
|
* assumed group membership of that uid. Return 0 on success, -1 on
|
|
|
|
* failure (the original system error remains in errno).
|
2010-12-23 01:44:02 -05:00
|
|
|
*/
|
|
|
|
int
|
2019-10-14 14:45:33 +02:00
|
|
|
virSetUIDGID(uid_t uid, gid_t gid, gid_t *groups G_GNUC_UNUSED,
|
|
|
|
int ngroups G_GNUC_UNUSED)
|
2010-12-23 01:44:02 -05:00
|
|
|
{
|
util: make virSetUIDGID async-signal-safe
https://bugzilla.redhat.com/show_bug.cgi?id=964358
POSIX states that multi-threaded apps should not use functions
that are not async-signal-safe between fork and exec, yet we
were using getpwuid_r and initgroups. Although rare, it is
possible to hit deadlock in the child, when it tries to grab
a mutex that was already held by another thread in the parent.
I actually hit this deadlock when testing multiple domains
being started in parallel with a command hook, with the following
backtrace in the child:
Thread 1 (Thread 0x7fd56bbf2700 (LWP 3212)):
#0 __lll_lock_wait ()
at ../nptl/sysdeps/unix/sysv/linux/x86_64/lowlevellock.S:136
#1 0x00007fd5761e7388 in _L_lock_854 () from /lib64/libpthread.so.0
#2 0x00007fd5761e7257 in __pthread_mutex_lock (mutex=0x7fd56be00360)
at pthread_mutex_lock.c:61
#3 0x00007fd56bbf9fc5 in _nss_files_getpwuid_r (uid=0, result=0x7fd56bbf0c70,
buffer=0x7fd55c2a65f0 "", buflen=1024, errnop=0x7fd56bbf25b8)
at nss_files/files-pwd.c:40
#4 0x00007fd575aeff1d in __getpwuid_r (uid=0, resbuf=0x7fd56bbf0c70,
buffer=0x7fd55c2a65f0 "", buflen=1024, result=0x7fd56bbf0cb0)
at ../nss/getXXbyYY_r.c:253
#5 0x00007fd578aebafc in virSetUIDGID (uid=0, gid=0) at util/virutil.c:1031
#6 0x00007fd578aebf43 in virSetUIDGIDWithCaps (uid=0, gid=0, capBits=0,
clearExistingCaps=true) at util/virutil.c:1388
#7 0x00007fd578a9a20b in virExec (cmd=0x7fd55c231f10) at util/vircommand.c:654
#8 0x00007fd578a9dfa2 in virCommandRunAsync (cmd=0x7fd55c231f10, pid=0x0)
at util/vircommand.c:2247
#9 0x00007fd578a9d74e in virCommandRun (cmd=0x7fd55c231f10, exitstatus=0x0)
at util/vircommand.c:2100
#10 0x00007fd56326fde5 in qemuProcessStart (conn=0x7fd53c000df0,
driver=0x7fd55c0dc4f0, vm=0x7fd54800b100, migrateFrom=0x0, stdin_fd=-1,
stdin_path=0x0, snapshot=0x0, vmop=VIR_NETDEV_VPORT_PROFILE_OP_CREATE,
flags=1) at qemu/qemu_process.c:3694
...
The solution is to split the work of getpwuid_r/initgroups into the
unsafe portions (getgrouplist, called pre-fork) and safe portions
(setgroups, called post-fork).
* src/util/virutil.h (virSetUIDGID, virSetUIDGIDWithCaps): Adjust
signature.
* src/util/virutil.c (virSetUIDGID): Add parameters.
(virSetUIDGIDWithCaps): Adjust clients.
* src/util/vircommand.c (virExec): Likewise.
* src/util/virfile.c (virFileAccessibleAs, virFileOpenForked)
(virDirCreate): Likewise.
* src/security/security_dac.c (virSecurityDACSetProcessLabel):
Likewise.
* src/lxc/lxc_container.c (lxcContainerSetID): Likewise.
* configure.ac (AC_CHECK_FUNCS_ONCE): Check for setgroups, not
initgroups.
Signed-off-by: Eric Blake <eblake@redhat.com>
2013-05-21 20:59:10 -06:00
|
|
|
if (gid != (gid_t)-1 && setregid(gid, gid) < 0) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("cannot change to '%u' group"),
|
|
|
|
(unsigned int) gid);
|
|
|
|
return -1;
|
2010-12-23 01:44:02 -05:00
|
|
|
}
|
|
|
|
|
util: make virSetUIDGID async-signal-safe
https://bugzilla.redhat.com/show_bug.cgi?id=964358
POSIX states that multi-threaded apps should not use functions
that are not async-signal-safe between fork and exec, yet we
were using getpwuid_r and initgroups. Although rare, it is
possible to hit deadlock in the child, when it tries to grab
a mutex that was already held by another thread in the parent.
I actually hit this deadlock when testing multiple domains
being started in parallel with a command hook, with the following
backtrace in the child:
Thread 1 (Thread 0x7fd56bbf2700 (LWP 3212)):
#0 __lll_lock_wait ()
at ../nptl/sysdeps/unix/sysv/linux/x86_64/lowlevellock.S:136
#1 0x00007fd5761e7388 in _L_lock_854 () from /lib64/libpthread.so.0
#2 0x00007fd5761e7257 in __pthread_mutex_lock (mutex=0x7fd56be00360)
at pthread_mutex_lock.c:61
#3 0x00007fd56bbf9fc5 in _nss_files_getpwuid_r (uid=0, result=0x7fd56bbf0c70,
buffer=0x7fd55c2a65f0 "", buflen=1024, errnop=0x7fd56bbf25b8)
at nss_files/files-pwd.c:40
#4 0x00007fd575aeff1d in __getpwuid_r (uid=0, resbuf=0x7fd56bbf0c70,
buffer=0x7fd55c2a65f0 "", buflen=1024, result=0x7fd56bbf0cb0)
at ../nss/getXXbyYY_r.c:253
#5 0x00007fd578aebafc in virSetUIDGID (uid=0, gid=0) at util/virutil.c:1031
#6 0x00007fd578aebf43 in virSetUIDGIDWithCaps (uid=0, gid=0, capBits=0,
clearExistingCaps=true) at util/virutil.c:1388
#7 0x00007fd578a9a20b in virExec (cmd=0x7fd55c231f10) at util/vircommand.c:654
#8 0x00007fd578a9dfa2 in virCommandRunAsync (cmd=0x7fd55c231f10, pid=0x0)
at util/vircommand.c:2247
#9 0x00007fd578a9d74e in virCommandRun (cmd=0x7fd55c231f10, exitstatus=0x0)
at util/vircommand.c:2100
#10 0x00007fd56326fde5 in qemuProcessStart (conn=0x7fd53c000df0,
driver=0x7fd55c0dc4f0, vm=0x7fd54800b100, migrateFrom=0x0, stdin_fd=-1,
stdin_path=0x0, snapshot=0x0, vmop=VIR_NETDEV_VPORT_PROFILE_OP_CREATE,
flags=1) at qemu/qemu_process.c:3694
...
The solution is to split the work of getpwuid_r/initgroups into the
unsafe portions (getgrouplist, called pre-fork) and safe portions
(setgroups, called post-fork).
* src/util/virutil.h (virSetUIDGID, virSetUIDGIDWithCaps): Adjust
signature.
* src/util/virutil.c (virSetUIDGID): Add parameters.
(virSetUIDGIDWithCaps): Adjust clients.
* src/util/vircommand.c (virExec): Likewise.
* src/util/virfile.c (virFileAccessibleAs, virFileOpenForked)
(virDirCreate): Likewise.
* src/security/security_dac.c (virSecurityDACSetProcessLabel):
Likewise.
* src/lxc/lxc_container.c (lxcContainerSetID): Likewise.
* configure.ac (AC_CHECK_FUNCS_ONCE): Check for setgroups, not
initgroups.
Signed-off-by: Eric Blake <eblake@redhat.com>
2013-05-21 20:59:10 -06:00
|
|
|
# if HAVE_SETGROUPS
|
2015-06-23 13:48:42 +02:00
|
|
|
if (gid != (gid_t)-1 && setgroups(ngroups, groups) < 0) {
|
util: make virSetUIDGID async-signal-safe
https://bugzilla.redhat.com/show_bug.cgi?id=964358
POSIX states that multi-threaded apps should not use functions
that are not async-signal-safe between fork and exec, yet we
were using getpwuid_r and initgroups. Although rare, it is
possible to hit deadlock in the child, when it tries to grab
a mutex that was already held by another thread in the parent.
I actually hit this deadlock when testing multiple domains
being started in parallel with a command hook, with the following
backtrace in the child:
Thread 1 (Thread 0x7fd56bbf2700 (LWP 3212)):
#0 __lll_lock_wait ()
at ../nptl/sysdeps/unix/sysv/linux/x86_64/lowlevellock.S:136
#1 0x00007fd5761e7388 in _L_lock_854 () from /lib64/libpthread.so.0
#2 0x00007fd5761e7257 in __pthread_mutex_lock (mutex=0x7fd56be00360)
at pthread_mutex_lock.c:61
#3 0x00007fd56bbf9fc5 in _nss_files_getpwuid_r (uid=0, result=0x7fd56bbf0c70,
buffer=0x7fd55c2a65f0 "", buflen=1024, errnop=0x7fd56bbf25b8)
at nss_files/files-pwd.c:40
#4 0x00007fd575aeff1d in __getpwuid_r (uid=0, resbuf=0x7fd56bbf0c70,
buffer=0x7fd55c2a65f0 "", buflen=1024, result=0x7fd56bbf0cb0)
at ../nss/getXXbyYY_r.c:253
#5 0x00007fd578aebafc in virSetUIDGID (uid=0, gid=0) at util/virutil.c:1031
#6 0x00007fd578aebf43 in virSetUIDGIDWithCaps (uid=0, gid=0, capBits=0,
clearExistingCaps=true) at util/virutil.c:1388
#7 0x00007fd578a9a20b in virExec (cmd=0x7fd55c231f10) at util/vircommand.c:654
#8 0x00007fd578a9dfa2 in virCommandRunAsync (cmd=0x7fd55c231f10, pid=0x0)
at util/vircommand.c:2247
#9 0x00007fd578a9d74e in virCommandRun (cmd=0x7fd55c231f10, exitstatus=0x0)
at util/vircommand.c:2100
#10 0x00007fd56326fde5 in qemuProcessStart (conn=0x7fd53c000df0,
driver=0x7fd55c0dc4f0, vm=0x7fd54800b100, migrateFrom=0x0, stdin_fd=-1,
stdin_path=0x0, snapshot=0x0, vmop=VIR_NETDEV_VPORT_PROFILE_OP_CREATE,
flags=1) at qemu/qemu_process.c:3694
...
The solution is to split the work of getpwuid_r/initgroups into the
unsafe portions (getgrouplist, called pre-fork) and safe portions
(setgroups, called post-fork).
* src/util/virutil.h (virSetUIDGID, virSetUIDGIDWithCaps): Adjust
signature.
* src/util/virutil.c (virSetUIDGID): Add parameters.
(virSetUIDGIDWithCaps): Adjust clients.
* src/util/vircommand.c (virExec): Likewise.
* src/util/virfile.c (virFileAccessibleAs, virFileOpenForked)
(virDirCreate): Likewise.
* src/security/security_dac.c (virSecurityDACSetProcessLabel):
Likewise.
* src/lxc/lxc_container.c (lxcContainerSetID): Likewise.
* configure.ac (AC_CHECK_FUNCS_ONCE): Check for setgroups, not
initgroups.
Signed-off-by: Eric Blake <eblake@redhat.com>
2013-05-21 20:59:10 -06:00
|
|
|
virReportSystemError(errno, "%s",
|
|
|
|
_("cannot set supplemental groups"));
|
|
|
|
return -1;
|
|
|
|
}
|
2010-12-23 01:44:02 -05:00
|
|
|
# endif
|
util: make virSetUIDGID async-signal-safe
https://bugzilla.redhat.com/show_bug.cgi?id=964358
POSIX states that multi-threaded apps should not use functions
that are not async-signal-safe between fork and exec, yet we
were using getpwuid_r and initgroups. Although rare, it is
possible to hit deadlock in the child, when it tries to grab
a mutex that was already held by another thread in the parent.
I actually hit this deadlock when testing multiple domains
being started in parallel with a command hook, with the following
backtrace in the child:
Thread 1 (Thread 0x7fd56bbf2700 (LWP 3212)):
#0 __lll_lock_wait ()
at ../nptl/sysdeps/unix/sysv/linux/x86_64/lowlevellock.S:136
#1 0x00007fd5761e7388 in _L_lock_854 () from /lib64/libpthread.so.0
#2 0x00007fd5761e7257 in __pthread_mutex_lock (mutex=0x7fd56be00360)
at pthread_mutex_lock.c:61
#3 0x00007fd56bbf9fc5 in _nss_files_getpwuid_r (uid=0, result=0x7fd56bbf0c70,
buffer=0x7fd55c2a65f0 "", buflen=1024, errnop=0x7fd56bbf25b8)
at nss_files/files-pwd.c:40
#4 0x00007fd575aeff1d in __getpwuid_r (uid=0, resbuf=0x7fd56bbf0c70,
buffer=0x7fd55c2a65f0 "", buflen=1024, result=0x7fd56bbf0cb0)
at ../nss/getXXbyYY_r.c:253
#5 0x00007fd578aebafc in virSetUIDGID (uid=0, gid=0) at util/virutil.c:1031
#6 0x00007fd578aebf43 in virSetUIDGIDWithCaps (uid=0, gid=0, capBits=0,
clearExistingCaps=true) at util/virutil.c:1388
#7 0x00007fd578a9a20b in virExec (cmd=0x7fd55c231f10) at util/vircommand.c:654
#8 0x00007fd578a9dfa2 in virCommandRunAsync (cmd=0x7fd55c231f10, pid=0x0)
at util/vircommand.c:2247
#9 0x00007fd578a9d74e in virCommandRun (cmd=0x7fd55c231f10, exitstatus=0x0)
at util/vircommand.c:2100
#10 0x00007fd56326fde5 in qemuProcessStart (conn=0x7fd53c000df0,
driver=0x7fd55c0dc4f0, vm=0x7fd54800b100, migrateFrom=0x0, stdin_fd=-1,
stdin_path=0x0, snapshot=0x0, vmop=VIR_NETDEV_VPORT_PROFILE_OP_CREATE,
flags=1) at qemu/qemu_process.c:3694
...
The solution is to split the work of getpwuid_r/initgroups into the
unsafe portions (getgrouplist, called pre-fork) and safe portions
(setgroups, called post-fork).
* src/util/virutil.h (virSetUIDGID, virSetUIDGIDWithCaps): Adjust
signature.
* src/util/virutil.c (virSetUIDGID): Add parameters.
(virSetUIDGIDWithCaps): Adjust clients.
* src/util/vircommand.c (virExec): Likewise.
* src/util/virfile.c (virFileAccessibleAs, virFileOpenForked)
(virDirCreate): Likewise.
* src/security/security_dac.c (virSecurityDACSetProcessLabel):
Likewise.
* src/lxc/lxc_container.c (lxcContainerSetID): Likewise.
* configure.ac (AC_CHECK_FUNCS_ONCE): Check for setgroups, not
initgroups.
Signed-off-by: Eric Blake <eblake@redhat.com>
2013-05-21 20:59:10 -06:00
|
|
|
|
|
|
|
if (uid != (uid_t)-1 && setreuid(uid, uid) < 0) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("cannot change to uid to '%u'"),
|
|
|
|
(unsigned int) uid);
|
|
|
|
return -1;
|
2010-12-23 01:44:02 -05:00
|
|
|
}
|
2012-08-28 16:51:05 +02:00
|
|
|
|
2010-12-23 01:44:02 -05:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2012-05-24 14:37:54 +01:00
|
|
|
#else /* ! HAVE_GETPWUID_R */
|
|
|
|
|
2013-07-29 08:04:35 -06:00
|
|
|
int
|
2019-10-14 14:45:33 +02:00
|
|
|
virGetGroupList(uid_t uid G_GNUC_UNUSED, gid_t gid G_GNUC_UNUSED,
|
2013-07-29 08:04:35 -06:00
|
|
|
gid_t **list)
|
|
|
|
{
|
|
|
|
*list = NULL;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2018-11-19 22:31:01 +01:00
|
|
|
bool
|
2019-10-14 14:45:33 +02:00
|
|
|
virDoesUserExist(const char *name G_GNUC_UNUSED)
|
2018-09-14 08:18:54 +02:00
|
|
|
{
|
2018-11-19 22:31:01 +01:00
|
|
|
return false;
|
2018-09-14 08:18:54 +02:00
|
|
|
}
|
|
|
|
|
2018-11-19 22:31:01 +01:00
|
|
|
bool
|
2019-10-14 14:45:33 +02:00
|
|
|
virDoesGroupExist(const char *name G_GNUC_UNUSED)
|
2018-09-14 08:18:54 +02:00
|
|
|
{
|
2018-11-19 22:31:01 +01:00
|
|
|
return false;
|
2018-09-14 08:18:54 +02:00
|
|
|
}
|
|
|
|
|
2012-05-24 14:37:54 +01:00
|
|
|
# ifdef WIN32
|
|
|
|
char *
|
2019-10-14 14:45:33 +02:00
|
|
|
virGetUserDirectoryByUID(uid_t uid G_GNUC_UNUSED)
|
2012-05-24 14:37:54 +01:00
|
|
|
{
|
2013-07-30 15:55:44 -04:00
|
|
|
/* Since Windows lacks setuid binaries, and since we already fake
|
|
|
|
* geteuid(), we can safely assume that this is only called when
|
|
|
|
* querying about the current user */
|
2012-05-24 14:37:54 +01:00
|
|
|
|
2019-12-17 22:44:12 +01:00
|
|
|
return g_strdup(g_get_home_dir());
|
2012-05-24 14:37:54 +01:00
|
|
|
}
|
|
|
|
|
2016-04-12 18:11:20 +01:00
|
|
|
char *
|
2019-10-14 14:45:33 +02:00
|
|
|
virGetUserShell(uid_t uid G_GNUC_UNUSED)
|
2016-04-12 18:11:20 +01:00
|
|
|
{
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
"%s", _("virGetUserShell is not available"));
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2012-05-24 14:37:54 +01:00
|
|
|
# else /* !HAVE_GETPWUID_R && !WIN32 */
|
2010-03-17 01:06:31 +01:00
|
|
|
char *
|
2019-10-14 14:45:33 +02:00
|
|
|
virGetUserDirectoryByUID(uid_t uid G_GNUC_UNUSED)
|
2010-03-17 01:06:31 +01:00
|
|
|
{
|
2012-07-18 11:26:24 +01:00
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
"%s", _("virGetUserDirectory is not available"));
|
2010-03-17 01:06:31 +01:00
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2016-04-12 18:11:20 +01:00
|
|
|
char *
|
2019-10-14 14:45:33 +02:00
|
|
|
virGetUserShell(uid_t uid G_GNUC_UNUSED)
|
2016-04-12 18:11:20 +01:00
|
|
|
{
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
"%s", _("virGetUserShell is not available"));
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
2012-05-24 14:37:54 +01:00
|
|
|
# endif /* ! HAVE_GETPWUID_R && ! WIN32 */
|
|
|
|
|
2010-03-17 01:06:31 +01:00
|
|
|
char *
|
2019-10-14 14:45:33 +02:00
|
|
|
virGetUserName(uid_t uid G_GNUC_UNUSED)
|
2010-03-17 01:06:31 +01:00
|
|
|
{
|
2012-07-18 11:26:24 +01:00
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
"%s", _("virGetUserName is not available"));
|
2010-03-17 01:06:31 +01:00
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2019-10-14 14:45:33 +02:00
|
|
|
int virGetUserID(const char *name G_GNUC_UNUSED,
|
|
|
|
uid_t *uid G_GNUC_UNUSED)
|
2010-03-17 01:06:31 +01:00
|
|
|
{
|
2012-07-18 11:26:24 +01:00
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
"%s", _("virGetUserID is not available"));
|
2010-03-17 01:06:31 +01:00
|
|
|
|
2015-06-08 09:32:24 +02:00
|
|
|
return -1;
|
2010-03-17 01:06:31 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2019-10-14 14:45:33 +02:00
|
|
|
int virGetGroupID(const char *name G_GNUC_UNUSED,
|
|
|
|
gid_t *gid G_GNUC_UNUSED)
|
2010-03-17 01:06:31 +01:00
|
|
|
{
|
2012-07-18 11:26:24 +01:00
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
"%s", _("virGetGroupID is not available"));
|
2010-03-17 01:06:31 +01:00
|
|
|
|
2015-06-08 09:32:24 +02:00
|
|
|
return -1;
|
2010-03-17 01:06:31 +01:00
|
|
|
}
|
2010-12-23 01:44:02 -05:00
|
|
|
|
|
|
|
int
|
2019-10-14 14:45:33 +02:00
|
|
|
virSetUIDGID(uid_t uid G_GNUC_UNUSED,
|
|
|
|
gid_t gid G_GNUC_UNUSED,
|
|
|
|
gid_t *groups G_GNUC_UNUSED,
|
|
|
|
int ngroups G_GNUC_UNUSED)
|
2010-12-23 01:44:02 -05:00
|
|
|
{
|
2012-07-18 11:26:24 +01:00
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
"%s", _("virSetUIDGID is not available"));
|
2010-12-23 01:44:02 -05:00
|
|
|
return -1;
|
|
|
|
}
|
2012-01-25 19:54:43 +01:00
|
|
|
|
|
|
|
char *
|
2019-10-14 14:45:33 +02:00
|
|
|
virGetGroupName(gid_t gid G_GNUC_UNUSED)
|
2012-01-25 19:54:43 +01:00
|
|
|
{
|
2012-07-18 11:26:24 +01:00
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
"%s", _("virGetGroupName is not available"));
|
2012-01-25 19:54:43 +01:00
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
2010-03-17 01:06:31 +01:00
|
|
|
#endif /* HAVE_GETPWUID_R */
|
Support configuration of huge pages in guests
Add option to domain XML for
<memoryBacking>
<hugepages/>
</memoryBacking>
* configure.in: Add check for mntent.h
* qemud/libvirtd_qemu.aug, qemud/test_libvirtd_qemu.aug, src/qemu.conf
Add 'hugetlbfs_mount' config parameter
* src/qemu_conf.c, src/qemu_conf.h: Check for -mem-path flag in QEMU,
and pass it when hugepages are requested.
Load hugetlbfs_mount config parameter, search for mount if not given.
* src/qemu_driver.c: Free hugetlbfs_mount/path parameter in driver shutdown.
Create directory for QEMU hugepage usage, chowning if required.
* docs/formatdomain.html.in: Document memoryBacking/hugepages elements
* docs/schemas/domain.rng: Add memoryBacking/hugepages elements to schema
* src/util.c, src/util.h, src/libvirt_private.syms: Add virFileFindMountPoint
helper API
* tests/qemuhelptest.c: Add -mem-path constants
* tests/qemuxml2argvtest.c, tests/qemuxml2xmltest.c: Add tests for hugepage
handling
* tests/qemuxml2argvdata/qemuxml2argv-hugepages.xml,
tests/qemuxml2argvdata/qemuxml2argv-hugepages.args: Data files for
hugepage tests
2009-08-25 15:05:18 +01:00
|
|
|
|
util: virSetUIDGIDWithCaps - change uid while keeping caps
Normally when a process' uid is changed to non-0, all the capabilities
bits are cleared, even those explicitly set with calls to
capng_update()/capng_apply() made immediately before setuid. And
*after* the process' uid has been changed, it no longer has the
necessary privileges to add capabilities back to the process.
In order to set a non-0 uid while still maintaining any capabilities
bits, it is necessary to either call capng_change_id() (which
unfortunately doesn't currently call initgroups to setup auxiliary
group membership), or to perform the small amount of calisthenics
contained in the new utility function virSetUIDGIDWithCaps().
Another very important difference between the capabilities
setting/clearing in virSetUIDGIDWithCaps() and virCommand's
virSetCapabilities() (which it will replace in the next patch) is that
the new function properly clears the capabilities bounding set, so it
will not be possible for a child process to set any new
capabilities.
A short description of what is done by virSetUIDGIDWithCaps():
1) clear all capabilities then set all those desired by the caller (in
capBits) plus CAP_SETGID, CAP_SETUID, and CAP_SETPCAP (which is needed
to change the capabilities bounding set).
2) call prctl(), telling it that we want to maintain current
capabilities across an upcoming setuid().
3) switch to the new uid/gid
4) again call prctl(), telling it we will no longer want capabilities
maintained if this process does another setuid().
5) clear the capabilities that we added to allow us to
setuid/setgid/change the bounding set (unless they were also requested
by the caller via the virCommand API).
Because the modification/maintaining of capabilities is intermingled
with setting the uid, this is necessarily done in a single function,
rather than having two independent functions.
Note that, due to the way that effective capabilities are computed (at
time of execve) for a process that has uid != 0, the *file*
capabilities of the binary being executed must also have the desired
capabilities bit(s) set (see "man 7 capabilities"). This can be done
with the "filecap" command. (e.g. "filecap /usr/bin/qemu-kvm sys_rawio").
2013-02-05 10:30:32 -05:00
|
|
|
#if WITH_CAPNG
|
|
|
|
/* Set the real and effective uid and gid to the given values, while
|
|
|
|
* maintaining the capabilities indicated by bits in @capBits. Return
|
|
|
|
* 0 on success, -1 on failure (the original system error remains in
|
|
|
|
* errno).
|
|
|
|
*/
|
|
|
|
int
|
util: make virSetUIDGID async-signal-safe
https://bugzilla.redhat.com/show_bug.cgi?id=964358
POSIX states that multi-threaded apps should not use functions
that are not async-signal-safe between fork and exec, yet we
were using getpwuid_r and initgroups. Although rare, it is
possible to hit deadlock in the child, when it tries to grab
a mutex that was already held by another thread in the parent.
I actually hit this deadlock when testing multiple domains
being started in parallel with a command hook, with the following
backtrace in the child:
Thread 1 (Thread 0x7fd56bbf2700 (LWP 3212)):
#0 __lll_lock_wait ()
at ../nptl/sysdeps/unix/sysv/linux/x86_64/lowlevellock.S:136
#1 0x00007fd5761e7388 in _L_lock_854 () from /lib64/libpthread.so.0
#2 0x00007fd5761e7257 in __pthread_mutex_lock (mutex=0x7fd56be00360)
at pthread_mutex_lock.c:61
#3 0x00007fd56bbf9fc5 in _nss_files_getpwuid_r (uid=0, result=0x7fd56bbf0c70,
buffer=0x7fd55c2a65f0 "", buflen=1024, errnop=0x7fd56bbf25b8)
at nss_files/files-pwd.c:40
#4 0x00007fd575aeff1d in __getpwuid_r (uid=0, resbuf=0x7fd56bbf0c70,
buffer=0x7fd55c2a65f0 "", buflen=1024, result=0x7fd56bbf0cb0)
at ../nss/getXXbyYY_r.c:253
#5 0x00007fd578aebafc in virSetUIDGID (uid=0, gid=0) at util/virutil.c:1031
#6 0x00007fd578aebf43 in virSetUIDGIDWithCaps (uid=0, gid=0, capBits=0,
clearExistingCaps=true) at util/virutil.c:1388
#7 0x00007fd578a9a20b in virExec (cmd=0x7fd55c231f10) at util/vircommand.c:654
#8 0x00007fd578a9dfa2 in virCommandRunAsync (cmd=0x7fd55c231f10, pid=0x0)
at util/vircommand.c:2247
#9 0x00007fd578a9d74e in virCommandRun (cmd=0x7fd55c231f10, exitstatus=0x0)
at util/vircommand.c:2100
#10 0x00007fd56326fde5 in qemuProcessStart (conn=0x7fd53c000df0,
driver=0x7fd55c0dc4f0, vm=0x7fd54800b100, migrateFrom=0x0, stdin_fd=-1,
stdin_path=0x0, snapshot=0x0, vmop=VIR_NETDEV_VPORT_PROFILE_OP_CREATE,
flags=1) at qemu/qemu_process.c:3694
...
The solution is to split the work of getpwuid_r/initgroups into the
unsafe portions (getgrouplist, called pre-fork) and safe portions
(setgroups, called post-fork).
* src/util/virutil.h (virSetUIDGID, virSetUIDGIDWithCaps): Adjust
signature.
* src/util/virutil.c (virSetUIDGID): Add parameters.
(virSetUIDGIDWithCaps): Adjust clients.
* src/util/vircommand.c (virExec): Likewise.
* src/util/virfile.c (virFileAccessibleAs, virFileOpenForked)
(virDirCreate): Likewise.
* src/security/security_dac.c (virSecurityDACSetProcessLabel):
Likewise.
* src/lxc/lxc_container.c (lxcContainerSetID): Likewise.
* configure.ac (AC_CHECK_FUNCS_ONCE): Check for setgroups, not
initgroups.
Signed-off-by: Eric Blake <eblake@redhat.com>
2013-05-21 20:59:10 -06:00
|
|
|
virSetUIDGIDWithCaps(uid_t uid, gid_t gid, gid_t *groups, int ngroups,
|
|
|
|
unsigned long long capBits, bool clearExistingCaps)
|
util: virSetUIDGIDWithCaps - change uid while keeping caps
Normally when a process' uid is changed to non-0, all the capabilities
bits are cleared, even those explicitly set with calls to
capng_update()/capng_apply() made immediately before setuid. And
*after* the process' uid has been changed, it no longer has the
necessary privileges to add capabilities back to the process.
In order to set a non-0 uid while still maintaining any capabilities
bits, it is necessary to either call capng_change_id() (which
unfortunately doesn't currently call initgroups to setup auxiliary
group membership), or to perform the small amount of calisthenics
contained in the new utility function virSetUIDGIDWithCaps().
Another very important difference between the capabilities
setting/clearing in virSetUIDGIDWithCaps() and virCommand's
virSetCapabilities() (which it will replace in the next patch) is that
the new function properly clears the capabilities bounding set, so it
will not be possible for a child process to set any new
capabilities.
A short description of what is done by virSetUIDGIDWithCaps():
1) clear all capabilities then set all those desired by the caller (in
capBits) plus CAP_SETGID, CAP_SETUID, and CAP_SETPCAP (which is needed
to change the capabilities bounding set).
2) call prctl(), telling it that we want to maintain current
capabilities across an upcoming setuid().
3) switch to the new uid/gid
4) again call prctl(), telling it we will no longer want capabilities
maintained if this process does another setuid().
5) clear the capabilities that we added to allow us to
setuid/setgid/change the bounding set (unless they were also requested
by the caller via the virCommand API).
Because the modification/maintaining of capabilities is intermingled
with setting the uid, this is necessarily done in a single function,
rather than having two independent functions.
Note that, due to the way that effective capabilities are computed (at
time of execve) for a process that has uid != 0, the *file*
capabilities of the binary being executed must also have the desired
capabilities bit(s) set (see "man 7 capabilities"). This can be done
with the "filecap" command. (e.g. "filecap /usr/bin/qemu-kvm sys_rawio").
2013-02-05 10:30:32 -05:00
|
|
|
{
|
Convert 'int i' to 'size_t i' in src/util/ files
Convert the type of loop iterators named 'i', 'j', k',
'ii', 'jj', 'kk', to be 'size_t' instead of 'int' or
'unsigned int', also santizing 'ii', 'jj', 'kk' to use
the normal 'i', 'j', 'k' naming
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2013-07-08 15:09:33 +01:00
|
|
|
size_t i;
|
2019-10-21 15:19:04 -03:00
|
|
|
int capng_ret;
|
2019-01-24 10:33:01 +01:00
|
|
|
bool need_setgid = false;
|
|
|
|
bool need_setuid = false;
|
2013-03-25 15:25:28 +01:00
|
|
|
bool need_setpcap = false;
|
2019-01-24 10:33:01 +01:00
|
|
|
const char *capstr = NULL;
|
util: virSetUIDGIDWithCaps - change uid while keeping caps
Normally when a process' uid is changed to non-0, all the capabilities
bits are cleared, even those explicitly set with calls to
capng_update()/capng_apply() made immediately before setuid. And
*after* the process' uid has been changed, it no longer has the
necessary privileges to add capabilities back to the process.
In order to set a non-0 uid while still maintaining any capabilities
bits, it is necessary to either call capng_change_id() (which
unfortunately doesn't currently call initgroups to setup auxiliary
group membership), or to perform the small amount of calisthenics
contained in the new utility function virSetUIDGIDWithCaps().
Another very important difference between the capabilities
setting/clearing in virSetUIDGIDWithCaps() and virCommand's
virSetCapabilities() (which it will replace in the next patch) is that
the new function properly clears the capabilities bounding set, so it
will not be possible for a child process to set any new
capabilities.
A short description of what is done by virSetUIDGIDWithCaps():
1) clear all capabilities then set all those desired by the caller (in
capBits) plus CAP_SETGID, CAP_SETUID, and CAP_SETPCAP (which is needed
to change the capabilities bounding set).
2) call prctl(), telling it that we want to maintain current
capabilities across an upcoming setuid().
3) switch to the new uid/gid
4) again call prctl(), telling it we will no longer want capabilities
maintained if this process does another setuid().
5) clear the capabilities that we added to allow us to
setuid/setgid/change the bounding set (unless they were also requested
by the caller via the virCommand API).
Because the modification/maintaining of capabilities is intermingled
with setting the uid, this is necessarily done in a single function,
rather than having two independent functions.
Note that, due to the way that effective capabilities are computed (at
time of execve) for a process that has uid != 0, the *file*
capabilities of the binary being executed must also have the desired
capabilities bit(s) set (see "man 7 capabilities"). This can be done
with the "filecap" command. (e.g. "filecap /usr/bin/qemu-kvm sys_rawio").
2013-02-05 10:30:32 -05:00
|
|
|
|
2013-03-13 15:26:35 -04:00
|
|
|
/* First drop all caps (unless the requested uid is "unchanged" or
|
|
|
|
* root and clearExistingCaps wasn't requested), then add back
|
|
|
|
* those in capBits + the extra ones we need to change uid/gid and
|
|
|
|
* change the capabilities bounding set.
|
util: virSetUIDGIDWithCaps - change uid while keeping caps
Normally when a process' uid is changed to non-0, all the capabilities
bits are cleared, even those explicitly set with calls to
capng_update()/capng_apply() made immediately before setuid. And
*after* the process' uid has been changed, it no longer has the
necessary privileges to add capabilities back to the process.
In order to set a non-0 uid while still maintaining any capabilities
bits, it is necessary to either call capng_change_id() (which
unfortunately doesn't currently call initgroups to setup auxiliary
group membership), or to perform the small amount of calisthenics
contained in the new utility function virSetUIDGIDWithCaps().
Another very important difference between the capabilities
setting/clearing in virSetUIDGIDWithCaps() and virCommand's
virSetCapabilities() (which it will replace in the next patch) is that
the new function properly clears the capabilities bounding set, so it
will not be possible for a child process to set any new
capabilities.
A short description of what is done by virSetUIDGIDWithCaps():
1) clear all capabilities then set all those desired by the caller (in
capBits) plus CAP_SETGID, CAP_SETUID, and CAP_SETPCAP (which is needed
to change the capabilities bounding set).
2) call prctl(), telling it that we want to maintain current
capabilities across an upcoming setuid().
3) switch to the new uid/gid
4) again call prctl(), telling it we will no longer want capabilities
maintained if this process does another setuid().
5) clear the capabilities that we added to allow us to
setuid/setgid/change the bounding set (unless they were also requested
by the caller via the virCommand API).
Because the modification/maintaining of capabilities is intermingled
with setting the uid, this is necessarily done in a single function,
rather than having two independent functions.
Note that, due to the way that effective capabilities are computed (at
time of execve) for a process that has uid != 0, the *file*
capabilities of the binary being executed must also have the desired
capabilities bit(s) set (see "man 7 capabilities"). This can be done
with the "filecap" command. (e.g. "filecap /usr/bin/qemu-kvm sys_rawio").
2013-02-05 10:30:32 -05:00
|
|
|
*/
|
|
|
|
|
2013-03-14 16:28:29 -06:00
|
|
|
if (clearExistingCaps || (uid != (uid_t)-1 && uid != 0))
|
2019-01-24 10:33:01 +01:00
|
|
|
capng_clear(CAPNG_SELECT_BOTH);
|
util: virSetUIDGIDWithCaps - change uid while keeping caps
Normally when a process' uid is changed to non-0, all the capabilities
bits are cleared, even those explicitly set with calls to
capng_update()/capng_apply() made immediately before setuid. And
*after* the process' uid has been changed, it no longer has the
necessary privileges to add capabilities back to the process.
In order to set a non-0 uid while still maintaining any capabilities
bits, it is necessary to either call capng_change_id() (which
unfortunately doesn't currently call initgroups to setup auxiliary
group membership), or to perform the small amount of calisthenics
contained in the new utility function virSetUIDGIDWithCaps().
Another very important difference between the capabilities
setting/clearing in virSetUIDGIDWithCaps() and virCommand's
virSetCapabilities() (which it will replace in the next patch) is that
the new function properly clears the capabilities bounding set, so it
will not be possible for a child process to set any new
capabilities.
A short description of what is done by virSetUIDGIDWithCaps():
1) clear all capabilities then set all those desired by the caller (in
capBits) plus CAP_SETGID, CAP_SETUID, and CAP_SETPCAP (which is needed
to change the capabilities bounding set).
2) call prctl(), telling it that we want to maintain current
capabilities across an upcoming setuid().
3) switch to the new uid/gid
4) again call prctl(), telling it we will no longer want capabilities
maintained if this process does another setuid().
5) clear the capabilities that we added to allow us to
setuid/setgid/change the bounding set (unless they were also requested
by the caller via the virCommand API).
Because the modification/maintaining of capabilities is intermingled
with setting the uid, this is necessarily done in a single function,
rather than having two independent functions.
Note that, due to the way that effective capabilities are computed (at
time of execve) for a process that has uid != 0, the *file*
capabilities of the binary being executed must also have the desired
capabilities bit(s) set (see "man 7 capabilities"). This can be done
with the "filecap" command. (e.g. "filecap /usr/bin/qemu-kvm sys_rawio").
2013-02-05 10:30:32 -05:00
|
|
|
|
Convert 'int i' to 'size_t i' in src/util/ files
Convert the type of loop iterators named 'i', 'j', k',
'ii', 'jj', 'kk', to be 'size_t' instead of 'int' or
'unsigned int', also santizing 'ii', 'jj', 'kk' to use
the normal 'i', 'j', 'k' naming
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2013-07-08 15:09:33 +01:00
|
|
|
for (i = 0; i <= CAP_LAST_CAP; i++) {
|
2019-01-24 10:33:01 +01:00
|
|
|
capstr = capng_capability_to_name(i);
|
|
|
|
|
Convert 'int i' to 'size_t i' in src/util/ files
Convert the type of loop iterators named 'i', 'j', k',
'ii', 'jj', 'kk', to be 'size_t' instead of 'int' or
'unsigned int', also santizing 'ii', 'jj', 'kk' to use
the normal 'i', 'j', 'k' naming
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2013-07-08 15:09:33 +01:00
|
|
|
if (capBits & (1ULL << i)) {
|
util: virSetUIDGIDWithCaps - change uid while keeping caps
Normally when a process' uid is changed to non-0, all the capabilities
bits are cleared, even those explicitly set with calls to
capng_update()/capng_apply() made immediately before setuid. And
*after* the process' uid has been changed, it no longer has the
necessary privileges to add capabilities back to the process.
In order to set a non-0 uid while still maintaining any capabilities
bits, it is necessary to either call capng_change_id() (which
unfortunately doesn't currently call initgroups to setup auxiliary
group membership), or to perform the small amount of calisthenics
contained in the new utility function virSetUIDGIDWithCaps().
Another very important difference between the capabilities
setting/clearing in virSetUIDGIDWithCaps() and virCommand's
virSetCapabilities() (which it will replace in the next patch) is that
the new function properly clears the capabilities bounding set, so it
will not be possible for a child process to set any new
capabilities.
A short description of what is done by virSetUIDGIDWithCaps():
1) clear all capabilities then set all those desired by the caller (in
capBits) plus CAP_SETGID, CAP_SETUID, and CAP_SETPCAP (which is needed
to change the capabilities bounding set).
2) call prctl(), telling it that we want to maintain current
capabilities across an upcoming setuid().
3) switch to the new uid/gid
4) again call prctl(), telling it we will no longer want capabilities
maintained if this process does another setuid().
5) clear the capabilities that we added to allow us to
setuid/setgid/change the bounding set (unless they were also requested
by the caller via the virCommand API).
Because the modification/maintaining of capabilities is intermingled
with setting the uid, this is necessarily done in a single function,
rather than having two independent functions.
Note that, due to the way that effective capabilities are computed (at
time of execve) for a process that has uid != 0, the *file*
capabilities of the binary being executed must also have the desired
capabilities bit(s) set (see "man 7 capabilities"). This can be done
with the "filecap" command. (e.g. "filecap /usr/bin/qemu-kvm sys_rawio").
2013-02-05 10:30:32 -05:00
|
|
|
capng_update(CAPNG_ADD,
|
|
|
|
CAPNG_EFFECTIVE|CAPNG_INHERITABLE|
|
|
|
|
CAPNG_PERMITTED|CAPNG_BOUNDING_SET,
|
Convert 'int i' to 'size_t i' in src/util/ files
Convert the type of loop iterators named 'i', 'j', k',
'ii', 'jj', 'kk', to be 'size_t' instead of 'int' or
'unsigned int', also santizing 'ii', 'jj', 'kk' to use
the normal 'i', 'j', 'k' naming
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2013-07-08 15:09:33 +01:00
|
|
|
i);
|
2019-01-24 10:33:01 +01:00
|
|
|
|
|
|
|
VIR_DEBUG("Added '%s' to child capabilities' set", capstr);
|
util: virSetUIDGIDWithCaps - change uid while keeping caps
Normally when a process' uid is changed to non-0, all the capabilities
bits are cleared, even those explicitly set with calls to
capng_update()/capng_apply() made immediately before setuid. And
*after* the process' uid has been changed, it no longer has the
necessary privileges to add capabilities back to the process.
In order to set a non-0 uid while still maintaining any capabilities
bits, it is necessary to either call capng_change_id() (which
unfortunately doesn't currently call initgroups to setup auxiliary
group membership), or to perform the small amount of calisthenics
contained in the new utility function virSetUIDGIDWithCaps().
Another very important difference between the capabilities
setting/clearing in virSetUIDGIDWithCaps() and virCommand's
virSetCapabilities() (which it will replace in the next patch) is that
the new function properly clears the capabilities bounding set, so it
will not be possible for a child process to set any new
capabilities.
A short description of what is done by virSetUIDGIDWithCaps():
1) clear all capabilities then set all those desired by the caller (in
capBits) plus CAP_SETGID, CAP_SETUID, and CAP_SETPCAP (which is needed
to change the capabilities bounding set).
2) call prctl(), telling it that we want to maintain current
capabilities across an upcoming setuid().
3) switch to the new uid/gid
4) again call prctl(), telling it we will no longer want capabilities
maintained if this process does another setuid().
5) clear the capabilities that we added to allow us to
setuid/setgid/change the bounding set (unless they were also requested
by the caller via the virCommand API).
Because the modification/maintaining of capabilities is intermingled
with setting the uid, this is necessarily done in a single function,
rather than having two independent functions.
Note that, due to the way that effective capabilities are computed (at
time of execve) for a process that has uid != 0, the *file*
capabilities of the binary being executed must also have the desired
capabilities bit(s) set (see "man 7 capabilities"). This can be done
with the "filecap" command. (e.g. "filecap /usr/bin/qemu-kvm sys_rawio").
2013-02-05 10:30:32 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (gid != (gid_t)-1 &&
|
|
|
|
!capng_have_capability(CAPNG_EFFECTIVE, CAP_SETGID)) {
|
|
|
|
need_setgid = true;
|
|
|
|
capng_update(CAPNG_ADD, CAPNG_EFFECTIVE|CAPNG_PERMITTED, CAP_SETGID);
|
|
|
|
}
|
|
|
|
if (uid != (uid_t)-1 &&
|
|
|
|
!capng_have_capability(CAPNG_EFFECTIVE, CAP_SETUID)) {
|
|
|
|
need_setuid = true;
|
|
|
|
capng_update(CAPNG_ADD, CAPNG_EFFECTIVE|CAPNG_PERMITTED, CAP_SETUID);
|
|
|
|
}
|
|
|
|
# ifdef PR_CAPBSET_DROP
|
|
|
|
/* If newer kernel, we need also need setpcap to change the bounding set */
|
|
|
|
if ((capBits || need_setgid || need_setuid) &&
|
|
|
|
!capng_have_capability(CAPNG_EFFECTIVE, CAP_SETPCAP)) {
|
|
|
|
need_setpcap = true;
|
|
|
|
}
|
|
|
|
if (need_setpcap)
|
|
|
|
capng_update(CAPNG_ADD, CAPNG_EFFECTIVE|CAPNG_PERMITTED, CAP_SETPCAP);
|
|
|
|
# endif
|
|
|
|
|
|
|
|
/* Tell system we want to keep caps across uid change */
|
2013-03-25 15:25:28 +01:00
|
|
|
if (prctl(PR_SET_KEEPCAPS, 1, 0, 0, 0)) {
|
util: virSetUIDGIDWithCaps - change uid while keeping caps
Normally when a process' uid is changed to non-0, all the capabilities
bits are cleared, even those explicitly set with calls to
capng_update()/capng_apply() made immediately before setuid. And
*after* the process' uid has been changed, it no longer has the
necessary privileges to add capabilities back to the process.
In order to set a non-0 uid while still maintaining any capabilities
bits, it is necessary to either call capng_change_id() (which
unfortunately doesn't currently call initgroups to setup auxiliary
group membership), or to perform the small amount of calisthenics
contained in the new utility function virSetUIDGIDWithCaps().
Another very important difference between the capabilities
setting/clearing in virSetUIDGIDWithCaps() and virCommand's
virSetCapabilities() (which it will replace in the next patch) is that
the new function properly clears the capabilities bounding set, so it
will not be possible for a child process to set any new
capabilities.
A short description of what is done by virSetUIDGIDWithCaps():
1) clear all capabilities then set all those desired by the caller (in
capBits) plus CAP_SETGID, CAP_SETUID, and CAP_SETPCAP (which is needed
to change the capabilities bounding set).
2) call prctl(), telling it that we want to maintain current
capabilities across an upcoming setuid().
3) switch to the new uid/gid
4) again call prctl(), telling it we will no longer want capabilities
maintained if this process does another setuid().
5) clear the capabilities that we added to allow us to
setuid/setgid/change the bounding set (unless they were also requested
by the caller via the virCommand API).
Because the modification/maintaining of capabilities is intermingled
with setting the uid, this is necessarily done in a single function,
rather than having two independent functions.
Note that, due to the way that effective capabilities are computed (at
time of execve) for a process that has uid != 0, the *file*
capabilities of the binary being executed must also have the desired
capabilities bit(s) set (see "man 7 capabilities"). This can be done
with the "filecap" command. (e.g. "filecap /usr/bin/qemu-kvm sys_rawio").
2013-02-05 10:30:32 -05:00
|
|
|
virReportSystemError(errno, "%s",
|
|
|
|
_("prctl failed to set KEEPCAPS"));
|
2019-10-21 15:19:04 -03:00
|
|
|
return -1;
|
util: virSetUIDGIDWithCaps - change uid while keeping caps
Normally when a process' uid is changed to non-0, all the capabilities
bits are cleared, even those explicitly set with calls to
capng_update()/capng_apply() made immediately before setuid. And
*after* the process' uid has been changed, it no longer has the
necessary privileges to add capabilities back to the process.
In order to set a non-0 uid while still maintaining any capabilities
bits, it is necessary to either call capng_change_id() (which
unfortunately doesn't currently call initgroups to setup auxiliary
group membership), or to perform the small amount of calisthenics
contained in the new utility function virSetUIDGIDWithCaps().
Another very important difference between the capabilities
setting/clearing in virSetUIDGIDWithCaps() and virCommand's
virSetCapabilities() (which it will replace in the next patch) is that
the new function properly clears the capabilities bounding set, so it
will not be possible for a child process to set any new
capabilities.
A short description of what is done by virSetUIDGIDWithCaps():
1) clear all capabilities then set all those desired by the caller (in
capBits) plus CAP_SETGID, CAP_SETUID, and CAP_SETPCAP (which is needed
to change the capabilities bounding set).
2) call prctl(), telling it that we want to maintain current
capabilities across an upcoming setuid().
3) switch to the new uid/gid
4) again call prctl(), telling it we will no longer want capabilities
maintained if this process does another setuid().
5) clear the capabilities that we added to allow us to
setuid/setgid/change the bounding set (unless they were also requested
by the caller via the virCommand API).
Because the modification/maintaining of capabilities is intermingled
with setting the uid, this is necessarily done in a single function,
rather than having two independent functions.
Note that, due to the way that effective capabilities are computed (at
time of execve) for a process that has uid != 0, the *file*
capabilities of the binary being executed must also have the desired
capabilities bit(s) set (see "man 7 capabilities"). This can be done
with the "filecap" command. (e.g. "filecap /usr/bin/qemu-kvm sys_rawio").
2013-02-05 10:30:32 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
/* Change to the temp capabilities */
|
2013-03-25 15:25:28 +01:00
|
|
|
if ((capng_ret = capng_apply(CAPNG_SELECT_CAPS)) < 0) {
|
2013-03-25 15:25:29 +01:00
|
|
|
/* Failed. If we are running unprivileged, and the arguments make sense
|
|
|
|
* for this scenario, assume we're starting some kind of setuid helper:
|
|
|
|
* do not set any of capBits in the permitted or effective sets, and let
|
|
|
|
* the program get them on its own.
|
|
|
|
*
|
|
|
|
* (Too bad we cannot restrict the bounding set to the capabilities we
|
|
|
|
* would like the helper to have!).
|
|
|
|
*/
|
|
|
|
if (getuid() > 0 && clearExistingCaps && !need_setuid && !need_setgid) {
|
|
|
|
capng_clear(CAPNG_SELECT_CAPS);
|
|
|
|
} else {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
_("cannot apply process capabilities %d"), capng_ret);
|
2019-10-21 15:19:04 -03:00
|
|
|
return -1;
|
2013-03-25 15:25:29 +01:00
|
|
|
}
|
util: virSetUIDGIDWithCaps - change uid while keeping caps
Normally when a process' uid is changed to non-0, all the capabilities
bits are cleared, even those explicitly set with calls to
capng_update()/capng_apply() made immediately before setuid. And
*after* the process' uid has been changed, it no longer has the
necessary privileges to add capabilities back to the process.
In order to set a non-0 uid while still maintaining any capabilities
bits, it is necessary to either call capng_change_id() (which
unfortunately doesn't currently call initgroups to setup auxiliary
group membership), or to perform the small amount of calisthenics
contained in the new utility function virSetUIDGIDWithCaps().
Another very important difference between the capabilities
setting/clearing in virSetUIDGIDWithCaps() and virCommand's
virSetCapabilities() (which it will replace in the next patch) is that
the new function properly clears the capabilities bounding set, so it
will not be possible for a child process to set any new
capabilities.
A short description of what is done by virSetUIDGIDWithCaps():
1) clear all capabilities then set all those desired by the caller (in
capBits) plus CAP_SETGID, CAP_SETUID, and CAP_SETPCAP (which is needed
to change the capabilities bounding set).
2) call prctl(), telling it that we want to maintain current
capabilities across an upcoming setuid().
3) switch to the new uid/gid
4) again call prctl(), telling it we will no longer want capabilities
maintained if this process does another setuid().
5) clear the capabilities that we added to allow us to
setuid/setgid/change the bounding set (unless they were also requested
by the caller via the virCommand API).
Because the modification/maintaining of capabilities is intermingled
with setting the uid, this is necessarily done in a single function,
rather than having two independent functions.
Note that, due to the way that effective capabilities are computed (at
time of execve) for a process that has uid != 0, the *file*
capabilities of the binary being executed must also have the desired
capabilities bit(s) set (see "man 7 capabilities"). This can be done
with the "filecap" command. (e.g. "filecap /usr/bin/qemu-kvm sys_rawio").
2013-02-05 10:30:32 -05:00
|
|
|
}
|
|
|
|
|
util: make virSetUIDGID async-signal-safe
https://bugzilla.redhat.com/show_bug.cgi?id=964358
POSIX states that multi-threaded apps should not use functions
that are not async-signal-safe between fork and exec, yet we
were using getpwuid_r and initgroups. Although rare, it is
possible to hit deadlock in the child, when it tries to grab
a mutex that was already held by another thread in the parent.
I actually hit this deadlock when testing multiple domains
being started in parallel with a command hook, with the following
backtrace in the child:
Thread 1 (Thread 0x7fd56bbf2700 (LWP 3212)):
#0 __lll_lock_wait ()
at ../nptl/sysdeps/unix/sysv/linux/x86_64/lowlevellock.S:136
#1 0x00007fd5761e7388 in _L_lock_854 () from /lib64/libpthread.so.0
#2 0x00007fd5761e7257 in __pthread_mutex_lock (mutex=0x7fd56be00360)
at pthread_mutex_lock.c:61
#3 0x00007fd56bbf9fc5 in _nss_files_getpwuid_r (uid=0, result=0x7fd56bbf0c70,
buffer=0x7fd55c2a65f0 "", buflen=1024, errnop=0x7fd56bbf25b8)
at nss_files/files-pwd.c:40
#4 0x00007fd575aeff1d in __getpwuid_r (uid=0, resbuf=0x7fd56bbf0c70,
buffer=0x7fd55c2a65f0 "", buflen=1024, result=0x7fd56bbf0cb0)
at ../nss/getXXbyYY_r.c:253
#5 0x00007fd578aebafc in virSetUIDGID (uid=0, gid=0) at util/virutil.c:1031
#6 0x00007fd578aebf43 in virSetUIDGIDWithCaps (uid=0, gid=0, capBits=0,
clearExistingCaps=true) at util/virutil.c:1388
#7 0x00007fd578a9a20b in virExec (cmd=0x7fd55c231f10) at util/vircommand.c:654
#8 0x00007fd578a9dfa2 in virCommandRunAsync (cmd=0x7fd55c231f10, pid=0x0)
at util/vircommand.c:2247
#9 0x00007fd578a9d74e in virCommandRun (cmd=0x7fd55c231f10, exitstatus=0x0)
at util/vircommand.c:2100
#10 0x00007fd56326fde5 in qemuProcessStart (conn=0x7fd53c000df0,
driver=0x7fd55c0dc4f0, vm=0x7fd54800b100, migrateFrom=0x0, stdin_fd=-1,
stdin_path=0x0, snapshot=0x0, vmop=VIR_NETDEV_VPORT_PROFILE_OP_CREATE,
flags=1) at qemu/qemu_process.c:3694
...
The solution is to split the work of getpwuid_r/initgroups into the
unsafe portions (getgrouplist, called pre-fork) and safe portions
(setgroups, called post-fork).
* src/util/virutil.h (virSetUIDGID, virSetUIDGIDWithCaps): Adjust
signature.
* src/util/virutil.c (virSetUIDGID): Add parameters.
(virSetUIDGIDWithCaps): Adjust clients.
* src/util/vircommand.c (virExec): Likewise.
* src/util/virfile.c (virFileAccessibleAs, virFileOpenForked)
(virDirCreate): Likewise.
* src/security/security_dac.c (virSecurityDACSetProcessLabel):
Likewise.
* src/lxc/lxc_container.c (lxcContainerSetID): Likewise.
* configure.ac (AC_CHECK_FUNCS_ONCE): Check for setgroups, not
initgroups.
Signed-off-by: Eric Blake <eblake@redhat.com>
2013-05-21 20:59:10 -06:00
|
|
|
if (virSetUIDGID(uid, gid, groups, ngroups) < 0)
|
2019-10-21 15:19:04 -03:00
|
|
|
return -1;
|
util: virSetUIDGIDWithCaps - change uid while keeping caps
Normally when a process' uid is changed to non-0, all the capabilities
bits are cleared, even those explicitly set with calls to
capng_update()/capng_apply() made immediately before setuid. And
*after* the process' uid has been changed, it no longer has the
necessary privileges to add capabilities back to the process.
In order to set a non-0 uid while still maintaining any capabilities
bits, it is necessary to either call capng_change_id() (which
unfortunately doesn't currently call initgroups to setup auxiliary
group membership), or to perform the small amount of calisthenics
contained in the new utility function virSetUIDGIDWithCaps().
Another very important difference between the capabilities
setting/clearing in virSetUIDGIDWithCaps() and virCommand's
virSetCapabilities() (which it will replace in the next patch) is that
the new function properly clears the capabilities bounding set, so it
will not be possible for a child process to set any new
capabilities.
A short description of what is done by virSetUIDGIDWithCaps():
1) clear all capabilities then set all those desired by the caller (in
capBits) plus CAP_SETGID, CAP_SETUID, and CAP_SETPCAP (which is needed
to change the capabilities bounding set).
2) call prctl(), telling it that we want to maintain current
capabilities across an upcoming setuid().
3) switch to the new uid/gid
4) again call prctl(), telling it we will no longer want capabilities
maintained if this process does another setuid().
5) clear the capabilities that we added to allow us to
setuid/setgid/change the bounding set (unless they were also requested
by the caller via the virCommand API).
Because the modification/maintaining of capabilities is intermingled
with setting the uid, this is necessarily done in a single function,
rather than having two independent functions.
Note that, due to the way that effective capabilities are computed (at
time of execve) for a process that has uid != 0, the *file*
capabilities of the binary being executed must also have the desired
capabilities bit(s) set (see "man 7 capabilities"). This can be done
with the "filecap" command. (e.g. "filecap /usr/bin/qemu-kvm sys_rawio").
2013-02-05 10:30:32 -05:00
|
|
|
|
|
|
|
/* Tell it we are done keeping capabilities */
|
2013-03-25 15:25:28 +01:00
|
|
|
if (prctl(PR_SET_KEEPCAPS, 0, 0, 0, 0)) {
|
util: virSetUIDGIDWithCaps - change uid while keeping caps
Normally when a process' uid is changed to non-0, all the capabilities
bits are cleared, even those explicitly set with calls to
capng_update()/capng_apply() made immediately before setuid. And
*after* the process' uid has been changed, it no longer has the
necessary privileges to add capabilities back to the process.
In order to set a non-0 uid while still maintaining any capabilities
bits, it is necessary to either call capng_change_id() (which
unfortunately doesn't currently call initgroups to setup auxiliary
group membership), or to perform the small amount of calisthenics
contained in the new utility function virSetUIDGIDWithCaps().
Another very important difference between the capabilities
setting/clearing in virSetUIDGIDWithCaps() and virCommand's
virSetCapabilities() (which it will replace in the next patch) is that
the new function properly clears the capabilities bounding set, so it
will not be possible for a child process to set any new
capabilities.
A short description of what is done by virSetUIDGIDWithCaps():
1) clear all capabilities then set all those desired by the caller (in
capBits) plus CAP_SETGID, CAP_SETUID, and CAP_SETPCAP (which is needed
to change the capabilities bounding set).
2) call prctl(), telling it that we want to maintain current
capabilities across an upcoming setuid().
3) switch to the new uid/gid
4) again call prctl(), telling it we will no longer want capabilities
maintained if this process does another setuid().
5) clear the capabilities that we added to allow us to
setuid/setgid/change the bounding set (unless they were also requested
by the caller via the virCommand API).
Because the modification/maintaining of capabilities is intermingled
with setting the uid, this is necessarily done in a single function,
rather than having two independent functions.
Note that, due to the way that effective capabilities are computed (at
time of execve) for a process that has uid != 0, the *file*
capabilities of the binary being executed must also have the desired
capabilities bit(s) set (see "man 7 capabilities"). This can be done
with the "filecap" command. (e.g. "filecap /usr/bin/qemu-kvm sys_rawio").
2013-02-05 10:30:32 -05:00
|
|
|
virReportSystemError(errno, "%s",
|
|
|
|
_("prctl failed to reset KEEPCAPS"));
|
2019-10-21 15:19:04 -03:00
|
|
|
return -1;
|
util: virSetUIDGIDWithCaps - change uid while keeping caps
Normally when a process' uid is changed to non-0, all the capabilities
bits are cleared, even those explicitly set with calls to
capng_update()/capng_apply() made immediately before setuid. And
*after* the process' uid has been changed, it no longer has the
necessary privileges to add capabilities back to the process.
In order to set a non-0 uid while still maintaining any capabilities
bits, it is necessary to either call capng_change_id() (which
unfortunately doesn't currently call initgroups to setup auxiliary
group membership), or to perform the small amount of calisthenics
contained in the new utility function virSetUIDGIDWithCaps().
Another very important difference between the capabilities
setting/clearing in virSetUIDGIDWithCaps() and virCommand's
virSetCapabilities() (which it will replace in the next patch) is that
the new function properly clears the capabilities bounding set, so it
will not be possible for a child process to set any new
capabilities.
A short description of what is done by virSetUIDGIDWithCaps():
1) clear all capabilities then set all those desired by the caller (in
capBits) plus CAP_SETGID, CAP_SETUID, and CAP_SETPCAP (which is needed
to change the capabilities bounding set).
2) call prctl(), telling it that we want to maintain current
capabilities across an upcoming setuid().
3) switch to the new uid/gid
4) again call prctl(), telling it we will no longer want capabilities
maintained if this process does another setuid().
5) clear the capabilities that we added to allow us to
setuid/setgid/change the bounding set (unless they were also requested
by the caller via the virCommand API).
Because the modification/maintaining of capabilities is intermingled
with setting the uid, this is necessarily done in a single function,
rather than having two independent functions.
Note that, due to the way that effective capabilities are computed (at
time of execve) for a process that has uid != 0, the *file*
capabilities of the binary being executed must also have the desired
capabilities bit(s) set (see "man 7 capabilities"). This can be done
with the "filecap" command. (e.g. "filecap /usr/bin/qemu-kvm sys_rawio").
2013-02-05 10:30:32 -05:00
|
|
|
}
|
|
|
|
|
2019-01-24 10:33:01 +01:00
|
|
|
# ifdef PR_CAP_AMBIENT
|
|
|
|
/* we couldn't do this in the loop earlier above, because the capabilities
|
|
|
|
* were not applied yet, since in order to add a capability into the AMBIENT
|
|
|
|
* set, it has to be present in both the PERMITTED and INHERITABLE sets
|
|
|
|
* (capabilities(7))
|
|
|
|
*/
|
|
|
|
for (i = 0; i <= CAP_LAST_CAP; i++) {
|
|
|
|
capstr = capng_capability_to_name(i);
|
|
|
|
|
|
|
|
if (capBits & (1ULL << i)) {
|
|
|
|
if (prctl(PR_CAP_AMBIENT, PR_CAP_AMBIENT_RAISE, i, 0, 0) < 0) {
|
|
|
|
virReportSystemError(errno,
|
|
|
|
_("prctl failed to enable '%s' in the "
|
|
|
|
"AMBIENT set"),
|
|
|
|
capstr);
|
2019-10-21 15:19:04 -03:00
|
|
|
return -1;
|
2019-01-24 10:33:01 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
# endif
|
|
|
|
|
2013-03-25 15:25:28 +01:00
|
|
|
/* Set bounding set while we have CAP_SETPCAP. Unfortunately we cannot
|
|
|
|
* do this if we failed to get the capability above, so ignore the
|
|
|
|
* return value.
|
|
|
|
*/
|
|
|
|
capng_apply(CAPNG_SELECT_BOUNDS);
|
|
|
|
|
util: virSetUIDGIDWithCaps - change uid while keeping caps
Normally when a process' uid is changed to non-0, all the capabilities
bits are cleared, even those explicitly set with calls to
capng_update()/capng_apply() made immediately before setuid. And
*after* the process' uid has been changed, it no longer has the
necessary privileges to add capabilities back to the process.
In order to set a non-0 uid while still maintaining any capabilities
bits, it is necessary to either call capng_change_id() (which
unfortunately doesn't currently call initgroups to setup auxiliary
group membership), or to perform the small amount of calisthenics
contained in the new utility function virSetUIDGIDWithCaps().
Another very important difference between the capabilities
setting/clearing in virSetUIDGIDWithCaps() and virCommand's
virSetCapabilities() (which it will replace in the next patch) is that
the new function properly clears the capabilities bounding set, so it
will not be possible for a child process to set any new
capabilities.
A short description of what is done by virSetUIDGIDWithCaps():
1) clear all capabilities then set all those desired by the caller (in
capBits) plus CAP_SETGID, CAP_SETUID, and CAP_SETPCAP (which is needed
to change the capabilities bounding set).
2) call prctl(), telling it that we want to maintain current
capabilities across an upcoming setuid().
3) switch to the new uid/gid
4) again call prctl(), telling it we will no longer want capabilities
maintained if this process does another setuid().
5) clear the capabilities that we added to allow us to
setuid/setgid/change the bounding set (unless they were also requested
by the caller via the virCommand API).
Because the modification/maintaining of capabilities is intermingled
with setting the uid, this is necessarily done in a single function,
rather than having two independent functions.
Note that, due to the way that effective capabilities are computed (at
time of execve) for a process that has uid != 0, the *file*
capabilities of the binary being executed must also have the desired
capabilities bit(s) set (see "man 7 capabilities"). This can be done
with the "filecap" command. (e.g. "filecap /usr/bin/qemu-kvm sys_rawio").
2013-02-05 10:30:32 -05:00
|
|
|
/* Drop the caps that allow setuid/gid (unless they were requested) */
|
|
|
|
if (need_setgid)
|
|
|
|
capng_update(CAPNG_DROP, CAPNG_EFFECTIVE|CAPNG_PERMITTED, CAP_SETGID);
|
|
|
|
if (need_setuid)
|
|
|
|
capng_update(CAPNG_DROP, CAPNG_EFFECTIVE|CAPNG_PERMITTED, CAP_SETUID);
|
|
|
|
/* Throw away CAP_SETPCAP so no more changes */
|
|
|
|
if (need_setpcap)
|
|
|
|
capng_update(CAPNG_DROP, CAPNG_EFFECTIVE|CAPNG_PERMITTED, CAP_SETPCAP);
|
|
|
|
|
2013-03-25 15:25:28 +01:00
|
|
|
if (((capng_ret = capng_apply(CAPNG_SELECT_CAPS)) < 0)) {
|
util: virSetUIDGIDWithCaps - change uid while keeping caps
Normally when a process' uid is changed to non-0, all the capabilities
bits are cleared, even those explicitly set with calls to
capng_update()/capng_apply() made immediately before setuid. And
*after* the process' uid has been changed, it no longer has the
necessary privileges to add capabilities back to the process.
In order to set a non-0 uid while still maintaining any capabilities
bits, it is necessary to either call capng_change_id() (which
unfortunately doesn't currently call initgroups to setup auxiliary
group membership), or to perform the small amount of calisthenics
contained in the new utility function virSetUIDGIDWithCaps().
Another very important difference between the capabilities
setting/clearing in virSetUIDGIDWithCaps() and virCommand's
virSetCapabilities() (which it will replace in the next patch) is that
the new function properly clears the capabilities bounding set, so it
will not be possible for a child process to set any new
capabilities.
A short description of what is done by virSetUIDGIDWithCaps():
1) clear all capabilities then set all those desired by the caller (in
capBits) plus CAP_SETGID, CAP_SETUID, and CAP_SETPCAP (which is needed
to change the capabilities bounding set).
2) call prctl(), telling it that we want to maintain current
capabilities across an upcoming setuid().
3) switch to the new uid/gid
4) again call prctl(), telling it we will no longer want capabilities
maintained if this process does another setuid().
5) clear the capabilities that we added to allow us to
setuid/setgid/change the bounding set (unless they were also requested
by the caller via the virCommand API).
Because the modification/maintaining of capabilities is intermingled
with setting the uid, this is necessarily done in a single function,
rather than having two independent functions.
Note that, due to the way that effective capabilities are computed (at
time of execve) for a process that has uid != 0, the *file*
capabilities of the binary being executed must also have the desired
capabilities bit(s) set (see "man 7 capabilities"). This can be done
with the "filecap" command. (e.g. "filecap /usr/bin/qemu-kvm sys_rawio").
2013-02-05 10:30:32 -05:00
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
_("cannot apply process capabilities %d"), capng_ret);
|
2019-10-21 15:19:04 -03:00
|
|
|
return -1;
|
util: virSetUIDGIDWithCaps - change uid while keeping caps
Normally when a process' uid is changed to non-0, all the capabilities
bits are cleared, even those explicitly set with calls to
capng_update()/capng_apply() made immediately before setuid. And
*after* the process' uid has been changed, it no longer has the
necessary privileges to add capabilities back to the process.
In order to set a non-0 uid while still maintaining any capabilities
bits, it is necessary to either call capng_change_id() (which
unfortunately doesn't currently call initgroups to setup auxiliary
group membership), or to perform the small amount of calisthenics
contained in the new utility function virSetUIDGIDWithCaps().
Another very important difference between the capabilities
setting/clearing in virSetUIDGIDWithCaps() and virCommand's
virSetCapabilities() (which it will replace in the next patch) is that
the new function properly clears the capabilities bounding set, so it
will not be possible for a child process to set any new
capabilities.
A short description of what is done by virSetUIDGIDWithCaps():
1) clear all capabilities then set all those desired by the caller (in
capBits) plus CAP_SETGID, CAP_SETUID, and CAP_SETPCAP (which is needed
to change the capabilities bounding set).
2) call prctl(), telling it that we want to maintain current
capabilities across an upcoming setuid().
3) switch to the new uid/gid
4) again call prctl(), telling it we will no longer want capabilities
maintained if this process does another setuid().
5) clear the capabilities that we added to allow us to
setuid/setgid/change the bounding set (unless they were also requested
by the caller via the virCommand API).
Because the modification/maintaining of capabilities is intermingled
with setting the uid, this is necessarily done in a single function,
rather than having two independent functions.
Note that, due to the way that effective capabilities are computed (at
time of execve) for a process that has uid != 0, the *file*
capabilities of the binary being executed must also have the desired
capabilities bit(s) set (see "man 7 capabilities"). This can be done
with the "filecap" command. (e.g. "filecap /usr/bin/qemu-kvm sys_rawio").
2013-02-05 10:30:32 -05:00
|
|
|
}
|
|
|
|
|
2019-10-21 15:19:04 -03:00
|
|
|
return 0;
|
util: virSetUIDGIDWithCaps - change uid while keeping caps
Normally when a process' uid is changed to non-0, all the capabilities
bits are cleared, even those explicitly set with calls to
capng_update()/capng_apply() made immediately before setuid. And
*after* the process' uid has been changed, it no longer has the
necessary privileges to add capabilities back to the process.
In order to set a non-0 uid while still maintaining any capabilities
bits, it is necessary to either call capng_change_id() (which
unfortunately doesn't currently call initgroups to setup auxiliary
group membership), or to perform the small amount of calisthenics
contained in the new utility function virSetUIDGIDWithCaps().
Another very important difference between the capabilities
setting/clearing in virSetUIDGIDWithCaps() and virCommand's
virSetCapabilities() (which it will replace in the next patch) is that
the new function properly clears the capabilities bounding set, so it
will not be possible for a child process to set any new
capabilities.
A short description of what is done by virSetUIDGIDWithCaps():
1) clear all capabilities then set all those desired by the caller (in
capBits) plus CAP_SETGID, CAP_SETUID, and CAP_SETPCAP (which is needed
to change the capabilities bounding set).
2) call prctl(), telling it that we want to maintain current
capabilities across an upcoming setuid().
3) switch to the new uid/gid
4) again call prctl(), telling it we will no longer want capabilities
maintained if this process does another setuid().
5) clear the capabilities that we added to allow us to
setuid/setgid/change the bounding set (unless they were also requested
by the caller via the virCommand API).
Because the modification/maintaining of capabilities is intermingled
with setting the uid, this is necessarily done in a single function,
rather than having two independent functions.
Note that, due to the way that effective capabilities are computed (at
time of execve) for a process that has uid != 0, the *file*
capabilities of the binary being executed must also have the desired
capabilities bit(s) set (see "man 7 capabilities"). This can be done
with the "filecap" command. (e.g. "filecap /usr/bin/qemu-kvm sys_rawio").
2013-02-05 10:30:32 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
#else
|
|
|
|
/*
|
|
|
|
* On platforms without libcapng, the capabilities setting is treated
|
|
|
|
* as a NOP.
|
|
|
|
*/
|
|
|
|
|
|
|
|
int
|
util: make virSetUIDGID async-signal-safe
https://bugzilla.redhat.com/show_bug.cgi?id=964358
POSIX states that multi-threaded apps should not use functions
that are not async-signal-safe between fork and exec, yet we
were using getpwuid_r and initgroups. Although rare, it is
possible to hit deadlock in the child, when it tries to grab
a mutex that was already held by another thread in the parent.
I actually hit this deadlock when testing multiple domains
being started in parallel with a command hook, with the following
backtrace in the child:
Thread 1 (Thread 0x7fd56bbf2700 (LWP 3212)):
#0 __lll_lock_wait ()
at ../nptl/sysdeps/unix/sysv/linux/x86_64/lowlevellock.S:136
#1 0x00007fd5761e7388 in _L_lock_854 () from /lib64/libpthread.so.0
#2 0x00007fd5761e7257 in __pthread_mutex_lock (mutex=0x7fd56be00360)
at pthread_mutex_lock.c:61
#3 0x00007fd56bbf9fc5 in _nss_files_getpwuid_r (uid=0, result=0x7fd56bbf0c70,
buffer=0x7fd55c2a65f0 "", buflen=1024, errnop=0x7fd56bbf25b8)
at nss_files/files-pwd.c:40
#4 0x00007fd575aeff1d in __getpwuid_r (uid=0, resbuf=0x7fd56bbf0c70,
buffer=0x7fd55c2a65f0 "", buflen=1024, result=0x7fd56bbf0cb0)
at ../nss/getXXbyYY_r.c:253
#5 0x00007fd578aebafc in virSetUIDGID (uid=0, gid=0) at util/virutil.c:1031
#6 0x00007fd578aebf43 in virSetUIDGIDWithCaps (uid=0, gid=0, capBits=0,
clearExistingCaps=true) at util/virutil.c:1388
#7 0x00007fd578a9a20b in virExec (cmd=0x7fd55c231f10) at util/vircommand.c:654
#8 0x00007fd578a9dfa2 in virCommandRunAsync (cmd=0x7fd55c231f10, pid=0x0)
at util/vircommand.c:2247
#9 0x00007fd578a9d74e in virCommandRun (cmd=0x7fd55c231f10, exitstatus=0x0)
at util/vircommand.c:2100
#10 0x00007fd56326fde5 in qemuProcessStart (conn=0x7fd53c000df0,
driver=0x7fd55c0dc4f0, vm=0x7fd54800b100, migrateFrom=0x0, stdin_fd=-1,
stdin_path=0x0, snapshot=0x0, vmop=VIR_NETDEV_VPORT_PROFILE_OP_CREATE,
flags=1) at qemu/qemu_process.c:3694
...
The solution is to split the work of getpwuid_r/initgroups into the
unsafe portions (getgrouplist, called pre-fork) and safe portions
(setgroups, called post-fork).
* src/util/virutil.h (virSetUIDGID, virSetUIDGIDWithCaps): Adjust
signature.
* src/util/virutil.c (virSetUIDGID): Add parameters.
(virSetUIDGIDWithCaps): Adjust clients.
* src/util/vircommand.c (virExec): Likewise.
* src/util/virfile.c (virFileAccessibleAs, virFileOpenForked)
(virDirCreate): Likewise.
* src/security/security_dac.c (virSecurityDACSetProcessLabel):
Likewise.
* src/lxc/lxc_container.c (lxcContainerSetID): Likewise.
* configure.ac (AC_CHECK_FUNCS_ONCE): Check for setgroups, not
initgroups.
Signed-off-by: Eric Blake <eblake@redhat.com>
2013-05-21 20:59:10 -06:00
|
|
|
virSetUIDGIDWithCaps(uid_t uid, gid_t gid, gid_t *groups, int ngroups,
|
2019-10-14 14:45:33 +02:00
|
|
|
unsigned long long capBits G_GNUC_UNUSED,
|
|
|
|
bool clearExistingCaps G_GNUC_UNUSED)
|
util: virSetUIDGIDWithCaps - change uid while keeping caps
Normally when a process' uid is changed to non-0, all the capabilities
bits are cleared, even those explicitly set with calls to
capng_update()/capng_apply() made immediately before setuid. And
*after* the process' uid has been changed, it no longer has the
necessary privileges to add capabilities back to the process.
In order to set a non-0 uid while still maintaining any capabilities
bits, it is necessary to either call capng_change_id() (which
unfortunately doesn't currently call initgroups to setup auxiliary
group membership), or to perform the small amount of calisthenics
contained in the new utility function virSetUIDGIDWithCaps().
Another very important difference between the capabilities
setting/clearing in virSetUIDGIDWithCaps() and virCommand's
virSetCapabilities() (which it will replace in the next patch) is that
the new function properly clears the capabilities bounding set, so it
will not be possible for a child process to set any new
capabilities.
A short description of what is done by virSetUIDGIDWithCaps():
1) clear all capabilities then set all those desired by the caller (in
capBits) plus CAP_SETGID, CAP_SETUID, and CAP_SETPCAP (which is needed
to change the capabilities bounding set).
2) call prctl(), telling it that we want to maintain current
capabilities across an upcoming setuid().
3) switch to the new uid/gid
4) again call prctl(), telling it we will no longer want capabilities
maintained if this process does another setuid().
5) clear the capabilities that we added to allow us to
setuid/setgid/change the bounding set (unless they were also requested
by the caller via the virCommand API).
Because the modification/maintaining of capabilities is intermingled
with setting the uid, this is necessarily done in a single function,
rather than having two independent functions.
Note that, due to the way that effective capabilities are computed (at
time of execve) for a process that has uid != 0, the *file*
capabilities of the binary being executed must also have the desired
capabilities bit(s) set (see "man 7 capabilities"). This can be done
with the "filecap" command. (e.g. "filecap /usr/bin/qemu-kvm sys_rawio").
2013-02-05 10:30:32 -05:00
|
|
|
{
|
util: make virSetUIDGID async-signal-safe
https://bugzilla.redhat.com/show_bug.cgi?id=964358
POSIX states that multi-threaded apps should not use functions
that are not async-signal-safe between fork and exec, yet we
were using getpwuid_r and initgroups. Although rare, it is
possible to hit deadlock in the child, when it tries to grab
a mutex that was already held by another thread in the parent.
I actually hit this deadlock when testing multiple domains
being started in parallel with a command hook, with the following
backtrace in the child:
Thread 1 (Thread 0x7fd56bbf2700 (LWP 3212)):
#0 __lll_lock_wait ()
at ../nptl/sysdeps/unix/sysv/linux/x86_64/lowlevellock.S:136
#1 0x00007fd5761e7388 in _L_lock_854 () from /lib64/libpthread.so.0
#2 0x00007fd5761e7257 in __pthread_mutex_lock (mutex=0x7fd56be00360)
at pthread_mutex_lock.c:61
#3 0x00007fd56bbf9fc5 in _nss_files_getpwuid_r (uid=0, result=0x7fd56bbf0c70,
buffer=0x7fd55c2a65f0 "", buflen=1024, errnop=0x7fd56bbf25b8)
at nss_files/files-pwd.c:40
#4 0x00007fd575aeff1d in __getpwuid_r (uid=0, resbuf=0x7fd56bbf0c70,
buffer=0x7fd55c2a65f0 "", buflen=1024, result=0x7fd56bbf0cb0)
at ../nss/getXXbyYY_r.c:253
#5 0x00007fd578aebafc in virSetUIDGID (uid=0, gid=0) at util/virutil.c:1031
#6 0x00007fd578aebf43 in virSetUIDGIDWithCaps (uid=0, gid=0, capBits=0,
clearExistingCaps=true) at util/virutil.c:1388
#7 0x00007fd578a9a20b in virExec (cmd=0x7fd55c231f10) at util/vircommand.c:654
#8 0x00007fd578a9dfa2 in virCommandRunAsync (cmd=0x7fd55c231f10, pid=0x0)
at util/vircommand.c:2247
#9 0x00007fd578a9d74e in virCommandRun (cmd=0x7fd55c231f10, exitstatus=0x0)
at util/vircommand.c:2100
#10 0x00007fd56326fde5 in qemuProcessStart (conn=0x7fd53c000df0,
driver=0x7fd55c0dc4f0, vm=0x7fd54800b100, migrateFrom=0x0, stdin_fd=-1,
stdin_path=0x0, snapshot=0x0, vmop=VIR_NETDEV_VPORT_PROFILE_OP_CREATE,
flags=1) at qemu/qemu_process.c:3694
...
The solution is to split the work of getpwuid_r/initgroups into the
unsafe portions (getgrouplist, called pre-fork) and safe portions
(setgroups, called post-fork).
* src/util/virutil.h (virSetUIDGID, virSetUIDGIDWithCaps): Adjust
signature.
* src/util/virutil.c (virSetUIDGID): Add parameters.
(virSetUIDGIDWithCaps): Adjust clients.
* src/util/vircommand.c (virExec): Likewise.
* src/util/virfile.c (virFileAccessibleAs, virFileOpenForked)
(virDirCreate): Likewise.
* src/security/security_dac.c (virSecurityDACSetProcessLabel):
Likewise.
* src/lxc/lxc_container.c (lxcContainerSetID): Likewise.
* configure.ac (AC_CHECK_FUNCS_ONCE): Check for setgroups, not
initgroups.
Signed-off-by: Eric Blake <eblake@redhat.com>
2013-05-21 20:59:10 -06:00
|
|
|
return virSetUIDGID(uid, gid, groups, ngroups);
|
util: virSetUIDGIDWithCaps - change uid while keeping caps
Normally when a process' uid is changed to non-0, all the capabilities
bits are cleared, even those explicitly set with calls to
capng_update()/capng_apply() made immediately before setuid. And
*after* the process' uid has been changed, it no longer has the
necessary privileges to add capabilities back to the process.
In order to set a non-0 uid while still maintaining any capabilities
bits, it is necessary to either call capng_change_id() (which
unfortunately doesn't currently call initgroups to setup auxiliary
group membership), or to perform the small amount of calisthenics
contained in the new utility function virSetUIDGIDWithCaps().
Another very important difference between the capabilities
setting/clearing in virSetUIDGIDWithCaps() and virCommand's
virSetCapabilities() (which it will replace in the next patch) is that
the new function properly clears the capabilities bounding set, so it
will not be possible for a child process to set any new
capabilities.
A short description of what is done by virSetUIDGIDWithCaps():
1) clear all capabilities then set all those desired by the caller (in
capBits) plus CAP_SETGID, CAP_SETUID, and CAP_SETPCAP (which is needed
to change the capabilities bounding set).
2) call prctl(), telling it that we want to maintain current
capabilities across an upcoming setuid().
3) switch to the new uid/gid
4) again call prctl(), telling it we will no longer want capabilities
maintained if this process does another setuid().
5) clear the capabilities that we added to allow us to
setuid/setgid/change the bounding set (unless they were also requested
by the caller via the virCommand API).
Because the modification/maintaining of capabilities is intermingled
with setting the uid, this is necessarily done in a single function,
rather than having two independent functions.
Note that, due to the way that effective capabilities are computed (at
time of execve) for a process that has uid != 0, the *file*
capabilities of the binary being executed must also have the desired
capabilities bit(s) set (see "man 7 capabilities"). This can be done
with the "filecap" command. (e.g. "filecap /usr/bin/qemu-kvm sys_rawio").
2013-02-05 10:30:32 -05:00
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
Support configuration of huge pages in guests
Add option to domain XML for
<memoryBacking>
<hugepages/>
</memoryBacking>
* configure.in: Add check for mntent.h
* qemud/libvirtd_qemu.aug, qemud/test_libvirtd_qemu.aug, src/qemu.conf
Add 'hugetlbfs_mount' config parameter
* src/qemu_conf.c, src/qemu_conf.h: Check for -mem-path flag in QEMU,
and pass it when hugepages are requested.
Load hugetlbfs_mount config parameter, search for mount if not given.
* src/qemu_driver.c: Free hugetlbfs_mount/path parameter in driver shutdown.
Create directory for QEMU hugepage usage, chowning if required.
* docs/formatdomain.html.in: Document memoryBacking/hugepages elements
* docs/schemas/domain.rng: Add memoryBacking/hugepages elements to schema
* src/util.c, src/util.h, src/libvirt_private.syms: Add virFileFindMountPoint
helper API
* tests/qemuhelptest.c: Add -mem-path constants
* tests/qemuxml2argvtest.c, tests/qemuxml2xmltest.c: Add tests for hugepage
handling
* tests/qemuxml2argvdata/qemuxml2argv-hugepages.xml,
tests/qemuxml2argvdata/qemuxml2argv-hugepages.args: Data files for
hugepage tests
2009-08-25 15:05:18 +01:00
|
|
|
|
2017-02-20 07:00:51 -05:00
|
|
|
void virWaitForDevices(void)
|
2009-09-10 14:21:10 +01:00
|
|
|
{
|
2019-10-15 14:47:50 +02:00
|
|
|
g_autoptr(virCommand) cmd = NULL;
|
2019-10-15 15:16:31 +02:00
|
|
|
g_autofree char *udev = NULL;
|
2009-09-10 14:21:10 +01:00
|
|
|
int exitstatus;
|
|
|
|
|
2019-05-17 11:09:45 +02:00
|
|
|
if (!(udev = virFindFileInPath(UDEVADM)))
|
|
|
|
return;
|
|
|
|
|
|
|
|
if (!(cmd = virCommandNewArgList(udev, "settle", NULL)))
|
2009-09-10 14:21:10 +01:00
|
|
|
return;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* NOTE: we ignore errors here; this is just to make sure that any device
|
|
|
|
* nodes that are being created finish before we try to scan them.
|
|
|
|
*/
|
2019-05-17 11:09:45 +02:00
|
|
|
ignore_value(virCommandRun(cmd, &exitstatus));
|
2009-09-10 14:21:10 +01:00
|
|
|
}
|
2009-11-12 22:48:24 +01:00
|
|
|
|
2016-12-12 13:33:42 +01:00
|
|
|
#if WITH_DEVMAPPER
|
2011-02-17 15:29:07 +08:00
|
|
|
bool
|
2011-09-16 14:05:58 +02:00
|
|
|
virIsDevMapperDevice(const char *dev_name)
|
2011-02-17 15:29:07 +08:00
|
|
|
{
|
|
|
|
struct stat buf;
|
|
|
|
|
2011-09-16 14:05:58 +02:00
|
|
|
if (!stat(dev_name, &buf) &&
|
2011-02-17 15:29:07 +08:00
|
|
|
S_ISBLK(buf.st_mode) &&
|
|
|
|
dm_is_dm_major(major(buf.st_rdev)))
|
|
|
|
return true;
|
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
2011-02-18 12:00:47 -07:00
|
|
|
#else
|
2019-10-14 14:45:33 +02:00
|
|
|
bool virIsDevMapperDevice(const char *dev_name G_GNUC_UNUSED)
|
2011-02-18 12:00:47 -07:00
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
#endif
|
2012-09-11 16:57:02 +08:00
|
|
|
|
|
|
|
bool
|
2014-03-18 09:14:35 +01:00
|
|
|
virValidateWWN(const char *wwn)
|
|
|
|
{
|
Convert 'int i' to 'size_t i' in src/util/ files
Convert the type of loop iterators named 'i', 'j', k',
'ii', 'jj', 'kk', to be 'size_t' instead of 'int' or
'unsigned int', also santizing 'ii', 'jj', 'kk' to use
the normal 'i', 'j', 'k' naming
Signed-off-by: Daniel P. Berrange <berrange@redhat.com>
2013-07-08 15:09:33 +01:00
|
|
|
size_t i;
|
qemu: Allow the disk wwn to have "0x" prefix
The recent qemu requires "0x" prefix for the disk wwn, this patch
changes virValidateWWN to allow the prefix, and prepend "0x" if
it's not specified. E.g.
qemu-kvm: -device scsi-hd,bus=scsi0.0,channel=0,scsi-id=0,lun=0,\
drive=drive-scsi0-0-0-0,id=scsi0-0-0-0,wwn=6000c60016ea71ad:
Property 'scsi-hd.wwn' doesn't take value '6000c60016ea71ad'
Though it's a qemu regression, but it's nice to allow the prefix,
and doesn't hurt for us to always output "0x".
2013-04-17 21:23:44 +08:00
|
|
|
const char *p = wwn;
|
2012-09-11 16:57:02 +08:00
|
|
|
|
2014-11-13 15:28:18 +01:00
|
|
|
if (STRPREFIX(wwn, "0x"))
|
qemu: Allow the disk wwn to have "0x" prefix
The recent qemu requires "0x" prefix for the disk wwn, this patch
changes virValidateWWN to allow the prefix, and prepend "0x" if
it's not specified. E.g.
qemu-kvm: -device scsi-hd,bus=scsi0.0,channel=0,scsi-id=0,lun=0,\
drive=drive-scsi0-0-0-0,id=scsi0-0-0-0,wwn=6000c60016ea71ad:
Property 'scsi-hd.wwn' doesn't take value '6000c60016ea71ad'
Though it's a qemu regression, but it's nice to allow the prefix,
and doesn't hurt for us to always output "0x".
2013-04-17 21:23:44 +08:00
|
|
|
p += 2;
|
|
|
|
|
|
|
|
for (i = 0; p[i]; i++) {
|
2019-11-18 15:16:00 +01:00
|
|
|
if (!g_ascii_isxdigit(p[i]))
|
2012-09-11 16:57:02 +08:00
|
|
|
break;
|
qemu: Allow the disk wwn to have "0x" prefix
The recent qemu requires "0x" prefix for the disk wwn, this patch
changes virValidateWWN to allow the prefix, and prepend "0x" if
it's not specified. E.g.
qemu-kvm: -device scsi-hd,bus=scsi0.0,channel=0,scsi-id=0,lun=0,\
drive=drive-scsi0-0-0-0,id=scsi0-0-0-0,wwn=6000c60016ea71ad:
Property 'scsi-hd.wwn' doesn't take value '6000c60016ea71ad'
Though it's a qemu regression, but it's nice to allow the prefix,
and doesn't hurt for us to always output "0x".
2013-04-17 21:23:44 +08:00
|
|
|
}
|
2012-09-11 16:57:02 +08:00
|
|
|
|
qemu: Allow the disk wwn to have "0x" prefix
The recent qemu requires "0x" prefix for the disk wwn, this patch
changes virValidateWWN to allow the prefix, and prepend "0x" if
it's not specified. E.g.
qemu-kvm: -device scsi-hd,bus=scsi0.0,channel=0,scsi-id=0,lun=0,\
drive=drive-scsi0-0-0-0,id=scsi0-0-0-0,wwn=6000c60016ea71ad:
Property 'scsi-hd.wwn' doesn't take value '6000c60016ea71ad'
Though it's a qemu regression, but it's nice to allow the prefix,
and doesn't hurt for us to always output "0x".
2013-04-17 21:23:44 +08:00
|
|
|
if (i != 16 || p[i]) {
|
2014-11-11 10:12:20 +08:00
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
_("Malformed wwn: %s"), wwn);
|
2012-09-11 16:57:02 +08:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
2012-12-06 18:23:02 +08:00
|
|
|
|
2013-01-02 22:37:06 +08:00
|
|
|
#if defined(major) && defined(minor)
|
|
|
|
int
|
|
|
|
virGetDeviceID(const char *path, int *maj, int *min)
|
|
|
|
{
|
|
|
|
struct stat sb;
|
|
|
|
|
2013-01-09 16:34:15 -07:00
|
|
|
if (stat(path, &sb) < 0)
|
2013-01-02 22:37:06 +08:00
|
|
|
return -errno;
|
|
|
|
|
2013-01-09 16:34:15 -07:00
|
|
|
if (!S_ISBLK(sb.st_mode))
|
2013-01-02 22:37:06 +08:00
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
if (maj)
|
|
|
|
*maj = major(sb.st_rdev);
|
|
|
|
if (min)
|
|
|
|
*min = minor(sb.st_rdev);
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
#else
|
|
|
|
int
|
2019-10-14 14:45:33 +02:00
|
|
|
virGetDeviceID(const char *path G_GNUC_UNUSED,
|
|
|
|
int *maj G_GNUC_UNUSED,
|
|
|
|
int *min G_GNUC_UNUSED)
|
2013-01-02 22:37:06 +08:00
|
|
|
{
|
|
|
|
return -ENOSYS;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#define SYSFS_DEV_BLOCK_PATH "/sys/dev/block"
|
|
|
|
|
2013-01-02 22:37:10 +08:00
|
|
|
char *
|
2013-01-02 22:37:06 +08:00
|
|
|
virGetUnprivSGIOSysfsPath(const char *path,
|
|
|
|
const char *sysfs_dir)
|
|
|
|
{
|
|
|
|
int maj, min;
|
|
|
|
char *sysfs_path = NULL;
|
|
|
|
int rc;
|
|
|
|
|
|
|
|
if ((rc = virGetDeviceID(path, &maj, &min)) < 0) {
|
|
|
|
virReportSystemError(-rc,
|
|
|
|
_("Unable to get device ID '%s'"),
|
|
|
|
path);
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2019-10-22 15:26:14 +02:00
|
|
|
sysfs_path = g_strdup_printf("%s/%d:%d/queue/unpriv_sgio",
|
|
|
|
sysfs_dir ? sysfs_dir : SYSFS_DEV_BLOCK_PATH,
|
|
|
|
maj, min);
|
2013-01-02 22:37:06 +08:00
|
|
|
return sysfs_path;
|
|
|
|
}
|
|
|
|
|
|
|
|
int
|
|
|
|
virSetDeviceUnprivSGIO(const char *path,
|
|
|
|
const char *sysfs_dir,
|
|
|
|
int unpriv_sgio)
|
|
|
|
{
|
|
|
|
char *sysfs_path = NULL;
|
|
|
|
char *val = NULL;
|
|
|
|
int ret = -1;
|
|
|
|
int rc;
|
|
|
|
|
|
|
|
if (!(sysfs_path = virGetUnprivSGIOSysfsPath(path, sysfs_dir)))
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
if (!virFileExists(sysfs_path)) {
|
|
|
|
virReportError(VIR_ERR_OPERATION_INVALID, "%s",
|
|
|
|
_("unpriv_sgio is not supported by this kernel"));
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
2019-10-22 15:26:14 +02:00
|
|
|
val = g_strdup_printf("%d", unpriv_sgio);
|
2013-01-02 22:37:06 +08:00
|
|
|
|
|
|
|
if ((rc = virFileWriteStr(sysfs_path, val, 0)) < 0) {
|
|
|
|
virReportSystemError(-rc, _("failed to set %s"), sysfs_path);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = 0;
|
2014-03-25 07:53:22 +01:00
|
|
|
cleanup:
|
2013-01-02 22:37:06 +08:00
|
|
|
VIR_FREE(sysfs_path);
|
|
|
|
VIR_FREE(val);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
int
|
|
|
|
virGetDeviceUnprivSGIO(const char *path,
|
|
|
|
const char *sysfs_dir,
|
|
|
|
int *unpriv_sgio)
|
|
|
|
{
|
|
|
|
char *sysfs_path = NULL;
|
|
|
|
char *buf = NULL;
|
|
|
|
char *tmp = NULL;
|
|
|
|
int ret = -1;
|
|
|
|
|
|
|
|
if (!(sysfs_path = virGetUnprivSGIOSysfsPath(path, sysfs_dir)))
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
if (!virFileExists(sysfs_path)) {
|
|
|
|
virReportError(VIR_ERR_OPERATION_INVALID, "%s",
|
|
|
|
_("unpriv_sgio is not supported by this kernel"));
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (virFileReadAll(sysfs_path, 1024, &buf) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
if ((tmp = strchr(buf, '\n')))
|
|
|
|
*tmp = '\0';
|
|
|
|
|
|
|
|
if (virStrToLong_i(buf, NULL, 10, unpriv_sgio) < 0) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR,
|
|
|
|
_("failed to parse value of %s"), sysfs_path);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = 0;
|
2014-03-25 07:53:22 +01:00
|
|
|
cleanup:
|
2013-01-02 22:37:06 +08:00
|
|
|
VIR_FREE(sysfs_path);
|
|
|
|
VIR_FREE(buf);
|
|
|
|
return ret;
|
|
|
|
}
|
2013-01-08 01:05:29 +08:00
|
|
|
|
2013-04-17 17:50:56 +02:00
|
|
|
|
2013-05-24 17:35:01 +02:00
|
|
|
/**
|
|
|
|
* virParseOwnershipIds:
|
|
|
|
*
|
|
|
|
* Parse the usual "uid:gid" ownership specification into uid_t and
|
|
|
|
* gid_t passed as parameters. NULL value for those parameters mean
|
|
|
|
* the information is not needed. Also, none of those values are
|
|
|
|
* changed in case of any error.
|
|
|
|
*
|
|
|
|
* Returns -1 on error, 0 otherwise.
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
virParseOwnershipIds(const char *label, uid_t *uidPtr, gid_t *gidPtr)
|
|
|
|
{
|
|
|
|
int rc = -1;
|
|
|
|
uid_t theuid;
|
|
|
|
gid_t thegid;
|
|
|
|
char *tmp_label = NULL;
|
|
|
|
char *sep = NULL;
|
|
|
|
char *owner = NULL;
|
|
|
|
char *group = NULL;
|
|
|
|
|
2019-10-20 13:49:46 +02:00
|
|
|
tmp_label = g_strdup(label);
|
2013-05-24 17:35:01 +02:00
|
|
|
|
|
|
|
/* Split label */
|
|
|
|
sep = strchr(tmp_label, ':');
|
|
|
|
if (sep == NULL) {
|
|
|
|
virReportError(VIR_ERR_INVALID_ARG,
|
|
|
|
_("Failed to parse uid and gid from '%s'"),
|
|
|
|
label);
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
*sep = '\0';
|
|
|
|
owner = tmp_label;
|
|
|
|
group = sep + 1;
|
|
|
|
|
|
|
|
/* Parse owner and group, error message is defined by
|
|
|
|
* virGetUserID or virGetGroupID.
|
|
|
|
*/
|
|
|
|
if (virGetUserID(owner, &theuid) < 0 ||
|
|
|
|
virGetGroupID(group, &thegid) < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
if (uidPtr)
|
|
|
|
*uidPtr = theuid;
|
|
|
|
if (gidPtr)
|
|
|
|
*gidPtr = thegid;
|
|
|
|
|
|
|
|
rc = 0;
|
|
|
|
|
2014-03-25 07:53:22 +01:00
|
|
|
cleanup:
|
2013-05-24 17:35:01 +02:00
|
|
|
VIR_FREE(tmp_label);
|
|
|
|
|
|
|
|
return rc;
|
|
|
|
}
|
2013-10-09 10:52:39 +01:00
|
|
|
|
2014-03-05 17:20:50 +00:00
|
|
|
static time_t selfLastChanged;
|
|
|
|
|
|
|
|
time_t virGetSelfLastChanged(void)
|
|
|
|
{
|
|
|
|
return selfLastChanged;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
void virUpdateSelfLastChanged(const char *path)
|
|
|
|
{
|
|
|
|
struct stat sb;
|
|
|
|
|
|
|
|
if (stat(path, &sb) < 0)
|
|
|
|
return;
|
|
|
|
|
|
|
|
if (sb.st_ctime > selfLastChanged) {
|
|
|
|
VIR_DEBUG("Setting self last changed to %lld for '%s'",
|
|
|
|
(long long)sb.st_ctime, path);
|
|
|
|
selfLastChanged = sb.st_ctime;
|
|
|
|
}
|
|
|
|
}
|
2014-07-15 14:34:13 +02:00
|
|
|
|
2015-02-02 05:26:49 -05:00
|
|
|
|
2015-02-03 14:20:25 +01:00
|
|
|
#ifndef WIN32
|
2015-02-02 05:26:49 -05:00
|
|
|
long virGetSystemPageSize(void)
|
|
|
|
{
|
|
|
|
return sysconf(_SC_PAGESIZE);
|
|
|
|
}
|
2015-02-03 14:20:25 +01:00
|
|
|
#else /* WIN32 */
|
|
|
|
long virGetSystemPageSize(void)
|
|
|
|
{
|
|
|
|
errno = ENOSYS;
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
#endif /* WIN32 */
|
2015-02-02 05:26:49 -05:00
|
|
|
|
|
|
|
long virGetSystemPageSizeKB(void)
|
|
|
|
{
|
|
|
|
long val = virGetSystemPageSize();
|
|
|
|
if (val < 0)
|
|
|
|
return val;
|
|
|
|
return val / 1024;
|
|
|
|
}
|
2015-03-04 15:08:09 +01:00
|
|
|
|
|
|
|
/**
|
|
|
|
* virMemoryLimitTruncate
|
|
|
|
*
|
|
|
|
* Return truncated memory limit to VIR_DOMAIN_MEMORY_PARAM_UNLIMITED as maximum
|
|
|
|
* which means that the limit is not set => unlimited.
|
|
|
|
*/
|
|
|
|
unsigned long long
|
|
|
|
virMemoryLimitTruncate(unsigned long long value)
|
|
|
|
{
|
|
|
|
return value < VIR_DOMAIN_MEMORY_PARAM_UNLIMITED ? value :
|
|
|
|
VIR_DOMAIN_MEMORY_PARAM_UNLIMITED;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* virMemoryLimitIsSet
|
|
|
|
*
|
|
|
|
* Returns true if the limit is set and false for unlimited value.
|
|
|
|
*/
|
|
|
|
bool
|
|
|
|
virMemoryLimitIsSet(unsigned long long value)
|
|
|
|
{
|
|
|
|
return value < VIR_DOMAIN_MEMORY_PARAM_UNLIMITED;
|
|
|
|
}
|
2015-05-05 17:58:49 +02:00
|
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
* virMemoryMaxValue
|
|
|
|
*
|
2015-05-21 16:50:19 +02:00
|
|
|
* @capped: whether the value must fit into unsigned long
|
2015-05-05 17:58:49 +02:00
|
|
|
* (long long is assumed otherwise)
|
|
|
|
*
|
2015-12-10 14:36:51 +01:00
|
|
|
* Note: This function is mocked in tests/qemuxml2argvmock.c for test stability
|
|
|
|
*
|
2015-05-05 17:58:49 +02:00
|
|
|
* Returns the maximum possible memory value in bytes.
|
|
|
|
*/
|
|
|
|
unsigned long long
|
2015-05-21 16:50:19 +02:00
|
|
|
virMemoryMaxValue(bool capped)
|
2015-05-05 17:58:49 +02:00
|
|
|
{
|
|
|
|
/* On 32-bit machines, our bound is 0xffffffff * KiB. On 64-bit
|
|
|
|
* machines, our bound is off_t (2^63). */
|
2015-05-21 16:50:19 +02:00
|
|
|
if (capped && sizeof(unsigned long) < sizeof(long long))
|
2015-05-05 17:58:49 +02:00
|
|
|
return 1024ull * ULONG_MAX;
|
|
|
|
else
|
|
|
|
return LLONG_MAX;
|
|
|
|
}
|
2018-06-01 10:15:58 +02:00
|
|
|
|
|
|
|
|
|
|
|
bool
|
|
|
|
virHostHasIOMMU(void)
|
|
|
|
{
|
|
|
|
DIR *iommuDir = NULL;
|
|
|
|
struct dirent *iommuGroup = NULL;
|
|
|
|
bool ret = false;
|
|
|
|
int direrr;
|
|
|
|
|
|
|
|
if (virDirOpenQuiet(&iommuDir, "/sys/kernel/iommu_groups/") < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
while ((direrr = virDirRead(iommuDir, &iommuGroup, NULL)) > 0)
|
|
|
|
break;
|
|
|
|
|
|
|
|
if (direrr < 0 || !iommuGroup)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
ret = true;
|
|
|
|
|
|
|
|
cleanup:
|
|
|
|
VIR_DIR_CLOSE(iommuDir);
|
|
|
|
return ret;
|
|
|
|
}
|
2018-11-08 11:47:09 +01:00
|
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
* virHostGetDRMRenderNode:
|
|
|
|
*
|
|
|
|
* Picks the first DRM render node available. Missing DRI or missing DRM render
|
|
|
|
* nodes in the system results in an error.
|
|
|
|
*
|
|
|
|
* Returns an absolute path to the first render node available or NULL in case
|
|
|
|
* of an error with the error being reported.
|
|
|
|
* Caller is responsible for freeing the result string.
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
char *
|
|
|
|
virHostGetDRMRenderNode(void)
|
|
|
|
{
|
|
|
|
char *ret = NULL;
|
|
|
|
DIR *driDir = NULL;
|
|
|
|
const char *driPath = "/dev/dri";
|
|
|
|
struct dirent *ent = NULL;
|
|
|
|
int dirErr = 0;
|
|
|
|
bool have_rendernode = false;
|
|
|
|
|
|
|
|
if (virDirOpen(&driDir, driPath) < 0)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
while ((dirErr = virDirRead(driDir, &ent, driPath)) > 0) {
|
|
|
|
if (STRPREFIX(ent->d_name, "renderD")) {
|
|
|
|
have_rendernode = true;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (dirErr < 0)
|
|
|
|
goto cleanup;
|
|
|
|
|
|
|
|
/* even if /dev/dri exists, there might be no renderDX nodes available */
|
|
|
|
if (!have_rendernode) {
|
|
|
|
virReportError(VIR_ERR_INTERNAL_ERROR, "%s",
|
|
|
|
_("No DRM render nodes available"));
|
|
|
|
goto cleanup;
|
|
|
|
}
|
|
|
|
|
2019-10-22 15:26:14 +02:00
|
|
|
ret = g_strdup_printf("%s/%s", driPath, ent->d_name);
|
2018-11-08 11:47:09 +01:00
|
|
|
|
|
|
|
cleanup:
|
|
|
|
VIR_DIR_CLOSE(driDir);
|
|
|
|
return ret;
|
|
|
|
}
|