blob: a335e2d20017c9d8ac3bc25ea3161bb946c0279d [file] [log] [blame]
/*
nsjail - CLONE_NEWUSER routines
-----------------------------------------
Copyright 2014 Google Inc. All Rights Reserved.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
#include "user.h"
#include <errno.h>
#include <fcntl.h>
#include <grp.h>
#include <limits.h>
#include <linux/securebits.h>
#include <pwd.h>
#include <stdbool.h>
#include <stddef.h>
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <sys/prctl.h>
#include <sys/syscall.h>
#include <sys/types.h>
#include <unistd.h>
#include "logs.h"
#include "macros.h"
#include "subproc.h"
#include "util.h"
#define STR_(x) #x
#define STR(x) STR_(x)
constexpr char kNewUidPath[] =
#ifdef NEWUIDMAP_PATH
STR(NEWUIDMAP_PATH);
#else
"/usr/bin/newuidmap";
#endif
constexpr char kNewGidPath[] =
#ifdef NEWGIDMAP_PATH
STR(NEWGIDMAP_PATH);
#else
"/usr/bin/newgidmap";
#endif
namespace user {
static bool setResGid(gid_t gid) {
LOG_D("setresgid(%d)", gid);
#if defined(__NR_setresgid32)
if (util::syscall(__NR_setresgid32, (uintptr_t)gid, (uintptr_t)gid, (uintptr_t)gid) == -1) {
PLOG_W("setresgid32(%d)", (int)gid);
return false;
}
#else /* defined(__NR_setresgid32) */
if (util::syscall(__NR_setresgid, (uintptr_t)gid, (uintptr_t)gid, (uintptr_t)gid) == -1) {
PLOG_W("setresgid(%d)", gid);
return false;
}
#endif /* defined(__NR_setresuid32) */
return true;
}
static bool setResUid(uid_t uid) {
LOG_D("setresuid(%d)", uid);
#if defined(__NR_setresuid32)
if (util::syscall(__NR_setresuid32, (uintptr_t)uid, (uintptr_t)uid, (uintptr_t)uid) == -1) {
PLOG_W("setresuid32(%d)", (int)uid);
return false;
}
#else /* defined(__NR_setresuid32) */
if (util::syscall(__NR_setresuid, (uintptr_t)uid, (uintptr_t)uid, (uintptr_t)uid) == -1) {
PLOG_W("setresuid(%d)", uid);
return false;
}
#endif /* defined(__NR_setresuid32) */
return true;
}
static bool hasGidMapSelf(nsjconf_t* nsjconf) {
for (const auto& gid : nsjconf->gids) {
if (!gid.is_newidmap) {
return true;
}
}
return false;
}
static bool setGroupsDeny(nsjconf_t* nsjconf, pid_t pid) {
/*
* No need to write 'deny' to /proc/pid/setgroups if our euid==0, as writing to
* uid_map/gid_map will succeed anyway
*/
if (!nsjconf->clone_newuser || nsjconf->orig_euid == 0 || !hasGidMapSelf(nsjconf)) {
return true;
}
char fname[PATH_MAX];
snprintf(fname, sizeof(fname), "/proc/%d/setgroups", pid);
const char* const denystr = "deny";
if (!util::writeBufToFile(fname, denystr, strlen(denystr), O_WRONLY | O_CLOEXEC)) {
LOG_E("util::writeBufToFile('%s', '%s') failed", fname, denystr);
return false;
}
return true;
}
static bool uidMapSelf(nsjconf_t* nsjconf, pid_t pid) {
std::string map;
for (const auto& uid : nsjconf->uids) {
if (uid.is_newidmap) {
continue;
}
map.append(std::to_string(uid.inside_id));
map.append(" ");
map.append(std::to_string(uid.outside_id));
map.append(" ");
map.append(std::to_string(uid.count));
map.append("\n");
}
if (map.empty()) {
return true;
}
char fname[PATH_MAX];
snprintf(fname, sizeof(fname), "/proc/%d/uid_map", pid);
LOG_D("Writing '%s' to '%s'", map.c_str(), fname);
if (!util::writeBufToFile(fname, map.data(), map.length(), O_WRONLY | O_CLOEXEC)) {
LOG_E("util::writeBufToFile('%s', '%s') failed", fname, map.c_str());
return false;
}
return true;
}
static bool gidMapSelf(nsjconf_t* nsjconf, pid_t pid) {
std::string map;
for (const auto& gid : nsjconf->gids) {
if (gid.is_newidmap) {
continue;
}
map.append(std::to_string(gid.inside_id));
map.append(" ");
map.append(std::to_string(gid.outside_id));
map.append(" ");
map.append(std::to_string(gid.count));
map.append("\n");
}
if (map.empty()) {
return true;
}
char fname[PATH_MAX];
snprintf(fname, sizeof(fname), "/proc/%d/gid_map", pid);
LOG_D("Writing '%s' to '%s'", map.c_str(), fname);
if (!util::writeBufToFile(fname, map.data(), map.length(), O_WRONLY | O_CLOEXEC)) {
LOG_E("util::writeBufToFile('%s', '%s') failed", fname, map.c_str());
return false;
}
return true;
}
/* Use newgidmap for writing the gid map */
static bool gidMapExternal(nsjconf_t* nsjconf, pid_t pid) {
bool use = false;
std::vector<std::string> argv = {kNewGidPath, std::to_string(pid)};
for (const auto& gid : nsjconf->gids) {
if (!gid.is_newidmap) {
continue;
}
use = true;
argv.push_back(std::to_string(gid.inside_id));
argv.push_back(std::to_string(gid.outside_id));
argv.push_back(std::to_string(gid.count));
}
if (!use) {
return true;
}
if (subproc::systemExe(argv, environ) != 0) {
LOG_E("'%s' failed", kNewGidPath);
return false;
}
return true;
}
/* Use newuidmap for writing the uid map */
static bool uidMapExternal(nsjconf_t* nsjconf, pid_t pid) {
bool use = false;
std::vector<std::string> argv = {kNewUidPath, std::to_string(pid)};
for (const auto& uid : nsjconf->uids) {
if (!uid.is_newidmap) {
continue;
}
use = true;
argv.push_back(std::to_string(uid.inside_id));
argv.push_back(std::to_string(uid.outside_id));
argv.push_back(std::to_string(uid.count));
}
if (!use) {
return true;
}
if (subproc::systemExe(argv, environ) != 0) {
LOG_E("'%s' failed", kNewUidPath);
return false;
}
return true;
}
static bool uidGidMap(nsjconf_t* nsjconf, pid_t pid) {
RETURN_ON_FAILURE(gidMapSelf(nsjconf, pid));
RETURN_ON_FAILURE(gidMapExternal(nsjconf, pid));
RETURN_ON_FAILURE(uidMapSelf(nsjconf, pid));
RETURN_ON_FAILURE(uidMapExternal(nsjconf, pid));
return true;
}
bool initNsFromParent(nsjconf_t* nsjconf, pid_t pid) {
if (!setGroupsDeny(nsjconf, pid)) {
return false;
}
if (!nsjconf->clone_newuser) {
return true;
}
if (!uidGidMap(nsjconf, pid)) {
return false;
}
return true;
}
bool initNsFromChild(nsjconf_t* nsjconf) {
if (!nsjconf->clone_newuser && nsjconf->orig_euid != 0) {
return true;
}
/*
* Make sure all capabilities are retained after the subsequent setuid/setgid, as they will
* be needed for privileged operations: mounts, uts change etc.
*/
if (prctl(PR_SET_SECUREBITS, SECBIT_KEEP_CAPS | SECBIT_NO_SETUID_FIXUP, 0UL, 0UL, 0UL) ==
-1) {
PLOG_E("prctl(PR_SET_SECUREBITS, SECBIT_KEEP_CAPS | SECBIT_NO_SETUID_FIXUP)");
return false;
}
/*
* Best effort because of /proc/self/setgroups. We deny
* setgroups(2) calls only if user namespaces are in use.
*/
std::vector<gid_t> groups;
std::string groupsString = "[";
if (!nsjconf->clone_newuser && nsjconf->gids.size() > 1) {
for (auto it = nsjconf->gids.begin() + 1; it != nsjconf->gids.end(); it++) {
groups.push_back(it->inside_id);
groupsString += std::to_string(it->inside_id);
if (it < nsjconf->gids.end() - 1) groupsString += ", ";
}
}
groupsString += "]";
if (!setResGid(nsjconf->gids[0].inside_id)) {
PLOG_E("setresgid(%lu)", (unsigned long)nsjconf->gids[0].inside_id);
return false;
}
LOG_D("setgroups(%zu, %s)", groups.size(), groupsString.c_str());
if (setgroups(groups.size(), groups.data()) == -1) {
/* Indicate error if specific groups were requested */
if (groups.size() > 0) {
PLOG_E("setgroups(%zu, %s) failed", groups.size(), groupsString.c_str());
return false;
}
PLOG_D("setgroups(%zu, %s) failed", groups.size(), groupsString.c_str());
}
if (!setResUid(nsjconf->uids[0].inside_id)) {
PLOG_E("setresuid(%lu)", (unsigned long)nsjconf->uids[0].inside_id);
return false;
}
/*
* Disable securebits again to avoid spawned programs
* unexpectedly retaining capabilities after a UID/GID
* change.
*/
if (prctl(PR_SET_SECUREBITS, 0UL, 0UL, 0UL, 0UL) == -1) {
PLOG_E("prctl(PR_SET_SECUREBITS, 0)");
return false;
}
return true;
}
static uid_t parseUid(const std::string& id) {
if (id.empty()) {
return getuid();
}
struct passwd* pw = getpwnam(id.c_str());
if (pw != NULL) {
return pw->pw_uid;
}
if (util::isANumber(id.c_str())) {
return (uid_t)strtoimax(id.c_str(), NULL, 0);
}
return (uid_t)-1;
}
static gid_t parseGid(const std::string& id) {
if (id.empty()) {
return getgid();
}
struct group* gr = getgrnam(id.c_str());
if (gr != NULL) {
return gr->gr_gid;
}
if (util::isANumber(id.c_str())) {
return (gid_t)strtoimax(id.c_str(), NULL, 0);
}
return (gid_t)-1;
}
bool parseId(nsjconf_t* nsjconf, const std::string& i_id, const std::string& o_id, size_t cnt,
bool is_gid, bool is_newidmap) {
if (cnt < 1) {
cnt = 1;
}
uid_t inside_id;
uid_t outside_id;
if (is_gid) {
inside_id = parseGid(i_id);
if (inside_id == (uid_t)-1) {
LOG_W("Cannot parse '%s' as GID", i_id.c_str());
return false;
}
outside_id = parseGid(o_id);
if (outside_id == (uid_t)-1) {
LOG_W("Cannot parse '%s' as GID", o_id.c_str());
return false;
}
} else {
inside_id = parseUid(i_id);
if (inside_id == (uid_t)-1) {
LOG_W("Cannot parse '%s' as UID", i_id.c_str());
return false;
}
outside_id = parseUid(o_id);
if (outside_id == (uid_t)-1) {
LOG_W("Cannot parse '%s' as UID", o_id.c_str());
return false;
}
}
idmap_t id;
id.inside_id = inside_id;
id.outside_id = outside_id;
id.count = cnt;
id.is_newidmap = is_newidmap;
if (is_gid) {
nsjconf->gids.push_back(id);
} else {
nsjconf->uids.push_back(id);
}
return true;
}
} // namespace user