proc_file = fopen(proc_fn, "r");
if (!proc_file) {
- SYSERROR("Could not open %s.", proc_fn);
+ SYSERROR("Could not open %s", proc_fn);
goto on_error;
}
info = calloc(1, sizeof(*info));
if (!info) {
- SYSERROR("Could not allocate memory.");
+ SYSERROR("Could not allocate memory");
fclose(proc_file);
return NULL;
}
found = false;
+
while (getline(&line, &line_bufsz, proc_file) != -1) {
ret = sscanf(line, "CapBnd: %llx", &info->capability_mask);
if (ret != EOF && ret == 1) {
fclose(proc_file);
if (!found) {
- SYSERROR("Could not read capability bounding set from %s.",
- proc_fn);
- errno = ENOENT;
+ ERROR("Could not read capability bounding set from %s",
+ proc_fn);
goto on_error;
}
for (i = 0; i < LXC_NS_MAX; i++) {
if (ctx->ns_fd[i] < 0)
continue;
+
close(ctx->ns_fd[i]);
ctx->ns_fd[i] = -EBADF;
}
static int in_same_namespace(pid_t pid1, pid_t pid2, const char *ns)
{
int ns_fd1 = -1, ns_fd2 = -1, ret = -1;
+ int saved_errno = errno;
struct stat ns_st1, ns_st2;
ns_fd1 = lxc_preserve_ns(pid1, ns);
if (errno == ENOENT)
return -EINVAL;
+ saved_errno = errno;
goto out;
}
ns_fd2 = lxc_preserve_ns(pid2, ns);
- if (ns_fd2 < 0)
+ if (ns_fd2 < 0) {
+ saved_errno = errno;
goto out;
+ }
ret = fstat(ns_fd1, &ns_st1);
- if (ret < 0)
+ if (ret < 0) {
+ saved_errno = errno;
goto out;
+ }
ret = fstat(ns_fd2, &ns_st2);
- if (ret < 0)
+ if (ret < 0) {
+ saved_errno = errno;
goto out;
+ }
/* processes are in the same namespace */
- ret = -EINVAL;
- if ((ns_st1.st_dev == ns_st2.st_dev ) && (ns_st1.st_ino == ns_st2.st_ino))
+ if ((ns_st1.st_dev == ns_st2.st_dev ) && (ns_st1.st_ino == ns_st2.st_ino)) {
+ ret = -EINVAL;
goto out;
+ }
/* processes are in different namespaces */
ret = ns_fd2;
ns_fd2 = -1;
out:
-
if (ns_fd1 >= 0)
close(ns_fd1);
+
if (ns_fd2 >= 0)
close(ns_fd2);
+ errno = saved_errno;
return ret;
}
static int lxc_attach_to_ns(pid_t pid, struct lxc_proc_context_info *ctx)
{
- int i, ret;
+ int i;
for (i = 0; i < LXC_NS_MAX; i++) {
if (ctx->ns_fd[i] < 0)
continue;
- ret = setns(ctx->ns_fd[i], ns_info[i].clone_flag);
- if (ret < 0) {
+ if (setns(ctx->ns_fd[i], ns_info[i].clone_flag) < 0) {
SYSERROR("Failed to attach to %s namespace of %d",
- ns_info[i].proc_name, pid);
+ ns_info[i].proc_name, pid);
return -1;
}
ret = unshare(CLONE_NEWNS);
if (ret < 0) {
- SYSERROR("Failed to unshare mount namespace.");
+ SYSERROR("Failed to unshare mount namespace");
return -1;
}
if (detect_shared_rootfs()) {
if (mount(NULL, "/", NULL, MS_SLAVE | MS_REC, NULL)) {
- SYSERROR("Failed to make / rslave.");
+ SYSERROR("Failed to make / rslave");
ERROR("Continuing...");
}
}
/* Assume /proc is always mounted, so remount it. */
ret = umount2("/proc", MNT_DETACH);
if (ret < 0) {
- SYSERROR("Failed to unmount /proc.");
+ SYSERROR("Failed to unmount /proc");
return -1;
}
ret = mount("none", "/proc", "proc", 0, NULL);
if (ret < 0) {
- SYSERROR("Failed to remount /proc.");
+ SYSERROR("Failed to remount /proc");
return -1;
}
*/
ret = umount2("/sys", MNT_DETACH);
if (ret < 0 && errno != EINVAL) {
- SYSERROR("Failed to unmount /sys.");
+ SYSERROR("Failed to unmount /sys");
return -1;
} else if (ret == 0) {
/* Remount it. */
ret = mount("none", "/sys", "sysfs", 0, NULL);
if (ret < 0) {
- SYSERROR("Failed to remount /sys.");
+ SYSERROR("Failed to remount /sys");
return -1;
}
}
SYSERROR("Failed to drop capability %d", cap);
return -1;
}
+
TRACE("Dropped capability %d", cap);
}
if (!extra_keep_store[i]) {
while (i > 0)
free(extra_keep_store[--i]);
+
free(extra_keep_store);
return -1;
}
free(extra_keep_store);
}
- SYSERROR("Failed to clear environment");
+ ERROR("Failed to clear environment");
return -1;
}
if (ret < 0)
SYSWARN("Failed to set environment variable");
}
+
free(extra_keep_store[i]);
}
+
free(extra_keep_store);
}
if (extra_env) {
for (; *extra_env; extra_env++) {
char *p;
+
/* We just assume the user knows what they are doing, so
* we don't do any checks.
*/
ret = dup2(pipes[1], STDOUT_FILENO);
close(pipes[1]);
if (ret < 0)
- exit(EXIT_FAILURE);
+ _exit(EXIT_FAILURE);
/* Get rid of stdin/stderr, so we try to associate it with
* /dev/null.
/* Finish argument list. */
ret = snprintf(uid_buf, sizeof(uid_buf), "%ld", (long)uid);
if (ret <= 0 || ret >= sizeof(uid_buf))
- exit(EXIT_FAILURE);
+ _exit(EXIT_FAILURE);
/* Try to run getent program. */
(void)execvp("getent", arguments);
- exit(EXIT_FAILURE);
+ _exit(EXIT_FAILURE);
}
close(pipes[1]);
token = strtok_r(NULL, ":", &saveptr);
value = token ? strtol(token, &endptr, 10) : 0;
if (!token || !endptr || *endptr || value == LONG_MIN ||
- value == LONG_MAX)
+ value == LONG_MAX)
continue;
/* dummy sanity check: user id matches */
if (!token)
continue;
}
+
if (!token)
continue;
+
free(result);
result = strdup(token);
found = true;
}
+
free(line);
fclose(pipe_f);
if (ret != EOF && ret == 1)
gid = (gid_t)value;
}
+
if (uid != (uid_t)-1 && gid != (gid_t)-1)
break;
}
/* Only override arguments if we found something. */
if (uid != (uid_t)-1)
*init_uid = uid;
+
if (gid != (gid_t)-1)
*init_gid = gid;
/* Remove current setting. */
if (!c->set_config_item(c, "lxc.seccomp.profile", "") &&
- !c->set_config_item(c, "lxc.seccomp", "")) {
+ !c->set_config_item(c, "lxc.seccomp", ""))
return false;
- }
/* Fetch the current profile path over the cmd interface. */
path = c->get_running_config_item(c, "lxc.seccomp.profile");
if (!path) {
INFO("Failed to retrieve lxc.seccomp.profile");
+
path = c->get_running_config_item(c, "lxc.seccomp");
if (!path) {
INFO("Failed to retrieve lxc.seccomp");
ret = lxc_attach_remount_sys_proc();
if (ret < 0)
goto on_error;
+
TRACE("Remounted \"/proc\" and \"/sys\"");
}
new_personality = init_ctx->personality;
else
new_personality = options->personality;
+
ret = personality(new_personality);
if (ret < 0)
goto on_error;
+
TRACE("Set new personality");
}
#endif
ret = lxc_attach_drop_privs(init_ctx);
if (ret < 0)
goto on_error;
+
TRACE("Dropped capabilities");
}
options->extra_keep_env);
if (ret < 0)
goto on_error;
+
TRACE("Set up environment");
/* This remark only affects fully unprivileged containers:
/* Set {u,g}id. */
new_uid = 0;
new_gid = 0;
+
/* Ignore errors, we will fall back to root in that case (/proc was not
* mounted etc.).
*/
if (options->uid != (uid_t)-1)
new_uid = options->uid;
+
if (options->gid != (gid_t)-1)
new_gid = options->gid;
ret = prctl(PR_SET_NO_NEW_PRIVS, 1, 0, 0, 0);
if (ret < 0)
goto on_error;
+
TRACE("Set PR_SET_NO_NEW_PRIVS");
}
/* Change into our new LSM profile. */
on_exec = options->attach_flags & LXC_ATTACH_LSM_EXEC ? true : false;
+
ret = lsm_process_label_set_at(lsm_fd, init_ctx->lsm_label, on_exec);
close(lsm_fd);
if (ret < 0)
goto on_error;
+
TRACE("Set %s LSM label to \"%s\"", lsm_name(), init_ctx->lsm_label);
}
ret = lxc_seccomp_load(init_ctx->container->lxc_conf);
if (ret < 0)
goto on_error;
+
TRACE("Loaded seccomp profile");
}
+
shutdown(payload->ipc_socket, SHUT_RDWR);
close(payload->ipc_socket);
payload->ipc_socket = -EBADF;
SYSERROR("Failed to prepare terminal file descriptor %d", payload->terminal_slave_fd);
goto on_error;
}
+
TRACE("Prepared terminal file descriptor %d", payload->terminal_slave_fd);
}
ret = lxc_terminal_create(terminal);
if (ret < 0) {
- SYSERROR("Failed to create terminal");
+ ERROR("Failed to create terminal");
return -1;
}
ret = access("/proc/self/ns", X_OK);
if (ret) {
- ERROR("Does this kernel version support namespaces?");
+ SYSERROR("Does this kernel version support namespaces?");
return -1;
}
init_ctx->container->lxc_conf = lxc_conf_init();
if (!init_ctx->container->lxc_conf) {
lxc_proc_put_context_info(init_ctx);
- return -ENOMEM;
+ return -1;
}
}
conf = init_ctx->container->lxc_conf;
}
pid = lxc_raw_getpid();
+
for (i = 0; i < LXC_NS_MAX; i++) {
- int j, saved_errno;
+ int j;
if (options->namespaces & ns_info[i].clone_flag)
init_ctx->ns_fd[i] = lxc_preserve_ns(init_pid, ns_info[i].proc_name);
init_ctx->ns_fd[i] = in_same_namespace(pid, init_pid, ns_info[i].proc_name);
else
continue;
+
if (init_ctx->ns_fd[i] >= 0)
continue;
}
/* We failed to preserve the namespace. */
- saved_errno = errno;
+ SYSERROR("Failed to attach to %s namespace of %d",
+ ns_info[i].proc_name, pid);
+
/* Close all already opened file descriptors before we return an
* error, so we don't leak them.
*/
for (j = 0; j < i; j++)
close(init_ctx->ns_fd[j]);
- errno = saved_errno;
- SYSERROR("Failed to attach to %s namespace of %d",
- ns_info[i].proc_name, pid);
free(cwd);
lxc_proc_put_context_info(init_ctx);
return -1;
ret = lxc_attach_terminal_mainloop_init(&terminal, &descr);
if (ret < 0)
goto on_error;
+
TRACE("Initialized terminal mainloop");
}
ret = lxc_write_nointr(ipc_sockets[0], &status, sizeof(status));
if (ret != sizeof(status))
goto close_mainloop;
+
TRACE("Told intermediate process to start initializing");
/* Get pid of attached process from intermediate process. */
ret = lxc_read_nointr(ipc_sockets[0], &attached_pid, sizeof(attached_pid));
if (ret != sizeof(attached_pid))
goto close_mainloop;
+
TRACE("Received pid %d of attached process in parent pid namespace", attached_pid);
/* Ignore SIGKILL (CTRL-C) and SIGQUIT (CTRL-\) - issue #313. */
ret = wait_for_pid(pid);
if (ret < 0)
goto close_mainloop;
+
TRACE("Intermediate process %d exited", pid);
/* We will always have to reap the attached process now. */
labelfd = lsm_process_label_fd_get(attached_pid, on_exec);
if (labelfd < 0)
goto close_mainloop;
+
TRACE("Opened LSM label file descriptor %d", labelfd);
/* Send child fd of the LSM security module to write to. */
ret_parent = 0;
to_cleanup_pid = -1;
+
if (options->attach_flags & LXC_ATTACH_TERMINAL) {
ret = lxc_mainloop(&descr, -1);
if (ret < 0) {
lxc_terminal_delete(&terminal);
lxc_terminal_conf_free(&terminal);
}
+
lxc_proc_put_context_info(init_ctx);
return ret_parent;
}
/* close unneeded file descriptors */
close(ipc_sockets[0]);
ipc_sockets[0] = -EBADF;
+
if (options->attach_flags & LXC_ATTACH_TERMINAL) {
lxc_attach_terminal_close_master(&terminal);
lxc_attach_terminal_close_peer(&terminal);
lxc_proc_put_context_info(init_ctx);
rexit(-1);
}
+
TRACE("Intermediate process starting to initialize");
/* Attach now, create another subprocess later, since pid namespaces
lxc_proc_put_context_info(init_ctx);
rexit(-1);
}
+
/* close namespace file descriptors */
lxc_proc_close_ns_fd(init_ctx);
ret = attach_child_main(&payload);
if (ret < 0)
ERROR("Failed to exec");
+
_exit(EXIT_FAILURE);
}
+
if (options->attach_flags & LXC_ATTACH_TERMINAL)
lxc_attach_terminal_close_slave(&terminal);
lxc_proc_put_context_info(init_ctx);
rexit(-1);
}
+
TRACE("Sending pid %d of attached process", pid);
/* The rest is in the hands of the initial and the attached process. */
lxc_attach_command_t* cmd = (lxc_attach_command_t*)payload;
execvp(cmd->program, cmd->argv);
- SYSERROR("Failed to exec \"%s\".", cmd->program);
+
+ SYSERROR("Failed to exec \"%s\"", cmd->program);
return -1;
}
ret = getpwuid_r(uid, &pwent, buf, bufsize, &pwentp);
if (!pwentp) {
if (ret == 0)
- WARN("Could not find matched password record.");
+ WARN("Could not find matched password record");
WARN("Failed to get password record - %u", uid);
}
user_shell = lxc_attach_getpwshell(uid);
else
user_shell = pwent.pw_shell;
+
if (user_shell)
execlp(user_shell, user_shell, (char *)NULL);
* on /bin/sh as a default shell.
*/
execlp("/bin/sh", "/bin/sh", (char *)NULL);
+
SYSERROR("Failed to execute shell");
if (!pwentp)
free(user_shell);
+
free(buf);
return -1;
}