]> git.proxmox.com Git - mirror_lxc.git/blame - src/lxc/utils.c
apparmor: use fopen_cloexec
[mirror_lxc.git] / src / lxc / utils.c
CommitLineData
e3642c43
DL
1/*
2 * lxc: linux Container library
3 *
4 * (C) Copyright IBM Corp. 2007, 2008
5 *
6 * Authors:
9afe19d6 7 * Daniel Lezcano <daniel.lezcano at free.fr>
e3642c43
DL
8 *
9 * This library is free software; you can redistribute it and/or
10 * modify it under the terms of the GNU Lesser General Public
11 * License as published by the Free Software Foundation; either
12 * version 2.1 of the License, or (at your option) any later version.
13 *
14 * This library is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
17 * Lesser General Public License for more details.
18 *
19 * You should have received a copy of the GNU Lesser General Public
20 * License along with this library; if not, write to the Free Software
250b1eec 21 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
e3642c43
DL
22 */
23
052616eb
ÇO
24#include "config.h"
25
7935833c 26#define __STDC_FORMAT_MACROS /* Required for PRIu64 to work. */
643c1984 27#include <ctype.h>
a1e5280d 28#include <dirent.h>
e3642c43 29#include <errno.h>
a1e5280d 30#include <fcntl.h>
dbaf55a3 31#include <grp.h>
7935833c 32#include <inttypes.h>
a1e5280d 33#include <libgen.h>
b467714b 34#include <pthread.h>
d983b93c 35#include <stddef.h>
a1e5280d
CB
36#include <stdio.h>
37#include <stdlib.h>
61a1d519 38#include <string.h>
981f6029 39#include <unistd.h>
e3642c43 40#include <sys/mman.h>
6e4bb2e0 41#include <sys/mount.h>
a1e5280d
CB
42#include <sys/param.h>
43#include <sys/prctl.h>
44#include <sys/stat.h>
9be53773
SH
45#include <sys/types.h>
46#include <sys/wait.h>
e3642c43
DL
47
48#include "log.h"
025ed0f3 49#include "lxclock.h"
51d0854c 50#include "namespace.h"
e3db0162 51#include "parse.h"
981f6029 52#include "utils.h"
e3642c43 53
43f984ea
DJ
54#ifndef HAVE_STRLCPY
55#include "include/strlcpy.h"
56#endif
57
bd583214
DJ
58#ifndef HAVE_STRLCAT
59#include "include/strlcat.h"
60#endif
61
4928c718
SG
62#ifndef O_PATH
63#define O_PATH 010000000
64#endif
65
66#ifndef O_NOFOLLOW
67#define O_NOFOLLOW 00400000
68#endif
69
ac2cecc4 70lxc_log_define(utils, lxc);
e3642c43 71
4295c5de
SH
72/*
73 * if path is btrfs, tries to remove it and any subvolumes beneath it
74 */
75extern bool btrfs_try_remove_subvol(const char *path);
76
41dc7155 77static int _recursive_rmdir(const char *dirname, dev_t pdev,
0cc417b2 78 const char *exclude, int level, bool onedev)
60bf62d4 79{
74f96976 80 struct dirent *direntp;
60bf62d4
SH
81 DIR *dir;
82 int ret, failed=0;
83 char pathname[MAXPATHLEN];
18aa217b 84 bool hadexclude = false;
60bf62d4
SH
85
86 dir = opendir(dirname);
87 if (!dir) {
b103ceac 88 ERROR("failed to open %s", dirname);
4355ab5f 89 return -1;
60bf62d4
SH
90 }
91
74f96976 92 while ((direntp = readdir(dir))) {
60bf62d4
SH
93 struct stat mystat;
94 int rc;
95
60bf62d4
SH
96 if (!strcmp(direntp->d_name, ".") ||
97 !strcmp(direntp->d_name, ".."))
98 continue;
99
100 rc = snprintf(pathname, MAXPATHLEN, "%s/%s", dirname, direntp->d_name);
101 if (rc < 0 || rc >= MAXPATHLEN) {
102 ERROR("pathname too long");
103 failed=1;
104 continue;
105 }
18aa217b
SH
106
107 if (!level && exclude && !strcmp(direntp->d_name, exclude)) {
108 ret = rmdir(pathname);
109 if (ret < 0) {
110 switch(errno) {
111 case ENOTEMPTY:
0cc417b2 112 INFO("Not deleting snapshot %s", pathname);
18aa217b
SH
113 hadexclude = true;
114 break;
115 case ENOTDIR:
116 ret = unlink(pathname);
117 if (ret)
b103ceac 118 INFO("Failed to remove %s", pathname);
18aa217b
SH
119 break;
120 default:
b103ceac 121 SYSERROR("Failed to rmdir %s", pathname);
18aa217b
SH
122 failed = 1;
123 break;
124 }
125 }
126 continue;
127 }
128
60bf62d4
SH
129 ret = lstat(pathname, &mystat);
130 if (ret) {
b103ceac 131 ERROR("Failed to stat %s", pathname);
4295c5de 132 failed = 1;
60bf62d4
SH
133 continue;
134 }
b14fc100 135
4295c5de
SH
136 if (onedev && mystat.st_dev != pdev) {
137 /* TODO should we be checking /proc/self/mountinfo for
138 * pathname and not doing this if found? */
139 if (btrfs_try_remove_subvol(pathname))
140 INFO("Removed btrfs subvolume at %s\n", pathname);
60bf62d4 141 continue;
4295c5de 142 }
b14fc100 143
60bf62d4 144 if (S_ISDIR(mystat.st_mode)) {
0cc417b2 145 if (_recursive_rmdir(pathname, pdev, exclude, level+1, onedev) < 0)
60bf62d4
SH
146 failed=1;
147 } else {
148 if (unlink(pathname) < 0) {
b103ceac 149 SYSERROR("Failed to delete %s", pathname);
60bf62d4
SH
150 failed=1;
151 }
152 }
153 }
154
4295c5de 155 if (rmdir(dirname) < 0 && !btrfs_try_remove_subvol(dirname) && !hadexclude) {
b103ceac 156 ERROR("Failed to delete %s", dirname);
4295c5de 157 failed=1;
60bf62d4
SH
158 }
159
025ed0f3 160 ret = closedir(dir);
025ed0f3 161 if (ret) {
b103ceac 162 ERROR("Failed to close directory %s", dirname);
60bf62d4
SH
163 failed=1;
164 }
165
4355ab5f 166 return failed ? -1 : 0;
60bf62d4
SH
167}
168
29a11a7f
CB
169/* We have two different magic values for overlayfs, yay. */
170#ifndef OVERLAYFS_SUPER_MAGIC
0cc417b2 171#define OVERLAYFS_SUPER_MAGIC 0x794c764f
29a11a7f
CB
172#endif
173
174#ifndef OVERLAY_SUPER_MAGIC
0cc417b2 175#define OVERLAY_SUPER_MAGIC 0x794c7630
29a11a7f
CB
176#endif
177
178/* In overlayfs, st_dev is unreliable. So on overlayfs we don't do the
179 * lxc_rmdir_onedev()
0cc417b2
SH
180 */
181static bool is_native_overlayfs(const char *path)
182{
29a11a7f
CB
183 if (has_fs_type(path, OVERLAY_SUPER_MAGIC) ||
184 has_fs_type(path, OVERLAYFS_SUPER_MAGIC))
0cc417b2 185 return true;
29a11a7f 186
0cc417b2
SH
187 return false;
188}
189
4355ab5f 190/* returns 0 on success, -1 if there were any failures */
41dc7155 191extern int lxc_rmdir_onedev(const char *path, const char *exclude)
60bf62d4
SH
192{
193 struct stat mystat;
0cc417b2
SH
194 bool onedev = true;
195
41dc7155 196 if (is_native_overlayfs(path))
0cc417b2 197 onedev = false;
60bf62d4
SH
198
199 if (lstat(path, &mystat) < 0) {
067650d0
SH
200 if (errno == ENOENT)
201 return 0;
41dc7155 202
b103ceac 203 ERROR("Failed to stat %s", path);
4355ab5f 204 return -1;
60bf62d4
SH
205 }
206
0cc417b2 207 return _recursive_rmdir(path, mystat.st_dev, exclude, 0, onedev);
60bf62d4
SH
208}
209
9ddaf3bf 210/* borrowed from iproute2 */
7c11d57a 211extern int get_u16(unsigned short *val, const char *arg, int base)
9ddaf3bf
JHS
212{
213 unsigned long res;
214 char *ptr;
215
216 if (!arg || !*arg)
217 return -1;
218
09bbd745 219 errno = 0;
9ddaf3bf 220 res = strtoul(arg, &ptr, base);
09bbd745 221 if (!ptr || ptr == arg || *ptr || res > 0xFFFF || errno != 0)
9ddaf3bf
JHS
222 return -1;
223
224 *val = res;
225
226 return 0;
227}
228
3ce74686 229extern int mkdir_p(const char *dir, mode_t mode)
1b09f2c0 230{
3ce74686
SH
231 const char *tmp = dir;
232 const char *orig = dir;
860fc865
RW
233 char *makeme;
234
235 do {
236 dir = tmp + strspn(tmp, "/");
237 tmp = dir + strcspn(dir, "/");
b14fc100 238
d74325c4 239 makeme = strndup(orig, dir - orig);
860fc865
RW
240 if (*makeme) {
241 if (mkdir(makeme, mode) && errno != EEXIST) {
959aee9c 242 SYSERROR("failed to create directory '%s'", makeme);
d74325c4 243 free(makeme);
860fc865
RW
244 return -1;
245 }
246 }
d74325c4 247 free(makeme);
860fc865 248 } while(tmp != dir);
1b09f2c0 249
98663823 250 return 0;
1b09f2c0 251}
2a59a681 252
44b9ae4b 253char *get_rundir()
9e60f51d 254{
97a696c6
SG
255 char *rundir;
256 const char *homedir;
9650c735 257 struct stat sb;
9e60f51d 258
b14fc100 259 if (stat(RUNTIME_PATH, &sb) < 0)
9650c735 260 return NULL;
9650c735
TA
261
262 if (geteuid() == sb.st_uid || getegid() == sb.st_gid) {
c580b8d2 263 rundir = strdup(RUNTIME_PATH);
d6470e71
SG
264 return rundir;
265 }
97a696c6
SG
266
267 rundir = getenv("XDG_RUNTIME_DIR");
44b9ae4b
SG
268 if (rundir) {
269 rundir = strdup(rundir);
270 return rundir;
271 }
97a696c6 272
44b9ae4b
SG
273 INFO("XDG_RUNTIME_DIR isn't set in the environment.");
274 homedir = getenv("HOME");
275 if (!homedir) {
276 ERROR("HOME isn't set in the environment.");
277 return NULL;
97a696c6
SG
278 }
279
44b9ae4b 280 rundir = malloc(sizeof(char) * (17 + strlen(homedir)));
b14fc100 281 if (!rundir)
282 return NULL;
283
44b9ae4b
SG
284 sprintf(rundir, "%s/.cache/lxc/run/", homedir);
285
9e60f51d
DE
286 return rundir;
287}
288
9be53773
SH
289int wait_for_pid(pid_t pid)
290{
291 int status, ret;
292
293again:
294 ret = waitpid(pid, &status, 0);
295 if (ret == -1) {
71b9b8ed 296 if (errno == EINTR)
9be53773 297 goto again;
b14fc100 298
9be53773
SH
299 return -1;
300 }
b14fc100 301
9be53773
SH
302 if (ret != pid)
303 goto again;
b14fc100 304
9be53773
SH
305 if (!WIFEXITED(status) || WEXITSTATUS(status) != 0)
306 return -1;
b14fc100 307
9be53773
SH
308 return 0;
309}
c797a220
CS
310
311int lxc_wait_for_pid_status(pid_t pid)
312{
313 int status, ret;
314
315again:
316 ret = waitpid(pid, &status, 0);
317 if (ret == -1) {
318 if (errno == EINTR)
319 goto again;
b14fc100 320
c797a220
CS
321 return -1;
322 }
b14fc100 323
c797a220
CS
324 if (ret != pid)
325 goto again;
b14fc100 326
c797a220
CS
327 return status;
328}
92f023dc 329
b14fc100 330ssize_t lxc_write_nointr(int fd, const void *buf, size_t count)
92f023dc 331{
650468bb 332 ssize_t ret;
92f023dc
CS
333again:
334 ret = write(fd, buf, count);
335 if (ret < 0 && errno == EINTR)
336 goto again;
b14fc100 337
92f023dc
CS
338 return ret;
339}
340
b14fc100 341ssize_t lxc_read_nointr(int fd, void *buf, size_t count)
92f023dc 342{
650468bb 343 ssize_t ret;
92f023dc
CS
344again:
345 ret = read(fd, buf, count);
346 if (ret < 0 && errno == EINTR)
347 goto again;
b14fc100 348
92f023dc
CS
349 return ret;
350}
351
b14fc100 352ssize_t lxc_read_nointr_expect(int fd, void *buf, size_t count, const void *expected_buf)
92f023dc 353{
650468bb 354 ssize_t ret;
b14fc100 355
92f023dc
CS
356 ret = lxc_read_nointr(fd, buf, count);
357 if (ret <= 0)
358 return ret;
b14fc100 359
650468bb 360 if ((size_t)ret != count)
92f023dc 361 return -1;
b14fc100 362
92f023dc
CS
363 if (expected_buf && memcmp(buf, expected_buf, count) != 0) {
364 errno = EINVAL;
365 return -1;
366 }
b14fc100 367
92f023dc
CS
368 return ret;
369}
3ce74686
SH
370
371#if HAVE_LIBGNUTLS
372#include <gnutls/gnutls.h>
373#include <gnutls/crypto.h>
41246cee
DE
374
375__attribute__((constructor))
376static void gnutls_lxc_init(void)
377{
378 gnutls_global_init();
379}
380
3ce74686
SH
381int sha1sum_file(char *fnam, unsigned char *digest)
382{
383 char *buf;
384 int ret;
385 FILE *f;
386 long flen;
387
388 if (!fnam)
389 return -1;
b14fc100 390
025ed0f3 391 f = fopen_cloexec(fnam, "r");
7be677a8 392 if (!f) {
3ce74686
SH
393 SYSERROR("Error opening template");
394 return -1;
395 }
b14fc100 396
3ce74686
SH
397 if (fseek(f, 0, SEEK_END) < 0) {
398 SYSERROR("Error seeking to end of template");
dd1d77f9 399 fclose(f);
3ce74686
SH
400 return -1;
401 }
b14fc100 402
3ce74686
SH
403 if ((flen = ftell(f)) < 0) {
404 SYSERROR("Error telling size of template");
dd1d77f9 405 fclose(f);
3ce74686
SH
406 return -1;
407 }
b14fc100 408
3ce74686
SH
409 if (fseek(f, 0, SEEK_SET) < 0) {
410 SYSERROR("Error seeking to start of template");
dd1d77f9 411 fclose(f);
3ce74686
SH
412 return -1;
413 }
b14fc100 414
3ce74686
SH
415 if ((buf = malloc(flen+1)) == NULL) {
416 SYSERROR("Out of memory");
dd1d77f9 417 fclose(f);
3ce74686
SH
418 return -1;
419 }
b14fc100 420
3ce74686
SH
421 if (fread(buf, 1, flen, f) != flen) {
422 SYSERROR("Failure reading template");
423 free(buf);
dd1d77f9 424 fclose(f);
3ce74686
SH
425 return -1;
426 }
b14fc100 427
dd1d77f9 428 if (fclose(f) < 0) {
3ce74686
SH
429 SYSERROR("Failre closing template");
430 free(buf);
431 return -1;
432 }
b14fc100 433
3ce74686
SH
434 buf[flen] = '\0';
435 ret = gnutls_hash_fast(GNUTLS_DIG_SHA1, buf, flen, (void *)digest);
436 free(buf);
437 return ret;
438}
439#endif
61a1d519
CS
440
441char** lxc_va_arg_list_to_argv(va_list ap, size_t skip, int do_strdup)
442{
443 va_list ap2;
444 size_t count = 1 + skip;
445 char **result;
446
447 /* first determine size of argument list, we don't want to reallocate
448 * constantly...
449 */
450 va_copy(ap2, ap);
451 while (1) {
452 char* arg = va_arg(ap2, char*);
453 if (!arg)
454 break;
455 count++;
456 }
457 va_end(ap2);
458
459 result = calloc(count, sizeof(char*));
460 if (!result)
461 return NULL;
b14fc100 462
61a1d519
CS
463 count = skip;
464 while (1) {
465 char* arg = va_arg(ap, char*);
466 if (!arg)
467 break;
468 arg = do_strdup ? strdup(arg) : arg;
469 if (!arg)
470 goto oom;
471 result[count++] = arg;
472 }
473
474 /* calloc has already set last element to NULL*/
475 return result;
476
477oom:
478 free(result);
479 return NULL;
480}
481
482const char** lxc_va_arg_list_to_argv_const(va_list ap, size_t skip)
483{
484 return (const char**)lxc_va_arg_list_to_argv(ap, skip, 0);
485}
db27c8d7 486
8bd8018e 487struct lxc_popen_FILE *lxc_popen(const char *command)
ebec9176 488{
3f323207 489 int ret;
ebec9176
AM
490 int pipe_fds[2];
491 pid_t child_pid;
8bd8018e 492 struct lxc_popen_FILE *fp = NULL;
ebec9176 493
8bd8018e
CB
494 ret = pipe2(pipe_fds, O_CLOEXEC);
495 if (ret < 0)
ebec9176 496 return NULL;
ebec9176
AM
497
498 child_pid = fork();
8bd8018e
CB
499 if (child_pid < 0)
500 goto on_error;
501
502 if (!child_pid) {
503 sigset_t mask;
504
505 close(pipe_fds[0]);
506
507 /* duplicate stdout */
508 if (pipe_fds[1] != STDOUT_FILENO)
509 ret = dup2(pipe_fds[1], STDOUT_FILENO);
510 else
511 ret = fcntl(pipe_fds[1], F_SETFD, 0);
512 if (ret < 0) {
513 close(pipe_fds[1]);
03f618af 514 _exit(EXIT_FAILURE);
3f323207
CB
515 }
516
8bd8018e
CB
517 /* duplicate stderr */
518 if (pipe_fds[1] != STDERR_FILENO)
519 ret = dup2(pipe_fds[1], STDERR_FILENO);
520 else
521 ret = fcntl(pipe_fds[1], F_SETFD, 0);
522 close(pipe_fds[1]);
523 if (ret < 0)
03f618af 524 _exit(EXIT_FAILURE);
8bd8018e
CB
525
526 /* unblock all signals */
527 ret = sigfillset(&mask);
528 if (ret < 0)
03f618af 529 _exit(EXIT_FAILURE);
8bd8018e 530
b467714b 531 ret = pthread_sigmask(SIG_UNBLOCK, &mask, NULL);
8bd8018e 532 if (ret < 0)
03f618af 533 _exit(EXIT_FAILURE);
8bd8018e
CB
534
535 execl("/bin/sh", "sh", "-c", command, (char *)NULL);
03f618af 536 _exit(127);
ebec9176
AM
537 }
538
8bd8018e
CB
539 close(pipe_fds[1]);
540 pipe_fds[1] = -1;
ebec9176 541
8bd8018e
CB
542 fp = malloc(sizeof(*fp));
543 if (!fp)
544 goto on_error;
b14fc100 545
7e50ec0b 546 memset(fp, 0, sizeof(*fp));
ebec9176
AM
547
548 fp->child_pid = child_pid;
8bd8018e 549 fp->pipe = pipe_fds[0];
ebec9176 550
7e50ec0b
CB
551 /* From now on, closing fp->f will also close fp->pipe. So only ever
552 * call fclose(fp->f).
553 */
8bd8018e
CB
554 fp->f = fdopen(pipe_fds[0], "r");
555 if (!fp->f)
556 goto on_error;
ebec9176 557
8bd8018e 558 return fp;
ebec9176 559
8bd8018e 560on_error:
7e50ec0b
CB
561 /* We can only close pipe_fds[0] if fdopen() didn't succeed or wasn't
562 * called yet. Otherwise the fd belongs to the file opened by fdopen()
563 * since it isn't dup()ed.
564 */
565 if (fp && !fp->f && pipe_fds[0] >= 0)
8bd8018e
CB
566 close(pipe_fds[0]);
567
568 if (pipe_fds[1] >= 0)
569 close(pipe_fds[1]);
ebec9176 570
7e50ec0b
CB
571 if (fp && fp->f)
572 fclose(fp->f);
573
574 if (fp)
575 free(fp);
576
ebec9176
AM
577 return NULL;
578}
579
8bd8018e 580int lxc_pclose(struct lxc_popen_FILE *fp)
ebec9176 581{
ebec9176 582 pid_t wait_pid;
8bd8018e 583 int wstatus = 0;
ebec9176 584
8bd8018e 585 if (!fp)
ebec9176 586 return -1;
ebec9176
AM
587
588 do {
8bd8018e
CB
589 wait_pid = waitpid(fp->child_pid, &wstatus, 0);
590 } while (wait_pid < 0 && errno == EINTR);
ebec9176 591
8bd8018e
CB
592 fclose(fp->f);
593 free(fp);
594
595 if (wait_pid < 0)
ebec9176 596 return -1;
ebec9176
AM
597
598 return wstatus;
599}
600
502657d5
CS
601char *lxc_string_replace(const char *needle, const char *replacement, const char *haystack)
602{
603 ssize_t len = -1, saved_len = -1;
604 char *result = NULL;
605 size_t replacement_len = strlen(replacement);
606 size_t needle_len = strlen(needle);
607
608 /* should be executed exactly twice */
609 while (len == -1 || result == NULL) {
610 char *p;
611 char *last_p;
612 ssize_t part_len;
613
614 if (len != -1) {
615 result = calloc(1, len + 1);
616 if (!result)
617 return NULL;
b14fc100 618
502657d5
CS
619 saved_len = len;
620 }
621
622 len = 0;
623
624 for (last_p = (char *)haystack, p = strstr(last_p, needle); p; last_p = p, p = strstr(last_p, needle)) {
625 part_len = (ssize_t)(p - last_p);
626 if (result && part_len > 0)
627 memcpy(&result[len], last_p, part_len);
b14fc100 628
502657d5 629 len += part_len;
b14fc100 630
502657d5
CS
631 if (result && replacement_len > 0)
632 memcpy(&result[len], replacement, replacement_len);
b14fc100 633
502657d5
CS
634 len += replacement_len;
635 p += needle_len;
636 }
b14fc100 637
502657d5
CS
638 part_len = strlen(last_p);
639 if (result && part_len > 0)
640 memcpy(&result[len], last_p, part_len);
b14fc100 641
502657d5
CS
642 len += part_len;
643 }
644
645 /* make sure we did the same thing twice,
646 * once for calculating length, the other
647 * time for copying data */
97bc2422
CB
648 if (saved_len != len) {
649 free(result);
650 return NULL;
651 }
b14fc100 652
502657d5
CS
653 /* make sure we didn't overwrite any buffer,
654 * due to calloc the string should be 0-terminated */
97bc2422
CB
655 if (result[len] != '\0') {
656 free(result);
657 return NULL;
658 }
502657d5
CS
659
660 return result;
661}
662
663bool lxc_string_in_array(const char *needle, const char **haystack)
664{
665 for (; haystack && *haystack; haystack++)
666 if (!strcmp(needle, *haystack))
667 return true;
b14fc100 668
502657d5
CS
669 return false;
670}
671
672char *lxc_string_join(const char *sep, const char **parts, bool use_as_prefix)
673{
674 char *result;
675 char **p;
676 size_t sep_len = strlen(sep);
677 size_t result_len = use_as_prefix * sep_len;
bd583214 678 size_t buf_len;
502657d5
CS
679
680 /* calculate new string length */
681 for (p = (char **)parts; *p; p++)
682 result_len += (p > (char **)parts) * sep_len + strlen(*p);
683
bd583214
DJ
684 buf_len = result_len + 1;
685 result = calloc(buf_len, 1);
502657d5
CS
686 if (!result)
687 return NULL;
688
689 if (use_as_prefix)
bd583214 690 (void)strlcpy(result, sep, buf_len);
43f984ea 691
502657d5
CS
692 for (p = (char **)parts; *p; p++) {
693 if (p > (char **)parts)
bd583214 694 (void)strlcat(result, sep, buf_len);
b14fc100 695
bd583214 696 (void)strlcat(result, *p, buf_len);
502657d5
CS
697 }
698
699 return result;
700}
701
702char **lxc_normalize_path(const char *path)
703{
704 char **components;
705 char **p;
706 size_t components_len = 0;
707 size_t pos = 0;
708
709 components = lxc_string_split(path, '/');
710 if (!components)
711 return NULL;
b14fc100 712
502657d5
CS
713 for (p = components; *p; p++)
714 components_len++;
715
716 /* resolve '.' and '..' */
717 for (pos = 0; pos < components_len; ) {
718 if (!strcmp(components[pos], ".") || (!strcmp(components[pos], "..") && pos == 0)) {
719 /* eat this element */
720 free(components[pos]);
721 memmove(&components[pos], &components[pos+1], sizeof(char *) * (components_len - pos));
722 components_len--;
723 } else if (!strcmp(components[pos], "..")) {
724 /* eat this and the previous element */
725 free(components[pos - 1]);
726 free(components[pos]);
727 memmove(&components[pos-1], &components[pos+1], sizeof(char *) * (components_len - pos));
728 components_len -= 2;
729 pos--;
730 } else {
731 pos++;
732 }
733 }
734
735 return components;
736}
737
eda0afd4 738char *lxc_deslashify(const char *path)
aeb3682f 739{
eda0afd4 740 char *dup, *p;
c56a9652
CB
741 char **parts = NULL;
742 size_t n, len;
aeb3682f 743
eda0afd4
CB
744 dup = strdup(path);
745 if (!dup)
746 return NULL;
747
748 parts = lxc_normalize_path(dup);
749 if (!parts) {
750 free(dup);
751 return NULL;
752 }
aeb3682f 753
c56a9652
CB
754 /* We'll end up here if path == "///" or path == "". */
755 if (!*parts) {
eda0afd4 756 len = strlen(dup);
f85b16a1 757 if (!len) {
eda0afd4
CB
758 lxc_free_array((void **)parts, free);
759 return dup;
f85b16a1 760 }
b14fc100 761
eda0afd4 762 n = strcspn(dup, "/");
c56a9652 763 if (n == len) {
eda0afd4
CB
764 free(dup);
765 lxc_free_array((void **)parts, free);
766
c56a9652
CB
767 p = strdup("/");
768 if (!p)
eda0afd4
CB
769 return NULL;
770
771 return p;
c56a9652
CB
772 }
773 }
774
eda0afd4
CB
775 p = lxc_string_join("/", (const char **)parts, *dup == '/');
776 free(dup);
f85b16a1 777 lxc_free_array((void **)parts, free);
eda0afd4 778 return p;
aeb3682f
TA
779}
780
24b51482
CS
781char *lxc_append_paths(const char *first, const char *second)
782{
e8eb3956
CB
783 int ret;
784 size_t len;
24b51482 785 char *result = NULL;
e8eb3956 786 const char *pattern = "%s%s";
24b51482 787
e8eb3956 788 len = strlen(first) + strlen(second) + 1;
24b51482
CS
789 if (second[0] != '/') {
790 len += 1;
791 pattern = "%s/%s";
792 }
793
794 result = calloc(1, len);
795 if (!result)
796 return NULL;
797
e8eb3956
CB
798 ret = snprintf(result, len, pattern, first, second);
799 if (ret < 0 || (size_t)ret >= len) {
800 free(result);
801 return NULL;
802 }
803
24b51482
CS
804 return result;
805}
806
502657d5
CS
807bool lxc_string_in_list(const char *needle, const char *haystack, char _sep)
808{
809 char *token, *str, *saveptr = NULL;
810 char sep[2] = { _sep, '\0' };
43f984ea 811 size_t len;
502657d5
CS
812
813 if (!haystack || !needle)
814 return 0;
815
43f984ea
DJ
816 len = strlen(haystack);
817 str = alloca(len + 1);
818 (void)strlcpy(str, haystack, len + 1);
819
502657d5
CS
820 for (; (token = strtok_r(str, sep, &saveptr)); str = NULL) {
821 if (strcmp(needle, token) == 0)
822 return 1;
823 }
824
825 return 0;
826}
827
828char **lxc_string_split(const char *string, char _sep)
829{
830 char *token, *str, *saveptr = NULL;
605ea1f7
CB
831 char sep[2] = {_sep, '\0'};
832 char **tmp = NULL, **result = NULL;
502657d5
CS
833 size_t result_capacity = 0;
834 size_t result_count = 0;
835 int r, saved_errno;
43f984ea 836 size_t len;
502657d5
CS
837
838 if (!string)
839 return calloc(1, sizeof(char *));
840
43f984ea
DJ
841 len = strlen(string);
842 str = alloca(len + 1);
843 (void)strlcpy(str, string, len + 1);
844
502657d5
CS
845 for (; (token = strtok_r(str, sep, &saveptr)); str = NULL) {
846 r = lxc_grow_array((void ***)&result, &result_capacity, result_count + 1, 16);
847 if (r < 0)
848 goto error_out;
b14fc100 849
502657d5
CS
850 result[result_count] = strdup(token);
851 if (!result[result_count])
852 goto error_out;
b14fc100 853
502657d5
CS
854 result_count++;
855 }
856
857 /* if we allocated too much, reduce it */
605ea1f7
CB
858 tmp = realloc(result, (result_count + 1) * sizeof(char *));
859 if (!tmp)
860 goto error_out;
b14fc100 861
605ea1f7 862 result = tmp;
b14fc100 863
605ea1f7
CB
864 /* Make sure we don't return uninitialized memory. */
865 if (result_count == 0)
866 *result = NULL;
b14fc100 867
605ea1f7 868 return result;
b14fc100 869
502657d5
CS
870error_out:
871 saved_errno = errno;
872 lxc_free_array((void **)result, free);
873 errno = saved_errno;
874 return NULL;
875}
876
3dca1af0
SH
877static bool complete_word(char ***result, char *start, char *end, size_t *cap, size_t *cnt)
878{
879 int r;
880
881 r = lxc_grow_array((void ***)result, cap, 2 + *cnt, 16);
882 if (r < 0)
883 return false;
b14fc100 884
3dca1af0
SH
885 (*result)[*cnt] = strndup(start, end - start);
886 if (!(*result)[*cnt])
887 return false;
b14fc100 888
3dca1af0
SH
889 (*cnt)++;
890
891 return true;
892}
893
894/*
895 * Given a a string 'one two "three four"', split into three words,
896 * one, two, and "three four"
897 */
898char **lxc_string_split_quoted(char *string)
899{
900 char *nextword = string, *p, state;
901 char **result = NULL;
902 size_t result_capacity = 0;
903 size_t result_count = 0;
904
905 if (!string || !*string)
906 return calloc(1, sizeof(char *));
907
908 // TODO I'm *not* handling escaped quote
909 state = ' ';
910 for (p = string; *p; p++) {
911 switch(state) {
912 case ' ':
913 if (isspace(*p))
914 continue;
915 else if (*p == '"' || *p == '\'') {
916 nextword = p;
917 state = *p;
918 continue;
919 }
920 nextword = p;
921 state = 'a';
922 continue;
923 case 'a':
924 if (isspace(*p)) {
925 complete_word(&result, nextword, p, &result_capacity, &result_count);
926 state = ' ';
927 continue;
928 }
929 continue;
930 case '"':
931 case '\'':
932 if (*p == state) {
933 complete_word(&result, nextword+1, p, &result_capacity, &result_count);
934 state = ' ';
935 continue;
936 }
937 continue;
938 }
939 }
940
941 if (state == 'a')
942 complete_word(&result, nextword, p, &result_capacity, &result_count);
943
944 return realloc(result, (result_count + 1) * sizeof(char *));
945}
946
502657d5
CS
947char **lxc_string_split_and_trim(const char *string, char _sep)
948{
949 char *token, *str, *saveptr = NULL;
950 char sep[2] = { _sep, '\0' };
951 char **result = NULL;
952 size_t result_capacity = 0;
953 size_t result_count = 0;
954 int r, saved_errno;
955 size_t i = 0;
43f984ea 956 size_t len;
502657d5
CS
957
958 if (!string)
959 return calloc(1, sizeof(char *));
960
43f984ea
DJ
961 len = strlen(string);
962 str = alloca(len + 1);
963 (void)strlcpy(str, string, len + 1);
964
502657d5
CS
965 for (; (token = strtok_r(str, sep, &saveptr)); str = NULL) {
966 while (token[0] == ' ' || token[0] == '\t')
967 token++;
b14fc100 968
502657d5
CS
969 i = strlen(token);
970 while (i > 0 && (token[i - 1] == ' ' || token[i - 1] == '\t')) {
971 token[i - 1] = '\0';
972 i--;
973 }
b14fc100 974
502657d5
CS
975 r = lxc_grow_array((void ***)&result, &result_capacity, result_count + 1, 16);
976 if (r < 0)
977 goto error_out;
b14fc100 978
502657d5
CS
979 result[result_count] = strdup(token);
980 if (!result[result_count])
981 goto error_out;
b14fc100 982
502657d5
CS
983 result_count++;
984 }
985
986 /* if we allocated too much, reduce it */
987 return realloc(result, (result_count + 1) * sizeof(char *));
b14fc100 988
502657d5
CS
989error_out:
990 saved_errno = errno;
991 lxc_free_array((void **)result, free);
992 errno = saved_errno;
993 return NULL;
994}
995
996void lxc_free_array(void **array, lxc_free_fn element_free_fn)
997{
998 void **p;
b14fc100 999
502657d5
CS
1000 for (p = array; p && *p; p++)
1001 element_free_fn(*p);
b14fc100 1002
502657d5
CS
1003 free((void*)array);
1004}
1005
b14fc100 1006int lxc_grow_array(void ***array, size_t *capacity, size_t new_size, size_t capacity_increment)
502657d5
CS
1007{
1008 size_t new_capacity;
1009 void **new_array;
1010
1011 /* first time around, catch some trivial mistakes of the user
1012 * only initializing one of these */
1013 if (!*array || !*capacity) {
1014 *array = NULL;
1015 *capacity = 0;
1016 }
1017
1018 new_capacity = *capacity;
1019 while (new_size + 1 > new_capacity)
1020 new_capacity += capacity_increment;
b14fc100 1021
502657d5
CS
1022 if (new_capacity != *capacity) {
1023 /* we have to reallocate */
1024 new_array = realloc(*array, new_capacity * sizeof(void *));
1025 if (!new_array)
1026 return -1;
b14fc100 1027
502657d5
CS
1028 memset(&new_array[*capacity], 0, (new_capacity - (*capacity)) * sizeof(void *));
1029 *array = new_array;
1030 *capacity = new_capacity;
1031 }
1032
1033 /* array has sufficient elements */
1034 return 0;
1035}
1036
1037size_t lxc_array_len(void **array)
1038{
1039 void **p;
1040 size_t result = 0;
1041
1042 for (p = array; p && *p; p++)
1043 result++;
1044
1045 return result;
1046}
1047
7cea5905
CB
1048int lxc_write_to_file(const char *filename, const void *buf, size_t count,
1049 bool add_newline, mode_t mode)
0e95426b
CS
1050{
1051 int fd, saved_errno;
1052 ssize_t ret;
1053
7cea5905 1054 fd = open(filename, O_WRONLY | O_TRUNC | O_CREAT | O_CLOEXEC, mode);
0e95426b
CS
1055 if (fd < 0)
1056 return -1;
b14fc100 1057
0e95426b
CS
1058 ret = lxc_write_nointr(fd, buf, count);
1059 if (ret < 0)
799f29ab 1060 goto out_error;
b14fc100 1061
0e95426b
CS
1062 if ((size_t)ret != count)
1063 goto out_error;
b14fc100 1064
0e95426b
CS
1065 if (add_newline) {
1066 ret = lxc_write_nointr(fd, "\n", 1);
1067 if (ret != 1)
1068 goto out_error;
1069 }
b14fc100 1070
0e95426b
CS
1071 close(fd);
1072 return 0;
1073
1074out_error:
1075 saved_errno = errno;
1076 close(fd);
1077 errno = saved_errno;
1078 return -1;
1079}
1080
b14fc100 1081int lxc_read_from_file(const char *filename, void *buf, size_t count)
0e95426b
CS
1082{
1083 int fd = -1, saved_errno;
1084 ssize_t ret;
1085
1086 fd = open(filename, O_RDONLY | O_CLOEXEC);
1087 if (fd < 0)
1088 return -1;
1089
1090 if (!buf || !count) {
1091 char buf2[100];
1092 size_t count2 = 0;
6d1400b5 1093
0e95426b
CS
1094 while ((ret = read(fd, buf2, 100)) > 0)
1095 count2 += ret;
6d1400b5 1096
0e95426b
CS
1097 if (ret >= 0)
1098 ret = count2;
1099 } else {
1100 memset(buf, 0, count);
1101 ret = read(fd, buf, count);
1102 }
1103
1104 if (ret < 0)
6d1400b5 1105 SYSERROR("Read %s", filename);
0e95426b
CS
1106
1107 saved_errno = errno;
1108 close(fd);
1109 errno = saved_errno;
1110 return ret;
1111}
799f29ab
ÇO
1112
1113void **lxc_append_null_to_array(void **array, size_t count)
1114{
1115 void **temp;
1116
1117 /* Append NULL to the array */
1118 if (count) {
1119 temp = realloc(array, (count + 1) * sizeof(*array));
1120 if (!temp) {
84760c11 1121 size_t i;
799f29ab
ÇO
1122 for (i = 0; i < count; i++)
1123 free(array[i]);
1124 free(array);
1125 return NULL;
1126 }
b14fc100 1127
799f29ab
ÇO
1128 array = temp;
1129 array[count] = NULL;
1130 }
b14fc100 1131
799f29ab
ÇO
1132 return array;
1133}
508c263e
SH
1134
1135int randseed(bool srand_it)
1136{
1137 /*
1138 srand pre-seed function based on /dev/urandom
1139 */
091045f8 1140 unsigned int seed = time(NULL) + getpid();
508c263e
SH
1141
1142 FILE *f;
1143 f = fopen("/dev/urandom", "r");
1144 if (f) {
1145 int ret = fread(&seed, sizeof(seed), 1, f);
1146 if (ret != 1)
7874d81a 1147 SYSDEBUG("unable to fread /dev/urandom, fallback to time+pid rand seed");
1148
508c263e
SH
1149 fclose(f);
1150 }
1151
1152 if (srand_it)
1153 srand(seed);
1154
1155 return seed;
1156}
5d897655
SH
1157
1158uid_t get_ns_uid(uid_t orig)
1159{
1160 char *line = NULL;
1161 size_t sz = 0;
1162 uid_t nsid, hostid, range;
1163 FILE *f = fopen("/proc/self/uid_map", "r");
1164 if (!f)
1165 return 0;
1166
1167 while (getline(&line, &sz, f) != -1) {
1168 if (sscanf(line, "%u %u %u", &nsid, &hostid, &range) != 3)
1169 continue;
b14fc100 1170
5d897655
SH
1171 if (hostid <= orig && hostid + range > orig) {
1172 nsid += orig - hostid;
1173 goto found;
1174 }
1175 }
1176
1177 nsid = 0;
b14fc100 1178
5d897655
SH
1179found:
1180 fclose(f);
1181 free(line);
1182 return nsid;
1183}
c476bdce
SH
1184
1185bool dir_exists(const char *path)
1186{
1187 struct stat sb;
1188 int ret;
1189
1190 ret = stat(path, &sb);
1191 if (ret < 0)
1a0e70ac 1192 /* Could be something other than eexist, just say "no". */
c476bdce 1193 return false;
b14fc100 1194
c476bdce
SH
1195 return S_ISDIR(sb.st_mode);
1196}
93c379f0
ÇO
1197
1198/* Note we don't use SHA-1 here as we don't want to depend on HAVE_GNUTLS.
1199 * FNV has good anti collision properties and we're not worried
1200 * about pre-image resistance or one-way-ness, we're just trying to make
1201 * the name unique in the 108 bytes of space we have.
1202 */
1203uint64_t fnv_64a_buf(void *buf, size_t len, uint64_t hval)
1204{
1205 unsigned char *bp;
1206
1207 for(bp = buf; bp < (unsigned char *)buf + len; bp++)
1208 {
1209 /* xor the bottom with the current octet */
1210 hval ^= (uint64_t)*bp;
1211
1212 /* gcc optimised:
1213 * multiply by the 64 bit FNV magic prime mod 2^64
1214 */
1215 hval += (hval << 1) + (hval << 4) + (hval << 5) +
1216 (hval << 7) + (hval << 8) + (hval << 40);
1217 }
1218
1219 return hval;
1220}
2c6f3fc9 1221
f6310f18 1222bool is_shared_mountpoint(const char *path)
2c6f3fc9 1223{
f6310f18 1224 char buf[LXC_LINELEN];
2c6f3fc9
SH
1225 FILE *f;
1226 int i;
f6310f18 1227 char *p, *p2;
2c6f3fc9
SH
1228
1229 f = fopen("/proc/self/mountinfo", "r");
1230 if (!f)
1231 return 0;
b14fc100 1232
eab15c1e
CB
1233 while (fgets(buf, LXC_LINELEN, f)) {
1234 for (p = buf, i = 0; p && i < 4; i++)
1235 p = strchr(p + 1, ' ');
2c6f3fc9
SH
1236 if (!p)
1237 continue;
b14fc100 1238
eab15c1e 1239 p2 = strchr(p + 1, ' ');
2c6f3fc9
SH
1240 if (!p2)
1241 continue;
b14fc100 1242
2c6f3fc9 1243 *p2 = '\0';
f6310f18
LT
1244 if (strcmp(p + 1, path) == 0) {
1245 /* This is the path. Is it shared? */
eab15c1e 1246 p = strchr(p2 + 1, ' ');
2c6f3fc9
SH
1247 if (p && strstr(p, "shared:")) {
1248 fclose(f);
f6310f18 1249 return true;
2c6f3fc9
SH
1250 }
1251 }
1252 }
b14fc100 1253
2c6f3fc9 1254 fclose(f);
f6310f18
LT
1255 return false;
1256}
1257
1258/*
1259 * Detect whether / is mounted MS_SHARED. The only way I know of to
1260 * check that is through /proc/self/mountinfo.
1261 * I'm only checking for /. If the container rootfs or mount location
1262 * is MS_SHARED, but not '/', then you're out of luck - figuring that
1263 * out would be too much work to be worth it.
1264 */
1265int detect_shared_rootfs(void)
1266{
1267 if (is_shared_mountpoint("/"))
1268 return 1;
2c6f3fc9
SH
1269 return 0;
1270}
0e6e3a41 1271
51d0854c
DY
1272bool switch_to_ns(pid_t pid, const char *ns) {
1273 int fd, ret;
1274 char nspath[MAXPATHLEN];
1275
1276 /* Switch to new ns */
1277 ret = snprintf(nspath, MAXPATHLEN, "/proc/%d/ns/%s", pid, ns);
1278 if (ret < 0 || ret >= MAXPATHLEN)
1279 return false;
1280
1281 fd = open(nspath, O_RDONLY);
1282 if (fd < 0) {
a9cb0fb8 1283 SYSERROR("Failed to open %s", nspath);
51d0854c
DY
1284 return false;
1285 }
1286
1287 ret = setns(fd, 0);
1288 if (ret) {
a9cb0fb8 1289 SYSERROR("Failed to set process %d to %s of %d.", pid, ns, fd);
51d0854c
DY
1290 close(fd);
1291 return false;
1292 }
b14fc100 1293
51d0854c
DY
1294 close(fd);
1295 return true;
1296}
1297
b7f954bb
SH
1298/*
1299 * looking at fs/proc_namespace.c, it appears we can
1300 * actually expect the rootfs entry to very specifically contain
1301 * " - rootfs rootfs "
1302 * IIUC, so long as we've chrooted so that rootfs is not our root,
1303 * the rootfs entry should always be skipped in mountinfo contents.
1304 */
fa454c8e 1305bool detect_ramfs_rootfs(void)
b7f954bb 1306{
b7f954bb 1307 FILE *f;
fa454c8e
CB
1308 char *p, *p2;
1309 char *line = NULL;
1310 size_t len = 0;
b7f954bb 1311 int i;
b7f954bb
SH
1312
1313 f = fopen("/proc/self/mountinfo", "r");
1314 if (!f)
fa454c8e
CB
1315 return false;
1316
1317 while (getline(&line, &len, f) != -1) {
1318 for (p = line, i = 0; p && i < 4; i++)
1319 p = strchr(p + 1, ' ');
b7f954bb
SH
1320 if (!p)
1321 continue;
b14fc100 1322
fa454c8e 1323 p2 = strchr(p + 1, ' ');
b7f954bb
SH
1324 if (!p2)
1325 continue;
b14fc100 1326
b7f954bb 1327 *p2 = '\0';
fa454c8e 1328 if (strcmp(p + 1, "/") == 0) {
1a0e70ac 1329 /* This is '/'. Is it the ramfs? */
fa454c8e 1330 p = strchr(p2 + 1, '-');
b7f954bb 1331 if (p && strncmp(p, "- rootfs rootfs ", 16) == 0) {
fa454c8e 1332 free(line);
b7f954bb 1333 fclose(f);
fa454c8e 1334 return true;
b7f954bb
SH
1335 }
1336 }
1337 }
b14fc100 1338
fa454c8e 1339 free(line);
b7f954bb 1340 fclose(f);
fa454c8e 1341 return false;
b7f954bb
SH
1342}
1343
df6a2945 1344char *on_path(const char *cmd, const char *rootfs) {
0e6e3a41
SG
1345 char *path = NULL;
1346 char *entry = NULL;
1347 char *saveptr = NULL;
1348 char cmdpath[MAXPATHLEN];
1349 int ret;
1350
1351 path = getenv("PATH");
1352 if (!path)
8afb3e61 1353 return NULL;
0e6e3a41
SG
1354
1355 path = strdup(path);
1356 if (!path)
8afb3e61 1357 return NULL;
0e6e3a41
SG
1358
1359 entry = strtok_r(path, ":", &saveptr);
1360 while (entry) {
9d9c111c
SH
1361 if (rootfs)
1362 ret = snprintf(cmdpath, MAXPATHLEN, "%s/%s/%s", rootfs, entry, cmd);
1363 else
1364 ret = snprintf(cmdpath, MAXPATHLEN, "%s/%s", entry, cmd);
0e6e3a41
SG
1365
1366 if (ret < 0 || ret >= MAXPATHLEN)
1367 goto next_loop;
1368
1369 if (access(cmdpath, X_OK) == 0) {
1370 free(path);
8afb3e61 1371 return strdup(cmdpath);
0e6e3a41
SG
1372 }
1373
1374next_loop:
b707e368 1375 entry = strtok_r(NULL, ":", &saveptr);
0e6e3a41
SG
1376 }
1377
1378 free(path);
8afb3e61 1379 return NULL;
0e6e3a41 1380}
76a26f55
SH
1381
1382bool file_exists(const char *f)
1383{
1384 struct stat statbuf;
1385
1386 return stat(f, &statbuf) == 0;
1387}
9d9c111c 1388
12983ba4
SH
1389bool cgns_supported(void)
1390{
1391 return file_exists("/proc/self/ns/cgroup");
1392}
1393
9d9c111c
SH
1394/* historically lxc-init has been under /usr/lib/lxc and under
1395 * /usr/lib/$ARCH/lxc. It now lives as $prefix/sbin/init.lxc.
1396 */
1397char *choose_init(const char *rootfs)
1398{
1399 char *retv = NULL;
370ec268
SF
1400 const char *empty = "",
1401 *tmp;
9d9c111c 1402 int ret, env_set = 0;
9d9c111c
SH
1403
1404 if (!getenv("PATH")) {
1405 if (setenv("PATH", "/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin", 0))
1406 SYSERROR("Failed to setenv");
b14fc100 1407
9d9c111c
SH
1408 env_set = 1;
1409 }
1410
1411 retv = on_path("init.lxc", rootfs);
1412
1413 if (env_set) {
1414 if (unsetenv("PATH"))
1415 SYSERROR("Failed to unsetenv");
1416 }
1417
1418 if (retv)
1419 return retv;
1420
1421 retv = malloc(PATH_MAX);
1422 if (!retv)
1423 return NULL;
1424
1425 if (rootfs)
370ec268 1426 tmp = rootfs;
9d9c111c 1427 else
370ec268
SF
1428 tmp = empty;
1429
1430 ret = snprintf(retv, PATH_MAX, "%s/%s/%s", tmp, SBINDIR, "/init.lxc");
9d9c111c
SH
1431 if (ret < 0 || ret >= PATH_MAX) {
1432 ERROR("pathname too long");
1433 goto out1;
1434 }
b14fc100 1435
e57cd7e9 1436 if (access(retv, X_OK) == 0)
9d9c111c
SH
1437 return retv;
1438
370ec268 1439 ret = snprintf(retv, PATH_MAX, "%s/%s/%s", tmp, LXCINITDIR, "/lxc/lxc-init");
9d9c111c
SH
1440 if (ret < 0 || ret >= PATH_MAX) {
1441 ERROR("pathname too long");
1442 goto out1;
1443 }
b14fc100 1444
e57cd7e9 1445 if (access(retv, X_OK) == 0)
9d9c111c
SH
1446 return retv;
1447
370ec268 1448 ret = snprintf(retv, PATH_MAX, "%s/usr/lib/lxc/lxc-init", tmp);
9d9c111c
SH
1449 if (ret < 0 || ret >= PATH_MAX) {
1450 ERROR("pathname too long");
1451 goto out1;
1452 }
b14fc100 1453
e57cd7e9 1454 if (access(retv, X_OK) == 0)
9d9c111c
SH
1455 return retv;
1456
370ec268 1457 ret = snprintf(retv, PATH_MAX, "%s/sbin/lxc-init", tmp);
9d9c111c
SH
1458 if (ret < 0 || ret >= PATH_MAX) {
1459 ERROR("pathname too long");
1460 goto out1;
1461 }
b14fc100 1462
e57cd7e9 1463 if (access(retv, X_OK) == 0)
9d9c111c
SH
1464 return retv;
1465
1466 /*
1467 * Last resort, look for the statically compiled init.lxc which we
1468 * hopefully bind-mounted in.
1469 * If we are called during container setup, and we get to this point,
1470 * then the init.lxc.static from the host will need to be bind-mounted
1471 * in. So we return NULL here to indicate that.
1472 */
1473 if (rootfs)
1474 goto out1;
1475
1476 ret = snprintf(retv, PATH_MAX, "/init.lxc.static");
1477 if (ret < 0 || ret >= PATH_MAX) {
1478 WARN("Nonsense - name /lxc.init.static too long");
1479 goto out1;
1480 }
b14fc100 1481
e57cd7e9 1482 if (access(retv, X_OK) == 0)
9d9c111c
SH
1483 return retv;
1484
1485out1:
1486 free(retv);
1487 return NULL;
1488}
735f2c6e
TA
1489
1490int print_to_file(const char *file, const char *content)
1491{
1492 FILE *f;
1493 int ret = 0;
1494
1495 f = fopen(file, "w");
1496 if (!f)
1497 return -1;
b14fc100 1498
735f2c6e
TA
1499 if (fprintf(f, "%s", content) != strlen(content))
1500 ret = -1;
b14fc100 1501
735f2c6e
TA
1502 fclose(f);
1503 return ret;
1504}
e1daebd9
SH
1505
1506int is_dir(const char *path)
1507{
1508 struct stat statbuf;
b14fc100 1509 int ret;
1510
1511 ret = stat(path, &statbuf);
e1daebd9
SH
1512 if (ret == 0 && S_ISDIR(statbuf.st_mode))
1513 return 1;
b14fc100 1514
e1daebd9
SH
1515 return 0;
1516}
6010a416
SG
1517
1518/*
1519 * Given the '-t' template option to lxc-create, figure out what to
1520 * do. If the template is a full executable path, use that. If it
1521 * is something like 'sshd', then return $templatepath/lxc-sshd.
1522 * On success return the template, on error return NULL.
1523 */
1524char *get_template_path(const char *t)
1525{
1526 int ret, len;
1527 char *tpath;
1528
1529 if (t[0] == '/' && access(t, X_OK) == 0) {
1530 tpath = strdup(t);
1531 return tpath;
1532 }
1533
1534 len = strlen(LXCTEMPLATEDIR) + strlen(t) + strlen("/lxc-") + 1;
b14fc100 1535
6010a416
SG
1536 tpath = malloc(len);
1537 if (!tpath)
1538 return NULL;
b14fc100 1539
6010a416
SG
1540 ret = snprintf(tpath, len, "%s/lxc-%s", LXCTEMPLATEDIR, t);
1541 if (ret < 0 || ret >= len) {
1542 free(tpath);
1543 return NULL;
1544 }
b14fc100 1545
6010a416
SG
1546 if (access(tpath, X_OK) < 0) {
1547 SYSERROR("bad template: %s", t);
1548 free(tpath);
1549 return NULL;
1550 }
1551
1552 return tpath;
1553}
0a4be28d 1554
592fd47a
SH
1555/*
1556 * @path: a pathname where / replaced with '\0'.
1557 * @offsetp: pointer to int showing which path segment was last seen.
1558 * Updated on return to reflect the next segment.
1559 * @fulllen: full original path length.
1560 * Returns a pointer to the next path segment, or NULL if done.
1561 */
1562static char *get_nextpath(char *path, int *offsetp, int fulllen)
1563{
1564 int offset = *offsetp;
1565
1566 if (offset >= fulllen)
1567 return NULL;
1568
1569 while (path[offset] != '\0' && offset < fulllen)
1570 offset++;
b14fc100 1571
592fd47a
SH
1572 while (path[offset] == '\0' && offset < fulllen)
1573 offset++;
1574
1575 *offsetp = offset;
1576 return (offset < fulllen) ? &path[offset] : NULL;
1577}
1578
1579/*
1580 * Check that @subdir is a subdir of @dir. @len is the length of
1581 * @dir (to avoid having to recalculate it).
1582 */
1583static bool is_subdir(const char *subdir, const char *dir, size_t len)
1584{
1585 size_t subdirlen = strlen(subdir);
1586
1587 if (subdirlen < len)
1588 return false;
b14fc100 1589
592fd47a
SH
1590 if (strncmp(subdir, dir, len) != 0)
1591 return false;
b14fc100 1592
592fd47a
SH
1593 if (dir[len-1] == '/')
1594 return true;
b14fc100 1595
592fd47a
SH
1596 if (subdir[len] == '/' || subdirlen == len)
1597 return true;
b14fc100 1598
592fd47a
SH
1599 return false;
1600}
1601
1602/*
1603 * Check if the open fd is a symlink. Return -ELOOP if it is. Return
1604 * -ENOENT if we couldn't fstat. Return 0 if the fd is ok.
1605 */
1606static int check_symlink(int fd)
1607{
1608 struct stat sb;
b14fc100 1609 int ret;
1610
1611 ret = fstat(fd, &sb);
592fd47a
SH
1612 if (ret < 0)
1613 return -ENOENT;
b14fc100 1614
592fd47a
SH
1615 if (S_ISLNK(sb.st_mode))
1616 return -ELOOP;
b14fc100 1617
592fd47a
SH
1618 return 0;
1619}
1620
1621/*
1622 * Open a file or directory, provided that it contains no symlinks.
1623 *
1624 * CAVEAT: This function must not be used for other purposes than container
1625 * setup before executing the container's init
1626 */
1627static int open_if_safe(int dirfd, const char *nextpath)
1628{
1629 int newfd = openat(dirfd, nextpath, O_RDONLY | O_NOFOLLOW);
1a0e70ac 1630 if (newfd >= 0) /* Was not a symlink, all good. */
592fd47a
SH
1631 return newfd;
1632
1633 if (errno == ELOOP)
1634 return newfd;
1635
1636 if (errno == EPERM || errno == EACCES) {
1a0e70ac
CB
1637 /* We're not root (cause we got EPERM) so try opening with
1638 * O_PATH.
1639 */
592fd47a
SH
1640 newfd = openat(dirfd, nextpath, O_PATH | O_NOFOLLOW);
1641 if (newfd >= 0) {
1a0e70ac
CB
1642 /* O_PATH will return an fd for symlinks. We know
1643 * nextpath wasn't a symlink at last openat, so if fd is
1644 * now a link, then something * fishy is going on.
592fd47a
SH
1645 */
1646 int ret = check_symlink(newfd);
1647 if (ret < 0) {
1648 close(newfd);
1649 newfd = ret;
1650 }
1651 }
1652 }
1653
1654 return newfd;
1655}
1656
1657/*
1658 * Open a path intending for mounting, ensuring that the final path
1659 * is inside the container's rootfs.
1660 *
1661 * CAVEAT: This function must not be used for other purposes than container
1662 * setup before executing the container's init
1663 *
1664 * @target: path to be opened
1665 * @prefix_skip: a part of @target in which to ignore symbolic links. This
1666 * would be the container's rootfs.
1667 *
1668 * Return an open fd for the path, or <0 on error.
1669 */
1670static int open_without_symlink(const char *target, const char *prefix_skip)
1671{
1672 int curlen = 0, dirfd, fulllen, i;
1673 char *dup = NULL;
1674
1675 fulllen = strlen(target);
1676
1677 /* make sure prefix-skip makes sense */
01074e5b 1678 if (prefix_skip && strlen(prefix_skip) > 0) {
592fd47a
SH
1679 curlen = strlen(prefix_skip);
1680 if (!is_subdir(target, prefix_skip, curlen)) {
1681 ERROR("WHOA there - target '%s' didn't start with prefix '%s'",
1682 target, prefix_skip);
1683 return -EINVAL;
1684 }
b14fc100 1685
592fd47a
SH
1686 /*
1687 * get_nextpath() expects the curlen argument to be
1688 * on a (turned into \0) / or before it, so decrement
1689 * curlen to make sure that happens
1690 */
1691 if (curlen)
1692 curlen--;
1693 } else {
1694 prefix_skip = "/";
1695 curlen = 0;
1696 }
1697
1698 /* Make a copy of target which we can hack up, and tokenize it */
1699 if ((dup = strdup(target)) == NULL) {
1700 SYSERROR("Out of memory checking for symbolic link");
1701 return -ENOMEM;
1702 }
b14fc100 1703
592fd47a
SH
1704 for (i = 0; i < fulllen; i++) {
1705 if (dup[i] == '/')
1706 dup[i] = '\0';
1707 }
1708
1709 dirfd = open(prefix_skip, O_RDONLY);
1710 if (dirfd < 0)
1711 goto out;
b14fc100 1712
592fd47a
SH
1713 while (1) {
1714 int newfd, saved_errno;
1715 char *nextpath;
1716
1717 if ((nextpath = get_nextpath(dup, &curlen, fulllen)) == NULL)
1718 goto out;
b14fc100 1719
592fd47a
SH
1720 newfd = open_if_safe(dirfd, nextpath);
1721 saved_errno = errno;
1722 close(dirfd);
b14fc100 1723
592fd47a
SH
1724 dirfd = newfd;
1725 if (newfd < 0) {
1726 errno = saved_errno;
1727 if (errno == ELOOP)
1728 SYSERROR("%s in %s was a symbolic link!", nextpath, target);
b14fc100 1729
592fd47a
SH
1730 goto out;
1731 }
1732 }
1733
1734out:
1735 free(dup);
1736 return dirfd;
1737}
1738
1739/*
1740 * Safely mount a path into a container, ensuring that the mount target
1741 * is under the container's @rootfs. (If @rootfs is NULL, then the container
1742 * uses the host's /)
1743 *
1744 * CAVEAT: This function must not be used for other purposes than container
1745 * setup before executing the container's init
1746 */
1747int safe_mount(const char *src, const char *dest, const char *fstype,
1748 unsigned long flags, const void *data, const char *rootfs)
1749{
1a0e70ac
CB
1750 int destfd, ret, saved_errno;
1751 /* Only needs enough for /proc/self/fd/<fd>. */
1752 char srcbuf[50], destbuf[50];
1753 int srcfd = -1;
592fd47a
SH
1754 const char *mntsrc = src;
1755
1756 if (!rootfs)
1757 rootfs = "";
1758
1759 /* todo - allow symlinks for relative paths if 'allowsymlinks' option is passed */
1760 if (flags & MS_BIND && src && src[0] != '/') {
1761 INFO("this is a relative bind mount");
b14fc100 1762
592fd47a
SH
1763 srcfd = open_without_symlink(src, NULL);
1764 if (srcfd < 0)
1765 return srcfd;
b14fc100 1766
592fd47a
SH
1767 ret = snprintf(srcbuf, 50, "/proc/self/fd/%d", srcfd);
1768 if (ret < 0 || ret > 50) {
1769 close(srcfd);
1770 ERROR("Out of memory");
1771 return -EINVAL;
1772 }
1773 mntsrc = srcbuf;
1774 }
1775
1776 destfd = open_without_symlink(dest, rootfs);
1777 if (destfd < 0) {
88e078ba
CB
1778 if (srcfd != -1) {
1779 saved_errno = errno;
592fd47a 1780 close(srcfd);
88e078ba
CB
1781 errno = saved_errno;
1782 }
b14fc100 1783
592fd47a
SH
1784 return destfd;
1785 }
1786
1787 ret = snprintf(destbuf, 50, "/proc/self/fd/%d", destfd);
1788 if (ret < 0 || ret > 50) {
1789 if (srcfd != -1)
1790 close(srcfd);
b14fc100 1791
592fd47a
SH
1792 close(destfd);
1793 ERROR("Out of memory");
1794 return -EINVAL;
1795 }
1796
1797 ret = mount(mntsrc, destbuf, fstype, flags, data);
1798 saved_errno = errno;
1799 if (srcfd != -1)
1800 close(srcfd);
b14fc100 1801
592fd47a
SH
1802 close(destfd);
1803 if (ret < 0) {
1804 errno = saved_errno;
0103eb53 1805 SYSERROR("Failed to mount %s onto %s", src ? src : "(null)", dest);
592fd47a
SH
1806 return ret;
1807 }
1808
1809 return 0;
1810}
1811
ced03a01
SH
1812/*
1813 * Mount a proc under @rootfs if proc self points to a pid other than
1814 * my own. This is needed to have a known-good proc mount for setting
1815 * up LSMs both at container startup and attach.
1816 *
1817 * @rootfs : the rootfs where proc should be mounted
1818 *
1819 * Returns < 0 on failure, 0 if the correct proc was already mounted
1820 * and 1 if a new proc was mounted.
f267d666
BP
1821 *
1822 * NOTE: not to be called from inside the container namespace!
ced03a01 1823 */
943144d9 1824int lxc_mount_proc_if_needed(const char *rootfs)
ced03a01
SH
1825{
1826 char path[MAXPATHLEN];
6b1ba5d6
CB
1827 int link_to_pid, linklen, mypid, ret;
1828 char link[LXC_NUMSTRLEN64] = {0};
ced03a01
SH
1829
1830 ret = snprintf(path, MAXPATHLEN, "%s/proc/self", rootfs);
1831 if (ret < 0 || ret >= MAXPATHLEN) {
1832 SYSERROR("proc path name too long");
1833 return -1;
1834 }
fc2ad9dc 1835
6b1ba5d6 1836 linklen = readlink(path, link, LXC_NUMSTRLEN64);
fc2ad9dc 1837
ced03a01 1838 ret = snprintf(path, MAXPATHLEN, "%s/proc", rootfs);
d539a2b2
CB
1839 if (ret < 0 || ret >= MAXPATHLEN) {
1840 SYSERROR("proc path name too long");
1841 return -1;
1842 }
fc2ad9dc
CB
1843
1844 /* /proc not mounted */
1845 if (linklen < 0) {
1846 if (mkdir(path, 0755) && errno != EEXIST)
1847 return -1;
b14fc100 1848
ced03a01 1849 goto domount;
6b1ba5d6
CB
1850 } else if (linklen >= LXC_NUMSTRLEN64) {
1851 link[linklen - 1] = '\0';
1852 ERROR("readlink returned truncated content: \"%s\"", link);
1853 return -1;
fc2ad9dc
CB
1854 }
1855
0059379f 1856 mypid = lxc_raw_getpid();
6b1ba5d6
CB
1857 INFO("I am %d, /proc/self points to \"%s\"", mypid, link);
1858
2d036cca
CB
1859 if (lxc_safe_int(link, &link_to_pid) < 0)
1860 return -1;
fc2ad9dc 1861
6b1ba5d6
CB
1862 /* correct procfs is already mounted */
1863 if (link_to_pid == mypid)
1864 return 0;
fc2ad9dc 1865
6b1ba5d6
CB
1866 ret = umount2(path, MNT_DETACH);
1867 if (ret < 0)
1868 WARN("failed to umount \"%s\" with MNT_DETACH", path);
ced03a01
SH
1869
1870domount:
fc2ad9dc 1871 /* rootfs is NULL */
6b1ba5d6 1872 if (!strcmp(rootfs, ""))
f267d666
BP
1873 ret = mount("proc", path, "proc", 0, NULL);
1874 else
1875 ret = safe_mount("proc", path, "proc", 0, NULL, rootfs);
f267d666 1876 if (ret < 0)
ced03a01 1877 return -1;
f267d666 1878
fc2ad9dc 1879 INFO("mounted /proc in container for security transition");
ced03a01
SH
1880 return 1;
1881}
69aeabac 1882
f8dd0275 1883int open_devnull(void)
69aeabac 1884{
f8dd0275
AM
1885 int fd = open("/dev/null", O_RDWR);
1886
1887 if (fd < 0)
1888 SYSERROR("Can't open /dev/null");
1889
1890 return fd;
1891}
69aeabac 1892
f8dd0275
AM
1893int set_stdfds(int fd)
1894{
bbbf65ee
CB
1895 int ret;
1896
69aeabac
TA
1897 if (fd < 0)
1898 return -1;
1899
bbbf65ee
CB
1900 ret = dup2(fd, STDIN_FILENO);
1901 if (ret < 0)
f8dd0275 1902 return -1;
bbbf65ee
CB
1903
1904 ret = dup2(fd, STDOUT_FILENO);
1905 if (ret < 0)
f8dd0275 1906 return -1;
bbbf65ee
CB
1907
1908 ret = dup2(fd, STDERR_FILENO);
1909 if (ret < 0)
f8dd0275
AM
1910 return -1;
1911
1912 return 0;
1913}
1914
1915int null_stdfds(void)
1916{
1917 int ret = -1;
b14fc100 1918 int fd;
f8dd0275 1919
b14fc100 1920 fd = open_devnull();
f8dd0275
AM
1921 if (fd >= 0) {
1922 ret = set_stdfds(fd);
1923 close(fd);
1924 }
69aeabac 1925
69aeabac
TA
1926 return ret;
1927}
ccb4cabe
SH
1928
1929/*
1930 * Return the number of lines in file @fn, or -1 on error
1931 */
1932int lxc_count_file_lines(const char *fn)
1933{
1934 FILE *f;
1935 char *line = NULL;
1936 size_t sz = 0;
1937 int n = 0;
1938
1939 f = fopen_cloexec(fn, "r");
1940 if (!f)
1941 return -1;
1942
1943 while (getline(&line, &sz, f) != -1) {
1944 n++;
1945 }
b14fc100 1946
ccb4cabe
SH
1947 free(line);
1948 fclose(f);
1949 return n;
1950}
1adbd020 1951
330ae3d3 1952/* Check whether a signal is blocked by a process. */
de3c491b 1953/* /proc/pid-to-str/status\0 = (5 + 21 + 7 + 1) */
eabf1ea9 1954#define __PROC_STATUS_LEN (6 + (LXC_NUMSTRLEN64) + 7 + 1)
573ad77f 1955bool task_blocks_signal(pid_t pid, int signal)
330ae3d3 1956{
330ae3d3 1957 int ret;
de3c491b 1958 char status[__PROC_STATUS_LEN];
eabf1ea9 1959 FILE *f;
573ad77f 1960 uint64_t sigblk = 0, one = 1;
eabf1ea9
CB
1961 size_t n = 0;
1962 bool bret = false;
1963 char *line = NULL;
330ae3d3 1964
de3c491b
CB
1965 ret = snprintf(status, __PROC_STATUS_LEN, "/proc/%d/status", pid);
1966 if (ret < 0 || ret >= __PROC_STATUS_LEN)
330ae3d3
CB
1967 return bret;
1968
1969 f = fopen(status, "r");
1970 if (!f)
1971 return bret;
1972
1973 while (getline(&line, &n, f) != -1) {
573ad77f
CB
1974 char *numstr;
1975
eabf1ea9 1976 if (strncmp(line, "SigBlk:", 7))
6fbcbe3b
CB
1977 continue;
1978
573ad77f
CB
1979 numstr = lxc_trim_whitespace_in_place(line + 7);
1980 ret = lxc_safe_uint64(numstr, &sigblk, 16);
1981 if (ret < 0)
6fbcbe3b 1982 goto out;
573ad77f
CB
1983
1984 break;
330ae3d3
CB
1985 }
1986
573ad77f 1987 if (sigblk & (one << (signal - 1)))
330ae3d3
CB
1988 bret = true;
1989
1990out:
1991 free(line);
1992 fclose(f);
1993 return bret;
1994}
000dfda7
CB
1995
1996static int lxc_append_null_to_list(void ***list)
1997{
1998 int newentry = 0;
1999 void **tmp;
2000
2001 if (*list)
2002 for (; (*list)[newentry]; newentry++) {
2003 ;
2004 }
2005
2006 tmp = realloc(*list, (newentry + 2) * sizeof(void **));
2007 if (!tmp)
2008 return -1;
2009
2010 *list = tmp;
2011 (*list)[newentry + 1] = NULL;
2012
2013 return newentry;
2014}
2015
2016int lxc_append_string(char ***list, char *entry)
2017{
000dfda7 2018 char *copy;
a54694f8
CB
2019 int newentry;
2020
2021 newentry = lxc_append_null_to_list((void ***)list);
2022 if (newentry < 0)
2023 return -1;
000dfda7
CB
2024
2025 copy = strdup(entry);
2026 if (!copy)
2027 return -1;
2028
2029 (*list)[newentry] = copy;
2030
2031 return 0;
2032}
a687256f
CB
2033
2034int lxc_preserve_ns(const int pid, const char *ns)
2035{
2036 int ret;
a052913d
CB
2037/* 5 /proc + 21 /int_as_str + 3 /ns + 20 /NS_NAME + 1 \0 */
2038#define __NS_PATH_LEN 50
2039 char path[__NS_PATH_LEN];
a687256f 2040
4d8ac866
CB
2041 /* This way we can use this function to also check whether namespaces
2042 * are supported by the kernel by passing in the NULL or the empty
2043 * string.
2044 */
a052913d 2045 ret = snprintf(path, __NS_PATH_LEN, "/proc/%d/ns%s%s", pid,
4d8ac866
CB
2046 !ns || strcmp(ns, "") == 0 ? "" : "/",
2047 !ns || strcmp(ns, "") == 0 ? "" : ns);
ea918412 2048 if (ret < 0 || (size_t)ret >= __NS_PATH_LEN) {
2049 errno = EFBIG;
2050 return -1;
2051 }
a687256f
CB
2052
2053 return open(path, O_RDONLY | O_CLOEXEC);
2054}
6bc2eafe
CB
2055
2056int lxc_safe_uint(const char *numstr, unsigned int *converted)
2057{
2058 char *err = NULL;
2059 unsigned long int uli;
2060
643c1984
CB
2061 while (isspace(*numstr))
2062 numstr++;
2063
2064 if (*numstr == '-')
2065 return -EINVAL;
2066
6bc2eafe
CB
2067 errno = 0;
2068 uli = strtoul(numstr, &err, 0);
643c1984 2069 if (errno == ERANGE && uli == ULONG_MAX)
ff0e49c7 2070 return -ERANGE;
6bc2eafe 2071
643c1984 2072 if (err == numstr || *err != '\0')
6bc2eafe
CB
2073 return -EINVAL;
2074
2075 if (uli > UINT_MAX)
2076 return -ERANGE;
2077
8c57d930 2078 *converted = (unsigned int)uli;
6bc2eafe
CB
2079 return 0;
2080}
b5f845e7 2081
681188c1
CB
2082int lxc_safe_ulong(const char *numstr, unsigned long *converted)
2083{
2084 char *err = NULL;
2085 unsigned long int uli;
2086
2087 while (isspace(*numstr))
2088 numstr++;
2089
2090 if (*numstr == '-')
2091 return -EINVAL;
2092
2093 errno = 0;
2094 uli = strtoul(numstr, &err, 0);
2095 if (errno == ERANGE && uli == ULONG_MAX)
2096 return -ERANGE;
2097
2098 if (err == numstr || *err != '\0')
2099 return -EINVAL;
2100
2101 *converted = uli;
2102 return 0;
2103}
2104
573ad77f 2105int lxc_safe_uint64(const char *numstr, uint64_t *converted, int base)
eacebcc3
FA
2106{
2107 char *err = NULL;
2108 uint64_t u;
2109
2110 while (isspace(*numstr))
2111 numstr++;
2112
2113 if (*numstr == '-')
2114 return -EINVAL;
2115
2116 errno = 0;
573ad77f 2117 u = strtoull(numstr, &err, base);
eacebcc3
FA
2118 if (errno == ERANGE && u == ULLONG_MAX)
2119 return -ERANGE;
2120
2121 if (err == numstr || *err != '\0')
2122 return -EINVAL;
2123
2124 *converted = u;
2125 return 0;
2126}
2127
b5f845e7
CB
2128int lxc_safe_int(const char *numstr, int *converted)
2129{
2130 char *err = NULL;
2131 signed long int sli;
2132
2133 errno = 0;
2134 sli = strtol(numstr, &err, 0);
643c1984 2135 if (errno == ERANGE && (sli == LONG_MAX || sli == LONG_MIN))
ff0e49c7 2136 return -ERANGE;
643c1984
CB
2137
2138 if (errno != 0 && sli == 0)
ff0e49c7 2139 return -EINVAL;
b5f845e7 2140
643c1984 2141 if (err == numstr || *err != '\0')
b5f845e7
CB
2142 return -EINVAL;
2143
643c1984 2144 if (sli > INT_MAX || sli < INT_MIN)
b5f845e7
CB
2145 return -ERANGE;
2146
2147 *converted = (int)sli;
2148 return 0;
2149}
8c57d930
CB
2150
2151int lxc_safe_long(const char *numstr, long int *converted)
2152{
2153 char *err = NULL;
2154 signed long int sli;
2155
2156 errno = 0;
2157 sli = strtol(numstr, &err, 0);
643c1984 2158 if (errno == ERANGE && (sli == LONG_MAX || sli == LONG_MIN))
ff0e49c7 2159 return -ERANGE;
8c57d930 2160
643c1984 2161 if (errno != 0 && sli == 0)
ff0e49c7 2162 return -EINVAL;
8c57d930 2163
643c1984
CB
2164 if (err == numstr || *err != '\0')
2165 return -EINVAL;
8c57d930
CB
2166
2167 *converted = sli;
2168 return 0;
2169}
dbaf55a3 2170
b037bc67
CB
2171int lxc_safe_long_long(const char *numstr, long long int *converted)
2172{
2173 char *err = NULL;
2174 signed long long int sli;
2175
2176 errno = 0;
2177 sli = strtoll(numstr, &err, 0);
2178 if (errno == ERANGE && (sli == LLONG_MAX || sli == LLONG_MIN))
2179 return -ERANGE;
2180
2181 if (errno != 0 && sli == 0)
2182 return -EINVAL;
2183
2184 if (err == numstr || *err != '\0')
2185 return -EINVAL;
2186
2187 *converted = sli;
2188 return 0;
2189}
2190
dbaf55a3
CB
2191int lxc_switch_uid_gid(uid_t uid, gid_t gid)
2192{
2193 if (setgid(gid) < 0) {
2194 SYSERROR("Failed to switch to gid %d.", gid);
2195 return -errno;
2196 }
2197 NOTICE("Switched to gid %d.", gid);
2198
2199 if (setuid(uid) < 0) {
2200 SYSERROR("Failed to switch to uid %d.", uid);
2201 return -errno;
2202 }
2203 NOTICE("Switched to uid %d.", uid);
2204
2205 return 0;
2206}
2207
2208/* Simple covenience function which enables uniform logging. */
2209int lxc_setgroups(int size, gid_t list[])
2210{
2211 if (setgroups(size, list) < 0) {
2212 SYSERROR("Failed to setgroups().");
2213 return -errno;
2214 }
2215 NOTICE("Dropped additional groups.");
2216
2217 return 0;
2218}
c6868a1f
CB
2219
2220static int lxc_get_unused_loop_dev_legacy(char *loop_name)
2221{
2222 struct dirent *dp;
2223 struct loop_info64 lo64;
2224 DIR *dir;
2225 int dfd = -1, fd = -1, ret = -1;
2226
2227 dir = opendir("/dev");
2228 if (!dir)
2229 return -1;
2230
2231 while ((dp = readdir(dir))) {
c6868a1f
CB
2232 if (strncmp(dp->d_name, "loop", 4) != 0)
2233 continue;
2234
2235 dfd = dirfd(dir);
2236 if (dfd < 0)
2237 continue;
2238
2239 fd = openat(dfd, dp->d_name, O_RDWR);
2240 if (fd < 0)
2241 continue;
2242
2243 ret = ioctl(fd, LOOP_GET_STATUS64, &lo64);
2244 if (ret < 0) {
2245 if (ioctl(fd, LOOP_GET_STATUS64, &lo64) == 0 ||
2246 errno != ENXIO) {
2247 close(fd);
2248 fd = -1;
2249 continue;
2250 }
2251 }
2252
2253 ret = snprintf(loop_name, LO_NAME_SIZE, "/dev/%s", dp->d_name);
2254 if (ret < 0 || ret >= LO_NAME_SIZE) {
2255 close(fd);
2256 fd = -1;
2257 continue;
2258 }
2259
2260 break;
2261 }
2262
2263 closedir(dir);
2264
2265 if (fd < 0)
2266 return -1;
2267
2268 return fd;
2269}
2270
2271static int lxc_get_unused_loop_dev(char *name_loop)
2272{
2273 int loop_nr, ret;
2274 int fd_ctl = -1, fd_tmp = -1;
2275
2276 fd_ctl = open("/dev/loop-control", O_RDWR | O_CLOEXEC);
2277 if (fd_ctl < 0)
2278 return -ENODEV;
2279
2280 loop_nr = ioctl(fd_ctl, LOOP_CTL_GET_FREE);
2281 if (loop_nr < 0)
2282 goto on_error;
2283
2284 ret = snprintf(name_loop, LO_NAME_SIZE, "/dev/loop%d", loop_nr);
2285 if (ret < 0 || ret >= LO_NAME_SIZE)
2286 goto on_error;
2287
2288 fd_tmp = open(name_loop, O_RDWR | O_CLOEXEC);
2289 if (fd_tmp < 0)
2290 goto on_error;
2291
2292on_error:
2293 close(fd_ctl);
2294 return fd_tmp;
2295}
2296
2297int lxc_prepare_loop_dev(const char *source, char *loop_dev, int flags)
2298{
2299 int ret;
2300 struct loop_info64 lo64;
2301 int fd_img = -1, fret = -1, fd_loop = -1;
2302
2303 fd_loop = lxc_get_unused_loop_dev(loop_dev);
2304 if (fd_loop < 0) {
2305 if (fd_loop == -ENODEV)
2306 fd_loop = lxc_get_unused_loop_dev_legacy(loop_dev);
2307 else
2308 goto on_error;
2309 }
2310
2311 fd_img = open(source, O_RDWR | O_CLOEXEC);
2312 if (fd_img < 0)
2313 goto on_error;
2314
2315 ret = ioctl(fd_loop, LOOP_SET_FD, fd_img);
2316 if (ret < 0)
2317 goto on_error;
2318
2319 memset(&lo64, 0, sizeof(lo64));
2320 lo64.lo_flags = flags;
2321
2322 ret = ioctl(fd_loop, LOOP_SET_STATUS64, &lo64);
2323 if (ret < 0)
2324 goto on_error;
2325
2326 fret = 0;
2327
2328on_error:
2329 if (fd_img >= 0)
2330 close(fd_img);
2331
2332 if (fret < 0 && fd_loop >= 0) {
2333 close(fd_loop);
2334 fd_loop = -1;
2335 }
2336
2337 return fd_loop;
2338}
74251e49
CB
2339
2340int lxc_unstack_mountpoint(const char *path, bool lazy)
2341{
2342 int ret;
2343 int umounts = 0;
2344
2345pop_stack:
2346 ret = umount2(path, lazy ? MNT_DETACH : 0);
2347 if (ret < 0) {
2348 /* We consider anything else than EINVAL deadly to prevent going
2349 * into an infinite loop. (The other alternative is constantly
2350 * parsing /proc/self/mountinfo which is yucky and probably
2351 * racy.)
2352 */
2353 if (errno != EINVAL)
2354 return -errno;
2355 } else {
b4a40f7b
CB
2356 /* Just stop counting when this happens. That'd just be so
2357 * stupid that we won't even bother trying to report back the
2358 * correct value anymore.
2359 */
2360 if (umounts != INT_MAX)
2361 umounts++;
b14fc100 2362
74251e49
CB
2363 /* We succeeded in umounting. Make sure that there's no other
2364 * mountpoint stacked underneath.
2365 */
74251e49
CB
2366 goto pop_stack;
2367 }
2368
2369 return umounts;
2370}
ea3a694f
CB
2371
2372int run_command(char *buf, size_t buf_size, int (*child_fn)(void *), void *args)
2373{
2374 pid_t child;
2375 int ret, fret, pipefd[2];
2376 ssize_t bytes;
2377
46210729 2378 /* Make sure our callers do not receive uninitialized memory. */
ea3a694f
CB
2379 if (buf_size > 0 && buf)
2380 buf[0] = '\0';
2381
2382 if (pipe(pipefd) < 0) {
2383 SYSERROR("failed to create pipe");
2384 return -1;
2385 }
2386
2d728b2f 2387 child = lxc_raw_clone(0);
ea3a694f
CB
2388 if (child < 0) {
2389 close(pipefd[0]);
2390 close(pipefd[1]);
2391 SYSERROR("failed to create new process");
2392 return -1;
2393 }
2394
2395 if (child == 0) {
2396 /* Close the read-end of the pipe. */
2397 close(pipefd[0]);
2398
2399 /* Redirect std{err,out} to write-end of the
2400 * pipe.
2401 */
2402 ret = dup2(pipefd[1], STDOUT_FILENO);
2403 if (ret >= 0)
2404 ret = dup2(pipefd[1], STDERR_FILENO);
2405
2406 /* Close the write-end of the pipe. */
2407 close(pipefd[1]);
2408
2409 if (ret < 0) {
2410 SYSERROR("failed to duplicate std{err,out} file descriptor");
d8b3f9c3 2411 _exit(EXIT_FAILURE);
ea3a694f
CB
2412 }
2413
2414 /* Does not return. */
2415 child_fn(args);
2416 ERROR("failed to exec command");
d8b3f9c3 2417 _exit(EXIT_FAILURE);
ea3a694f
CB
2418 }
2419
2420 /* close the write-end of the pipe */
2421 close(pipefd[1]);
2422
7a643c7c
CB
2423 if (buf && buf_size > 0) {
2424 bytes = read(pipefd[0], buf, buf_size - 1);
2425 if (bytes > 0)
2426 buf[bytes - 1] = '\0';
2427 }
ea3a694f
CB
2428
2429 fret = wait_for_pid(child);
2430 /* close the read-end of the pipe */
2431 close(pipefd[0]);
2432
2433 return fret;
2434}
04ad7ffe
CB
2435
2436char *must_make_path(const char *first, ...)
2437{
2438 va_list args;
2439 char *cur, *dest;
2440 size_t full_len = strlen(first);
bd583214 2441 size_t buf_len;
04ad7ffe
CB
2442
2443 dest = must_copy_string(first);
2444
2445 va_start(args, first);
2446 while ((cur = va_arg(args, char *)) != NULL) {
2447 full_len += strlen(cur);
2448 if (cur[0] != '/')
2449 full_len++;
efed99a4 2450
bd583214
DJ
2451 buf_len = full_len + 1;
2452 dest = must_realloc(dest, buf_len);
efed99a4 2453
04ad7ffe 2454 if (cur[0] != '/')
bd583214
DJ
2455 (void)strlcat(dest, "/", buf_len);
2456 (void)strlcat(dest, cur, buf_len);
04ad7ffe
CB
2457 }
2458 va_end(args);
2459
2460 return dest;
2461}
2462
0c3deb94
CB
2463char *must_append_path(char *first, ...)
2464{
2465 char *cur;
2466 size_t full_len;
2467 va_list args;
2468 char *dest = first;
bd583214 2469 size_t buf_len;
0c3deb94
CB
2470
2471 full_len = strlen(first);
2472 va_start(args, first);
2473 while ((cur = va_arg(args, char *)) != NULL) {
2474 full_len += strlen(cur);
0c3deb94
CB
2475 if (cur[0] != '/')
2476 full_len++;
2477
bd583214
DJ
2478 buf_len = full_len + 1;
2479 dest = must_realloc(dest, buf_len);
0c3deb94
CB
2480
2481 if (cur[0] != '/')
bd583214
DJ
2482 (void)strlcat(dest, "/", buf_len);
2483 (void)strlcat(dest, cur, buf_len);
0c3deb94
CB
2484 }
2485 va_end(args);
2486
2487 return dest;
2488}
2489
04ad7ffe
CB
2490char *must_copy_string(const char *entry)
2491{
2492 char *ret;
2493
2494 if (!entry)
2495 return NULL;
b14fc100 2496
04ad7ffe
CB
2497 do {
2498 ret = strdup(entry);
2499 } while (!ret);
2500
2501 return ret;
2502}
2503
2504void *must_realloc(void *orig, size_t sz)
2505{
2506 void *ret;
2507
2508 do {
2509 ret = realloc(orig, sz);
2510 } while (!ret);
2511
2512 return ret;
2513}
a035c53a
CB
2514
2515bool is_fs_type(const struct statfs *fs, fs_type_magic magic_val)
2516{
2517 return (fs->f_type == (fs_type_magic)magic_val);
2518}
2519
2520bool has_fs_type(const char *path, fs_type_magic magic_val)
2521{
2522 bool has_type;
2523 int ret;
2524 struct statfs sb;
2525
2526 ret = statfs(path, &sb);
2527 if (ret < 0)
2528 return false;
2529
2530 has_type = is_fs_type(&sb, magic_val);
2531 if (!has_type && magic_val == RAMFS_MAGIC)
2532 WARN("When the ramfs it a tmpfs statfs() might report tmpfs");
2533
2534 return has_type;
2535}
d75c14e2
CB
2536
2537bool lxc_nic_exists(char *nic)
2538{
2539#define __LXC_SYS_CLASS_NET_LEN 15 + IFNAMSIZ + 1
2540 char path[__LXC_SYS_CLASS_NET_LEN];
2541 int ret;
2542 struct stat sb;
2543
2544 if (!strcmp(nic, "none"))
2545 return true;
2546
2547 ret = snprintf(path, __LXC_SYS_CLASS_NET_LEN, "/sys/class/net/%s", nic);
2548 if (ret < 0 || (size_t)ret >= __LXC_SYS_CLASS_NET_LEN)
2549 return false;
2550
2551 ret = stat(path, &sb);
2552 if (ret < 0)
2553 return false;
2554
2555 return true;
2556}
127c6e70
CB
2557
2558int lxc_make_tmpfile(char *template, bool rm)
2559{
2560 int fd, ret;
c3b818a0 2561 mode_t msk;
127c6e70 2562
c3b818a0 2563 msk = umask(0022);
127c6e70 2564 fd = mkstemp(template);
c3b818a0 2565 umask(msk);
127c6e70
CB
2566 if (fd < 0)
2567 return -1;
2568
2569 if (!rm)
2570 return fd;
2571
2572 ret = unlink(template);
2573 if (ret < 0) {
2574 close(fd);
2575 return -1;
2576 }
2577
2578 return fd;
2579}
e4636123 2580
e3db0162
CB
2581int parse_byte_size_string(const char *s, int64_t *converted)
2582{
2583 int ret, suffix_len;
2584 long long int conv;
2585 int64_t mltpl, overflow;
2586 char *end;
2587 char dup[LXC_NUMSTRLEN64 + 2];
a13560af 2588 char suffix[3] = {0};
e3db0162
CB
2589
2590 if (!s || !strcmp(s, ""))
2591 return -EINVAL;
2592
ccd42a31 2593 end = stpncpy(dup, s, sizeof(dup) - 1);
e3db0162
CB
2594 if (*end != '\0')
2595 return -EINVAL;
2596
2597 if (isdigit(*(end - 1)))
2598 suffix_len = 0;
2599 else if (isalpha(*(end - 1)))
2600 suffix_len = 1;
2601 else
2602 return -EINVAL;
2603
c2229b24 2604 if (suffix_len > 0 && (end - 2) == dup && !isdigit(*(end - 2)))
e3db0162
CB
2605 return -EINVAL;
2606
358b8c81
CB
2607 if (suffix_len > 0 && isalpha(*(end - 2)))
2608 suffix_len++;
e3db0162
CB
2609
2610 if (suffix_len > 0) {
2611 memcpy(suffix, end - suffix_len, suffix_len);
2612 *(suffix + suffix_len) = '\0';
2613 *(end - suffix_len) = '\0';
2614 }
2615 dup[lxc_char_right_gc(dup, strlen(dup))] = '\0';
2616
2617 ret = lxc_safe_long_long(dup, &conv);
2618 if (ret < 0)
2619 return -ret;
2620
2621 if (suffix_len != 2) {
2622 *converted = conv;
2623 return 0;
2624 }
2625
6d276edc 2626 if (strcasecmp(suffix, "KB") == 0)
e3db0162 2627 mltpl = 1024;
6d276edc 2628 else if (strcasecmp(suffix, "MB") == 0)
e3db0162 2629 mltpl = 1024 * 1024;
6d276edc 2630 else if (strcasecmp(suffix, "GB") == 0)
e3db0162
CB
2631 mltpl = 1024 * 1024 * 1024;
2632 else
2633 return -EINVAL;
2634
2635 overflow = conv * mltpl;
2636 if (conv != 0 && (overflow / conv) != mltpl)
2637 return -ERANGE;
2638
2639 *converted = overflow;
2640 return 0;
2641}
6222c3f4
CB
2642
2643uint64_t lxc_find_next_power2(uint64_t n)
2644{
2645 /* 0 is not valid input. We return 0 to the caller since 0 is not a
2646 * valid power of two.
2647 */
2648 if (n == 0)
2649 return 0;
2650
2651 if (!(n & (n - 1)))
2652 return n;
2653
2654 while (n & (n - 1))
2655 n = n & (n - 1);
2656
2657 n = n << 1;
2658 return n;
2659}
1fd0f41e
CB
2660
2661int lxc_set_death_signal(int signal)
2662{
2663 int ret;
2664 pid_t ppid;
2665
2666 ret = prctl(PR_SET_PDEATHSIG, signal, 0, 0, 0);
2667
2668 /* Check whether we have been orphaned. */
2669 ppid = (pid_t)syscall(SYS_getppid);
2670 if (ppid == 1) {
2671 pid_t self;
2672
2673 self = lxc_raw_getpid();
2674 ret = kill(self, SIGKILL);
2675 if (ret < 0)
2676 return -1;
2677 }
2678
2679 if (ret < 0) {
2680 SYSERROR("Failed to set PR_SET_PDEATHSIG to %d", signal);
2681 return -1;
2682 }
2683
2684 return 0;
2685}
7ad37670
CB
2686
2687void remove_trailing_newlines(char *l)
2688{
2689 char *p = l;
2690
2691 while (*p)
2692 p++;
2693
2694 while (--p >= l && *p == '\n')
2695 *p = '\0';
2696}
a9d4ebc1
CB
2697
2698int fd_cloexec(int fd, bool cloexec)
2699{
2700 int oflags, nflags;
2701
2702 oflags = fcntl(fd, F_GETFD, 0);
2703 if (oflags < 0)
2704 return -errno;
2705
2706 if (cloexec)
2707 nflags = oflags | FD_CLOEXEC;
2708 else
2709 nflags = oflags & ~FD_CLOEXEC;
2710
2711 if (nflags == oflags)
2712 return 0;
2713
2714 if (fcntl(fd, F_SETFD, nflags) < 0)
2715 return -errno;
2716
2717 return 0;
2718}
d7ab0375 2719
2720int recursive_destroy(char *dirname)
2721{
2722 int ret;
2723 struct dirent *direntp;
2724 DIR *dir;
2725 int r = 0;
2726
2727 dir = opendir(dirname);
2728 if (!dir)
2729 return -1;
2730
2731 while ((direntp = readdir(dir))) {
2732 char *pathname;
2733 struct stat mystat;
2734
2735 if (!strcmp(direntp->d_name, ".") ||
2736 !strcmp(direntp->d_name, ".."))
2737 continue;
2738
2739 pathname = must_make_path(dirname, direntp->d_name, NULL);
2740
2741 ret = lstat(pathname, &mystat);
2742 if (ret < 0) {
2743 if (!r)
2744 WARN("Failed to stat \"%s\"", pathname);
2745
2746 r = -1;
2747 goto next;
2748 }
2749
2750 if (!S_ISDIR(mystat.st_mode))
2751 goto next;
2752
2753 ret = recursive_destroy(pathname);
2754 if (ret < 0)
2755 r = -1;
2756
2757 next:
2758 free(pathname);
2759 }
2760
2761 ret = rmdir(dirname);
2762 if (ret < 0) {
2763 if (!r)
2764 SYSWARN("Failed to delete \"%s\"", dirname);
2765
2766 r = -1;
2767 }
2768
2769 ret = closedir(dir);
2770 if (ret < 0) {
2771 if (!r)
2772 SYSWARN("Failed to delete \"%s\"", dirname);
2773
2774 r = -1;
2775 }
2776
2777 return r;
2778}