]> git.proxmox.com Git - mirror_lxc.git/blob - src/lxc/lxccontainer.c
seccomp: SECCOMP_RET_USER_NOTIF support
[mirror_lxc.git] / src / lxc / lxccontainer.c
1 /* liblxcapi
2 *
3 * Copyright © 2012 Serge Hallyn <serge.hallyn@ubuntu.com>.
4 * Copyright © 2012 Canonical Ltd.
5 *
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
10
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
15
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19 */
20
21 #ifndef _GNU_SOURCE
22 #define _GNU_SOURCE 1
23 #endif
24 #include <arpa/inet.h>
25 #include <dirent.h>
26 #include <errno.h>
27 #include <fcntl.h>
28 #include <grp.h>
29 #include <libgen.h>
30 #include <pthread.h>
31 #include <sched.h>
32 #include <stdarg.h>
33 #include <stdint.h>
34 #include <stdio.h>
35 #include <stdlib.h>
36 #include <sys/file.h>
37 #include <sys/mman.h>
38 #include <sys/mount.h>
39 #include <sys/stat.h>
40 #include <sys/syscall.h>
41 #include <sys/sysmacros.h>
42 #include <sys/types.h>
43 #include <sys/wait.h>
44 #include <unistd.h>
45
46 #include "../include/netns_ifaddrs.h"
47 #include "af_unix.h"
48 #include "api_extensions.h"
49 #include "attach.h"
50 #include "cgroup.h"
51 #include "commands.h"
52 #include "commands_utils.h"
53 #include "conf.h"
54 #include "config.h"
55 #include "confile.h"
56 #include "confile_utils.h"
57 #include "criu.h"
58 #include "error.h"
59 #include "initutils.h"
60 #include "log.h"
61 #include "lxc.h"
62 #include "lxccontainer.h"
63 #include "lxclock.h"
64 #include "memory_utils.h"
65 #include "monitor.h"
66 #include "namespace.h"
67 #include "network.h"
68 #include "parse.h"
69 #include "raw_syscalls.h"
70 #include "start.h"
71 #include "state.h"
72 #include "storage.h"
73 #include "storage/btrfs.h"
74 #include "storage/overlay.h"
75 #include "storage_utils.h"
76 #include "sync.h"
77 #include "syscall_wrappers.h"
78 #include "terminal.h"
79 #include "utils.h"
80 #include "version.h"
81
82 /* major()/minor() */
83 #ifdef MAJOR_IN_MKDEV
84 #include <sys/mkdev.h>
85 #endif
86
87 #if IS_BIONIC
88 #include <../include/lxcmntent.h>
89 #else
90 #include <mntent.h>
91 #endif
92
93 #ifndef HAVE_STRLCPY
94 #include "include/strlcpy.h"
95 #endif
96
97 /* Define faccessat() if missing from the C library */
98 #ifndef HAVE_FACCESSAT
99 static int faccessat(int __fd, const char *__file, int __type, int __flag)
100 {
101 #ifdef __NR_faccessat
102 return syscall(__NR_faccessat, __fd, __file, __type, __flag);
103 #else
104 errno = ENOSYS;
105 return -1;
106 #endif
107 }
108 #endif
109
110 lxc_log_define(lxccontainer, lxc);
111
112 static bool do_lxcapi_destroy(struct lxc_container *c);
113 static const char *lxcapi_get_config_path(struct lxc_container *c);
114 #define do_lxcapi_get_config_path(c) lxcapi_get_config_path(c)
115 static bool do_lxcapi_set_config_item(struct lxc_container *c, const char *key, const char *v);
116 static bool container_destroy(struct lxc_container *c,
117 struct lxc_storage *storage);
118 static bool get_snappath_dir(struct lxc_container *c, char *snappath);
119 static bool lxcapi_snapshot_destroy_all(struct lxc_container *c);
120 static bool do_lxcapi_save_config(struct lxc_container *c, const char *alt_file);
121
122 static bool config_file_exists(const char *lxcpath, const char *cname)
123 {
124 __do_free char *fname = NULL;
125 int ret;
126 size_t len;
127
128 /* $lxcpath + '/' + $cname + '/config' + \0 */
129 len = strlen(lxcpath) + strlen(cname) + 9;
130 fname = must_realloc(NULL, len);
131 ret = snprintf(fname, len, "%s/%s/config", lxcpath, cname);
132 if (ret < 0 || (size_t)ret >= len)
133 return false;
134
135 return file_exists(fname);
136 }
137
138 /* A few functions to help detect when a container creation failed. If a
139 * container creation was killed partway through, then trying to actually start
140 * that container could harm the host. We detect this by creating a 'partial'
141 * file under the container directory, and keeping an advisory lock. When
142 * container creation completes, we remove that file. When we load or try to
143 * start a container, if we find that file, without a flock, we remove the
144 * container.
145 */
146 static int ongoing_create(struct lxc_container *c)
147 {
148 __do_free char *path = NULL;
149 int fd, ret;
150 size_t len;
151 struct flock lk = {0};
152
153 len = strlen(c->config_path) + strlen(c->name) + 10;
154 path = must_realloc(NULL, len);
155 ret = snprintf(path, len, "%s/%s/partial", c->config_path, c->name);
156 if (ret < 0 || (size_t)ret >= len)
157 return -1;
158
159 fd = open(path, O_RDWR | O_CLOEXEC);
160 if (fd < 0) {
161 if (errno != ENOENT)
162 return -1;
163
164 return 0;
165 }
166
167 lk.l_type = F_WRLCK;
168 lk.l_whence = SEEK_SET;
169 /* F_OFD_GETLK requires that l_pid be set to 0 otherwise the kernel
170 * will EINVAL us.
171 */
172 lk.l_pid = 0;
173
174 ret = fcntl(fd, F_OFD_GETLK, &lk);
175 if (ret < 0 && errno == EINVAL) {
176 ret = flock(fd, LOCK_EX | LOCK_NB);
177 if (ret < 0 && errno == EWOULDBLOCK)
178 ret = 0;
179 }
180
181 close(fd);
182
183 /* F_OFD_GETLK will not send us back a pid so don't check it. */
184 if (ret == 0)
185 /* Create is still ongoing. */
186 return 1;
187
188 /* Create completed but partial is still there. */
189 return 2;
190 }
191
192 static int create_partial(struct lxc_container *c)
193 {
194 __do_free char *path = NULL;
195 int fd, ret;
196 size_t len;
197 struct flock lk = {0};
198
199 /* $lxcpath + '/' + $name + '/partial' + \0 */
200 len = strlen(c->config_path) + strlen(c->name) + 10;
201 path = must_realloc(NULL, len);
202 ret = snprintf(path, len, "%s/%s/partial", c->config_path, c->name);
203 if (ret < 0 || (size_t)ret >= len)
204 return -1;
205
206 fd = open(path, O_RDWR | O_CREAT | O_EXCL | O_CLOEXEC, 0000);
207 if (fd < 0)
208 return -1;
209
210 lk.l_type = F_WRLCK;
211 lk.l_whence = SEEK_SET;
212
213 ret = fcntl(fd, F_OFD_SETLKW, &lk);
214 if (ret < 0) {
215 if (errno == EINVAL) {
216 ret = flock(fd, LOCK_EX);
217 if (ret == 0)
218 return fd;
219 }
220
221 SYSERROR("Failed to lock partial file %s", path);
222 close(fd);
223 return -1;
224 }
225
226 return fd;
227 }
228
229 static void remove_partial(struct lxc_container *c, int fd)
230 {
231 __do_free char *path = NULL;
232 int ret;
233 size_t len;
234
235 close(fd);
236
237 /* $lxcpath + '/' + $name + '/partial' + \0 */
238 len = strlen(c->config_path) + strlen(c->name) + 10;
239 path = must_realloc(NULL, len);
240 ret = snprintf(path, len, "%s/%s/partial", c->config_path, c->name);
241 if (ret < 0 || (size_t)ret >= len)
242 return;
243
244 ret = unlink(path);
245 if (ret < 0)
246 SYSERROR("Failed to remove partial file %s", path);
247 }
248
249 /* LOCKING
250 * 1. container_mem_lock(c) protects the struct lxc_container from multiple threads.
251 * 2. container_disk_lock(c) protects the on-disk container data - in particular the
252 * container configuration file.
253 * The container_disk_lock also takes the container_mem_lock.
254 * 3. thread_mutex protects process data (ex: fd table) from multiple threads.
255 * NOTHING mutexes two independent programs with their own struct
256 * lxc_container for the same c->name, between API calls. For instance,
257 * c->config_read(); c->start(); Between those calls, data on disk
258 * could change (which shouldn't bother the caller unless for instance
259 * the rootfs get moved). c->config_read(); update; c->config_write();
260 * Two such updaters could race. The callers should therefore check their
261 * results. Trying to prevent that would necessarily expose us to deadlocks
262 * due to hung callers. So I prefer to keep the locks only within our own
263 * functions, not across functions.
264 *
265 * If you're going to clone while holding a lxccontainer, increment
266 * c->numthreads (under privlock) before forking. When deleting,
267 * decrement numthreads under privlock, then if it hits 0 you can delete.
268 * Do not ever use a lxccontainer whose numthreads you did not bump.
269 */
270 static void lxc_container_free(struct lxc_container *c)
271 {
272 if (!c)
273 return;
274
275 free(c->configfile);
276 c->configfile = NULL;
277
278 free(c->error_string);
279 c->error_string = NULL;
280
281 if (c->slock) {
282 lxc_putlock(c->slock);
283 c->slock = NULL;
284 }
285
286 if (c->privlock) {
287 lxc_putlock(c->privlock);
288 c->privlock = NULL;
289 }
290
291 free(c->name);
292 c->name = NULL;
293
294 if (c->lxc_conf) {
295 lxc_conf_free(c->lxc_conf);
296 c->lxc_conf = NULL;
297 }
298
299 free(c->config_path);
300 c->config_path = NULL;
301
302 free(c);
303 }
304
305 /* Consider the following case:
306 *
307 * |====================================================================|
308 * | freer | racing get()er |
309 * |====================================================================|
310 * | lxc_container_put() | lxc_container_get() |
311 * | \ lxclock(c->privlock) | c->numthreads < 1? (no) |
312 * | \ c->numthreads = 0 | \ lxclock(c->privlock) -> waits |
313 * | \ lxcunlock() | \ |
314 * | \ lxc_container_free() | \ lxclock() returns |
315 * | | \ c->numthreads < 1 -> return 0 |
316 * | \ \ (free stuff) | |
317 * | \ \ sem_destroy(privlock) | |
318 * |_______________________________|____________________________________|
319 *
320 * When the get()er checks numthreads the first time, one of the following
321 * is true:
322 * 1. freer has set numthreads = 0. get() returns 0
323 * 2. freer is between lxclock and setting numthreads to 0. get()er will
324 * sem_wait on privlock, get lxclock after freer() drops it, then see
325 * numthreads is 0 and exit without touching lxclock again..
326 * 3. freer has not yet locked privlock. If get()er runs first, then put()er
327 * will see --numthreads = 1 and not call lxc_container_free().
328 */
329
330 int lxc_container_get(struct lxc_container *c)
331 {
332 if (!c)
333 return 0;
334
335 /* If someone else has already started freeing the container, don't try
336 * to take the lock, which may be invalid.
337 */
338 if (c->numthreads < 1)
339 return 0;
340
341 if (container_mem_lock(c))
342 return 0;
343
344 /* Bail without trying to unlock, bc the privlock is now probably in
345 * freed memory.
346 */
347 if (c->numthreads < 1)
348 return 0;
349
350 c->numthreads++;
351 container_mem_unlock(c);
352
353 return 1;
354 }
355
356 int lxc_container_put(struct lxc_container *c)
357 {
358 if (!c)
359 return -1;
360
361 if (container_mem_lock(c))
362 return -1;
363
364 c->numthreads--;
365
366 if (c->numthreads < 1) {
367 container_mem_unlock(c);
368 lxc_container_free(c);
369 return 1;
370 }
371
372 container_mem_unlock(c);
373 return 0;
374 }
375
376 static bool do_lxcapi_is_defined(struct lxc_container *c)
377 {
378 int statret;
379 struct stat statbuf;
380 bool ret = false;
381
382 if (!c)
383 return false;
384
385 if (container_mem_lock(c))
386 return false;
387
388 if (!c->configfile)
389 goto on_error;
390
391 statret = stat(c->configfile, &statbuf);
392 if (statret != 0)
393 goto on_error;
394
395 ret = true;
396
397 on_error:
398 container_mem_unlock(c);
399 return ret;
400 }
401
402 #define WRAP_API(rettype, fnname) \
403 static rettype fnname(struct lxc_container *c) \
404 { \
405 rettype ret; \
406 bool reset_config = false; \
407 \
408 if (!current_config && c && c->lxc_conf) { \
409 current_config = c->lxc_conf; \
410 reset_config = true; \
411 } \
412 \
413 ret = do_##fnname(c); \
414 if (reset_config) \
415 current_config = NULL; \
416 \
417 return ret; \
418 }
419
420 #define WRAP_API_1(rettype, fnname, t1) \
421 static rettype fnname(struct lxc_container *c, t1 a1) \
422 { \
423 rettype ret; \
424 bool reset_config = false; \
425 \
426 if (!current_config && c && c->lxc_conf) { \
427 current_config = c->lxc_conf; \
428 reset_config = true; \
429 } \
430 \
431 ret = do_##fnname(c, a1); \
432 if (reset_config) \
433 current_config = NULL; \
434 \
435 return ret; \
436 }
437
438 #define WRAP_API_2(rettype, fnname, t1, t2) \
439 static rettype fnname(struct lxc_container *c, t1 a1, t2 a2) \
440 { \
441 rettype ret; \
442 bool reset_config = false; \
443 \
444 if (!current_config && c && c->lxc_conf) { \
445 current_config = c->lxc_conf; \
446 reset_config = true; \
447 } \
448 \
449 ret = do_##fnname(c, a1, a2); \
450 if (reset_config) \
451 current_config = NULL; \
452 \
453 return ret; \
454 }
455
456 #define WRAP_API_3(rettype, fnname, t1, t2, t3) \
457 static rettype fnname(struct lxc_container *c, t1 a1, t2 a2, t3 a3) \
458 { \
459 rettype ret; \
460 bool reset_config = false; \
461 \
462 if (!current_config && c && c->lxc_conf) { \
463 current_config = c->lxc_conf; \
464 reset_config = true; \
465 } \
466 \
467 ret = do_##fnname(c, a1, a2, a3); \
468 if (reset_config) \
469 current_config = NULL; \
470 \
471 return ret; \
472 }
473
474 #define WRAP_API_6(rettype, fnname, t1, t2, t3, t4, t5, t6) \
475 static rettype fnname(struct lxc_container *c, t1 a1, t2 a2, t3 a3, \
476 t4 a4, t5 a5, t6 a6) \
477 { \
478 rettype ret; \
479 bool reset_config = false; \
480 \
481 if (!current_config && c && c->lxc_conf) { \
482 current_config = c->lxc_conf; \
483 reset_config = true; \
484 } \
485 \
486 ret = do_##fnname(c, a1, a2, a3, a4, a5, a6); \
487 if (reset_config) \
488 current_config = NULL; \
489 \
490 return ret; \
491 }
492
493 WRAP_API(bool, lxcapi_is_defined)
494
495 static const char *do_lxcapi_state(struct lxc_container *c)
496 {
497 lxc_state_t s;
498
499 if (!c)
500 return NULL;
501
502 s = lxc_getstate(c->name, c->config_path);
503 return lxc_state2str(s);
504 }
505
506 WRAP_API(const char *, lxcapi_state)
507
508 static bool is_stopped(struct lxc_container *c)
509 {
510 lxc_state_t s;
511
512 s = lxc_getstate(c->name, c->config_path);
513 return (s == STOPPED);
514 }
515
516 static bool do_lxcapi_is_running(struct lxc_container *c)
517 {
518 if (!c)
519 return false;
520
521 return !is_stopped(c);
522 }
523
524 WRAP_API(bool, lxcapi_is_running)
525
526 static bool do_lxcapi_freeze(struct lxc_container *c)
527 {
528 lxc_state_t s;
529
530 if (!c || !c->lxc_conf)
531 return false;
532
533 s = lxc_getstate(c->name, c->config_path);
534 if (s != FROZEN)
535 return lxc_freeze(c->lxc_conf, c->name, c->config_path) == 0;
536
537 return true;
538 }
539
540 WRAP_API(bool, lxcapi_freeze)
541
542 static bool do_lxcapi_unfreeze(struct lxc_container *c)
543 {
544 lxc_state_t s;
545
546 if (!c || !c->lxc_conf)
547 return false;
548
549 s = lxc_getstate(c->name, c->config_path);
550 if (s == FROZEN)
551 return lxc_unfreeze(c->lxc_conf, c->name, c->config_path) == 0;
552
553 return true;
554 }
555
556 WRAP_API(bool, lxcapi_unfreeze)
557
558 static int do_lxcapi_console_getfd(struct lxc_container *c, int *ttynum, int *masterfd)
559 {
560 if (!c)
561 return -1;
562
563 return lxc_terminal_getfd(c, ttynum, masterfd);
564 }
565
566 WRAP_API_2(int, lxcapi_console_getfd, int *, int *)
567
568 static int lxcapi_console(struct lxc_container *c, int ttynum, int stdinfd,
569 int stdoutfd, int stderrfd, int escape)
570 {
571 int ret;
572
573 if (!c)
574 return -1;
575
576 current_config = c->lxc_conf;
577 ret = lxc_console(c, ttynum, stdinfd, stdoutfd, stderrfd, escape);
578 current_config = NULL;
579
580 return ret;
581 }
582
583 static int do_lxcapi_console_log(struct lxc_container *c, struct lxc_console_log *log)
584 {
585 int ret;
586
587 if (!c)
588 return -EINVAL;
589
590 ret = lxc_cmd_console_log(c->name, do_lxcapi_get_config_path(c), log);
591 if (ret < 0) {
592 if (ret == -ENODATA)
593 NOTICE("The console log is empty");
594 else if (ret == -EFAULT)
595 NOTICE("The container does not keep a console log");
596 else if (ret == -ENOENT)
597 NOTICE("The container does not keep a console log file");
598 else if (ret == -EIO)
599 NOTICE("Failed to write console log to log file");
600 else
601 ERROR("Failed to retrieve console log");
602 }
603
604 return ret;
605 }
606
607 WRAP_API_1(int, lxcapi_console_log, struct lxc_console_log *)
608
609 static pid_t do_lxcapi_init_pid(struct lxc_container *c)
610 {
611 if (!c)
612 return -1;
613
614 return lxc_cmd_get_init_pid(c->name, c->config_path);
615 }
616
617 WRAP_API(pid_t, lxcapi_init_pid)
618
619 static bool load_config_locked(struct lxc_container *c, const char *fname)
620 {
621 if (!c->lxc_conf)
622 c->lxc_conf = lxc_conf_init();
623
624 if (!c->lxc_conf)
625 return false;
626
627 if (lxc_config_read(fname, c->lxc_conf, false) != 0)
628 return false;
629
630 c->lxc_conf->name = c->name;
631 return true;
632 }
633
634 static bool do_lxcapi_load_config(struct lxc_container *c, const char *alt_file)
635 {
636 int lret;
637 const char *fname;
638 bool need_disklock = false, ret = false;
639
640 if (!c)
641 return false;
642
643 fname = c->configfile;
644
645 if (alt_file)
646 fname = alt_file;
647
648 if (!fname)
649 return false;
650
651 /* If we're reading something other than the container's config, we only
652 * need to lock the in-memory container. If loading the container's
653 * config file, take the disk lock.
654 */
655 if (strcmp(fname, c->configfile) == 0)
656 need_disklock = true;
657
658 if (need_disklock)
659 lret = container_disk_lock(c);
660 else
661 lret = container_mem_lock(c);
662 if (lret)
663 return false;
664
665 ret = load_config_locked(c, fname);
666
667 if (need_disklock)
668 container_disk_unlock(c);
669 else
670 container_mem_unlock(c);
671
672 return ret;
673 }
674
675 WRAP_API_1(bool, lxcapi_load_config, const char *)
676
677 static bool do_lxcapi_want_daemonize(struct lxc_container *c, bool state)
678 {
679 if (!c || !c->lxc_conf)
680 return false;
681
682 if (container_mem_lock(c))
683 return false;
684
685 c->daemonize = state;
686
687 container_mem_unlock(c);
688
689 return true;
690 }
691
692 WRAP_API_1(bool, lxcapi_want_daemonize, bool)
693
694 static bool do_lxcapi_want_close_all_fds(struct lxc_container *c, bool state)
695 {
696 if (!c || !c->lxc_conf)
697 return false;
698
699 if (container_mem_lock(c))
700 return false;
701
702 c->lxc_conf->close_all_fds = state;
703
704 container_mem_unlock(c);
705
706 return true;
707 }
708
709 WRAP_API_1(bool, lxcapi_want_close_all_fds, bool)
710
711 static bool do_lxcapi_wait(struct lxc_container *c, const char *state,
712 int timeout)
713 {
714 int ret;
715
716 if (!c)
717 return false;
718
719 ret = lxc_wait(c->name, state, timeout, c->config_path);
720 return ret == 0;
721 }
722
723 WRAP_API_2(bool, lxcapi_wait, const char *, int)
724
725 static bool am_single_threaded(void)
726 {
727 DIR *dir;
728 struct dirent *direntp;
729 int count = 0;
730
731 dir = opendir("/proc/self/task");
732 if (!dir)
733 return false;
734
735 while ((direntp = readdir(dir))) {
736 if (strcmp(direntp->d_name, ".") == 0)
737 continue;
738
739 if (strcmp(direntp->d_name, "..") == 0)
740 continue;
741
742 count++;
743 if (count > 1)
744 break;
745 }
746 closedir(dir);
747
748 return count == 1;
749 }
750
751 static void push_arg(char ***argp, char *arg, int *nargs)
752 {
753 char *copy;
754 char **argv;
755
756 copy = must_copy_string(arg);
757
758 do {
759 argv = realloc(*argp, (*nargs + 2) * sizeof(char *));
760 } while (!argv);
761
762 *argp = argv;
763 argv[*nargs] = copy;
764 (*nargs)++;
765 argv[*nargs] = NULL;
766 }
767
768 static char **split_init_cmd(const char *incmd)
769 {
770 __do_free char *copy = NULL;
771 char *p;
772 char **argv;
773 int nargs = 0;
774
775 if (!incmd)
776 return NULL;
777
778 copy = must_copy_string(incmd);
779
780 do {
781 argv = malloc(sizeof(char *));
782 } while (!argv);
783
784 argv[0] = NULL;
785 lxc_iterate_parts (p, copy, " ")
786 push_arg(&argv, p, &nargs);
787
788 if (nargs == 0) {
789 free(argv);
790 return NULL;
791 }
792
793 return argv;
794 }
795
796 static void free_init_cmd(char **argv)
797 {
798 int i = 0;
799
800 if (!argv)
801 return;
802
803 while (argv[i])
804 free(argv[i++]);
805
806 free(argv);
807 }
808
809 static int lxc_rcv_status(int state_socket)
810 {
811 int ret;
812 int state = -1;
813
814 again:
815 /* Receive container state. */
816 ret = lxc_abstract_unix_rcv_credential(state_socket, &state, sizeof(int));
817 if (ret <= 0) {
818 if (errno != EINTR)
819 return -1;
820
821 TRACE("Caught EINTR; retrying");
822 goto again;
823 }
824
825 return state;
826 }
827
828 static bool wait_on_daemonized_start(struct lxc_handler *handler, int pid)
829 {
830 int ret, state;
831
832 /* Close write end of the socket pair. */
833 close(handler->state_socket_pair[1]);
834 handler->state_socket_pair[1] = -1;
835
836 state = lxc_rcv_status(handler->state_socket_pair[0]);
837
838 /* Close read end of the socket pair. */
839 close(handler->state_socket_pair[0]);
840 handler->state_socket_pair[0] = -1;
841
842 /* The first child is going to fork() again and then exits. So we reap
843 * the first child here.
844 */
845 ret = wait_for_pid(pid);
846 if (ret < 0)
847 DEBUG("Failed waiting on first child %d", pid);
848 else
849 DEBUG("First child %d exited", pid);
850
851 if (state < 0) {
852 SYSERROR("Failed to receive the container state");
853 return false;
854 }
855
856 /* If we receive anything else then running we know that the container
857 * failed to start.
858 */
859 if (state != RUNNING) {
860 ERROR("Received container state \"%s\" instead of \"RUNNING\"",
861 lxc_state2str(state));
862 return false;
863 }
864
865 TRACE("Container is in \"RUNNING\" state");
866 return true;
867 }
868
869 static bool do_lxcapi_start(struct lxc_container *c, int useinit, char * const argv[])
870 {
871 int ret;
872 struct lxc_handler *handler;
873 struct lxc_conf *conf;
874 char *default_args[] = {
875 "/sbin/init",
876 NULL,
877 };
878 char **init_cmd = NULL;
879 int keepfds[3] = {-1, -1, -1};
880
881 /* container does exist */
882 if (!c)
883 return false;
884
885 /* If anything fails before we set error_num, we want an error in there.
886 */
887 c->error_num = 1;
888
889 /* Container has not been setup. */
890 if (!c->lxc_conf)
891 return false;
892
893 ret = ongoing_create(c);
894 if (ret < 0) {
895 ERROR("Failed checking for incomplete container creation");
896 return false;
897 } else if (ret == 1) {
898 ERROR("Ongoing container creation detected");
899 return false;
900 } else if (ret == 2) {
901 ERROR("Failed to create container");
902 do_lxcapi_destroy(c);
903 return false;
904 }
905
906 if (container_mem_lock(c))
907 return false;
908
909 conf = c->lxc_conf;
910
911 /* initialize handler */
912 handler = lxc_init_handler(c->name, conf, c->config_path, c->daemonize);
913
914 container_mem_unlock(c);
915 if (!handler)
916 return false;
917
918 if (!argv) {
919 if (useinit && conf->execute_cmd)
920 argv = init_cmd = split_init_cmd(conf->execute_cmd);
921 else
922 argv = init_cmd = split_init_cmd(conf->init_cmd);
923 }
924
925 /* ... otherwise use default_args. */
926 if (!argv) {
927 if (useinit) {
928 ERROR("No valid init detected");
929 lxc_free_handler(handler);
930 return false;
931 }
932 argv = default_args;
933 }
934
935 /* I'm not sure what locks we want here.Any? Is liblxc's locking enough
936 * here to protect the on disk container? We don't want to exclude
937 * things like lxc_info while the container is running.
938 */
939 if (c->daemonize) {
940 bool started;
941 char title[2048];
942 pid_t pid;
943
944 pid = fork();
945 if (pid < 0) {
946 free_init_cmd(init_cmd);
947 lxc_free_handler(handler);
948 return false;
949 }
950
951 /* first parent */
952 if (pid != 0) {
953 /* Set to NULL because we don't want father unlink
954 * the PID file, child will do the free and unlink.
955 */
956 c->pidfile = NULL;
957
958 /* Wait for container to tell us whether it started
959 * successfully.
960 */
961 started = wait_on_daemonized_start(handler, pid);
962
963 free_init_cmd(init_cmd);
964 lxc_free_handler(handler);
965 return started;
966 }
967
968 /* first child */
969
970 /* We don't really care if this doesn't print all the
971 * characters. All that it means is that the proctitle will be
972 * ugly. Similarly, we also don't care if setproctitle() fails.
973 */
974 ret = snprintf(title, sizeof(title), "[lxc monitor] %s %s", c->config_path, c->name);
975 if (ret > 0) {
976 ret = setproctitle(title);
977 if (ret < 0)
978 INFO("Failed to set process title to %s", title);
979 else
980 INFO("Set process title to %s", title);
981 }
982
983 /* We fork() a second time to be reparented to init. Like
984 * POSIX's daemon() function we change to "/" and redirect
985 * std{in,out,err} to /dev/null.
986 */
987 pid = fork();
988 if (pid < 0) {
989 SYSERROR("Failed to fork first child process");
990 _exit(EXIT_FAILURE);
991 }
992
993 /* second parent */
994 if (pid != 0) {
995 free_init_cmd(init_cmd);
996 lxc_free_handler(handler);
997 _exit(EXIT_SUCCESS);
998 }
999
1000 /* second child */
1001
1002 /* change to / directory */
1003 ret = chdir("/");
1004 if (ret < 0) {
1005 SYSERROR("Failed to change to \"/\" directory");
1006 _exit(EXIT_FAILURE);
1007 }
1008
1009 keepfds[0] = handler->conf->maincmd_fd;
1010 keepfds[1] = handler->state_socket_pair[0];
1011 keepfds[2] = handler->state_socket_pair[1];
1012 ret = lxc_check_inherited(conf, true, keepfds,
1013 sizeof(keepfds) / sizeof(keepfds[0]));
1014 if (ret < 0)
1015 _exit(EXIT_FAILURE);
1016
1017 /* redirect std{in,out,err} to /dev/null */
1018 ret = null_stdfds();
1019 if (ret < 0) {
1020 ERROR("Failed to redirect std{in,out,err} to /dev/null");
1021 _exit(EXIT_FAILURE);
1022 }
1023
1024 /* become session leader */
1025 ret = setsid();
1026 if (ret < 0)
1027 TRACE("Process %d is already process group leader", lxc_raw_getpid());
1028 } else if (!am_single_threaded()) {
1029 ERROR("Cannot start non-daemonized container when threaded");
1030 free_init_cmd(init_cmd);
1031 lxc_free_handler(handler);
1032 return false;
1033 }
1034
1035 /* We need to write PID file after daemonize, so we always write the
1036 * right PID.
1037 */
1038 if (c->pidfile) {
1039 int w;
1040 char pidstr[INTTYPE_TO_STRLEN(pid_t)];
1041
1042 w = snprintf(pidstr, sizeof(pidstr), "%d", lxc_raw_getpid());
1043 if (w < 0 || (size_t)w >= sizeof(pidstr)) {
1044 free_init_cmd(init_cmd);
1045 lxc_free_handler(handler);
1046
1047 SYSERROR("Failed to write monitor pid to \"%s\"", c->pidfile);
1048
1049 if (c->daemonize)
1050 _exit(EXIT_FAILURE);
1051
1052 return false;
1053 }
1054
1055 ret = lxc_write_to_file(c->pidfile, pidstr, w, false, 0600);
1056 if (ret < 0) {
1057 free_init_cmd(init_cmd);
1058 lxc_free_handler(handler);
1059
1060 SYSERROR("Failed to write monitor pid to \"%s\"", c->pidfile);
1061
1062 if (c->daemonize)
1063 _exit(EXIT_FAILURE);
1064
1065 return false;
1066 }
1067 }
1068
1069 conf->reboot = REBOOT_NONE;
1070
1071 /* Unshare the mount namespace if requested */
1072 if (conf->monitor_unshare) {
1073 ret = unshare(CLONE_NEWNS);
1074 if (ret < 0) {
1075 SYSERROR("Failed to unshare mount namespace");
1076 lxc_free_handler(handler);
1077 ret = 1;
1078 goto on_error;
1079 }
1080
1081 ret = mount(NULL, "/", NULL, MS_SLAVE|MS_REC, NULL);
1082 if (ret < 0) {
1083 SYSERROR("Failed to make / rslave at startup");
1084 lxc_free_handler(handler);
1085 ret = 1;
1086 goto on_error;
1087 }
1088 }
1089
1090 reboot:
1091 if (conf->reboot == REBOOT_INIT) {
1092 /* initialize handler */
1093 handler = lxc_init_handler(c->name, conf, c->config_path, c->daemonize);
1094 if (!handler) {
1095 ret = 1;
1096 goto on_error;
1097 }
1098 }
1099
1100 keepfds[0] = handler->conf->maincmd_fd;
1101 keepfds[1] = handler->state_socket_pair[0];
1102 keepfds[2] = handler->state_socket_pair[1];
1103 ret = lxc_check_inherited(conf, c->daemonize, keepfds,
1104 sizeof(keepfds) / sizeof(keepfds[0]));
1105 if (ret < 0) {
1106 lxc_free_handler(handler);
1107 ret = 1;
1108 goto on_error;
1109 }
1110
1111 if (useinit)
1112 ret = lxc_execute(c->name, argv, 1, handler, c->config_path,
1113 c->daemonize, &c->error_num);
1114 else
1115 ret = lxc_start(c->name, argv, handler, c->config_path,
1116 c->daemonize, &c->error_num);
1117
1118 if (conf->reboot == REBOOT_REQ) {
1119 INFO("Container requested reboot");
1120 conf->reboot = REBOOT_INIT;
1121 goto reboot;
1122 }
1123
1124 on_error:
1125 if (c->pidfile) {
1126 unlink(c->pidfile);
1127 free(c->pidfile);
1128 c->pidfile = NULL;
1129 }
1130 free_init_cmd(init_cmd);
1131
1132 if (c->daemonize && ret != 0)
1133 _exit(EXIT_FAILURE);
1134 else if (c->daemonize)
1135 _exit(EXIT_SUCCESS);
1136
1137 if (ret != 0)
1138 return false;
1139
1140 return true;
1141 }
1142
1143 static bool lxcapi_start(struct lxc_container *c, int useinit,
1144 char *const argv[])
1145 {
1146 bool ret;
1147
1148 current_config = c ? c->lxc_conf : NULL;
1149 ret = do_lxcapi_start(c, useinit, argv);
1150 current_config = NULL;
1151
1152 return ret;
1153 }
1154
1155 /* Note, there MUST be an ending NULL. */
1156 static bool lxcapi_startl(struct lxc_container *c, int useinit, ...)
1157 {
1158 va_list ap;
1159 char **inargs = NULL;
1160 bool bret = false;
1161
1162 /* container exists */
1163 if (!c)
1164 return false;
1165
1166 current_config = c->lxc_conf;
1167
1168 va_start(ap, useinit);
1169 inargs = lxc_va_arg_list_to_argv(ap, 0, 1);
1170 va_end(ap);
1171 if (!inargs)
1172 goto on_error;
1173
1174 /* pass NULL if no arguments were supplied */
1175 bret = do_lxcapi_start(c, useinit, *inargs ? inargs : NULL);
1176
1177 on_error:
1178 if (inargs) {
1179 char **arg;
1180
1181 for (arg = inargs; *arg; arg++)
1182 free(*arg);
1183 free(inargs);
1184 }
1185
1186 current_config = NULL;
1187
1188 return bret;
1189 }
1190
1191 static bool do_lxcapi_stop(struct lxc_container *c)
1192 {
1193 int ret;
1194
1195 if (!c)
1196 return false;
1197
1198 ret = lxc_cmd_stop(c->name, c->config_path);
1199
1200 return ret == 0;
1201 }
1202
1203 WRAP_API(bool, lxcapi_stop)
1204
1205 static int do_create_container_dir(const char *path, struct lxc_conf *conf)
1206 {
1207 __do_free char *p = NULL;
1208 int lasterr;
1209 int ret = -1;
1210
1211 mode_t mask = umask(0002);
1212 ret = mkdir(path, 0770);
1213 lasterr = errno;
1214 umask(mask);
1215 errno = lasterr;
1216 if (ret) {
1217 if (errno != EEXIST)
1218 return -1;
1219
1220 ret = 0;
1221 }
1222
1223 p = must_copy_string(path);
1224
1225 if (!lxc_list_empty(&conf->id_map)) {
1226 ret = chown_mapped_root(p, conf);
1227 if (ret < 0)
1228 ret = -1;
1229 }
1230
1231 return ret;
1232 }
1233
1234 /* Create the standard expected container dir. */
1235 static bool create_container_dir(struct lxc_container *c)
1236 {
1237 int ret;
1238 size_t len;
1239 char *s;
1240
1241 len = strlen(c->config_path) + strlen(c->name) + 2;
1242 s = malloc(len);
1243 if (!s)
1244 return false;
1245
1246 ret = snprintf(s, len, "%s/%s", c->config_path, c->name);
1247 if (ret < 0 || (size_t)ret >= len) {
1248 free(s);
1249 return false;
1250 }
1251
1252 ret = do_create_container_dir(s, c->lxc_conf);
1253 free(s);
1254
1255 return ret == 0;
1256 }
1257
1258 /* do_storage_create: thin wrapper around storage_create(). Like
1259 * storage_create(), it returns a mounted bdev on success, NULL on error.
1260 */
1261 static struct lxc_storage *do_storage_create(struct lxc_container *c,
1262 const char *type,
1263 struct bdev_specs *specs)
1264 {
1265 __do_free char *dest = NULL;
1266 int ret;
1267 size_t len;
1268 struct lxc_storage *bdev;
1269
1270 /* rootfs.path or lxcpath/lxcname/rootfs */
1271 if (c->lxc_conf->rootfs.path &&
1272 (access(c->lxc_conf->rootfs.path, F_OK) == 0)) {
1273 const char *rpath = c->lxc_conf->rootfs.path;
1274 len = strlen(rpath) + 1;
1275 dest = must_realloc(NULL, len);
1276 ret = snprintf(dest, len, "%s", rpath);
1277 } else {
1278 const char *lxcpath = do_lxcapi_get_config_path(c);
1279 len = strlen(c->name) + strlen(lxcpath) + 9;
1280 dest = must_realloc(NULL, len);
1281 ret = snprintf(dest, len, "%s/%s/rootfs", lxcpath, c->name);
1282 }
1283 if (ret < 0 || (size_t)ret >= len)
1284 return NULL;
1285
1286 bdev = storage_create(dest, type, c->name, specs);
1287 if (!bdev) {
1288 ERROR("Failed to create \"%s\" storage", type);
1289 return NULL;
1290 }
1291
1292 if (!c->set_config_item(c, "lxc.rootfs.path", bdev->src)) {
1293 ERROR("Failed to set \"lxc.rootfs.path = %s\"", bdev->src);
1294 return NULL;
1295 }
1296
1297 /* If we are not root, chown the rootfs dir to root in the target user
1298 * namespace.
1299 */
1300 ret = geteuid();
1301 if (ret != 0 || (c->lxc_conf && !lxc_list_empty(&c->lxc_conf->id_map))) {
1302 ret = chown_mapped_root(bdev->dest, c->lxc_conf);
1303 if (ret < 0) {
1304 ERROR("Error chowning \"%s\" to container root", bdev->dest);
1305 suggest_default_idmap();
1306 storage_put(bdev);
1307 return NULL;
1308 }
1309 }
1310
1311 return bdev;
1312 }
1313
1314 static char *lxcbasename(char *path)
1315 {
1316 char *p;
1317
1318 p = path + strlen(path) - 1;
1319 while (*p != '/' && p > path)
1320 p--;
1321
1322 return p;
1323 }
1324
1325 static bool create_run_template(struct lxc_container *c, char *tpath,
1326 bool need_null_stdfds, char *const argv[])
1327 {
1328 int ret;
1329 pid_t pid;
1330
1331 if (!tpath)
1332 return true;
1333
1334 pid = fork();
1335 if (pid < 0) {
1336 SYSERROR("Failed to fork task for container creation template");
1337 return false;
1338 }
1339
1340 if (pid == 0) { /* child */
1341 int i, len;
1342 char *namearg, *patharg, *rootfsarg;
1343 char **newargv;
1344 int nargs = 0;
1345 struct lxc_storage *bdev = NULL;
1346 struct lxc_conf *conf = c->lxc_conf;
1347 uid_t euid;
1348
1349 if (need_null_stdfds) {
1350 ret = null_stdfds();
1351 if (ret < 0)
1352 _exit(EXIT_FAILURE);
1353 }
1354
1355 bdev = storage_init(c->lxc_conf);
1356 if (!bdev) {
1357 ERROR("Failed to initialize storage");
1358 _exit(EXIT_FAILURE);
1359 }
1360
1361 euid = geteuid();
1362 if (euid == 0) {
1363 ret = unshare(CLONE_NEWNS);
1364 if (ret < 0) {
1365 ERROR("Failed to unshare CLONE_NEWNS");
1366 _exit(EXIT_FAILURE);
1367 }
1368
1369 ret = detect_shared_rootfs();
1370 if (ret == 1) {
1371 ret = mount(NULL, "/", NULL, MS_SLAVE | MS_REC, NULL);
1372 if (ret < 0) {
1373 SYSERROR("Failed to make \"/\" rslave");
1374 ERROR("Continuing...");
1375 }
1376 }
1377 }
1378
1379 if (strcmp(bdev->type, "dir") != 0 && strcmp(bdev->type, "btrfs") != 0) {
1380 if (euid != 0) {
1381 ERROR("Unprivileged users can only create "
1382 "btrfs and directory-backed containers");
1383 _exit(EXIT_FAILURE);
1384 }
1385
1386 if (strcmp(bdev->type, "overlay") == 0 ||
1387 strcmp(bdev->type, "overlayfs") == 0) {
1388 /* If we create an overlay container we need to
1389 * rsync the contents into
1390 * <container-path>/<container-name>/rootfs.
1391 * However, the overlay mount function will
1392 * mount will mount
1393 * <container-path>/<container-name>/delta0
1394 * over
1395 * <container-path>/<container-name>/rootfs
1396 * which means we would rsync the rootfs into
1397 * the delta directory. That doesn't make sense
1398 * since the delta directory only exists to
1399 * record the differences to
1400 * <container-path>/<container-name>/rootfs. So
1401 * let's simply bind-mount here and then rsync
1402 * directly into
1403 * <container-path>/<container-name>/rootfs.
1404 */
1405 char *src;
1406
1407 src = ovl_get_rootfs(bdev->src, &(size_t){0});
1408 if (!src) {
1409 ERROR("Failed to get rootfs");
1410 _exit(EXIT_FAILURE);
1411 }
1412
1413 ret = mount(src, bdev->dest, "bind", MS_BIND | MS_REC, NULL);
1414 if (ret < 0) {
1415 ERROR("Failed to mount rootfs");
1416 _exit(EXIT_FAILURE);
1417 }
1418 } else {
1419 ret = bdev->ops->mount(bdev);
1420 if (ret < 0) {
1421 ERROR("Failed to mount rootfs");
1422 _exit(EXIT_FAILURE);
1423 }
1424 }
1425 } else { /* TODO come up with a better way here! */
1426 const char *src;
1427 free(bdev->dest);
1428 src = lxc_storage_get_path(bdev->src, bdev->type);
1429 bdev->dest = strdup(src);
1430 }
1431
1432 /* Create our new array, pre-pend the template name and base
1433 * args.
1434 */
1435 if (argv)
1436 for (nargs = 0; argv[nargs]; nargs++)
1437 ;
1438
1439 /* template, path, rootfs and name args */
1440 nargs += 4;
1441
1442 newargv = malloc(nargs * sizeof(*newargv));
1443 if (!newargv)
1444 _exit(EXIT_FAILURE);
1445 newargv[0] = lxcbasename(tpath);
1446
1447 /* --path */
1448 len = strlen(c->config_path) + strlen(c->name) + strlen("--path=") + 2;
1449 patharg = malloc(len);
1450 if (!patharg)
1451 _exit(EXIT_FAILURE);
1452
1453 ret = snprintf(patharg, len, "--path=%s/%s", c->config_path, c->name);
1454 if (ret < 0 || ret >= len)
1455 _exit(EXIT_FAILURE);
1456 newargv[1] = patharg;
1457
1458 /* --name */
1459 len = strlen("--name=") + strlen(c->name) + 1;
1460 namearg = malloc(len);
1461 if (!namearg)
1462 _exit(EXIT_FAILURE);
1463
1464 ret = snprintf(namearg, len, "--name=%s", c->name);
1465 if (ret < 0 || ret >= len)
1466 _exit(EXIT_FAILURE);
1467 newargv[2] = namearg;
1468
1469 /* --rootfs */
1470 len = strlen("--rootfs=") + 1 + strlen(bdev->dest);
1471 rootfsarg = malloc(len);
1472 if (!rootfsarg)
1473 _exit(EXIT_FAILURE);
1474
1475 ret = snprintf(rootfsarg, len, "--rootfs=%s", bdev->dest);
1476 if (ret < 0 || ret >= len)
1477 _exit(EXIT_FAILURE);
1478 newargv[3] = rootfsarg;
1479
1480 /* add passed-in args */
1481 if (argv)
1482 for (i = 4; i < nargs; i++)
1483 newargv[i] = argv[i - 4];
1484
1485 /* add trailing NULL */
1486 nargs++;
1487 newargv = realloc(newargv, nargs * sizeof(*newargv));
1488 if (!newargv)
1489 _exit(EXIT_FAILURE);
1490 newargv[nargs - 1] = NULL;
1491
1492 /* If we're running the template in a mapped userns, then we
1493 * prepend the template command with: lxc-usernsexec <-m map1>
1494 * ... <-m mapn> -- and we append "--mapped-uid x", where x is
1495 * the mapped uid for our geteuid()
1496 */
1497 if (!lxc_list_empty(&conf->id_map)) {
1498 int extraargs, hostuid_mapped, hostgid_mapped;
1499 char **n2;
1500 char txtuid[20], txtgid[20];
1501 struct lxc_list *it;
1502 struct id_map *map;
1503 int n2args = 1;
1504
1505 n2 = malloc(n2args * sizeof(*n2));
1506 if (!n2)
1507 _exit(EXIT_FAILURE);
1508
1509 newargv[0] = tpath;
1510 tpath = "lxc-usernsexec";
1511 n2[0] = "lxc-usernsexec";
1512
1513 lxc_list_for_each(it, &conf->id_map) {
1514 map = it->elem;
1515 n2args += 2;
1516 n2 = realloc(n2, n2args * sizeof(char *));
1517 if (!n2)
1518 _exit(EXIT_FAILURE);
1519
1520 n2[n2args - 2] = "-m";
1521 n2[n2args - 1] = malloc(200);
1522 if (!n2[n2args - 1])
1523 _exit(EXIT_FAILURE);
1524
1525 ret = snprintf(n2[n2args - 1], 200, "%c:%lu:%lu:%lu",
1526 map->idtype == ID_TYPE_UID ? 'u' : 'g',
1527 map->nsid, map->hostid, map->range);
1528 if (ret < 0 || ret >= 200)
1529 _exit(EXIT_FAILURE);
1530 }
1531
1532 hostuid_mapped = mapped_hostid(geteuid(), conf, ID_TYPE_UID);
1533 extraargs = hostuid_mapped >= 0 ? 1 : 3;
1534
1535 n2 = realloc(n2, (nargs + n2args + extraargs) * sizeof(char *));
1536 if (!n2)
1537 _exit(EXIT_FAILURE);
1538
1539 if (hostuid_mapped < 0) {
1540 hostuid_mapped = find_unmapped_nsid(conf, ID_TYPE_UID);
1541 n2[n2args++] = "-m";
1542 if (hostuid_mapped < 0) {
1543 ERROR("Failed to find free uid to map");
1544 _exit(EXIT_FAILURE);
1545 }
1546
1547 n2[n2args++] = malloc(200);
1548 if (!n2[n2args - 1]) {
1549 SYSERROR("out of memory");
1550 _exit(EXIT_FAILURE);
1551 }
1552
1553 ret = snprintf(n2[n2args - 1], 200, "u:%d:%d:1",
1554 hostuid_mapped, geteuid());
1555 if (ret < 0 || ret >= 200)
1556 _exit(EXIT_FAILURE);
1557 }
1558
1559 hostgid_mapped = mapped_hostid(getegid(), conf, ID_TYPE_GID);
1560 extraargs = hostgid_mapped >= 0 ? 1 : 3;
1561
1562 n2 = realloc(n2, (nargs + n2args + extraargs) * sizeof(char *));
1563 if (!n2)
1564 _exit(EXIT_FAILURE);
1565
1566 if (hostgid_mapped < 0) {
1567 hostgid_mapped = find_unmapped_nsid(conf, ID_TYPE_GID);
1568 n2[n2args++] = "-m";
1569 if (hostgid_mapped < 0) {
1570 ERROR("Failed to find free gid to map");
1571 _exit(EXIT_FAILURE);
1572 }
1573
1574 n2[n2args++] = malloc(200);
1575 if (!n2[n2args - 1]) {
1576 SYSERROR("out of memory");
1577 _exit(EXIT_FAILURE);
1578 }
1579
1580 ret = snprintf(n2[n2args - 1], 200, "g:%d:%d:1",
1581 hostgid_mapped, getegid());
1582 if (ret < 0 || ret >= 200)
1583 _exit(EXIT_FAILURE);
1584 }
1585
1586 n2[n2args++] = "--";
1587
1588 for (i = 0; i < nargs; i++)
1589 n2[i + n2args] = newargv[i];
1590 n2args += nargs;
1591
1592 /* Finally add "--mapped-uid $uid" to tell template what
1593 * to chown cached images to.
1594 */
1595 n2args += 4;
1596 n2 = realloc(n2, n2args * sizeof(char *));
1597 if (!n2)
1598 _exit(EXIT_FAILURE);
1599
1600 /* note n2[n2args-1] is NULL */
1601 n2[n2args - 5] = "--mapped-uid";
1602
1603 ret = snprintf(txtuid, 20, "%d", hostuid_mapped);
1604 if (ret < 0 || ret >= 20) {
1605 free(newargv);
1606 free(n2);
1607 _exit(EXIT_FAILURE);
1608 }
1609
1610 n2[n2args - 4] = txtuid;
1611 n2[n2args - 3] = "--mapped-gid";
1612
1613 ret = snprintf(txtgid, 20, "%d", hostgid_mapped);
1614 if (ret < 0 || ret >= 20) {
1615 free(newargv);
1616 free(n2);
1617 _exit(EXIT_FAILURE);
1618 }
1619
1620 n2[n2args - 2] = txtgid;
1621 n2[n2args - 1] = NULL;
1622 free(newargv);
1623 newargv = n2;
1624 }
1625
1626 execvp(tpath, newargv);
1627 SYSERROR("Failed to execute template %s", tpath);
1628 _exit(EXIT_FAILURE);
1629 }
1630
1631 ret = wait_for_pid(pid);
1632 if (ret != 0) {
1633 ERROR("Failed to create container from template");
1634 return false;
1635 }
1636
1637 return true;
1638 }
1639
1640 static bool prepend_lxc_header(char *path, const char *t, char *const argv[])
1641 {
1642 long flen;
1643 size_t len;
1644 char *contents;
1645 FILE *f;
1646 int ret = -1;
1647 #if HAVE_LIBGNUTLS
1648 int i;
1649 unsigned char md_value[SHA_DIGEST_LENGTH];
1650 char *tpath;
1651 #endif
1652
1653 f = fopen(path, "r");
1654 if (f == NULL)
1655 return false;
1656
1657 ret = fseek(f, 0, SEEK_END);
1658 if (ret < 0)
1659 goto out_error;
1660
1661 ret = -1;
1662 flen = ftell(f);
1663 if (flen < 0)
1664 goto out_error;
1665
1666 ret = fseek(f, 0, SEEK_SET);
1667 if (ret < 0)
1668 goto out_error;
1669
1670 ret = fseek(f, 0, SEEK_SET);
1671 if (ret < 0)
1672 goto out_error;
1673
1674 ret = -1;
1675 contents = malloc(flen + 1);
1676 if (!contents)
1677 goto out_error;
1678
1679 len = fread(contents, 1, flen, f);
1680 if (len != flen)
1681 goto out_free_contents;
1682
1683 contents[flen] = '\0';
1684
1685 ret = fclose(f);
1686 f = NULL;
1687 if (ret < 0)
1688 goto out_free_contents;
1689
1690 #if HAVE_LIBGNUTLS
1691 tpath = get_template_path(t);
1692 if (!tpath) {
1693 ERROR("Invalid template \"%s\" specified", t);
1694 goto out_free_contents;
1695 }
1696
1697 ret = sha1sum_file(tpath, md_value);
1698 if (ret < 0) {
1699 ERROR("Failed to get sha1sum of %s", tpath);
1700 free(tpath);
1701 goto out_free_contents;
1702 }
1703 free(tpath);
1704 #endif
1705
1706 f = fopen(path, "w");
1707 if (f == NULL) {
1708 SYSERROR("Reopening config for writing");
1709 free(contents);
1710 return false;
1711 }
1712
1713 fprintf(f, "# Template used to create this container: %s\n", t);
1714 if (argv) {
1715 fprintf(f, "# Parameters passed to the template:");
1716 while (*argv) {
1717 fprintf(f, " %s", *argv);
1718 argv++;
1719 }
1720 fprintf(f, "\n");
1721 }
1722
1723 #if HAVE_LIBGNUTLS
1724 fprintf(f, "# Template script checksum (SHA-1): ");
1725 for (i=0; i<SHA_DIGEST_LENGTH; i++)
1726 fprintf(f, "%02x", md_value[i]);
1727 fprintf(f, "\n");
1728 #endif
1729 fprintf(f, "# For additional config options, please look at lxc.container.conf(5)\n");
1730 fprintf(f, "\n# Uncomment the following line to support nesting containers:\n");
1731 fprintf(f, "#lxc.include = " LXCTEMPLATECONFIG "/nesting.conf\n");
1732 fprintf(f, "# (Be aware this has security implications)\n\n");
1733 if (fwrite(contents, 1, flen, f) != flen) {
1734 SYSERROR("Writing original contents");
1735 free(contents);
1736 fclose(f);
1737 return false;
1738 }
1739
1740 ret = 0;
1741
1742 out_free_contents:
1743 free(contents);
1744
1745 out_error:
1746 if (f) {
1747 int newret;
1748 newret = fclose(f);
1749 if (ret == 0)
1750 ret = newret;
1751 }
1752
1753 if (ret < 0) {
1754 SYSERROR("Error prepending header");
1755 return false;
1756 }
1757
1758 return true;
1759 }
1760
1761 static void lxcapi_clear_config(struct lxc_container *c)
1762 {
1763 if (!c || !c->lxc_conf)
1764 return;
1765
1766 lxc_conf_free(c->lxc_conf);
1767 c->lxc_conf = NULL;
1768 }
1769
1770 #define do_lxcapi_clear_config(c) lxcapi_clear_config(c)
1771
1772 /*
1773 * lxcapi_create:
1774 * create a container with the given parameters.
1775 * @c: container to be created. It has the lxcpath, name, and a starting
1776 * configuration already set
1777 * @t: the template to execute to instantiate the root filesystem and
1778 * adjust the configuration.
1779 * @bdevtype: backing store type to use. If NULL, dir will be used.
1780 * @specs: additional parameters for the backing store, i.e. LVM vg to
1781 * use.
1782 *
1783 * @argv: the arguments to pass to the template, terminated by NULL. If no
1784 * arguments, you can just pass NULL.
1785 */
1786 static bool do_lxcapi_create(struct lxc_container *c, const char *t,
1787 const char *bdevtype, struct bdev_specs *specs,
1788 int flags, char *const argv[])
1789 {
1790 int partial_fd;
1791 mode_t mask;
1792 pid_t pid;
1793 bool ret = false, rootfs_managed = true;
1794 char *tpath = NULL;
1795
1796 if (!c)
1797 return false;
1798
1799 if (t) {
1800 tpath = get_template_path(t);
1801 if (!tpath) {
1802 ERROR("Unknown template \"%s\"", t);
1803 goto out;
1804 }
1805 }
1806
1807 /* If a template is passed in, and the rootfs already is defined in the
1808 * container config and exists, then the caller is trying to create an
1809 * existing container. Return an error, but do NOT delete the container.
1810 */
1811 if (do_lxcapi_is_defined(c) && c->lxc_conf && c->lxc_conf->rootfs.path &&
1812 access(c->lxc_conf->rootfs.path, F_OK) == 0 && tpath) {
1813 ERROR("Container \"%s\" already exists in \"%s\"", c->name,
1814 c->config_path);
1815 goto free_tpath;
1816 }
1817
1818 if (!c->lxc_conf) {
1819 if (!do_lxcapi_load_config(c, lxc_global_config_value("lxc.default_config"))) {
1820 ERROR("Error loading default configuration file %s",
1821 lxc_global_config_value("lxc.default_config"));
1822 goto free_tpath;
1823 }
1824 }
1825
1826 if (!create_container_dir(c))
1827 goto free_tpath;
1828
1829 if (c->lxc_conf->rootfs.path)
1830 rootfs_managed = false;
1831
1832 /* If both template and rootfs.path are set, template is setup as
1833 * rootfs.path. The container is already created if we have a config and
1834 * rootfs.path is accessible
1835 */
1836 if (!c->lxc_conf->rootfs.path && !tpath) {
1837 /* No template passed in and rootfs does not exist. */
1838 if (!c->save_config(c, NULL)) {
1839 ERROR("Failed to save initial config for \"%s\"", c->name);
1840 goto out;
1841 }
1842 ret = true;
1843 goto out;
1844 }
1845
1846 /* Rootfs passed into configuration, but does not exist. */
1847 if (c->lxc_conf->rootfs.path && access(c->lxc_conf->rootfs.path, F_OK) != 0)
1848 goto out;
1849
1850 if (do_lxcapi_is_defined(c) && c->lxc_conf->rootfs.path && !tpath) {
1851 /* Rootfs already existed, user just wanted to save the loaded
1852 * configuration.
1853 */
1854 if (!c->save_config(c, NULL))
1855 ERROR("Failed to save initial config for \"%s\"", c->name);
1856
1857 ret = true;
1858 goto out;
1859 }
1860
1861 /* Mark that this container is being created */
1862 partial_fd = create_partial(c);
1863 if (partial_fd < 0)
1864 goto out;
1865
1866 /* No need to get disk lock bc we have the partial lock. */
1867
1868 mask = umask(0022);
1869
1870 /* Create the storage.
1871 * Note we can't do this in the same task as we use to execute the
1872 * template because of the way zfs works.
1873 * After you 'zfs create', zfs mounts the fs only in the initial
1874 * namespace.
1875 */
1876 pid = fork();
1877 if (pid < 0) {
1878 SYSERROR("Failed to fork task for container creation template");
1879 goto out_unlock;
1880 }
1881
1882 if (pid == 0) { /* child */
1883 struct lxc_storage *bdev = NULL;
1884
1885 bdev = do_storage_create(c, bdevtype, specs);
1886 if (!bdev) {
1887 ERROR("Failed to create %s storage for %s",
1888 bdevtype ? bdevtype : "(none)", c->name);
1889 _exit(EXIT_FAILURE);
1890 }
1891
1892 /* Save config file again to store the new rootfs location. */
1893 if (!do_lxcapi_save_config(c, NULL)) {
1894 ERROR("Failed to save initial config for %s", c->name);
1895 /* Parent task won't see the storage driver in the
1896 * config so we delete it.
1897 */
1898 bdev->ops->umount(bdev);
1899 bdev->ops->destroy(bdev);
1900 _exit(EXIT_FAILURE);
1901 }
1902
1903 _exit(EXIT_SUCCESS);
1904 }
1905
1906 if (wait_for_pid(pid) != 0)
1907 goto out_unlock;
1908
1909 /* Reload config to get the rootfs. */
1910 lxc_conf_free(c->lxc_conf);
1911 c->lxc_conf = NULL;
1912
1913 if (!load_config_locked(c, c->configfile))
1914 goto out_unlock;
1915
1916 if (!create_run_template(c, tpath, !!(flags & LXC_CREATE_QUIET), argv))
1917 goto out_unlock;
1918
1919 /* Now clear out the lxc_conf we have, reload from the created
1920 * container.
1921 */
1922 do_lxcapi_clear_config(c);
1923
1924 if (t) {
1925 if (!prepend_lxc_header(c->configfile, tpath, argv)) {
1926 ERROR("Failed to prepend header to config file");
1927 goto out_unlock;
1928 }
1929 }
1930
1931 ret = load_config_locked(c, c->configfile);
1932
1933 out_unlock:
1934 umask(mask);
1935 remove_partial(c, partial_fd);
1936
1937 out:
1938 if (!ret) {
1939 bool reset_managed = c->lxc_conf->rootfs.managed;
1940
1941 /*
1942 * Ensure that we don't destroy storage we didn't create
1943 * ourselves.
1944 */
1945 if (!rootfs_managed)
1946 c->lxc_conf->rootfs.managed = false;
1947 container_destroy(c, NULL);
1948 c->lxc_conf->rootfs.managed = reset_managed;
1949 }
1950
1951 free_tpath:
1952 free(tpath);
1953 return ret;
1954 }
1955
1956 static bool lxcapi_create(struct lxc_container *c, const char *t,
1957 const char *bdevtype, struct bdev_specs *specs,
1958 int flags, char *const argv[])
1959 {
1960 bool ret;
1961
1962 current_config = c ? c->lxc_conf : NULL;
1963
1964 ret = do_lxcapi_create(c, t, bdevtype, specs, flags, argv);
1965 current_config = NULL;
1966 return ret;
1967 }
1968
1969 static bool do_lxcapi_reboot(struct lxc_container *c)
1970 {
1971 int ret;
1972 pid_t pid;
1973 int rebootsignal = SIGINT;
1974
1975 if (!c)
1976 return false;
1977
1978 if (!do_lxcapi_is_running(c))
1979 return false;
1980
1981 pid = do_lxcapi_init_pid(c);
1982 if (pid <= 0)
1983 return false;
1984
1985 if (c->lxc_conf && c->lxc_conf->rebootsignal)
1986 rebootsignal = c->lxc_conf->rebootsignal;
1987
1988 ret = kill(pid, rebootsignal);
1989 if (ret < 0) {
1990 WARN("Failed to send signal %d to pid %d", rebootsignal, pid);
1991 return false;
1992 }
1993
1994 return true;
1995 }
1996
1997 WRAP_API(bool, lxcapi_reboot)
1998
1999 static bool do_lxcapi_reboot2(struct lxc_container *c, int timeout)
2000 {
2001 int killret, ret;
2002 pid_t pid;
2003 int rebootsignal = SIGINT, state_client_fd = -1;
2004 lxc_state_t states[MAX_STATE] = {0};
2005
2006 if (!c)
2007 return false;
2008
2009 if (!do_lxcapi_is_running(c))
2010 return true;
2011
2012 pid = do_lxcapi_init_pid(c);
2013 if (pid <= 0)
2014 return true;
2015
2016 if (c->lxc_conf && c->lxc_conf->rebootsignal)
2017 rebootsignal = c->lxc_conf->rebootsignal;
2018
2019 /* Add a new state client before sending the shutdown signal so that we
2020 * don't miss a state.
2021 */
2022 if (timeout != 0) {
2023 states[RUNNING] = 2;
2024 ret = lxc_cmd_add_state_client(c->name, c->config_path, states,
2025 &state_client_fd);
2026 if (ret < 0)
2027 return false;
2028
2029 if (state_client_fd < 0)
2030 return false;
2031
2032 if (ret == RUNNING)
2033 return true;
2034
2035 if (ret < MAX_STATE)
2036 return false;
2037 }
2038
2039 /* Send reboot signal to container. */
2040 killret = kill(pid, rebootsignal);
2041 if (killret < 0) {
2042 if (state_client_fd >= 0)
2043 close(state_client_fd);
2044
2045 WARN("Failed to send signal %d to pid %d", rebootsignal, pid);
2046 return false;
2047 }
2048 TRACE("Sent signal %d to pid %d", rebootsignal, pid);
2049
2050 if (timeout == 0)
2051 return true;
2052
2053 ret = lxc_cmd_sock_rcv_state(state_client_fd, timeout);
2054 close(state_client_fd);
2055 if (ret < 0)
2056 return false;
2057
2058 TRACE("Received state \"%s\"", lxc_state2str(ret));
2059 if (ret != RUNNING)
2060 return false;
2061
2062 return true;
2063 }
2064
2065 WRAP_API_1(bool, lxcapi_reboot2, int)
2066
2067 static bool do_lxcapi_shutdown(struct lxc_container *c, int timeout)
2068 {
2069 int killret, ret;
2070 pid_t pid;
2071 int haltsignal = SIGPWR, state_client_fd = -EBADF;
2072 lxc_state_t states[MAX_STATE] = {0};
2073
2074 if (!c)
2075 return false;
2076
2077 if (!do_lxcapi_is_running(c))
2078 return true;
2079
2080 pid = do_lxcapi_init_pid(c);
2081 if (pid <= 0)
2082 return true;
2083
2084 /* Detect whether we should send SIGRTMIN + 3 (e.g. systemd). */
2085 if (c->lxc_conf && c->lxc_conf->haltsignal)
2086 haltsignal = c->lxc_conf->haltsignal;
2087 else if (task_blocks_signal(pid, (SIGRTMIN + 3)))
2088 haltsignal = (SIGRTMIN + 3);
2089
2090 /* Add a new state client before sending the shutdown signal so that we
2091 * don't miss a state.
2092 */
2093 if (timeout != 0) {
2094 states[STOPPED] = 1;
2095 ret = lxc_cmd_add_state_client(c->name, c->config_path, states,
2096 &state_client_fd);
2097 if (ret < 0)
2098 return false;
2099
2100 if (state_client_fd < 0)
2101 return false;
2102
2103 if (ret == STOPPED)
2104 return true;
2105
2106 if (ret < MAX_STATE)
2107 return false;
2108 }
2109
2110 /* Send shutdown signal to container. */
2111 killret = kill(pid, haltsignal);
2112 if (killret < 0) {
2113 if (state_client_fd >= 0)
2114 close(state_client_fd);
2115
2116 WARN("Failed to send signal %d to pid %d", haltsignal, pid);
2117 return false;
2118 }
2119 TRACE("Sent signal %d to pid %d", haltsignal, pid);
2120
2121 if (timeout == 0)
2122 return true;
2123
2124 ret = lxc_cmd_sock_rcv_state(state_client_fd, timeout);
2125 close(state_client_fd);
2126 if (ret < 0)
2127 return false;
2128
2129 TRACE("Received state \"%s\"", lxc_state2str(ret));
2130 if (ret != STOPPED)
2131 return false;
2132
2133 return true;
2134 }
2135
2136 WRAP_API_1(bool, lxcapi_shutdown, int)
2137
2138 static bool lxcapi_createl(struct lxc_container *c, const char *t,
2139 const char *bdevtype, struct bdev_specs *specs, int flags, ...)
2140 {
2141 bool bret = false;
2142 char **args = NULL;
2143 va_list ap;
2144
2145 if (!c)
2146 return false;
2147
2148 current_config = c->lxc_conf;
2149
2150 /*
2151 * since we're going to wait for create to finish, I don't think we
2152 * need to get a copy of the arguments.
2153 */
2154 va_start(ap, flags);
2155 args = lxc_va_arg_list_to_argv(ap, 0, 0);
2156 va_end(ap);
2157 if (!args) {
2158 ERROR("Failed to allocate memory");
2159 goto out;
2160 }
2161
2162 bret = do_lxcapi_create(c, t, bdevtype, specs, flags, args);
2163
2164 out:
2165 free(args);
2166 current_config = NULL;
2167 return bret;
2168 }
2169
2170 static void do_clear_unexp_config_line(struct lxc_conf *conf, const char *key)
2171 {
2172 if (!strcmp(key, "lxc.cgroup"))
2173 return clear_unexp_config_line(conf, key, true);
2174
2175 if (!strcmp(key, "lxc.network"))
2176 return clear_unexp_config_line(conf, key, true);
2177
2178 if (!strcmp(key, "lxc.net"))
2179 return clear_unexp_config_line(conf, key, true);
2180
2181 /* Clear a network with a specific index. */
2182 if (!strncmp(key, "lxc.net.", 8)) {
2183 int ret;
2184 const char *idx;
2185
2186 idx = key + 8;
2187 ret = lxc_safe_uint(idx, &(unsigned int){0});
2188 if (!ret)
2189 return clear_unexp_config_line(conf, key, true);
2190 }
2191
2192 if (!strcmp(key, "lxc.hook"))
2193 return clear_unexp_config_line(conf, key, true);
2194
2195 return clear_unexp_config_line(conf, key, false);
2196 }
2197
2198 static bool do_lxcapi_clear_config_item(struct lxc_container *c,
2199 const char *key)
2200 {
2201 int ret = 1;
2202 struct lxc_config_t *config;
2203
2204 if (!c || !c->lxc_conf)
2205 return false;
2206
2207 if (container_mem_lock(c))
2208 return false;
2209
2210 config = lxc_get_config(key);
2211 /* Verify that the config key exists and that it has a callback
2212 * implemented.
2213 */
2214 if (config && config->clr)
2215 ret = config->clr(key, c->lxc_conf, NULL);
2216
2217 if (!ret)
2218 do_clear_unexp_config_line(c->lxc_conf, key);
2219
2220 container_mem_unlock(c);
2221 return ret == 0;
2222 }
2223
2224 WRAP_API_1(bool, lxcapi_clear_config_item, const char *)
2225
2226 static inline bool enter_net_ns(struct lxc_container *c)
2227 {
2228 pid_t pid = do_lxcapi_init_pid(c);
2229
2230 if (pid < 0)
2231 return false;
2232
2233 if ((geteuid() != 0 || (c->lxc_conf && !lxc_list_empty(&c->lxc_conf->id_map))) &&
2234 (access("/proc/self/ns/user", F_OK) == 0))
2235 if (!switch_to_ns(pid, "user"))
2236 return false;
2237
2238 return switch_to_ns(pid, "net");
2239 }
2240
2241 /* Used by qsort and bsearch functions for comparing names. */
2242 static inline int string_cmp(char **first, char **second)
2243 {
2244 return strcmp(*first, *second);
2245 }
2246
2247 /* Used by qsort and bsearch functions for comparing container names. */
2248 static inline int container_cmp(struct lxc_container **first,
2249 struct lxc_container **second)
2250 {
2251 return strcmp((*first)->name, (*second)->name);
2252 }
2253
2254 static bool add_to_array(char ***names, char *cname, int pos)
2255 {
2256 char **newnames = realloc(*names, (pos+1) * sizeof(char *));
2257 if (!newnames) {
2258 ERROR("Out of memory");
2259 return false;
2260 }
2261
2262 *names = newnames;
2263 newnames[pos] = strdup(cname);
2264 if (!newnames[pos])
2265 return false;
2266
2267 /* Sort the array as we will use binary search on it. */
2268 qsort(newnames, pos + 1, sizeof(char *),
2269 (int (*)(const void *, const void *))string_cmp);
2270
2271 return true;
2272 }
2273
2274 static bool add_to_clist(struct lxc_container ***list, struct lxc_container *c,
2275 int pos, bool sort)
2276 {
2277 struct lxc_container **newlist = realloc(*list, (pos + 1) * sizeof(struct lxc_container *));
2278 if (!newlist) {
2279 ERROR("Out of memory");
2280 return false;
2281 }
2282
2283 *list = newlist;
2284 newlist[pos] = c;
2285
2286 /* Sort the array as we will use binary search on it. */
2287 if (sort)
2288 qsort(newlist, pos + 1, sizeof(struct lxc_container *),
2289 (int (*)(const void *, const void *))container_cmp);
2290
2291 return true;
2292 }
2293
2294 static char** get_from_array(char ***names, char *cname, int size)
2295 {
2296 return (char **)bsearch(&cname, *names, size, sizeof(char *), (int (*)(const void *, const void *))string_cmp);
2297 }
2298
2299 static bool array_contains(char ***names, char *cname, int size)
2300 {
2301 if(get_from_array(names, cname, size) != NULL)
2302 return true;
2303
2304 return false;
2305 }
2306
2307 static bool remove_from_array(char ***names, char *cname, int size)
2308 {
2309 char **result = get_from_array(names, cname, size);
2310 if (result != NULL) {
2311 free(result);
2312 return true;
2313 }
2314
2315 return false;
2316 }
2317
2318 static char **do_lxcapi_get_interfaces(struct lxc_container *c)
2319 {
2320 pid_t pid;
2321 int i, count = 0, pipefd[2];
2322 char **interfaces = NULL;
2323 char interface[IFNAMSIZ];
2324
2325 if (pipe2(pipefd, O_CLOEXEC) < 0)
2326 return NULL;
2327
2328 pid = fork();
2329 if (pid < 0) {
2330 SYSERROR("Failed to fork task to get interfaces information");
2331 close(pipefd[0]);
2332 close(pipefd[1]);
2333 return NULL;
2334 }
2335
2336 if (pid == 0) { /* child */
2337 int ret = 1, nbytes;
2338 struct netns_ifaddrs *interfaceArray = NULL, *tempIfAddr = NULL;
2339
2340 /* close the read-end of the pipe */
2341 close(pipefd[0]);
2342
2343 if (!enter_net_ns(c)) {
2344 SYSERROR("Failed to enter network namespace");
2345 goto out;
2346 }
2347
2348 /* Grab the list of interfaces */
2349 if (netns_getifaddrs(&interfaceArray, -1, &(bool){false})) {
2350 SYSERROR("Failed to get interfaces list");
2351 goto out;
2352 }
2353
2354 /* Iterate through the interfaces */
2355 for (tempIfAddr = interfaceArray; tempIfAddr != NULL;
2356 tempIfAddr = tempIfAddr->ifa_next) {
2357 nbytes = lxc_write_nointr(pipefd[1], tempIfAddr->ifa_name, IFNAMSIZ);
2358 if (nbytes < 0)
2359 goto out;
2360
2361 count++;
2362 }
2363
2364 ret = 0;
2365
2366 out:
2367 if (interfaceArray)
2368 netns_freeifaddrs(interfaceArray);
2369
2370 /* close the write-end of the pipe, thus sending EOF to the reader */
2371 close(pipefd[1]);
2372 _exit(ret);
2373 }
2374
2375 /* close the write-end of the pipe */
2376 close(pipefd[1]);
2377
2378 while (lxc_read_nointr(pipefd[0], &interface, IFNAMSIZ) == IFNAMSIZ) {
2379 interface[IFNAMSIZ - 1] = '\0';
2380
2381 if (array_contains(&interfaces, interface, count))
2382 continue;
2383
2384 if (!add_to_array(&interfaces, interface, count))
2385 ERROR("Failed to add \"%s\" to array", interface);
2386
2387 count++;
2388 }
2389
2390 if (wait_for_pid(pid) != 0) {
2391 for (i = 0; i < count; i++)
2392 free(interfaces[i]);
2393
2394 free(interfaces);
2395 interfaces = NULL;
2396 }
2397
2398 /* close the read-end of the pipe */
2399 close(pipefd[0]);
2400
2401 /* Append NULL to the array */
2402 if (interfaces)
2403 interfaces = (char **)lxc_append_null_to_array((void **)interfaces, count);
2404
2405 return interfaces;
2406 }
2407
2408 WRAP_API(char **, lxcapi_get_interfaces)
2409
2410 static char **do_lxcapi_get_ips(struct lxc_container *c, const char *interface,
2411 const char *family, int scope)
2412 {
2413 int i, ret;
2414 pid_t pid;
2415 int pipefd[2];
2416 char address[INET6_ADDRSTRLEN];
2417 int count = 0;
2418 char **addresses = NULL;
2419
2420 ret = pipe2(pipefd, O_CLOEXEC);
2421 if (ret < 0) {
2422 SYSERROR("Failed to create pipe");
2423 return NULL;
2424 }
2425
2426 pid = fork();
2427 if (pid < 0) {
2428 SYSERROR("Failed to create new process");
2429 close(pipefd[0]);
2430 close(pipefd[1]);
2431 return NULL;
2432 }
2433
2434 if (pid == 0) {
2435 ssize_t nbytes;
2436 char addressOutputBuffer[INET6_ADDRSTRLEN];
2437 char *address_ptr = NULL;
2438 void *tempAddrPtr = NULL;
2439 struct netns_ifaddrs *interfaceArray = NULL, *tempIfAddr = NULL;
2440
2441 /* close the read-end of the pipe */
2442 close(pipefd[0]);
2443
2444 if (!enter_net_ns(c)) {
2445 SYSERROR("Failed to attach to network namespace");
2446 goto out;
2447 }
2448
2449 /* Grab the list of interfaces */
2450 if (netns_getifaddrs(&interfaceArray, -1, &(bool){false})) {
2451 SYSERROR("Failed to get interfaces list");
2452 goto out;
2453 }
2454
2455 /* Iterate through the interfaces */
2456 for (tempIfAddr = interfaceArray; tempIfAddr;
2457 tempIfAddr = tempIfAddr->ifa_next) {
2458 if (tempIfAddr->ifa_addr == NULL)
2459 continue;
2460
2461 #pragma GCC diagnostic push
2462 #pragma GCC diagnostic ignored "-Wcast-align"
2463
2464 if (tempIfAddr->ifa_addr->sa_family == AF_INET) {
2465 if (family && strcmp(family, "inet"))
2466 continue;
2467
2468 tempAddrPtr = &((struct sockaddr_in *)tempIfAddr->ifa_addr)->sin_addr;
2469 } else {
2470 if (family && strcmp(family, "inet6"))
2471 continue;
2472
2473 if (((struct sockaddr_in6 *)tempIfAddr->ifa_addr)->sin6_scope_id != scope)
2474 continue;
2475
2476 tempAddrPtr = &((struct sockaddr_in6 *)tempIfAddr->ifa_addr)->sin6_addr;
2477 }
2478
2479 #pragma GCC diagnostic pop
2480
2481 if (interface && strcmp(interface, tempIfAddr->ifa_name))
2482 continue;
2483 else if (!interface && strcmp("lo", tempIfAddr->ifa_name) == 0)
2484 continue;
2485
2486 address_ptr = (char *)inet_ntop(tempIfAddr->ifa_addr->sa_family,
2487 tempAddrPtr, addressOutputBuffer,
2488 sizeof(addressOutputBuffer));
2489 if (!address_ptr)
2490 continue;
2491
2492 nbytes = lxc_write_nointr(pipefd[1], address_ptr, INET6_ADDRSTRLEN);
2493 if (nbytes != INET6_ADDRSTRLEN) {
2494 SYSERROR("Failed to send ipv6 address \"%s\"",
2495 address_ptr);
2496 goto out;
2497 }
2498
2499 count++;
2500 }
2501
2502 ret = 0;
2503
2504 out:
2505 if (interfaceArray)
2506 netns_freeifaddrs(interfaceArray);
2507
2508 /* close the write-end of the pipe, thus sending EOF to the reader */
2509 close(pipefd[1]);
2510 _exit(ret);
2511 }
2512
2513 /* close the write-end of the pipe */
2514 close(pipefd[1]);
2515
2516 while (lxc_read_nointr(pipefd[0], &address, INET6_ADDRSTRLEN) == INET6_ADDRSTRLEN) {
2517 address[INET6_ADDRSTRLEN - 1] = '\0';
2518
2519 if (!add_to_array(&addresses, address, count))
2520 ERROR("PARENT: add_to_array failed");
2521
2522 count++;
2523 }
2524
2525 if (wait_for_pid(pid) != 0) {
2526 for (i = 0; i < count; i++)
2527 free(addresses[i]);
2528
2529 free(addresses);
2530 addresses = NULL;
2531 }
2532
2533 /* close the read-end of the pipe */
2534 close(pipefd[0]);
2535
2536 /* Append NULL to the array */
2537 if (addresses)
2538 addresses = (char **)lxc_append_null_to_array((void **)addresses, count);
2539
2540 return addresses;
2541 }
2542
2543 WRAP_API_3(char **, lxcapi_get_ips, const char *, const char *, int)
2544
2545 static int do_lxcapi_get_config_item(struct lxc_container *c, const char *key, char *retv, int inlen)
2546 {
2547 int ret = -1;
2548 struct lxc_config_t *config;
2549
2550 if (!c || !c->lxc_conf)
2551 return -1;
2552
2553 if (container_mem_lock(c))
2554 return -1;
2555
2556 config = lxc_get_config(key);
2557 /* Verify that the config key exists and that it has a callback
2558 * implemented.
2559 */
2560 if (config && config->get)
2561 ret = config->get(key, retv, inlen, c->lxc_conf, NULL);
2562
2563 container_mem_unlock(c);
2564 return ret;
2565 }
2566
2567 WRAP_API_3(int, lxcapi_get_config_item, const char *, char *, int)
2568
2569 static char* do_lxcapi_get_running_config_item(struct lxc_container *c, const char *key)
2570 {
2571 char *ret;
2572
2573 if (!c || !c->lxc_conf)
2574 return NULL;
2575
2576 if (container_mem_lock(c))
2577 return NULL;
2578
2579 ret = lxc_cmd_get_config_item(c->name, key, do_lxcapi_get_config_path(c));
2580 container_mem_unlock(c);
2581 return ret;
2582 }
2583
2584 WRAP_API_1(char *, lxcapi_get_running_config_item, const char *)
2585
2586 static int do_lxcapi_get_keys(struct lxc_container *c, const char *key, char *retv, int inlen)
2587 {
2588 int ret = -1;
2589
2590 /* List all config items. */
2591 if (!key)
2592 return lxc_list_config_items(retv, inlen);
2593
2594 if (!c || !c->lxc_conf)
2595 return -1;
2596
2597 if (container_mem_lock(c))
2598 return -1;
2599
2600 /* Support 'lxc.net.<idx>', i.e. 'lxc.net.0'
2601 * This is an intelligent result to show which keys are valid given the
2602 * type of nic it is.
2603 */
2604 if (strncmp(key, "lxc.net.", 8) == 0)
2605 ret = lxc_list_net(c->lxc_conf, key, retv, inlen);
2606 else
2607 ret = lxc_list_subkeys(c->lxc_conf, key, retv, inlen);
2608
2609 container_mem_unlock(c);
2610 return ret;
2611 }
2612
2613 WRAP_API_3(int, lxcapi_get_keys, const char *, char *, int)
2614
2615 static bool do_lxcapi_save_config(struct lxc_container *c, const char *alt_file)
2616 {
2617 int fd, lret;
2618 bool ret = false, need_disklock = false;
2619
2620 if (!alt_file)
2621 alt_file = c->configfile;
2622
2623 if (!alt_file)
2624 return false;
2625
2626 /* If we haven't yet loaded a config, load the stock config. */
2627 if (!c->lxc_conf) {
2628 if (!do_lxcapi_load_config(c, lxc_global_config_value("lxc.default_config"))) {
2629 ERROR("Error loading default configuration file %s "
2630 "while saving %s",
2631 lxc_global_config_value("lxc.default_config"),
2632 c->name);
2633 return false;
2634 }
2635 }
2636
2637 if (!create_container_dir(c))
2638 return false;
2639
2640 /* If we're writing to the container's config file, take the disk lock.
2641 * Otherwise just take the memlock to protect the struct lxc_container
2642 * while we're traversing it.
2643 */
2644 if (strcmp(c->configfile, alt_file) == 0)
2645 need_disklock = true;
2646
2647 if (need_disklock)
2648 lret = container_disk_lock(c);
2649 else
2650 lret = container_mem_lock(c);
2651 if (lret)
2652 return false;
2653
2654 fd = open(alt_file, O_WRONLY | O_CREAT | O_TRUNC | O_CLOEXEC,
2655 S_IRUSR | S_IWUSR | S_IRGRP | S_IWGRP);
2656 if (fd < 0)
2657 goto on_error;
2658
2659 lret = write_config(fd, c->lxc_conf);
2660 close(fd);
2661 if (lret < 0)
2662 goto on_error;
2663
2664 ret = true;
2665
2666 on_error:
2667 if (need_disklock)
2668 container_disk_unlock(c);
2669 else
2670 container_mem_unlock(c);
2671
2672 return ret;
2673 }
2674
2675 WRAP_API_1(bool, lxcapi_save_config, const char *)
2676
2677
2678 static bool mod_rdep(struct lxc_container *c0, struct lxc_container *c, bool inc)
2679 {
2680 FILE *f1;
2681 struct stat fbuf;
2682 void *buf = NULL;
2683 char *del = NULL;
2684 char path[PATH_MAX];
2685 char newpath[PATH_MAX];
2686 int fd, ret, n = 0, v = 0;
2687 bool bret = false;
2688 size_t len = 0, bytes = 0;
2689
2690 if (container_disk_lock(c0))
2691 return false;
2692
2693 ret = snprintf(path, PATH_MAX, "%s/%s/lxc_snapshots", c0->config_path, c0->name);
2694 if (ret < 0 || ret > PATH_MAX)
2695 goto out;
2696
2697 ret = snprintf(newpath, PATH_MAX, "%s\n%s\n", c->config_path, c->name);
2698 if (ret < 0 || ret > PATH_MAX)
2699 goto out;
2700
2701 /* If we find an lxc-snapshot file using the old format only listing the
2702 * number of snapshots we will keep using it. */
2703 f1 = fopen(path, "r");
2704 if (f1) {
2705 n = fscanf(f1, "%d", &v);
2706 fclose(f1);
2707 if (n == 1 && v == 0) {
2708 ret = remove(path);
2709 if (ret < 0)
2710 SYSERROR("Failed to remove \"%s\"", path);
2711
2712 n = 0;
2713 }
2714 }
2715
2716 if (n == 1) {
2717 v += inc ? 1 : -1;
2718 f1 = fopen(path, "w");
2719 if (!f1)
2720 goto out;
2721
2722 if (fprintf(f1, "%d\n", v) < 0) {
2723 ERROR("Error writing new snapshots value");
2724 fclose(f1);
2725 goto out;
2726 }
2727
2728 ret = fclose(f1);
2729 if (ret != 0) {
2730 SYSERROR("Error writing to or closing snapshots file");
2731 goto out;
2732 }
2733 } else {
2734 /* Here we know that we have or can use an lxc-snapshot file
2735 * using the new format. */
2736 if (inc) {
2737 f1 = fopen(path, "a");
2738 if (!f1)
2739 goto out;
2740
2741 if (fprintf(f1, "%s", newpath) < 0) {
2742 ERROR("Error writing new snapshots entry");
2743 ret = fclose(f1);
2744 if (ret != 0)
2745 SYSERROR("Error writing to or closing snapshots file");
2746 goto out;
2747 }
2748
2749 ret = fclose(f1);
2750 if (ret != 0) {
2751 SYSERROR("Error writing to or closing snapshots file");
2752 goto out;
2753 }
2754 } else if (!inc) {
2755 if ((fd = open(path, O_RDWR | O_CLOEXEC)) < 0)
2756 goto out;
2757
2758 if (fstat(fd, &fbuf) < 0) {
2759 close(fd);
2760 goto out;
2761 }
2762
2763 if (fbuf.st_size != 0) {
2764 buf = lxc_strmmap(NULL, fbuf.st_size, PROT_READ | PROT_WRITE, MAP_SHARED, fd, 0);
2765 if (buf == MAP_FAILED) {
2766 SYSERROR("Failed to create mapping %s", path);
2767 close(fd);
2768 goto out;
2769 }
2770
2771 len = strlen(newpath);
2772 while ((del = strstr((char *)buf, newpath))) {
2773 memmove(del, del + len, strlen(del) - len + 1);
2774 bytes += len;
2775 }
2776
2777 lxc_strmunmap(buf, fbuf.st_size);
2778 if (ftruncate(fd, fbuf.st_size - bytes) < 0) {
2779 SYSERROR("Failed to truncate file %s", path);
2780 close(fd);
2781 goto out;
2782 }
2783 }
2784
2785 close(fd);
2786 }
2787
2788 /* If the lxc-snapshot file is empty, remove it. */
2789 if (stat(path, &fbuf) < 0)
2790 goto out;
2791
2792 if (!fbuf.st_size) {
2793 ret = remove(path);
2794 if (ret < 0)
2795 SYSERROR("Failed to remove \"%s\"", path);
2796 }
2797 }
2798
2799 bret = true;
2800
2801 out:
2802 container_disk_unlock(c0);
2803 return bret;
2804 }
2805
2806 void mod_all_rdeps(struct lxc_container *c, bool inc)
2807 {
2808 struct lxc_container *p;
2809 char *lxcpath = NULL, *lxcname = NULL, path[PATH_MAX];
2810 size_t pathlen = 0, namelen = 0;
2811 FILE *f;
2812 int ret;
2813
2814 ret = snprintf(path, PATH_MAX, "%s/%s/lxc_rdepends",
2815 c->config_path, c->name);
2816 if (ret < 0 || ret >= PATH_MAX) {
2817 ERROR("Path name too long");
2818 return;
2819 }
2820
2821 f = fopen(path, "r");
2822 if (f == NULL)
2823 return;
2824
2825 while (getline(&lxcpath, &pathlen, f) != -1) {
2826 if (getline(&lxcname, &namelen, f) == -1) {
2827 ERROR("badly formatted file %s", path);
2828 goto out;
2829 }
2830
2831 remove_trailing_newlines(lxcpath);
2832 remove_trailing_newlines(lxcname);
2833
2834 if ((p = lxc_container_new(lxcname, lxcpath)) == NULL) {
2835 ERROR("Unable to find dependent container %s:%s",
2836 lxcpath, lxcname);
2837 continue;
2838 }
2839
2840 if (!mod_rdep(p, c, inc))
2841 ERROR("Failed to update snapshots file for %s:%s",
2842 lxcpath, lxcname);
2843
2844 lxc_container_put(p);
2845 }
2846
2847 out:
2848 free(lxcpath);
2849 free(lxcname);
2850 fclose(f);
2851 }
2852
2853 static bool has_fs_snapshots(struct lxc_container *c)
2854 {
2855 FILE *f;
2856 char path[PATH_MAX];
2857 int ret, v;
2858 struct stat fbuf;
2859 bool bret = false;
2860
2861 ret = snprintf(path, PATH_MAX, "%s/%s/lxc_snapshots", c->config_path,
2862 c->name);
2863 if (ret < 0 || ret > PATH_MAX)
2864 goto out;
2865
2866 /* If the file doesn't exist there are no snapshots. */
2867 if (stat(path, &fbuf) < 0)
2868 goto out;
2869
2870 v = fbuf.st_size;
2871 if (v != 0) {
2872 f = fopen(path, "r");
2873 if (!f)
2874 goto out;
2875
2876 ret = fscanf(f, "%d", &v);
2877 fclose(f);
2878 /* TODO: Figure out what to do with the return value of fscanf. */
2879 if (ret != 1)
2880 INFO("Container uses new lxc-snapshots format %s", path);
2881 }
2882
2883 bret = v != 0;
2884
2885 out:
2886 return bret;
2887 }
2888
2889 static bool has_snapshots(struct lxc_container *c)
2890 {
2891 char path[PATH_MAX];
2892 struct dirent *direntp;
2893 int count=0;
2894 DIR *dir;
2895
2896 if (!get_snappath_dir(c, path))
2897 return false;
2898
2899 dir = opendir(path);
2900 if (!dir)
2901 return false;
2902
2903 while ((direntp = readdir(dir))) {
2904 if (!strcmp(direntp->d_name, "."))
2905 continue;
2906
2907 if (!strcmp(direntp->d_name, ".."))
2908 continue;
2909 count++;
2910 break;
2911 }
2912
2913 closedir(dir);
2914 return count > 0;
2915 }
2916
2917 static bool do_destroy_container(struct lxc_conf *conf) {
2918 int ret;
2919
2920 if (am_guest_unpriv()) {
2921 ret = userns_exec_full(conf, storage_destroy_wrapper, conf,
2922 "storage_destroy_wrapper");
2923 if (ret < 0)
2924 return false;
2925
2926 return true;
2927 }
2928
2929 return storage_destroy(conf);
2930 }
2931
2932 static int lxc_rmdir_onedev_wrapper(void *data)
2933 {
2934 char *arg = (char *) data;
2935 return lxc_rmdir_onedev(arg, "snaps");
2936 }
2937
2938 static int lxc_unlink_exec_wrapper(void *data)
2939 {
2940 char *arg = data;
2941 return unlink(arg);
2942 }
2943
2944 static bool container_destroy(struct lxc_container *c,
2945 struct lxc_storage *storage)
2946 {
2947 const char *p1;
2948 size_t len;
2949 struct lxc_conf *conf;
2950 char *path = NULL;
2951 bool bret = false;
2952 int ret = 0;
2953
2954 if (!c || !do_lxcapi_is_defined(c))
2955 return false;
2956
2957 conf = c->lxc_conf;
2958 if (container_disk_lock(c))
2959 return false;
2960
2961 if (!is_stopped(c)) {
2962 /* We should queue some sort of error - in c->error_string? */
2963 ERROR("container %s is not stopped", c->name);
2964 goto out;
2965 }
2966
2967 if (conf && !lxc_list_empty(&conf->hooks[LXCHOOK_DESTROY])) {
2968 /* Start of environment variable setup for hooks */
2969 if (setenv("LXC_NAME", c->name, 1))
2970 SYSERROR("Failed to set environment variable for container name");
2971
2972 if (conf->rcfile && setenv("LXC_CONFIG_FILE", conf->rcfile, 1))
2973 SYSERROR("Failed to set environment variable for config path");
2974
2975 if (conf->rootfs.mount && setenv("LXC_ROOTFS_MOUNT", conf->rootfs.mount, 1))
2976 SYSERROR("Failed to set environment variable for rootfs mount");
2977
2978 if (conf->rootfs.path && setenv("LXC_ROOTFS_PATH", conf->rootfs.path, 1))
2979 SYSERROR("Failed to set environment variable for rootfs mount");
2980
2981 if (conf->console.path && setenv("LXC_CONSOLE", conf->console.path, 1))
2982 SYSERROR("Failed to set environment variable for console path");
2983
2984 if (conf->console.log_path && setenv("LXC_CONSOLE_LOGPATH", conf->console.log_path, 1))
2985 SYSERROR("Failed to set environment variable for console log");
2986 /* End of environment variable setup for hooks */
2987
2988 if (run_lxc_hooks(c->name, "destroy", conf, NULL)) {
2989 ERROR("Failed to execute clone hook for \"%s\"", c->name);
2990 goto out;
2991 }
2992 }
2993
2994 if (current_config && conf == current_config) {
2995 current_config = NULL;
2996
2997 if (conf->logfd != -1) {
2998 close(conf->logfd);
2999 conf->logfd = -1;
3000 }
3001 }
3002
3003 /* LXC is not managing the storage of the container. */
3004 if (conf && !conf->rootfs.managed)
3005 goto on_success;
3006
3007 if (conf && conf->rootfs.path && conf->rootfs.mount) {
3008 if (!do_destroy_container(conf)) {
3009 ERROR("Error destroying rootfs for %s", c->name);
3010 goto out;
3011 }
3012 INFO("Destroyed rootfs for %s", c->name);
3013 }
3014
3015 mod_all_rdeps(c, false);
3016
3017 p1 = do_lxcapi_get_config_path(c);
3018 /* strlen(p1)
3019 * +
3020 * /
3021 * +
3022 * strlen(c->name)
3023 * +
3024 * /
3025 * +
3026 * strlen("config") = 6
3027 * +
3028 * \0
3029 */
3030 len = strlen(p1) + 1 + strlen(c->name) + 1 + 6 + 1;
3031 path = malloc(len);
3032 if (!path) {
3033 ERROR("Failed to allocate memory");
3034 goto out;
3035 }
3036
3037 /* For an overlay container the rootfs is considered immutable and
3038 * cannot be removed when restoring from a snapshot.
3039 */
3040 if (storage && (!strcmp(storage->type, "overlay") ||
3041 !strcmp(storage->type, "overlayfs")) &&
3042 (storage->flags & LXC_STORAGE_INTERNAL_OVERLAY_RESTORE)) {
3043 ret = snprintf(path, len, "%s/%s/config", p1, c->name);
3044 if (ret < 0 || (size_t)ret >= len)
3045 goto out;
3046
3047 if (am_guest_unpriv())
3048 ret = userns_exec_1(conf, lxc_unlink_exec_wrapper, path,
3049 "lxc_unlink_exec_wrapper");
3050 else
3051 ret = unlink(path);
3052 if (ret < 0) {
3053 SYSERROR("Failed to destroy config file \"%s\" for \"%s\"",
3054 path, c->name);
3055 goto out;
3056 }
3057 INFO("Destroyed config file \"%s\" for \"%s\"", path, c->name);
3058
3059 bret = true;
3060 goto out;
3061 }
3062
3063 ret = snprintf(path, len, "%s/%s", p1, c->name);
3064 if (ret < 0 || (size_t)ret >= len)
3065 goto out;
3066
3067 if (am_guest_unpriv())
3068 ret = userns_exec_full(conf, lxc_rmdir_onedev_wrapper, path,
3069 "lxc_rmdir_onedev_wrapper");
3070 else
3071 ret = lxc_rmdir_onedev(path, "snaps");
3072 if (ret < 0) {
3073 ERROR("Failed to destroy directory \"%s\" for \"%s\"", path,
3074 c->name);
3075 goto out;
3076 }
3077 INFO("Destroyed directory \"%s\" for \"%s\"", path, c->name);
3078
3079 on_success:
3080 bret = true;
3081
3082 out:
3083 if (path)
3084 free(path);
3085
3086 container_disk_unlock(c);
3087 return bret;
3088 }
3089
3090 static bool do_lxcapi_destroy(struct lxc_container *c)
3091 {
3092 if (!c || !lxcapi_is_defined(c))
3093 return false;
3094
3095 if (c->lxc_conf && c->lxc_conf->rootfs.managed) {
3096 if (has_snapshots(c)) {
3097 ERROR("Container %s has snapshots; not removing", c->name);
3098 return false;
3099 }
3100
3101 if (has_fs_snapshots(c)) {
3102 ERROR("container %s has snapshots on its rootfs", c->name);
3103 return false;
3104 }
3105 }
3106
3107 return container_destroy(c, NULL);
3108 }
3109
3110 WRAP_API(bool, lxcapi_destroy)
3111
3112 static bool do_lxcapi_destroy_with_snapshots(struct lxc_container *c)
3113 {
3114 if (!c || !lxcapi_is_defined(c))
3115 return false;
3116
3117 if (!lxcapi_snapshot_destroy_all(c)) {
3118 ERROR("Error deleting all snapshots");
3119 return false;
3120 }
3121
3122 return lxcapi_destroy(c);
3123 }
3124
3125 WRAP_API(bool, lxcapi_destroy_with_snapshots)
3126
3127 int lxc_set_config_item_locked(struct lxc_conf *conf, const char *key,
3128 const char *v)
3129 {
3130 int ret;
3131 struct lxc_config_t *config;
3132 bool bret = true;
3133
3134 config = lxc_get_config(key);
3135 if (!config)
3136 return -EINVAL;
3137
3138 ret = config->set(key, v, conf, NULL);
3139 if (ret < 0)
3140 return -EINVAL;
3141
3142 if (lxc_config_value_empty(v))
3143 do_clear_unexp_config_line(conf, key);
3144 else
3145 bret = do_append_unexp_config_line(conf, key, v);
3146 if (!bret)
3147 return -ENOMEM;
3148
3149 return 0;
3150 }
3151
3152 static bool do_set_config_item_locked(struct lxc_container *c, const char *key,
3153 const char *v)
3154 {
3155 int ret;
3156
3157 if (!c->lxc_conf)
3158 c->lxc_conf = lxc_conf_init();
3159
3160 if (!c->lxc_conf)
3161 return false;
3162
3163 ret = lxc_set_config_item_locked(c->lxc_conf, key, v);
3164 if (ret < 0)
3165 return false;
3166
3167 return true;
3168 }
3169
3170 static bool do_lxcapi_set_config_item(struct lxc_container *c, const char *key, const char *v)
3171 {
3172 bool b = false;
3173
3174 if (!c)
3175 return false;
3176
3177 if (container_mem_lock(c))
3178 return false;
3179
3180 b = do_set_config_item_locked(c, key, v);
3181
3182 container_mem_unlock(c);
3183 return b;
3184 }
3185
3186 WRAP_API_2(bool, lxcapi_set_config_item, const char *, const char *)
3187
3188 static char *lxcapi_config_file_name(struct lxc_container *c)
3189 {
3190 if (!c || !c->configfile)
3191 return NULL;
3192
3193 return strdup(c->configfile);
3194 }
3195
3196 static const char *lxcapi_get_config_path(struct lxc_container *c)
3197 {
3198 if (!c || !c->config_path)
3199 return NULL;
3200
3201 return (const char *)(c->config_path);
3202 }
3203
3204 /*
3205 * not for export
3206 * Just recalculate the c->configfile based on the
3207 * c->config_path, which must be set.
3208 * The lxc_container must be locked or not yet public.
3209 */
3210 static bool set_config_filename(struct lxc_container *c)
3211 {
3212 char *newpath;
3213 int len, ret;
3214
3215 if (!c->config_path)
3216 return false;
3217
3218 /* $lxc_path + "/" + c->name + "/" + "config" + '\0' */
3219 len = strlen(c->config_path) + strlen(c->name) + strlen("config") + 3;
3220 newpath = malloc(len);
3221 if (!newpath)
3222 return false;
3223
3224 ret = snprintf(newpath, len, "%s/%s/config", c->config_path, c->name);
3225 if (ret < 0 || ret >= len) {
3226 fprintf(stderr, "Error printing out config file name\n");
3227 free(newpath);
3228 return false;
3229 }
3230
3231 free(c->configfile);
3232 c->configfile = newpath;
3233
3234 return true;
3235 }
3236
3237 static bool do_lxcapi_set_config_path(struct lxc_container *c, const char *path)
3238 {
3239 char *p;
3240 bool b = false;
3241 char *oldpath = NULL;
3242
3243 if (!c)
3244 return b;
3245
3246 if (container_mem_lock(c))
3247 return b;
3248
3249 p = strdup(path);
3250 if (!p) {
3251 ERROR("Out of memory setting new lxc path");
3252 goto err;
3253 }
3254
3255 b = true;
3256 if (c->config_path)
3257 oldpath = c->config_path;
3258 c->config_path = p;
3259
3260 /* Since we've changed the config path, we have to change the
3261 * config file name too */
3262 if (!set_config_filename(c)) {
3263 ERROR("Out of memory setting new config filename");
3264 b = false;
3265 free(c->config_path);
3266 c->config_path = oldpath;
3267 oldpath = NULL;
3268 }
3269
3270 err:
3271 free(oldpath);
3272 container_mem_unlock(c);
3273 return b;
3274 }
3275
3276 WRAP_API_1(bool, lxcapi_set_config_path, const char *)
3277
3278 static bool do_lxcapi_set_cgroup_item(struct lxc_container *c, const char *subsys, const char *value)
3279 {
3280 int ret;
3281 struct cgroup_ops *cgroup_ops;
3282
3283 if (!c)
3284 return false;
3285
3286 if (is_stopped(c))
3287 return false;
3288
3289 cgroup_ops = cgroup_init(c->lxc_conf);
3290 if (!cgroup_ops)
3291 return false;
3292
3293 ret = cgroup_ops->set(cgroup_ops, subsys, value, c->name, c->config_path);
3294
3295 cgroup_exit(cgroup_ops);
3296
3297 return ret == 0;
3298 }
3299
3300 WRAP_API_2(bool, lxcapi_set_cgroup_item, const char *, const char *)
3301
3302 static int do_lxcapi_get_cgroup_item(struct lxc_container *c, const char *subsys, char *retv, int inlen)
3303 {
3304 int ret;
3305 struct cgroup_ops *cgroup_ops;
3306
3307 if (!c)
3308 return -1;
3309
3310 if (is_stopped(c))
3311 return -1;
3312
3313 cgroup_ops = cgroup_init(c->lxc_conf);
3314 if (!cgroup_ops)
3315 return -1;
3316
3317 ret = cgroup_ops->get(cgroup_ops, subsys, retv, inlen, c->name,
3318 c->config_path);
3319
3320 cgroup_exit(cgroup_ops);
3321
3322 return ret;
3323 }
3324
3325 WRAP_API_3(int, lxcapi_get_cgroup_item, const char *, char *, int)
3326
3327 const char *lxc_get_global_config_item(const char *key)
3328 {
3329 return lxc_global_config_value(key);
3330 }
3331
3332 const char *lxc_get_version(void)
3333 {
3334 return LXC_VERSION;
3335 }
3336
3337 static int copy_file(const char *old, const char *new)
3338 {
3339 int in, out;
3340 ssize_t len, ret;
3341 char buf[8096];
3342 struct stat sbuf;
3343
3344 if (file_exists(new)) {
3345 ERROR("copy destination %s exists", new);
3346 return -1;
3347 }
3348
3349 ret = stat(old, &sbuf);
3350 if (ret < 0) {
3351 INFO("Error stat'ing %s", old);
3352 return -1;
3353 }
3354
3355 in = open(old, O_RDONLY);
3356 if (in < 0) {
3357 SYSERROR("Error opening original file %s", old);
3358 return -1;
3359 }
3360
3361 out = open(new, O_CREAT | O_EXCL | O_WRONLY, 0644);
3362 if (out < 0) {
3363 SYSERROR("Error opening new file %s", new);
3364 close(in);
3365 return -1;
3366 }
3367
3368 for (;;) {
3369 len = lxc_read_nointr(in, buf, 8096);
3370 if (len < 0) {
3371 SYSERROR("Error reading old file %s", old);
3372 goto err;
3373 }
3374
3375 if (len == 0)
3376 break;
3377
3378 ret = lxc_write_nointr(out, buf, len);
3379 if (ret < len) { /* should we retry? */
3380 SYSERROR("Error: write to new file %s was interrupted", new);
3381 goto err;
3382 }
3383 }
3384
3385 close(in);
3386 close(out);
3387
3388 /* We set mode, but not owner/group. */
3389 ret = chmod(new, sbuf.st_mode);
3390 if (ret) {
3391 SYSERROR("Error setting mode on %s", new);
3392 return -1;
3393 }
3394
3395 return 0;
3396
3397 err:
3398 close(in);
3399 close(out);
3400 return -1;
3401 }
3402
3403 static int copyhooks(struct lxc_container *oldc, struct lxc_container *c)
3404 {
3405 __do_free char *cpath = NULL;
3406 int i, len, ret;
3407 struct lxc_list *it;
3408
3409 len = strlen(oldc->config_path) + strlen(oldc->name) + 3;
3410 cpath = must_realloc(NULL, len);
3411 ret = snprintf(cpath, len, "%s/%s/", oldc->config_path, oldc->name);
3412 if (ret < 0 || ret >= len)
3413 return -1;
3414
3415 for (i=0; i<NUM_LXC_HOOKS; i++) {
3416 lxc_list_for_each(it, &c->lxc_conf->hooks[i]) {
3417 char *hookname = it->elem;
3418 char *fname = strrchr(hookname, '/');
3419 char tmppath[PATH_MAX];
3420 if (!fname) /* relative path - we don't support, but maybe we should */
3421 return 0;
3422
3423 if (strncmp(hookname, cpath, len - 1) != 0) {
3424 /* this hook is public - ignore */
3425 continue;
3426 }
3427
3428 /* copy the script, and change the entry in confile */
3429 ret = snprintf(tmppath, PATH_MAX, "%s/%s/%s",
3430 c->config_path, c->name, fname+1);
3431 if (ret < 0 || ret >= PATH_MAX)
3432 return -1;
3433
3434 ret = copy_file(it->elem, tmppath);
3435 if (ret < 0)
3436 return -1;
3437
3438 free(it->elem);
3439
3440 it->elem = strdup(tmppath);
3441 if (!it->elem) {
3442 ERROR("out of memory copying hook path");
3443 return -1;
3444 }
3445 }
3446 }
3447
3448 if (!clone_update_unexp_hooks(c->lxc_conf, oldc->config_path,
3449 c->config_path, oldc->name, c->name)) {
3450 ERROR("Error saving new hooks in clone");
3451 return -1;
3452 }
3453
3454 do_lxcapi_save_config(c, NULL);
3455 return 0;
3456 }
3457
3458
3459 static int copy_fstab(struct lxc_container *oldc, struct lxc_container *c)
3460 {
3461 char newpath[PATH_MAX];
3462 char *oldpath = oldc->lxc_conf->fstab;
3463 int ret;
3464
3465 if (!oldpath)
3466 return 0;
3467
3468 clear_unexp_config_line(c->lxc_conf, "lxc.mount.fstab", false);
3469
3470 char *p = strrchr(oldpath, '/');
3471 if (!p)
3472 return -1;
3473
3474 ret = snprintf(newpath, PATH_MAX, "%s/%s%s",
3475 c->config_path, c->name, p);
3476 if (ret < 0 || ret >= PATH_MAX) {
3477 ERROR("error printing new path for %s", oldpath);
3478 return -1;
3479 }
3480
3481 if (file_exists(newpath)) {
3482 ERROR("error: fstab file %s exists", newpath);
3483 return -1;
3484 }
3485
3486 if (copy_file(oldpath, newpath) < 0) {
3487 ERROR("error: copying %s to %s", oldpath, newpath);
3488 return -1;
3489 }
3490
3491 free(c->lxc_conf->fstab);
3492
3493 c->lxc_conf->fstab = strdup(newpath);
3494 if (!c->lxc_conf->fstab) {
3495 ERROR("error: allocating pathname");
3496 return -1;
3497 }
3498
3499 if (!do_append_unexp_config_line(c->lxc_conf, "lxc.mount.fstab", newpath)) {
3500 ERROR("error saving new lxctab");
3501 return -1;
3502 }
3503
3504 return 0;
3505 }
3506
3507 static void copy_rdepends(struct lxc_container *c, struct lxc_container *c0)
3508 {
3509 char path0[PATH_MAX], path1[PATH_MAX];
3510 int ret;
3511
3512 ret = snprintf(path0, PATH_MAX, "%s/%s/lxc_rdepends", c0->config_path,
3513 c0->name);
3514 if (ret < 0 || ret >= PATH_MAX) {
3515 WARN("Error copying reverse dependencies");
3516 return;
3517 }
3518
3519 ret = snprintf(path1, PATH_MAX, "%s/%s/lxc_rdepends", c->config_path,
3520 c->name);
3521 if (ret < 0 || ret >= PATH_MAX) {
3522 WARN("Error copying reverse dependencies");
3523 return;
3524 }
3525
3526 if (copy_file(path0, path1) < 0) {
3527 INFO("Error copying reverse dependencies");
3528 return;
3529 }
3530 }
3531
3532 static bool add_rdepends(struct lxc_container *c, struct lxc_container *c0)
3533 {
3534 int ret;
3535 char path[PATH_MAX];
3536 FILE *f;
3537 bool bret;
3538
3539 ret = snprintf(path, PATH_MAX, "%s/%s/lxc_rdepends", c->config_path,
3540 c->name);
3541 if (ret < 0 || ret >= PATH_MAX)
3542 return false;
3543
3544 f = fopen(path, "a");
3545 if (!f)
3546 return false;
3547
3548 bret = true;
3549
3550 /* If anything goes wrong, just return an error. */
3551 if (fprintf(f, "%s\n%s\n", c0->config_path, c0->name) < 0)
3552 bret = false;
3553
3554 if (fclose(f) != 0)
3555 bret = false;
3556
3557 return bret;
3558 }
3559
3560 /*
3561 * If the fs natively supports snapshot clones with no penalty,
3562 * then default to those even if not requested.
3563 * Currently we only do this for btrfs.
3564 */
3565 bool should_default_to_snapshot(struct lxc_container *c0,
3566 struct lxc_container *c1)
3567 {
3568 __do_free char *p0 = NULL, *p1 = NULL;
3569 int ret;
3570 size_t l0 = strlen(c0->config_path) + strlen(c0->name) + 2;
3571 size_t l1 = strlen(c1->config_path) + strlen(c1->name) + 2;
3572 char *rootfs = c0->lxc_conf->rootfs.path;
3573
3574 p0 = must_realloc(NULL, l0 + 1);
3575 p1 = must_realloc(NULL, l1 + 1);
3576 ret = snprintf(p0, l0, "%s/%s", c0->config_path, c0->name);
3577 if (ret < 0 || ret >= l0)
3578 return false;
3579
3580 ret = snprintf(p1, l1, "%s/%s", c1->config_path, c1->name);
3581 if (ret < 0 || ret >= l1)
3582 return false;
3583
3584 if (!is_btrfs_fs(p0) || !is_btrfs_fs(p1))
3585 return false;
3586
3587 if (is_btrfs_subvol(rootfs) <= 0)
3588 return false;
3589
3590 return btrfs_same_fs(p0, p1) == 0;
3591 }
3592
3593 static int copy_storage(struct lxc_container *c0, struct lxc_container *c,
3594 const char *newtype, int flags, const char *bdevdata,
3595 uint64_t newsize)
3596 {
3597 struct lxc_storage *bdev;
3598 bool need_rdep;
3599
3600 if (should_default_to_snapshot(c0, c))
3601 flags |= LXC_CLONE_SNAPSHOT;
3602
3603 bdev = storage_copy(c0, c->name, c->config_path, newtype, flags,
3604 bdevdata, newsize, &need_rdep);
3605 if (!bdev) {
3606 ERROR("Error copying storage.");
3607 return -1;
3608 }
3609
3610 /* Set new rootfs. */
3611 free(c->lxc_conf->rootfs.path);
3612 c->lxc_conf->rootfs.path = strdup(bdev->src);
3613 storage_put(bdev);
3614
3615 if (!c->lxc_conf->rootfs.path) {
3616 ERROR("Out of memory while setting storage path.");
3617 return -1;
3618 }
3619
3620 /* Append a new lxc.rootfs.path entry to the unexpanded config. */
3621 clear_unexp_config_line(c->lxc_conf, "lxc.rootfs.path", false);
3622 if (!do_append_unexp_config_line(c->lxc_conf, "lxc.rootfs.path",
3623 c->lxc_conf->rootfs.path)) {
3624 ERROR("Error saving new rootfs to cloned config.");
3625 return -1;
3626 }
3627
3628 if (flags & LXC_CLONE_SNAPSHOT)
3629 copy_rdepends(c, c0);
3630
3631 if (need_rdep) {
3632 if (!add_rdepends(c, c0))
3633 WARN("Error adding reverse dependency from %s to %s",
3634 c->name, c0->name);
3635 }
3636
3637 mod_all_rdeps(c, true);
3638
3639 return 0;
3640 }
3641
3642 struct clone_update_data {
3643 struct lxc_container *c0;
3644 struct lxc_container *c1;
3645 int flags;
3646 char **hookargs;
3647 };
3648
3649 static int clone_update_rootfs(struct clone_update_data *data)
3650 {
3651 struct lxc_container *c0 = data->c0;
3652 struct lxc_container *c = data->c1;
3653 int flags = data->flags;
3654 char **hookargs = data->hookargs;
3655 int ret = -1;
3656 char path[PATH_MAX];
3657 struct lxc_storage *bdev;
3658 FILE *fout;
3659 struct lxc_conf *conf = c->lxc_conf;
3660
3661 /* update hostname in rootfs */
3662 /* we're going to mount, so run in a clean namespace to simplify cleanup */
3663
3664 if (setgid(0) < 0) {
3665 ERROR("Failed to setgid to 0");
3666 return -1;
3667 }
3668
3669 if (setuid(0) < 0) {
3670 ERROR("Failed to setuid to 0");
3671 return -1;
3672 }
3673
3674 if (setgroups(0, NULL) < 0)
3675 WARN("Failed to clear groups");
3676
3677 if (unshare(CLONE_NEWNS) < 0)
3678 return -1;
3679
3680 bdev = storage_init(c->lxc_conf);
3681 if (!bdev)
3682 return -1;
3683
3684 if (strcmp(bdev->type, "dir") != 0) {
3685 if (unshare(CLONE_NEWNS) < 0) {
3686 ERROR("error unsharing mounts");
3687 storage_put(bdev);
3688 return -1;
3689 }
3690
3691 if (detect_shared_rootfs()) {
3692 if (mount(NULL, "/", NULL, MS_SLAVE|MS_REC, NULL)) {
3693 SYSERROR("Failed to make / rslave");
3694 ERROR("Continuing...");
3695 }
3696 }
3697
3698 if (bdev->ops->mount(bdev) < 0) {
3699 storage_put(bdev);
3700 return -1;
3701 }
3702 } else { /* TODO come up with a better way */
3703 free(bdev->dest);
3704 bdev->dest = strdup(lxc_storage_get_path(bdev->src, bdev->type));
3705 }
3706
3707 if (!lxc_list_empty(&conf->hooks[LXCHOOK_CLONE])) {
3708 /* Start of environment variable setup for hooks */
3709 if (c0->name && setenv("LXC_SRC_NAME", c0->name, 1))
3710 SYSERROR("failed to set environment variable for source container name");
3711
3712 if (setenv("LXC_NAME", c->name, 1))
3713 SYSERROR("failed to set environment variable for container name");
3714
3715 if (conf->rcfile && setenv("LXC_CONFIG_FILE", conf->rcfile, 1))
3716 SYSERROR("failed to set environment variable for config path");
3717
3718 if (bdev->dest && setenv("LXC_ROOTFS_MOUNT", bdev->dest, 1))
3719 SYSERROR("failed to set environment variable for rootfs mount");
3720
3721 if (conf->rootfs.path && setenv("LXC_ROOTFS_PATH", conf->rootfs.path, 1))
3722 SYSERROR("failed to set environment variable for rootfs mount");
3723
3724 if (run_lxc_hooks(c->name, "clone", conf, hookargs)) {
3725 ERROR("Error executing clone hook for %s", c->name);
3726 storage_put(bdev);
3727 return -1;
3728 }
3729 }
3730
3731 if (!(flags & LXC_CLONE_KEEPNAME)) {
3732 ret = snprintf(path, PATH_MAX, "%s/etc/hostname", bdev->dest);
3733 storage_put(bdev);
3734
3735 if (ret < 0 || ret >= PATH_MAX)
3736 return -1;
3737
3738 if (!file_exists(path))
3739 return 0;
3740
3741 if (!(fout = fopen(path, "w"))) {
3742 SYSERROR("unable to open %s: ignoring", path);
3743 return 0;
3744 }
3745
3746 if (fprintf(fout, "%s", c->name) < 0) {
3747 fclose(fout);
3748 return -1;
3749 }
3750
3751 if (fclose(fout) < 0)
3752 return -1;
3753 } else {
3754 storage_put(bdev);
3755 }
3756
3757 return 0;
3758 }
3759
3760 static int clone_update_rootfs_wrapper(void *data)
3761 {
3762 struct clone_update_data *arg = (struct clone_update_data *) data;
3763 return clone_update_rootfs(arg);
3764 }
3765
3766 /*
3767 * We want to support:
3768 sudo lxc-clone -o o1 -n n1 -s -L|-fssize fssize -v|--vgname vgname \
3769 -p|--lvprefix lvprefix -t|--fstype fstype -B backingstore
3770
3771 -s [ implies overlay]
3772 -s -B overlay
3773
3774 only rootfs gets converted (copied/snapshotted) on clone.
3775 */
3776
3777 static int create_file_dirname(char *path, struct lxc_conf *conf)
3778 {
3779 char *p = strrchr(path, '/');
3780 int ret = -1;
3781
3782 if (!p)
3783 return -1;
3784
3785 *p = '\0';
3786 ret = do_create_container_dir(path, conf);
3787 *p = '/';
3788
3789 return ret;
3790 }
3791
3792 static struct lxc_container *do_lxcapi_clone(struct lxc_container *c, const char *newname,
3793 const char *lxcpath, int flags,
3794 const char *bdevtype, const char *bdevdata, uint64_t newsize,
3795 char **hookargs)
3796 {
3797 char newpath[PATH_MAX];
3798 int fd, ret;
3799 struct clone_update_data data;
3800 size_t saved_unexp_len;
3801 pid_t pid;
3802 int storage_copied = 0;
3803 char *origroot = NULL, *saved_unexp_conf = NULL;
3804 struct lxc_container *c2 = NULL;
3805
3806 if (!c || !do_lxcapi_is_defined(c))
3807 return NULL;
3808
3809 if (container_mem_lock(c))
3810 return NULL;
3811 if (!is_stopped(c) && !(flags & LXC_CLONE_ALLOW_RUNNING)) {
3812 ERROR("error: Original container (%s) is running. Use --allowrunning if you want to force a snapshot of the running container.", c->name);
3813 goto out;
3814 }
3815
3816 /* Make sure the container doesn't yet exist. */
3817 if (!newname)
3818 newname = c->name;
3819
3820 if (!lxcpath)
3821 lxcpath = do_lxcapi_get_config_path(c);
3822
3823 ret = snprintf(newpath, PATH_MAX, "%s/%s/config", lxcpath, newname);
3824 if (ret < 0 || ret >= PATH_MAX) {
3825 SYSERROR("clone: failed making config pathname");
3826 goto out;
3827 }
3828
3829 if (file_exists(newpath)) {
3830 ERROR("error: clone: %s exists", newpath);
3831 goto out;
3832 }
3833
3834 ret = create_file_dirname(newpath, c->lxc_conf);
3835 if (ret < 0 && errno != EEXIST) {
3836 ERROR("Error creating container dir for %s", newpath);
3837 goto out;
3838 }
3839
3840 /* Copy the configuration. Tweak it as needed. */
3841 if (c->lxc_conf->rootfs.path) {
3842 origroot = c->lxc_conf->rootfs.path;
3843 c->lxc_conf->rootfs.path = NULL;
3844 }
3845
3846 fd = open(newpath, O_WRONLY | O_CREAT | O_CLOEXEC,
3847 S_IRUSR | S_IWUSR | S_IRGRP | S_IWGRP);
3848 if (fd < 0) {
3849 SYSERROR("Failed to open \"%s\"", newpath);
3850 goto out;
3851 }
3852
3853 saved_unexp_conf = c->lxc_conf->unexpanded_config;
3854 saved_unexp_len = c->lxc_conf->unexpanded_len;
3855 c->lxc_conf->unexpanded_config = strdup(saved_unexp_conf);
3856 if (!c->lxc_conf->unexpanded_config) {
3857 close(fd);
3858 goto out;
3859 }
3860
3861 clear_unexp_config_line(c->lxc_conf, "lxc.rootfs.path", false);
3862 write_config(fd, c->lxc_conf);
3863 close(fd);
3864
3865 c->lxc_conf->rootfs.path = origroot;
3866
3867 free(c->lxc_conf->unexpanded_config);
3868 c->lxc_conf->unexpanded_config = saved_unexp_conf;
3869 saved_unexp_conf = NULL;
3870 c->lxc_conf->unexpanded_len = saved_unexp_len;
3871
3872 ret = snprintf(newpath, PATH_MAX, "%s/%s/rootfs", lxcpath, newname);
3873 if (ret < 0 || ret >= PATH_MAX) {
3874 SYSERROR("clone: failed making rootfs pathname");
3875 goto out;
3876 }
3877
3878 ret = mkdir(newpath, 0755);
3879 if (ret < 0) {
3880 /* For an overlay container the rootfs is considered immutable
3881 * and will not have been removed when restoring from a
3882 * snapshot.
3883 */
3884 if (errno != ENOENT &&
3885 !(flags & LXC_STORAGE_INTERNAL_OVERLAY_RESTORE)) {
3886 SYSERROR("Failed to create directory \"%s\"", newpath);
3887 goto out;
3888 }
3889 }
3890
3891 if (am_guest_unpriv()) {
3892 if (chown_mapped_root(newpath, c->lxc_conf) < 0) {
3893 ERROR("Error chowning %s to container root", newpath);
3894 goto out;
3895 }
3896 }
3897
3898 c2 = lxc_container_new(newname, lxcpath);
3899 if (!c2) {
3900 ERROR("clone: failed to create new container (%s %s)", newname,
3901 lxcpath);
3902 goto out;
3903 }
3904
3905 /* copy/snapshot rootfs's */
3906 ret = copy_storage(c, c2, bdevtype, flags, bdevdata, newsize);
3907 if (ret < 0)
3908 goto out;
3909
3910 /* update utsname */
3911 if (!(flags & LXC_CLONE_KEEPNAME)) {
3912 clear_unexp_config_line(c2->lxc_conf, "lxc.utsname", false);
3913 clear_unexp_config_line(c2->lxc_conf, "lxc.uts.name", false);
3914
3915 if (!do_set_config_item_locked(c2, "lxc.uts.name", newname)) {
3916 ERROR("Error setting new hostname");
3917 goto out;
3918 }
3919 }
3920
3921 /* copy hooks */
3922 ret = copyhooks(c, c2);
3923 if (ret < 0) {
3924 ERROR("error copying hooks");
3925 goto out;
3926 }
3927
3928 if (copy_fstab(c, c2) < 0) {
3929 ERROR("error copying fstab");
3930 goto out;
3931 }
3932
3933 /* update macaddrs */
3934 if (!(flags & LXC_CLONE_KEEPMACADDR)) {
3935 if (!network_new_hwaddrs(c2->lxc_conf)) {
3936 ERROR("Error updating mac addresses");
3937 goto out;
3938 }
3939 }
3940
3941 /* Update absolute paths for overlay mount directories. */
3942 if (ovl_update_abs_paths(c2->lxc_conf, c->config_path, c->name, lxcpath, newname) < 0)
3943 goto out;
3944
3945 /* We've now successfully created c2's storage, so clear it out if we
3946 * fail after this.
3947 */
3948 storage_copied = 1;
3949
3950 if (!c2->save_config(c2, NULL))
3951 goto out;
3952
3953 if ((pid = fork()) < 0) {
3954 SYSERROR("fork");
3955 goto out;
3956 }
3957
3958 if (pid > 0) {
3959 ret = wait_for_pid(pid);
3960 if (ret)
3961 goto out;
3962
3963 container_mem_unlock(c);
3964 return c2;
3965 }
3966
3967 data.c0 = c;
3968 data.c1 = c2;
3969 data.flags = flags;
3970 data.hookargs = hookargs;
3971
3972 if (am_guest_unpriv())
3973 ret = userns_exec_full(c->lxc_conf, clone_update_rootfs_wrapper,
3974 &data, "clone_update_rootfs_wrapper");
3975 else
3976 ret = clone_update_rootfs(&data);
3977 if (ret < 0)
3978 _exit(EXIT_FAILURE);
3979
3980 container_mem_unlock(c);
3981 _exit(EXIT_SUCCESS);
3982
3983 out:
3984 container_mem_unlock(c);
3985 if (c2) {
3986 if (!storage_copied)
3987 c2->lxc_conf->rootfs.path = NULL;
3988
3989 c2->destroy(c2);
3990 lxc_container_put(c2);
3991 }
3992
3993 return NULL;
3994 }
3995
3996 static struct lxc_container *lxcapi_clone(struct lxc_container *c, const char *newname,
3997 const char *lxcpath, int flags,
3998 const char *bdevtype, const char *bdevdata, uint64_t newsize,
3999 char **hookargs)
4000 {
4001 struct lxc_container * ret;
4002
4003 current_config = c ? c->lxc_conf : NULL;
4004 ret = do_lxcapi_clone(c, newname, lxcpath, flags, bdevtype, bdevdata, newsize, hookargs);
4005 current_config = NULL;
4006
4007 return ret;
4008 }
4009
4010 static bool do_lxcapi_rename(struct lxc_container *c, const char *newname)
4011 {
4012 struct lxc_storage *bdev;
4013 struct lxc_container *newc;
4014
4015 if (!c || !c->name || !c->config_path || !c->lxc_conf)
4016 return false;
4017
4018 if (has_fs_snapshots(c) || has_snapshots(c)) {
4019 ERROR("Renaming a container with snapshots is not supported");
4020 return false;
4021 }
4022
4023 bdev = storage_init(c->lxc_conf);
4024 if (!bdev) {
4025 ERROR("Failed to find original backing store type");
4026 return false;
4027 }
4028
4029 newc = lxcapi_clone(c, newname, c->config_path, LXC_CLONE_KEEPMACADDR, NULL, bdev->type, 0, NULL);
4030 storage_put(bdev);
4031 if (!newc) {
4032 lxc_container_put(newc);
4033 return false;
4034 }
4035
4036 if (newc && lxcapi_is_defined(newc))
4037 lxc_container_put(newc);
4038
4039 if (!container_destroy(c, NULL)) {
4040 ERROR("Could not destroy existing container %s", c->name);
4041 return false;
4042 }
4043
4044 return true;
4045 }
4046
4047 WRAP_API_1(bool, lxcapi_rename, const char *)
4048
4049 static int lxcapi_attach(struct lxc_container *c, lxc_attach_exec_t exec_function, void *exec_payload, lxc_attach_options_t *options, pid_t *attached_process)
4050 {
4051 int ret;
4052
4053 if (!c)
4054 return -1;
4055
4056 current_config = c->lxc_conf;
4057
4058 ret = lxc_attach(c->name, c->config_path, exec_function, exec_payload, options, attached_process);
4059 current_config = NULL;
4060 return ret;
4061 }
4062
4063 static int do_lxcapi_attach_run_wait(struct lxc_container *c, lxc_attach_options_t *options, const char *program, const char * const argv[])
4064 {
4065 lxc_attach_command_t command;
4066 pid_t pid;
4067 int r;
4068
4069 if (!c)
4070 return -1;
4071
4072 command.program = (char*)program;
4073 command.argv = (char**)argv;
4074
4075 r = lxc_attach(c->name, c->config_path, lxc_attach_run_command, &command, options, &pid);
4076 if (r < 0) {
4077 ERROR("ups");
4078 return r;
4079 }
4080
4081 return lxc_wait_for_pid_status(pid);
4082 }
4083
4084 static int lxcapi_attach_run_wait(struct lxc_container *c, lxc_attach_options_t *options, const char *program, const char * const argv[])
4085 {
4086 int ret;
4087
4088 current_config = c ? c->lxc_conf : NULL;
4089 ret = do_lxcapi_attach_run_wait(c, options, program, argv);
4090 current_config = NULL;
4091
4092 return ret;
4093 }
4094
4095 static int get_next_index(const char *lxcpath, char *cname)
4096 {
4097 __do_free char *fname = NULL;
4098 struct stat sb;
4099 int i = 0, ret;
4100
4101 fname = must_realloc(NULL, strlen(lxcpath) + 20);
4102
4103 for (;;) {
4104 sprintf(fname, "%s/snap%d", lxcpath, i);
4105
4106 ret = stat(fname, &sb);
4107 if (ret != 0)
4108 return i;
4109
4110 i++;
4111 }
4112 }
4113
4114 static bool get_snappath_dir(struct lxc_container *c, char *snappath)
4115 {
4116 int ret;
4117
4118 /*
4119 * If the old style snapshot path exists, use it
4120 * /var/lib/lxc -> /var/lib/lxcsnaps
4121 */
4122 ret = snprintf(snappath, PATH_MAX, "%ssnaps", c->config_path);
4123 if (ret < 0 || ret >= PATH_MAX)
4124 return false;
4125
4126 if (dir_exists(snappath)) {
4127 ret = snprintf(snappath, PATH_MAX, "%ssnaps/%s", c->config_path, c->name);
4128 if (ret < 0 || ret >= PATH_MAX)
4129 return false;
4130
4131 return true;
4132 }
4133
4134 /*
4135 * Use the new style path
4136 * /var/lib/lxc -> /var/lib/lxc + c->name + /snaps + \0
4137 */
4138 ret = snprintf(snappath, PATH_MAX, "%s/%s/snaps", c->config_path, c->name);
4139 if (ret < 0 || ret >= PATH_MAX)
4140 return false;
4141
4142 return true;
4143 }
4144
4145 static int do_lxcapi_snapshot(struct lxc_container *c, const char *commentfile)
4146 {
4147 __do_free char *dfnam = NULL;
4148 int i, flags, ret;
4149 time_t timer;
4150 struct tm tm_info;
4151 struct lxc_container *c2;
4152 char snappath[PATH_MAX], newname[20];
4153 char buffer[25];
4154 FILE *f;
4155
4156 if (!c || !lxcapi_is_defined(c))
4157 return -1;
4158
4159 if (!storage_can_backup(c->lxc_conf)) {
4160 ERROR("%s's backing store cannot be backed up", c->name);
4161 ERROR("Your container must use another backing store type");
4162 return -1;
4163 }
4164
4165 if (!get_snappath_dir(c, snappath))
4166 return -1;
4167
4168 i = get_next_index(snappath, c->name);
4169
4170 if (mkdir_p(snappath, 0755) < 0) {
4171 ERROR("Failed to create snapshot directory %s", snappath);
4172 return -1;
4173 }
4174
4175 ret = snprintf(newname, 20, "snap%d", i);
4176 if (ret < 0 || ret >= 20)
4177 return -1;
4178
4179 /*
4180 * We pass LXC_CLONE_SNAPSHOT to make sure that a rdepends file entry is
4181 * created in the original container
4182 */
4183 flags = LXC_CLONE_SNAPSHOT | LXC_CLONE_KEEPMACADDR | LXC_CLONE_KEEPNAME |
4184 LXC_CLONE_KEEPBDEVTYPE | LXC_CLONE_MAYBE_SNAPSHOT;
4185 if (storage_is_dir(c->lxc_conf)) {
4186 ERROR("Snapshot of directory-backed container requested");
4187 ERROR("Making a copy-clone. If you do want snapshots, then");
4188 ERROR("please create overlay clone first, snapshot that");
4189 ERROR("and keep the original container pristine");
4190 flags &= ~LXC_CLONE_SNAPSHOT | LXC_CLONE_MAYBE_SNAPSHOT;
4191 }
4192
4193 c2 = do_lxcapi_clone(c, newname, snappath, flags, NULL, NULL, 0, NULL);
4194 if (!c2) {
4195 ERROR("Failed to clone of %s:%s", c->config_path, c->name);
4196 return -1;
4197 }
4198
4199 lxc_container_put(c2);
4200
4201 /* Now write down the creation time. */
4202 time(&timer);
4203
4204 if (!localtime_r(&timer, &tm_info)) {
4205 ERROR("Failed to get localtime");
4206 return -1;
4207 }
4208
4209 strftime(buffer, 25, "%Y:%m:%d %H:%M:%S", &tm_info);
4210
4211 dfnam = must_realloc(NULL, strlen(snappath) + strlen(newname) + 5);
4212 sprintf(dfnam, "%s/%s/ts", snappath, newname);
4213 f = fopen(dfnam, "w");
4214 if (!f) {
4215 ERROR("Failed to open %s", dfnam);
4216 return -1;
4217 }
4218
4219 if (fprintf(f, "%s", buffer) < 0) {
4220 SYSERROR("Writing timestamp");
4221 fclose(f);
4222 return -1;
4223 }
4224
4225 ret = fclose(f);
4226 if (ret != 0) {
4227 SYSERROR("Writing timestamp");
4228 return -1;
4229 }
4230
4231 if (commentfile) {
4232 __do_free char *path = NULL;
4233 /* $p / $name / comment \0 */
4234 int len = strlen(snappath) + strlen(newname) + 10;
4235
4236 path = must_realloc(NULL, len);
4237 sprintf(path, "%s/%s/comment", snappath, newname);
4238 return copy_file(commentfile, path) < 0 ? -1 : i;
4239 }
4240
4241 return i;
4242 }
4243
4244 WRAP_API_1(int, lxcapi_snapshot, const char *)
4245
4246 static void lxcsnap_free(struct lxc_snapshot *s)
4247 {
4248 free(s->name);
4249 free(s->comment_pathname);
4250 free(s->timestamp);
4251 free(s->lxcpath);
4252 }
4253
4254 static char *get_snapcomment_path(char* snappath, char *name)
4255 {
4256 /* $snappath/$name/comment */
4257 int ret, len = strlen(snappath) + strlen(name) + 10;
4258 char *s = malloc(len);
4259
4260 if (s) {
4261 ret = snprintf(s, len, "%s/%s/comment", snappath, name);
4262 if (ret < 0 || ret >= len) {
4263 free(s);
4264 s = NULL;
4265 }
4266 }
4267
4268 return s;
4269 }
4270
4271 static char *get_timestamp(char* snappath, char *name)
4272 {
4273 char path[PATH_MAX], *s = NULL;
4274 int ret, len;
4275 FILE *fin;
4276
4277 ret = snprintf(path, PATH_MAX, "%s/%s/ts", snappath, name);
4278 if (ret < 0 || ret >= PATH_MAX)
4279 return NULL;
4280
4281 fin = fopen(path, "r");
4282 if (!fin)
4283 return NULL;
4284
4285 (void) fseek(fin, 0, SEEK_END);
4286 len = ftell(fin);
4287 (void) fseek(fin, 0, SEEK_SET);
4288 if (len > 0) {
4289 s = malloc(len+1);
4290 if (s) {
4291 s[len] = '\0';
4292 if (fread(s, 1, len, fin) != len) {
4293 SYSERROR("reading timestamp");
4294 free(s);
4295 s = NULL;
4296 }
4297 }
4298 }
4299
4300 fclose(fin);
4301 return s;
4302 }
4303
4304 static int do_lxcapi_snapshot_list(struct lxc_container *c, struct lxc_snapshot **ret_snaps)
4305 {
4306 char snappath[PATH_MAX], path2[PATH_MAX];
4307 int count = 0, ret;
4308 struct dirent *direntp;
4309 struct lxc_snapshot *snaps =NULL, *nsnaps;
4310 DIR *dir;
4311
4312 if (!c || !lxcapi_is_defined(c))
4313 return -1;
4314
4315 if (!get_snappath_dir(c, snappath)) {
4316 ERROR("path name too long");
4317 return -1;
4318 }
4319
4320 dir = opendir(snappath);
4321 if (!dir) {
4322 INFO("Failed to open %s - assuming no snapshots", snappath);
4323 return 0;
4324 }
4325
4326 while ((direntp = readdir(dir))) {
4327 if (!strcmp(direntp->d_name, "."))
4328 continue;
4329
4330 if (!strcmp(direntp->d_name, ".."))
4331 continue;
4332
4333 ret = snprintf(path2, PATH_MAX, "%s/%s/config", snappath, direntp->d_name);
4334 if (ret < 0 || ret >= PATH_MAX) {
4335 ERROR("pathname too long");
4336 goto out_free;
4337 }
4338
4339 if (!file_exists(path2))
4340 continue;
4341
4342 nsnaps = realloc(snaps, (count + 1)*sizeof(*snaps));
4343 if (!nsnaps) {
4344 SYSERROR("Out of memory");
4345 goto out_free;
4346 }
4347
4348 snaps = nsnaps;
4349 snaps[count].free = lxcsnap_free;
4350 snaps[count].name = strdup(direntp->d_name);
4351 if (!snaps[count].name)
4352 goto out_free;
4353
4354 snaps[count].lxcpath = strdup(snappath);
4355 if (!snaps[count].lxcpath) {
4356 free(snaps[count].name);
4357 goto out_free;
4358 }
4359
4360 snaps[count].comment_pathname = get_snapcomment_path(snappath, direntp->d_name);
4361 snaps[count].timestamp = get_timestamp(snappath, direntp->d_name);
4362 count++;
4363 }
4364
4365 if (closedir(dir))
4366 WARN("Failed to close directory");
4367
4368 *ret_snaps = snaps;
4369 return count;
4370
4371 out_free:
4372 if (snaps) {
4373 int i;
4374
4375 for (i=0; i<count; i++)
4376 lxcsnap_free(&snaps[i]);
4377
4378 free(snaps);
4379 }
4380
4381 if (closedir(dir))
4382 WARN("Failed to close directory");
4383
4384 return -1;
4385 }
4386
4387 WRAP_API_1(int, lxcapi_snapshot_list, struct lxc_snapshot **)
4388
4389 static bool do_lxcapi_snapshot_restore(struct lxc_container *c, const char *snapname, const char *newname)
4390 {
4391 char clonelxcpath[PATH_MAX];
4392 int flags = 0;
4393 struct lxc_container *snap, *rest;
4394 struct lxc_storage *bdev;
4395 bool b = false;
4396
4397 if (!c || !c->name || !c->config_path)
4398 return false;
4399
4400 if (has_fs_snapshots(c)) {
4401 ERROR("container rootfs has dependent snapshots");
4402 return false;
4403 }
4404
4405 bdev = storage_init(c->lxc_conf);
4406 if (!bdev) {
4407 ERROR("Failed to find original backing store type");
4408 return false;
4409 }
4410
4411 /* For an overlay container the rootfs is considered immutable
4412 * and cannot be removed when restoring from a snapshot. We pass this
4413 * internal flag along to communicate this to various parts of the
4414 * codebase.
4415 */
4416 if (!strcmp(bdev->type, "overlay") || !strcmp(bdev->type, "overlayfs"))
4417 bdev->flags |= LXC_STORAGE_INTERNAL_OVERLAY_RESTORE;
4418
4419 if (!newname)
4420 newname = c->name;
4421
4422 if (!get_snappath_dir(c, clonelxcpath)) {
4423 storage_put(bdev);
4424 return false;
4425 }
4426 /* how should we lock this? */
4427
4428 snap = lxc_container_new(snapname, clonelxcpath);
4429 if (!snap || !lxcapi_is_defined(snap)) {
4430 ERROR("Could not open snapshot %s", snapname);
4431
4432 if (snap)
4433 lxc_container_put(snap);
4434
4435 storage_put(bdev);
4436 return false;
4437 }
4438
4439 if (!strcmp(c->name, newname)) {
4440 if (!container_destroy(c, bdev)) {
4441 ERROR("Could not destroy existing container %s", newname);
4442 lxc_container_put(snap);
4443 storage_put(bdev);
4444 return false;
4445 }
4446 }
4447
4448 if (strcmp(bdev->type, "dir") != 0 && strcmp(bdev->type, "loop") != 0)
4449 flags = LXC_CLONE_SNAPSHOT | LXC_CLONE_MAYBE_SNAPSHOT;
4450
4451 if (!strcmp(bdev->type, "overlay") || !strcmp(bdev->type, "overlayfs"))
4452 flags |= LXC_STORAGE_INTERNAL_OVERLAY_RESTORE;
4453
4454 rest = lxcapi_clone(snap, newname, c->config_path, flags, bdev->type,
4455 NULL, 0, NULL);
4456 storage_put(bdev);
4457 if (rest && lxcapi_is_defined(rest))
4458 b = true;
4459
4460 if (rest)
4461 lxc_container_put(rest);
4462
4463 lxc_container_put(snap);
4464 return b;
4465 }
4466
4467 WRAP_API_2(bool, lxcapi_snapshot_restore, const char *, const char *)
4468
4469 static bool do_snapshot_destroy(const char *snapname, const char *clonelxcpath)
4470 {
4471 struct lxc_container *snap = NULL;
4472 bool bret = false;
4473
4474 snap = lxc_container_new(snapname, clonelxcpath);
4475 if (!snap) {
4476 ERROR("Could not find snapshot %s", snapname);
4477 goto err;
4478 }
4479
4480 if (!do_lxcapi_destroy(snap)) {
4481 ERROR("Could not destroy snapshot %s", snapname);
4482 goto err;
4483 }
4484
4485 bret = true;
4486
4487 err:
4488 if (snap)
4489 lxc_container_put(snap);
4490
4491 return bret;
4492 }
4493
4494 static bool remove_all_snapshots(const char *path)
4495 {
4496 DIR *dir;
4497 struct dirent *direntp;
4498 bool bret = true;
4499
4500 dir = opendir(path);
4501 if (!dir) {
4502 SYSERROR("opendir on snapshot path %s", path);
4503 return false;
4504 }
4505
4506 while ((direntp = readdir(dir))) {
4507 if (!strcmp(direntp->d_name, "."))
4508 continue;
4509
4510 if (!strcmp(direntp->d_name, ".."))
4511 continue;
4512
4513 if (!do_snapshot_destroy(direntp->d_name, path)) {
4514 bret = false;
4515 continue;
4516 }
4517 }
4518
4519 closedir(dir);
4520
4521 if (rmdir(path))
4522 SYSERROR("Error removing directory %s", path);
4523
4524 return bret;
4525 }
4526
4527 static bool do_lxcapi_snapshot_destroy(struct lxc_container *c, const char *snapname)
4528 {
4529 char clonelxcpath[PATH_MAX];
4530
4531 if (!c || !c->name || !c->config_path || !snapname)
4532 return false;
4533
4534 if (!get_snappath_dir(c, clonelxcpath))
4535 return false;
4536
4537 return do_snapshot_destroy(snapname, clonelxcpath);
4538 }
4539
4540 WRAP_API_1(bool, lxcapi_snapshot_destroy, const char *)
4541
4542 static bool do_lxcapi_snapshot_destroy_all(struct lxc_container *c)
4543 {
4544 char clonelxcpath[PATH_MAX];
4545
4546 if (!c || !c->name || !c->config_path)
4547 return false;
4548
4549 if (!get_snappath_dir(c, clonelxcpath))
4550 return false;
4551
4552 return remove_all_snapshots(clonelxcpath);
4553 }
4554
4555 WRAP_API(bool, lxcapi_snapshot_destroy_all)
4556
4557 static bool do_lxcapi_may_control(struct lxc_container *c)
4558 {
4559 if (!c)
4560 return false;
4561
4562 return lxc_try_cmd(c->name, c->config_path) == 0;
4563 }
4564
4565 WRAP_API(bool, lxcapi_may_control)
4566
4567 static bool do_add_remove_node(pid_t init_pid, const char *path, bool add,
4568 struct stat *st)
4569 {
4570 int ret;
4571 char *tmp;
4572 pid_t pid;
4573 char chrootpath[PATH_MAX];
4574 char *directory_path = NULL;
4575
4576 pid = fork();
4577 if (pid < 0) {
4578 SYSERROR("Failed to fork()");
4579 return false;
4580 }
4581
4582 if (pid) {
4583 ret = wait_for_pid(pid);
4584 if (ret != 0) {
4585 ERROR("Failed to create device node");
4586 return false;
4587 }
4588
4589 return true;
4590 }
4591
4592 /* prepare the path */
4593 ret = snprintf(chrootpath, PATH_MAX, "/proc/%d/root", init_pid);
4594 if (ret < 0 || ret >= PATH_MAX)
4595 return false;
4596
4597 ret = chroot(chrootpath);
4598 if (ret < 0)
4599 _exit(EXIT_FAILURE);
4600
4601 ret = chdir("/");
4602 if (ret < 0)
4603 _exit(EXIT_FAILURE);
4604
4605 /* remove path if it exists */
4606 ret = faccessat(AT_FDCWD, path, F_OK, AT_SYMLINK_NOFOLLOW);
4607 if(ret == 0) {
4608 ret = unlink(path);
4609 if (ret < 0) {
4610 SYSERROR("Failed to remove \"%s\"", path);
4611 _exit(EXIT_FAILURE);
4612 }
4613 }
4614
4615 if (!add)
4616 _exit(EXIT_SUCCESS);
4617
4618 /* create any missing directories */
4619 tmp = strdup(path);
4620 if (!tmp)
4621 _exit(EXIT_FAILURE);
4622
4623 directory_path = dirname(tmp);
4624 ret = mkdir_p(directory_path, 0755);
4625 if (ret < 0 && errno != EEXIST) {
4626 SYSERROR("Failed to create path \"%s\"", directory_path);
4627 free(tmp);
4628 _exit(EXIT_FAILURE);
4629 }
4630
4631 /* create the device node */
4632 ret = mknod(path, st->st_mode, st->st_rdev);
4633 free(tmp);
4634 if (ret < 0) {
4635 SYSERROR("Failed to create device node at \"%s\"", path);
4636 _exit(EXIT_FAILURE);
4637 }
4638
4639 _exit(EXIT_SUCCESS);
4640 }
4641
4642 static bool add_remove_device_node(struct lxc_container *c, const char *src_path, const char *dest_path, bool add)
4643 {
4644 int ret;
4645 struct stat st;
4646 char value[LXC_MAX_BUFFER];
4647 const char *p;
4648 pid_t init_pid;
4649
4650 /* make sure container is running */
4651 if (!do_lxcapi_is_running(c)) {
4652 ERROR("container is not running");
4653 return false;
4654 }
4655
4656 /* use src_path if dest_path is NULL otherwise use dest_path */
4657 p = dest_path ? dest_path : src_path;
4658
4659 /* make sure we can access p */
4660 if(access(p, F_OK) < 0 || stat(p, &st) < 0)
4661 return false;
4662
4663 /* continue if path is character device or block device */
4664 if (S_ISCHR(st.st_mode))
4665 ret = snprintf(value, LXC_MAX_BUFFER, "c %d:%d rwm", major(st.st_rdev), minor(st.st_rdev));
4666 else if (S_ISBLK(st.st_mode))
4667 ret = snprintf(value, LXC_MAX_BUFFER, "b %d:%d rwm", major(st.st_rdev), minor(st.st_rdev));
4668 else
4669 return false;
4670
4671 /* check snprintf return code */
4672 if (ret < 0 || ret >= LXC_MAX_BUFFER)
4673 return false;
4674
4675 init_pid = do_lxcapi_init_pid(c);
4676 if (init_pid < 0) {
4677 ERROR("Failed to get init pid");
4678 return false;
4679 }
4680
4681 if (!do_add_remove_node(init_pid, p, add, &st))
4682 return false;
4683
4684 /* add or remove device to/from cgroup access list */
4685 if (add) {
4686 if (!do_lxcapi_set_cgroup_item(c, "devices.allow", value)) {
4687 ERROR("set_cgroup_item failed while adding the device node");
4688 return false;
4689 }
4690 } else {
4691 if (!do_lxcapi_set_cgroup_item(c, "devices.deny", value)) {
4692 ERROR("set_cgroup_item failed while removing the device node");
4693 return false;
4694 }
4695 }
4696
4697 return true;
4698 }
4699
4700 static bool do_lxcapi_add_device_node(struct lxc_container *c, const char *src_path, const char *dest_path)
4701 {
4702 // cannot mknod if we're not privileged wrt init_user_ns
4703 if (am_host_unpriv()) {
4704 ERROR(LXC_UNPRIV_EOPNOTSUPP, __FUNCTION__);
4705 return false;
4706 }
4707
4708 return add_remove_device_node(c, src_path, dest_path, true);
4709 }
4710
4711 WRAP_API_2(bool, lxcapi_add_device_node, const char *, const char *)
4712
4713 static bool do_lxcapi_remove_device_node(struct lxc_container *c, const char *src_path, const char *dest_path)
4714 {
4715 if (am_guest_unpriv()) {
4716 ERROR(LXC_UNPRIV_EOPNOTSUPP, __FUNCTION__);
4717 return false;
4718 }
4719
4720 return add_remove_device_node(c, src_path, dest_path, false);
4721 }
4722
4723 WRAP_API_2(bool, lxcapi_remove_device_node, const char *, const char *)
4724
4725 static bool do_lxcapi_attach_interface(struct lxc_container *c,
4726 const char *ifname,
4727 const char *dst_ifname)
4728 {
4729 pid_t init_pid;
4730 int ret = 0;
4731
4732 if (am_guest_unpriv()) {
4733 ERROR(LXC_UNPRIV_EOPNOTSUPP, __FUNCTION__);
4734 return false;
4735 }
4736
4737 if (!ifname) {
4738 ERROR("No source interface name given");
4739 return false;
4740 }
4741
4742 ret = lxc_netdev_isup(ifname);
4743 if (ret > 0) {
4744 /* netdev of ifname is up. */
4745 ret = lxc_netdev_down(ifname);
4746 if (ret)
4747 goto err;
4748 }
4749
4750 init_pid = do_lxcapi_init_pid(c);
4751 if (init_pid < 0) {
4752 ERROR("Failed to get init pid");
4753 goto err;
4754 }
4755
4756 ret = lxc_netdev_move_by_name(ifname, init_pid, dst_ifname);
4757 if (ret)
4758 goto err;
4759
4760 INFO("Moved network device \"%s\" to network namespace of %d", ifname, init_pid);
4761 return true;
4762
4763 err:
4764 return false;
4765 }
4766
4767 WRAP_API_2(bool, lxcapi_attach_interface, const char *, const char *)
4768
4769 static bool do_lxcapi_detach_interface(struct lxc_container *c,
4770 const char *ifname,
4771 const char *dst_ifname)
4772 {
4773 int ret;
4774 pid_t pid, pid_outside;
4775
4776 /*
4777 * TODO - if this is a physical device, then we need am_host_unpriv.
4778 * But for other types guest privilege suffices.
4779 */
4780 if (am_guest_unpriv()) {
4781 ERROR(LXC_UNPRIV_EOPNOTSUPP, __FUNCTION__);
4782 return false;
4783 }
4784
4785 if (!ifname) {
4786 ERROR("No source interface name given");
4787 return false;
4788 }
4789
4790 pid_outside = lxc_raw_getpid();
4791 pid = fork();
4792 if (pid < 0) {
4793 ERROR("Failed to fork");
4794 return false;
4795 }
4796
4797 if (pid == 0) { /* child */
4798 pid_t init_pid;
4799
4800 init_pid = do_lxcapi_init_pid(c);
4801 if (init_pid < 0) {
4802 ERROR("Failed to get init pid");
4803 _exit(EXIT_FAILURE);
4804 }
4805 if (!switch_to_ns(init_pid, "net")) {
4806 ERROR("Failed to enter network namespace");
4807 _exit(EXIT_FAILURE);
4808 }
4809
4810 ret = lxc_netdev_isup(ifname);
4811 if (ret < 0) {
4812 ERROR("Failed to determine whether network device \"%s\" is up", ifname);
4813 _exit(EXIT_FAILURE);
4814 }
4815
4816 /* netdev of ifname is up. */
4817 if (ret) {
4818 ret = lxc_netdev_down(ifname);
4819 if (ret) {
4820 ERROR("Failed to set network device \"%s\" down", ifname);
4821 _exit(EXIT_FAILURE);
4822 }
4823 }
4824
4825 ret = lxc_netdev_move_by_name(ifname, pid_outside, dst_ifname);
4826 /* -EINVAL means there is no netdev named as ifname. */
4827 if (ret < 0) {
4828 if (ret == -EINVAL)
4829 ERROR("Network device \"%s\" not found", ifname);
4830 else
4831 ERROR("Failed to remove network device \"%s\"", ifname);
4832
4833 _exit(EXIT_FAILURE);
4834 }
4835
4836 _exit(EXIT_SUCCESS);
4837 }
4838
4839 ret = wait_for_pid(pid);
4840 if (ret != 0)
4841 return false;
4842
4843 INFO("Moved network device \"%s\" to network namespace of %d", ifname, pid_outside);
4844 return true;
4845 }
4846
4847 WRAP_API_2(bool, lxcapi_detach_interface, const char *, const char *)
4848
4849 static int do_lxcapi_migrate(struct lxc_container *c, unsigned int cmd,
4850 struct migrate_opts *opts, unsigned int size)
4851 {
4852 int ret = -1;
4853 struct migrate_opts *valid_opts = opts;
4854 uint64_t features_to_check = 0;
4855
4856 /* If the caller has a bigger (newer) struct migrate_opts, let's make
4857 * sure that the stuff on the end is zero, i.e. that they didn't ask us
4858 * to do anything special.
4859 */
4860 if (size > sizeof(*opts)) {
4861 unsigned char *addr;
4862 unsigned char *end;
4863
4864 addr = (void *)opts + sizeof(*opts);
4865 end = (void *)opts + size;
4866
4867 for (; addr < end; addr++)
4868 if (*addr)
4869 return -E2BIG;
4870 }
4871
4872 /* If the caller has a smaller struct, let's zero out the end for them
4873 * so we don't accidentally use bits of it that they didn't know about
4874 * to initialize.
4875 */
4876 if (size < sizeof(*opts)) {
4877 valid_opts = malloc(sizeof(*opts));
4878 if (!valid_opts)
4879 return -ENOMEM;
4880
4881 memset(valid_opts, 0, sizeof(*opts));
4882 memcpy(valid_opts, opts, size);
4883 }
4884
4885 switch (cmd) {
4886 case MIGRATE_PRE_DUMP:
4887 if (!do_lxcapi_is_running(c)) {
4888 ERROR("container is not running");
4889 goto on_error;
4890 }
4891
4892 ret = !__criu_pre_dump(c, valid_opts);
4893 break;
4894 case MIGRATE_DUMP:
4895 if (!do_lxcapi_is_running(c)) {
4896 ERROR("container is not running");
4897 goto on_error;
4898 }
4899
4900 ret = !__criu_dump(c, valid_opts);
4901 break;
4902 case MIGRATE_RESTORE:
4903 if (do_lxcapi_is_running(c)) {
4904 ERROR("container is already running");
4905 goto on_error;
4906 }
4907
4908 ret = !__criu_restore(c, valid_opts);
4909 break;
4910 case MIGRATE_FEATURE_CHECK:
4911 features_to_check = valid_opts->features_to_check;
4912 ret = !__criu_check_feature(&features_to_check);
4913 if (ret) {
4914 /* Something went wrong. Let's let the caller
4915 * know which feature checks failed. */
4916 valid_opts->features_to_check = features_to_check;
4917 }
4918 break;
4919 default:
4920 ERROR("invalid migrate command %u", cmd);
4921 ret = -EINVAL;
4922 }
4923
4924 on_error:
4925 if (size < sizeof(*opts))
4926 free(valid_opts);
4927
4928 return ret;
4929 }
4930
4931 WRAP_API_3(int, lxcapi_migrate, unsigned int, struct migrate_opts *, unsigned int)
4932
4933 static bool do_lxcapi_checkpoint(struct lxc_container *c, char *directory, bool stop, bool verbose)
4934 {
4935 struct migrate_opts opts;
4936
4937 memset(&opts, 0, sizeof(opts));
4938
4939 opts.directory = directory;
4940 opts.stop = stop;
4941 opts.verbose = verbose;
4942
4943 return !do_lxcapi_migrate(c, MIGRATE_DUMP, &opts, sizeof(opts));
4944 }
4945
4946 WRAP_API_3(bool, lxcapi_checkpoint, char *, bool, bool)
4947
4948 static bool do_lxcapi_restore(struct lxc_container *c, char *directory, bool verbose)
4949 {
4950 struct migrate_opts opts;
4951
4952 memset(&opts, 0, sizeof(opts));
4953
4954 opts.directory = directory;
4955 opts.verbose = verbose;
4956
4957 return !do_lxcapi_migrate(c, MIGRATE_RESTORE, &opts, sizeof(opts));
4958 }
4959
4960 WRAP_API_2(bool, lxcapi_restore, char *, bool)
4961
4962 /* @st_mode is the st_mode field of the stat(source) return struct */
4963 static int create_mount_target(const char *dest, mode_t st_mode)
4964 {
4965 char *dirdup, *destdirname;
4966 int ret;
4967
4968 dirdup = strdup(dest);
4969 if (!dirdup) {
4970 SYSERROR("Failed to duplicate target name \"%s\"", dest);
4971 return -1;
4972 }
4973 destdirname = dirname(dirdup);
4974
4975 ret = mkdir_p(destdirname, 0755);
4976 if (ret < 0) {
4977 SYSERROR("Failed to create \"%s\"", destdirname);
4978 free(dirdup);
4979 return ret;
4980 }
4981 free(dirdup);
4982
4983 (void)remove(dest);
4984
4985 if (S_ISDIR(st_mode))
4986 ret = mkdir(dest, 0000);
4987 else
4988 ret = mknod(dest, S_IFREG | 0000, 0);
4989
4990 if (ret == 0)
4991 TRACE("Created mount target \"%s\"", dest);
4992 else if (ret < 0 && errno != EEXIST) {
4993 SYSERROR("Failed to create mount target \"%s\"", dest);
4994 return -1;
4995 }
4996
4997 return 0;
4998 }
4999
5000 static int do_lxcapi_mount(struct lxc_container *c, const char *source,
5001 const char *target, const char *filesystemtype,
5002 unsigned long mountflags, const void *data,
5003 struct lxc_mount *mnt)
5004 {
5005 char *suff, *sret;
5006 char template[PATH_MAX], path[PATH_MAX];
5007 pid_t pid, init_pid;
5008 struct stat sb;
5009 bool is_dir;
5010 int ret = -1, fd = -EBADF;
5011
5012 if (!c || !c->lxc_conf) {
5013 ERROR("Container or configuration is NULL");
5014 return -EINVAL;
5015 }
5016
5017 if (!c->lxc_conf->shmount.path_host) {
5018 ERROR("Host path to shared mountpoint must be specified in the config\n");
5019 return -EINVAL;
5020 }
5021
5022 ret = snprintf(template, sizeof(template), "%s/.lxcmount_XXXXXX", c->lxc_conf->shmount.path_host);
5023 if (ret < 0 || (size_t)ret >= sizeof(template)) {
5024 SYSERROR("Error writing shmounts tempdir name");
5025 goto out;
5026 }
5027
5028 /* Create a temporary file / dir under the shared mountpoint */
5029 if (!source || strcmp(source, "") == 0) {
5030 /* If source is not specified, maybe we want to mount a filesystem? */
5031 sb.st_mode = S_IFDIR;
5032 } else {
5033 ret = stat(source, &sb);
5034 if (ret < 0) {
5035 SYSERROR("Error getting stat info about the source \"%s\"", source);
5036 goto out;
5037 }
5038 }
5039
5040 is_dir = (S_ISDIR(sb.st_mode) != 0);
5041 if (is_dir) {
5042 sret = mkdtemp(template);
5043 if (!sret) {
5044 SYSERROR("Could not create shmounts temporary dir");
5045 goto out;
5046 }
5047 } else {
5048 fd = lxc_make_tmpfile(template, false);
5049 if (fd < 0) {
5050 SYSERROR("Could not create shmounts temporary file");
5051 goto out;
5052 }
5053 }
5054
5055 /* Do the fork */
5056 pid = fork();
5057 if (pid < 0) {
5058 SYSERROR("Could not fork");
5059 goto out;
5060 }
5061
5062 if (pid == 0) {
5063 /* Do the mount */
5064 ret = mount(source, template, filesystemtype, mountflags, data);
5065 if (ret < 0) {
5066 SYSERROR("Failed to mount onto \"%s\"", template);
5067 _exit(EXIT_FAILURE);
5068 }
5069 TRACE("Mounted \"%s\" onto \"%s\"", source, template);
5070
5071 init_pid = do_lxcapi_init_pid(c);
5072 if (init_pid < 0) {
5073 ERROR("Failed to obtain container's init pid");
5074 _exit(EXIT_FAILURE);
5075 }
5076
5077 /* Enter the container namespaces */
5078 if (!lxc_list_empty(&c->lxc_conf->id_map)) {
5079 if (!switch_to_ns(init_pid, "user")) {
5080 ERROR("Failed to enter user namespace");
5081 _exit(EXIT_FAILURE);
5082 }
5083
5084 if (!lxc_switch_uid_gid(0, 0))
5085 _exit(EXIT_FAILURE);
5086 }
5087
5088 if (!switch_to_ns(init_pid, "mnt")) {
5089 ERROR("Failed to enter mount namespace");
5090 _exit(EXIT_FAILURE);
5091 }
5092
5093 ret = create_mount_target(target, sb.st_mode);
5094 if (ret < 0)
5095 _exit(EXIT_FAILURE);
5096
5097 suff = strrchr(template, '/');
5098 if (!suff)
5099 _exit(EXIT_FAILURE);
5100
5101 ret = snprintf(path, sizeof(path), "%s%s", c->lxc_conf->shmount.path_cont, suff);
5102 if (ret < 0 || (size_t)ret >= sizeof(path)) {
5103 SYSERROR("Error writing container mountpoint name");
5104 _exit(EXIT_FAILURE);
5105 }
5106
5107 ret = mount(path, target, NULL, MS_MOVE | MS_REC, NULL);
5108 if (ret < 0) {
5109 SYSERROR("Failed to move the mount from \"%s\" to \"%s\"", path, target);
5110 _exit(EXIT_FAILURE);
5111 }
5112 TRACE("Moved mount from \"%s\" to \"%s\"", path, target);
5113
5114 _exit(EXIT_SUCCESS);
5115 }
5116
5117 ret = wait_for_pid(pid);
5118 if (ret < 0) {
5119 SYSERROR("Wait for the child with pid %ld failed", (long) pid);
5120 goto out;
5121 }
5122
5123 ret = 0;
5124
5125 (void)umount2(template, MNT_DETACH);
5126 if (is_dir)
5127 (void)rmdir(template);
5128 else
5129 (void)unlink(template);
5130
5131 out:
5132 if (fd >= 0)
5133 close(fd);
5134
5135 return ret;
5136 }
5137
5138 WRAP_API_6(int, lxcapi_mount, const char *, const char *, const char *,
5139 unsigned long, const void *, struct lxc_mount *)
5140
5141 static int do_lxcapi_umount(struct lxc_container *c, const char *target,
5142 unsigned long flags, struct lxc_mount *mnt)
5143 {
5144 pid_t pid, init_pid;
5145 int ret = -1;
5146
5147 if (!c || !c->lxc_conf) {
5148 ERROR("Container or configuration is NULL");
5149 return -EINVAL;
5150 }
5151
5152 /* Do the fork */
5153 pid = fork();
5154 if (pid < 0) {
5155 SYSERROR("Could not fork");
5156 return -1;
5157 }
5158
5159 if (pid == 0) {
5160 init_pid = do_lxcapi_init_pid(c);
5161 if (init_pid < 0) {
5162 ERROR("Failed to obtain container's init pid");
5163 _exit(EXIT_FAILURE);
5164 }
5165
5166 /* Enter the container namespaces */
5167 if (!lxc_list_empty(&c->lxc_conf->id_map)) {
5168 if (!switch_to_ns(init_pid, "user")) {
5169 ERROR("Failed to enter user namespace");
5170 _exit(EXIT_FAILURE);
5171 }
5172 }
5173
5174 if (!switch_to_ns(init_pid, "mnt")) {
5175 ERROR("Failed to enter mount namespace");
5176 _exit(EXIT_FAILURE);
5177 }
5178
5179 /* Do the unmount */
5180 ret = umount2(target, flags);
5181 if (ret < 0) {
5182 SYSERROR("Failed to umount \"%s\"", target);
5183 _exit(EXIT_FAILURE);
5184 }
5185
5186 _exit(EXIT_SUCCESS);
5187 }
5188
5189 ret = wait_for_pid(pid);
5190 if (ret < 0) {
5191 SYSERROR("Wait for the child with pid %ld failed", (long)pid);
5192 return -ret;
5193 }
5194
5195 return 0;
5196 }
5197
5198 WRAP_API_3(int, lxcapi_umount, const char *, unsigned long, struct lxc_mount*)
5199
5200 static int lxcapi_attach_run_waitl(struct lxc_container *c, lxc_attach_options_t *options, const char *program, const char *arg, ...)
5201 {
5202 va_list ap;
5203 const char **argv;
5204 int ret;
5205
5206 if (!c)
5207 return -1;
5208
5209 current_config = c->lxc_conf;
5210
5211 va_start(ap, arg);
5212 argv = lxc_va_arg_list_to_argv_const(ap, 1);
5213 va_end(ap);
5214
5215 if (!argv) {
5216 ERROR("Memory allocation error.");
5217 ret = -1;
5218 goto out;
5219 }
5220 argv[0] = arg;
5221
5222 ret = do_lxcapi_attach_run_wait(c, options, program, (const char * const *)argv);
5223 free((void*)argv);
5224
5225 out:
5226 current_config = NULL;
5227 return ret;
5228 }
5229
5230 static int do_lxcapi_seccomp_notify(struct lxc_container *c, unsigned int cmd, int fd)
5231 {
5232 #if HAVE_DECL_SECCOMP_NOTIF_GET_FD
5233 if (!c || !c->lxc_conf)
5234 return minus_one_set_errno(-EINVAL);
5235
5236 switch (cmd) {
5237 case LXC_SECCOMP_NOTIFY_GET_FD:
5238 if (fd)
5239 return minus_one_set_errno(EINVAL);
5240
5241 return c->lxc_conf->seccomp_notify_fd;
5242 }
5243
5244 return minus_one_set_errno(EINVAL);
5245 #else
5246 return minus_one_set_errno(ENOSYS);
5247 #endif
5248 }
5249
5250 WRAP_API_2(int, lxcapi_seccomp_notify, unsigned int, int)
5251
5252 struct lxc_container *lxc_container_new(const char *name, const char *configpath)
5253 {
5254 struct lxc_container *c;
5255 size_t len;
5256
5257 if (!name)
5258 return NULL;
5259
5260 c = malloc(sizeof(*c));
5261 if (!c) {
5262 fprintf(stderr, "Failed to allocate memory for %s\n", name);
5263 return NULL;
5264 }
5265 memset(c, 0, sizeof(*c));
5266
5267 if (configpath)
5268 c->config_path = strdup(configpath);
5269 else
5270 c->config_path = strdup(lxc_global_config_value("lxc.lxcpath"));
5271 if (!c->config_path) {
5272 fprintf(stderr, "Failed to allocate memory for %s\n", name);
5273 goto err;
5274 }
5275
5276 remove_trailing_slashes(c->config_path);
5277
5278 len = strlen(name);
5279 c->name = malloc(len + 1);
5280 if (!c->name) {
5281 fprintf(stderr, "Failed to allocate memory for %s\n", name);
5282 goto err;
5283 }
5284 (void)strlcpy(c->name, name, len + 1);
5285
5286 c->numthreads = 1;
5287 c->slock = lxc_newlock(c->config_path, name);
5288 if (!c->slock) {
5289 fprintf(stderr, "Failed to create lock for %s\n", name);
5290 goto err;
5291 }
5292
5293 c->privlock = lxc_newlock(NULL, NULL);
5294 if (!c->privlock) {
5295 fprintf(stderr, "Failed to create private lock for %s\n", name);
5296 goto err;
5297 }
5298
5299 if (!set_config_filename(c)) {
5300 fprintf(stderr, "Failed to create config file name for %s\n", name);
5301 goto err;
5302 }
5303
5304 if (file_exists(c->configfile) && !lxcapi_load_config(c, NULL)) {
5305 fprintf(stderr, "Failed to load config for %s\n", name);
5306 goto err;
5307 }
5308
5309 if (ongoing_create(c) == 2) {
5310 ERROR("Failed to complete container creation for %s", c->name);
5311 container_destroy(c, NULL);
5312 lxcapi_clear_config(c);
5313 }
5314
5315 c->daemonize = true;
5316 c->pidfile = NULL;
5317
5318 /* Assign the member functions. */
5319 c->is_defined = lxcapi_is_defined;
5320 c->state = lxcapi_state;
5321 c->is_running = lxcapi_is_running;
5322 c->freeze = lxcapi_freeze;
5323 c->unfreeze = lxcapi_unfreeze;
5324 c->console = lxcapi_console;
5325 c->console_getfd = lxcapi_console_getfd;
5326 c->init_pid = lxcapi_init_pid;
5327 c->load_config = lxcapi_load_config;
5328 c->want_daemonize = lxcapi_want_daemonize;
5329 c->want_close_all_fds = lxcapi_want_close_all_fds;
5330 c->start = lxcapi_start;
5331 c->startl = lxcapi_startl;
5332 c->stop = lxcapi_stop;
5333 c->config_file_name = lxcapi_config_file_name;
5334 c->wait = lxcapi_wait;
5335 c->set_config_item = lxcapi_set_config_item;
5336 c->destroy = lxcapi_destroy;
5337 c->destroy_with_snapshots = lxcapi_destroy_with_snapshots;
5338 c->rename = lxcapi_rename;
5339 c->save_config = lxcapi_save_config;
5340 c->get_keys = lxcapi_get_keys;
5341 c->create = lxcapi_create;
5342 c->createl = lxcapi_createl;
5343 c->shutdown = lxcapi_shutdown;
5344 c->reboot = lxcapi_reboot;
5345 c->reboot2 = lxcapi_reboot2;
5346 c->clear_config = lxcapi_clear_config;
5347 c->clear_config_item = lxcapi_clear_config_item;
5348 c->get_config_item = lxcapi_get_config_item;
5349 c->get_running_config_item = lxcapi_get_running_config_item;
5350 c->get_cgroup_item = lxcapi_get_cgroup_item;
5351 c->set_cgroup_item = lxcapi_set_cgroup_item;
5352 c->get_config_path = lxcapi_get_config_path;
5353 c->set_config_path = lxcapi_set_config_path;
5354 c->clone = lxcapi_clone;
5355 c->get_interfaces = lxcapi_get_interfaces;
5356 c->get_ips = lxcapi_get_ips;
5357 c->attach = lxcapi_attach;
5358 c->attach_run_wait = lxcapi_attach_run_wait;
5359 c->attach_run_waitl = lxcapi_attach_run_waitl;
5360 c->snapshot = lxcapi_snapshot;
5361 c->snapshot_list = lxcapi_snapshot_list;
5362 c->snapshot_restore = lxcapi_snapshot_restore;
5363 c->snapshot_destroy = lxcapi_snapshot_destroy;
5364 c->snapshot_destroy_all = lxcapi_snapshot_destroy_all;
5365 c->may_control = lxcapi_may_control;
5366 c->add_device_node = lxcapi_add_device_node;
5367 c->remove_device_node = lxcapi_remove_device_node;
5368 c->attach_interface = lxcapi_attach_interface;
5369 c->detach_interface = lxcapi_detach_interface;
5370 c->checkpoint = lxcapi_checkpoint;
5371 c->restore = lxcapi_restore;
5372 c->migrate = lxcapi_migrate;
5373 c->console_log = lxcapi_console_log;
5374 c->mount = lxcapi_mount;
5375 c->umount = lxcapi_umount;
5376 c->seccomp_notify = lxcapi_seccomp_notify;
5377
5378 return c;
5379
5380 err:
5381 lxc_container_free(c);
5382 return NULL;
5383 }
5384
5385 int lxc_get_wait_states(const char **states)
5386 {
5387 int i;
5388
5389 if (states)
5390 for (i=0; i<MAX_STATE; i++)
5391 states[i] = lxc_state2str(i);
5392
5393 return MAX_STATE;
5394 }
5395
5396 /*
5397 * These next two could probably be done smarter with reusing a common function
5398 * with different iterators and tests...
5399 */
5400 int list_defined_containers(const char *lxcpath, char ***names, struct lxc_container ***cret)
5401 {
5402 DIR *dir;
5403 int i, cfound = 0, nfound = 0;
5404 struct dirent *direntp;
5405 struct lxc_container *c;
5406
5407 if (!lxcpath)
5408 lxcpath = lxc_global_config_value("lxc.lxcpath");
5409
5410 dir = opendir(lxcpath);
5411 if (!dir) {
5412 SYSERROR("opendir on lxcpath");
5413 return -1;
5414 }
5415
5416 if (cret)
5417 *cret = NULL;
5418
5419 if (names)
5420 *names = NULL;
5421
5422 while ((direntp = readdir(dir))) {
5423 /* Ignore '.', '..' and any hidden directory. */
5424 if (!strncmp(direntp->d_name, ".", 1))
5425 continue;
5426
5427 if (!config_file_exists(lxcpath, direntp->d_name))
5428 continue;
5429
5430 if (names)
5431 if (!add_to_array(names, direntp->d_name, cfound))
5432 goto free_bad;
5433
5434 cfound++;
5435
5436 if (!cret) {
5437 nfound++;
5438 continue;
5439 }
5440
5441 c = lxc_container_new(direntp->d_name, lxcpath);
5442 if (!c) {
5443 INFO("Container %s:%s has a config but could not be loaded",
5444 lxcpath, direntp->d_name);
5445
5446 if (names)
5447 if(!remove_from_array(names, direntp->d_name, cfound--))
5448 goto free_bad;
5449
5450 continue;
5451 }
5452
5453 if (!do_lxcapi_is_defined(c)) {
5454 INFO("Container %s:%s has a config but is not defined",
5455 lxcpath, direntp->d_name);
5456
5457 if (names)
5458 if(!remove_from_array(names, direntp->d_name, cfound--))
5459 goto free_bad;
5460
5461 lxc_container_put(c);
5462 continue;
5463 }
5464
5465 if (!add_to_clist(cret, c, nfound, true)) {
5466 lxc_container_put(c);
5467 goto free_bad;
5468 }
5469
5470 nfound++;
5471 }
5472
5473 closedir(dir);
5474 return nfound;
5475
5476 free_bad:
5477 if (names && *names) {
5478 for (i=0; i<cfound; i++)
5479 free((*names)[i]);
5480 free(*names);
5481 }
5482
5483 if (cret && *cret) {
5484 for (i=0; i<nfound; i++)
5485 lxc_container_put((*cret)[i]);
5486 free(*cret);
5487 }
5488
5489 closedir(dir);
5490 return -1;
5491 }
5492
5493 int list_active_containers(const char *lxcpath, char ***nret,
5494 struct lxc_container ***cret)
5495 {
5496 int i, ret = -1, cret_cnt = 0, ct_name_cnt = 0;
5497 int lxcpath_len;
5498 char *line = NULL;
5499 char **ct_name = NULL;
5500 size_t len = 0;
5501 struct lxc_container *c = NULL;
5502 bool is_hashed;
5503
5504 if (!lxcpath)
5505 lxcpath = lxc_global_config_value("lxc.lxcpath");
5506 lxcpath_len = strlen(lxcpath);
5507
5508 if (cret)
5509 *cret = NULL;
5510
5511 if (nret)
5512 *nret = NULL;
5513
5514 FILE *f = fopen("/proc/net/unix", "r");
5515 if (!f)
5516 return -1;
5517
5518 while (getline(&line, &len, f) != -1) {
5519 char *p = strrchr(line, ' '), *p2;
5520 if (!p)
5521 continue;
5522 p++;
5523
5524 if (*p != 0x40)
5525 continue;
5526 p++;
5527
5528 is_hashed = false;
5529
5530 if (strncmp(p, lxcpath, lxcpath_len) == 0) {
5531 p += lxcpath_len;
5532 } else if (strncmp(p, "lxc/", 4) == 0) {
5533 p += 4;
5534 is_hashed = true;
5535 } else {
5536 continue;
5537 }
5538
5539 while (*p == '/')
5540 p++;
5541
5542 /* Now p is the start of lxc_name. */
5543 p2 = strchr(p, '/');
5544 if (!p2 || strncmp(p2, "/command", 8) != 0)
5545 continue;
5546 *p2 = '\0';
5547
5548 if (is_hashed) {
5549 char *recvpath = lxc_cmd_get_lxcpath(p);
5550 if (!recvpath)
5551 continue;
5552
5553 if (strncmp(lxcpath, recvpath, lxcpath_len) != 0) {
5554 free(recvpath);
5555 continue;
5556 }
5557 free(recvpath);
5558
5559 p = lxc_cmd_get_name(p);
5560 if (!p)
5561 continue;
5562 }
5563
5564 if (array_contains(&ct_name, p, ct_name_cnt)) {
5565 if (is_hashed)
5566 free(p);
5567 continue;
5568 }
5569
5570 if (!add_to_array(&ct_name, p, ct_name_cnt)) {
5571 if (is_hashed)
5572 free(p);
5573 goto free_cret_list;
5574 }
5575
5576 ct_name_cnt++;
5577
5578 if (!cret) {
5579 if (is_hashed)
5580 free(p);
5581 continue;
5582 }
5583
5584 c = lxc_container_new(p, lxcpath);
5585 if (!c) {
5586 INFO("Container %s:%s is running but could not be loaded",
5587 lxcpath, p);
5588
5589 remove_from_array(&ct_name, p, ct_name_cnt--);
5590 if (is_hashed)
5591 free(p);
5592
5593 continue;
5594 }
5595
5596 if (is_hashed)
5597 free(p);
5598
5599 /*
5600 * If this is an anonymous container, then is_defined *can*
5601 * return false. So we don't do that check. Count on the
5602 * fact that the command socket exists.
5603 */
5604
5605 if (!add_to_clist(cret, c, cret_cnt, true)) {
5606 lxc_container_put(c);
5607 goto free_cret_list;
5608 }
5609
5610 cret_cnt++;
5611 }
5612
5613 if (nret && cret && cret_cnt != ct_name_cnt) {
5614 if (c)
5615 lxc_container_put(c);
5616 goto free_cret_list;
5617 }
5618
5619 ret = ct_name_cnt;
5620 if (nret)
5621 *nret = ct_name;
5622 else
5623 goto free_ct_name;
5624
5625 goto out;
5626
5627 free_cret_list:
5628 if (cret && *cret) {
5629 for (i = 0; i < cret_cnt; i++)
5630 lxc_container_put((*cret)[i]);
5631 free(*cret);
5632 }
5633
5634 free_ct_name:
5635 if (ct_name) {
5636 for (i = 0; i < ct_name_cnt; i++)
5637 free(ct_name[i]);
5638 free(ct_name);
5639 }
5640
5641 out:
5642 free(line);
5643 fclose(f);
5644 return ret;
5645 }
5646
5647 int list_all_containers(const char *lxcpath, char ***nret,
5648 struct lxc_container ***cret)
5649 {
5650 int i, ret, active_cnt, ct_cnt, ct_list_cnt;
5651 char **active_name;
5652 char **ct_name;
5653 struct lxc_container **ct_list = NULL;
5654
5655 ct_cnt = list_defined_containers(lxcpath, &ct_name, NULL);
5656 if (ct_cnt < 0)
5657 return ct_cnt;
5658
5659 active_cnt = list_active_containers(lxcpath, &active_name, NULL);
5660 if (active_cnt < 0) {
5661 ret = active_cnt;
5662 goto free_ct_name;
5663 }
5664
5665 for (i = 0; i < active_cnt; i++) {
5666 if (!array_contains(&ct_name, active_name[i], ct_cnt)) {
5667 if (!add_to_array(&ct_name, active_name[i], ct_cnt)) {
5668 ret = -1;
5669 goto free_active_name;
5670 }
5671
5672 ct_cnt++;
5673 }
5674
5675 free(active_name[i]);
5676 active_name[i] = NULL;
5677 }
5678
5679 free(active_name);
5680 active_name = NULL;
5681 active_cnt = 0;
5682
5683 for (i = 0, ct_list_cnt = 0; i < ct_cnt && cret; i++) {
5684 struct lxc_container *c;
5685
5686 c = lxc_container_new(ct_name[i], lxcpath);
5687 if (!c) {
5688 WARN("Container %s:%s could not be loaded", lxcpath, ct_name[i]);
5689 remove_from_array(&ct_name, ct_name[i], ct_cnt--);
5690 continue;
5691 }
5692
5693 if (!add_to_clist(&ct_list, c, ct_list_cnt, false)) {
5694 lxc_container_put(c);
5695 ret = -1;
5696 goto free_ct_list;
5697 }
5698
5699 ct_list_cnt++;
5700 }
5701
5702 if (cret)
5703 *cret = ct_list;
5704
5705 if (nret) {
5706 *nret = ct_name;
5707 } else {
5708 ret = ct_cnt;
5709 goto free_ct_name;
5710 }
5711
5712 return ct_cnt;
5713
5714 free_ct_list:
5715 for (i = 0; i < ct_list_cnt; i++) {
5716 lxc_container_put(ct_list[i]);
5717 }
5718 free(ct_list);
5719
5720 free_active_name:
5721 for (i = 0; i < active_cnt; i++) {
5722 free(active_name[i]);
5723 }
5724 free(active_name);
5725
5726 free_ct_name:
5727 for (i = 0; i < ct_cnt; i++) {
5728 free(ct_name[i]);
5729 }
5730 free(ct_name);
5731 return ret;
5732 }
5733
5734 bool lxc_config_item_is_supported(const char *key)
5735 {
5736 return !!lxc_get_config(key);
5737 }
5738
5739 bool lxc_has_api_extension(const char *extension)
5740 {
5741 /* The NULL API extension is always present. :) */
5742 if (!extension)
5743 return true;
5744
5745 for (size_t i = 0; i < nr_api_extensions; i++)
5746 if (strcmp(api_extensions[i], extension) == 0)
5747 return true;
5748
5749 return false;
5750 }