]> git.proxmox.com Git - mirror_lxc.git/blob - src/lxc/lxccontainer.c
utils: move useful helper functions from lxccontainer to utils.
[mirror_lxc.git] / src / lxc / lxccontainer.c
1 /* liblxcapi
2 *
3 * Copyright © 2012 Serge Hallyn <serge.hallyn@ubuntu.com>.
4 * Copyright © 2012 Canonical Ltd.
5 *
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
10
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
15
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19 */
20
21 #define _GNU_SOURCE
22 #include <assert.h>
23 #include <stdarg.h>
24 #include <pthread.h>
25 #include <unistd.h>
26 #include <sys/types.h>
27 #include <sys/wait.h>
28 #include <sys/mount.h>
29 #include <errno.h>
30 #include <fcntl.h>
31 #include <sched.h>
32 #include <dirent.h>
33 #include <sched.h>
34 #include <arpa/inet.h>
35 #include <libgen.h>
36 #include <stdint.h>
37 #include <grp.h>
38 #include <sys/syscall.h>
39
40 #include <lxc/lxccontainer.h>
41 #include <lxc/version.h>
42
43 #include "config.h"
44 #include "lxc.h"
45 #include "state.h"
46 #include "conf.h"
47 #include "confile.h"
48 #include "console.h"
49 #include "cgroup.h"
50 #include "commands.h"
51 #include "log.h"
52 #include "bdev.h"
53 #include "utils.h"
54 #include "attach.h"
55 #include "monitor.h"
56 #include "namespace.h"
57 #include "lxclock.h"
58 #include "sync.h"
59
60 #if HAVE_IFADDRS_H
61 #include <ifaddrs.h>
62 #else
63 #include <../include/ifaddrs.h>
64 #endif
65
66 #define MAX_BUFFER 4096
67
68 #define NOT_SUPPORTED_ERROR "the requested function %s is not currently supported with unprivileged containers"
69
70 /* Define faccessat() if missing from the C library */
71 #ifndef HAVE_FACCESSAT
72 static int faccessat(int __fd, const char *__file, int __type, int __flag)
73 {
74 #ifdef __NR_faccessat
75 return syscall(__NR_faccessat, __fd, __file, __type, __flag);
76 #else
77 errno = ENOSYS;
78 return -1;
79 #endif
80 }
81 #endif
82
83
84 lxc_log_define(lxc_container, lxc);
85
86 static bool config_file_exists(const char *lxcpath, const char *cname)
87 {
88 /* $lxcpath + '/' + $cname + '/config' + \0 */
89 int ret, len = strlen(lxcpath) + strlen(cname) + 9;
90 char *fname = alloca(len);
91
92 ret = snprintf(fname, len, "%s/%s/config", lxcpath, cname);
93 if (ret < 0 || ret >= len)
94 return false;
95
96 return file_exists(fname);
97 }
98
99 /*
100 * A few functions to help detect when a container creation failed.
101 * If a container creation was killed partway through, then trying
102 * to actually start that container could harm the host. We detect
103 * this by creating a 'partial' file under the container directory,
104 * and keeping an advisory lock. When container creation completes,
105 * we remove that file. When we load or try to start a container, if
106 * we find that file, without a flock, we remove the container.
107 */
108 static int ongoing_create(struct lxc_container *c)
109 {
110 int len = strlen(c->config_path) + strlen(c->name) + 10;
111 char *path = alloca(len);
112 int fd, ret;
113 struct flock lk;
114
115 ret = snprintf(path, len, "%s/%s/partial", c->config_path, c->name);
116 if (ret < 0 || ret >= len) {
117 ERROR("Error writing partial pathname");
118 return -1;
119 }
120
121 if (!file_exists(path))
122 return 0;
123 fd = open(path, O_RDWR);
124 if (fd < 0) {
125 // give benefit of the doubt
126 SYSERROR("Error opening partial file");
127 return 0;
128 }
129 lk.l_type = F_WRLCK;
130 lk.l_whence = SEEK_SET;
131 lk.l_start = 0;
132 lk.l_len = 0;
133 lk.l_pid = -1;
134 if (fcntl(fd, F_GETLK, &lk) == 0 && lk.l_pid != -1) {
135 // create is still ongoing
136 close(fd);
137 return 1;
138 }
139 // create completed but partial is still there.
140 close(fd);
141 return 2;
142 }
143
144 static int create_partial(struct lxc_container *c)
145 {
146 // $lxcpath + '/' + $name + '/partial' + \0
147 int len = strlen(c->config_path) + strlen(c->name) + 10;
148 char *path = alloca(len);
149 int fd, ret;
150 struct flock lk;
151
152 ret = snprintf(path, len, "%s/%s/partial", c->config_path, c->name);
153 if (ret < 0 || ret >= len) {
154 ERROR("Error writing partial pathname");
155 return -1;
156 }
157 if ((fd=open(path, O_RDWR | O_CREAT | O_EXCL, 0755)) < 0) {
158 SYSERROR("Erorr creating partial file");
159 return -1;
160 }
161 lk.l_type = F_WRLCK;
162 lk.l_whence = SEEK_SET;
163 lk.l_start = 0;
164 lk.l_len = 0;
165 if (fcntl(fd, F_SETLKW, &lk) < 0) {
166 SYSERROR("Error locking partial file %s", path);
167 close(fd);
168 return -1;
169 }
170
171 return fd;
172 }
173
174 static void remove_partial(struct lxc_container *c, int fd)
175 {
176 // $lxcpath + '/' + $name + '/partial' + \0
177 int len = strlen(c->config_path) + strlen(c->name) + 10;
178 char *path = alloca(len);
179 int ret;
180
181 close(fd);
182 ret = snprintf(path, len, "%s/%s/partial", c->config_path, c->name);
183 if (ret < 0 || ret >= len) {
184 ERROR("Error writing partial pathname");
185 return;
186 }
187 if (unlink(path) < 0)
188 SYSERROR("Error unlink partial file %s", path);
189 }
190
191 /* LOCKING
192 * 1. container_mem_lock(c) protects the struct lxc_container from multiple threads.
193 * 2. container_disk_lock(c) protects the on-disk container data - in particular the
194 * container configuration file.
195 * The container_disk_lock also takes the container_mem_lock.
196 * 3. thread_mutex protects process data (ex: fd table) from multiple threads.
197 * NOTHING mutexes two independent programs with their own struct
198 * lxc_container for the same c->name, between API calls. For instance,
199 * c->config_read(); c->start(); Between those calls, data on disk
200 * could change (which shouldn't bother the caller unless for instance
201 * the rootfs get moved). c->config_read(); update; c->config_write();
202 * Two such updaters could race. The callers should therefore check their
203 * results. Trying to prevent that would necessarily expose us to deadlocks
204 * due to hung callers. So I prefer to keep the locks only within our own
205 * functions, not across functions.
206 *
207 * If you're going to clone while holding a lxccontainer, increment
208 * c->numthreads (under privlock) before forking. When deleting,
209 * decrement numthreads under privlock, then if it hits 0 you can delete.
210 * Do not ever use a lxccontainer whose numthreads you did not bump.
211 */
212
213 static void lxc_container_free(struct lxc_container *c)
214 {
215 if (!c)
216 return;
217
218 if (c->configfile) {
219 free(c->configfile);
220 c->configfile = NULL;
221 }
222 if (c->error_string) {
223 free(c->error_string);
224 c->error_string = NULL;
225 }
226 if (c->slock) {
227 lxc_putlock(c->slock);
228 c->slock = NULL;
229 }
230 if (c->privlock) {
231 lxc_putlock(c->privlock);
232 c->privlock = NULL;
233 }
234 if (c->name) {
235 free(c->name);
236 c->name = NULL;
237 }
238 if (c->lxc_conf) {
239 lxc_conf_free(c->lxc_conf);
240 c->lxc_conf = NULL;
241 }
242 if (c->config_path) {
243 free(c->config_path);
244 c->config_path = NULL;
245 }
246
247 free(c);
248 }
249
250 /*
251 * Consider the following case:
252 freer | racing get()er
253 ==================================================================
254 lxc_container_put() | lxc_container_get()
255 \ lxclock(c->privlock) | c->numthreads < 1? (no)
256 \ c->numthreads = 0 | \ lxclock(c->privlock) -> waits
257 \ lxcunlock() | \
258 \ lxc_container_free() | \ lxclock() returns
259 | \ c->numthreads < 1 -> return 0
260 \ \ (free stuff) |
261 \ \ sem_destroy(privlock) |
262
263 * When the get()er checks numthreads the first time, one of the following
264 * is true:
265 * 1. freer has set numthreads = 0. get() returns 0
266 * 2. freer is between lxclock and setting numthreads to 0. get()er will
267 * sem_wait on privlock, get lxclock after freer() drops it, then see
268 * numthreads is 0 and exit without touching lxclock again..
269 * 3. freer has not yet locked privlock. If get()er runs first, then put()er
270 * will see --numthreads = 1 and not call lxc_container_free().
271 */
272
273 int lxc_container_get(struct lxc_container *c)
274 {
275 if (!c)
276 return 0;
277
278 // if someone else has already started freeing the container, don't
279 // try to take the lock, which may be invalid
280 if (c->numthreads < 1)
281 return 0;
282
283 if (container_mem_lock(c))
284 return 0;
285 if (c->numthreads < 1) {
286 // bail without trying to unlock, bc the privlock is now probably
287 // in freed memory
288 return 0;
289 }
290 c->numthreads++;
291 container_mem_unlock(c);
292 return 1;
293 }
294
295 int lxc_container_put(struct lxc_container *c)
296 {
297 if (!c)
298 return -1;
299 if (container_mem_lock(c))
300 return -1;
301 if (--c->numthreads < 1) {
302 container_mem_unlock(c);
303 lxc_container_free(c);
304 return 1;
305 }
306 container_mem_unlock(c);
307 return 0;
308 }
309
310 static bool lxcapi_is_defined(struct lxc_container *c)
311 {
312 struct stat statbuf;
313 bool ret = false;
314 int statret;
315
316 if (!c)
317 return false;
318
319 if (container_mem_lock(c))
320 return false;
321 if (!c->configfile)
322 goto out;
323 statret = stat(c->configfile, &statbuf);
324 if (statret != 0)
325 goto out;
326 ret = true;
327
328 out:
329 container_mem_unlock(c);
330 return ret;
331 }
332
333 static const char *lxcapi_state(struct lxc_container *c)
334 {
335 lxc_state_t s;
336
337 if (!c)
338 return NULL;
339 s = lxc_getstate(c->name, c->config_path);
340 return lxc_state2str(s);
341 }
342
343 static bool is_stopped(struct lxc_container *c)
344 {
345 lxc_state_t s;
346 s = lxc_getstate(c->name, c->config_path);
347 return (s == STOPPED);
348 }
349
350 static bool lxcapi_is_running(struct lxc_container *c)
351 {
352 const char *s;
353
354 if (!c)
355 return false;
356 s = lxcapi_state(c);
357 if (!s || strcmp(s, "STOPPED") == 0)
358 return false;
359 return true;
360 }
361
362 static bool lxcapi_freeze(struct lxc_container *c)
363 {
364 int ret;
365 if (!c)
366 return false;
367
368 ret = lxc_freeze(c->name, c->config_path);
369 if (ret)
370 return false;
371 return true;
372 }
373
374 static bool lxcapi_unfreeze(struct lxc_container *c)
375 {
376 int ret;
377 if (!c)
378 return false;
379
380 ret = lxc_unfreeze(c->name, c->config_path);
381 if (ret)
382 return false;
383 return true;
384 }
385
386 static int lxcapi_console_getfd(struct lxc_container *c, int *ttynum, int *masterfd)
387 {
388 int ttyfd;
389 if (!c)
390 return -1;
391
392 ttyfd = lxc_console_getfd(c, ttynum, masterfd);
393 return ttyfd;
394 }
395
396 static int lxcapi_console(struct lxc_container *c, int ttynum, int stdinfd,
397 int stdoutfd, int stderrfd, int escape)
398 {
399 return lxc_console(c, ttynum, stdinfd, stdoutfd, stderrfd, escape);
400 }
401
402 static pid_t lxcapi_init_pid(struct lxc_container *c)
403 {
404 if (!c)
405 return -1;
406
407 return lxc_cmd_get_init_pid(c->name, c->config_path);
408 }
409
410 static bool load_config_locked(struct lxc_container *c, const char *fname)
411 {
412 if (!c->lxc_conf)
413 c->lxc_conf = lxc_conf_init();
414 if (!c->lxc_conf)
415 return false;
416 if (lxc_config_read(fname, c->lxc_conf, false) != 0)
417 return false;
418 return true;
419 }
420
421 static bool lxcapi_load_config(struct lxc_container *c, const char *alt_file)
422 {
423 bool ret = false, need_disklock = false;
424 int lret;
425 const char *fname;
426 if (!c)
427 return false;
428
429 fname = c->configfile;
430 if (alt_file)
431 fname = alt_file;
432 if (!fname)
433 return false;
434 /*
435 * If we're reading something other than the container's config,
436 * we only need to lock the in-memory container. If loading the
437 * container's config file, take the disk lock.
438 */
439 if (strcmp(fname, c->configfile) == 0)
440 need_disklock = true;
441
442 if (need_disklock)
443 lret = container_disk_lock(c);
444 else
445 lret = container_mem_lock(c);
446 if (lret)
447 return false;
448
449 ret = load_config_locked(c, fname);
450
451 if (need_disklock)
452 container_disk_unlock(c);
453 else
454 container_mem_unlock(c);
455 return ret;
456 }
457
458 static bool lxcapi_want_daemonize(struct lxc_container *c, bool state)
459 {
460 if (!c || !c->lxc_conf)
461 return false;
462 if (container_mem_lock(c)) {
463 ERROR("Error getting mem lock");
464 return false;
465 }
466 c->daemonize = state;
467 /* daemonize implies close_all_fds so set it */
468 if (state == 1)
469 c->lxc_conf->close_all_fds = 1;
470 container_mem_unlock(c);
471 return true;
472 }
473
474 static bool lxcapi_want_close_all_fds(struct lxc_container *c, bool state)
475 {
476 if (!c || !c->lxc_conf)
477 return false;
478 if (container_mem_lock(c)) {
479 ERROR("Error getting mem lock");
480 return false;
481 }
482 c->lxc_conf->close_all_fds = state;
483 container_mem_unlock(c);
484 return true;
485 }
486
487 static bool lxcapi_wait(struct lxc_container *c, const char *state, int timeout)
488 {
489 int ret;
490
491 if (!c)
492 return false;
493
494 ret = lxc_wait(c->name, state, timeout, c->config_path);
495 return ret == 0;
496 }
497
498
499 static bool wait_on_daemonized_start(struct lxc_container *c, int pid)
500 {
501 /* we'll probably want to make this timeout configurable? */
502 int timeout = 5, ret, status;
503
504 /*
505 * our child is going to fork again, then exit. reap the
506 * child
507 */
508 ret = waitpid(pid, &status, 0);
509 if (ret == -1 || !WIFEXITED(status) || WEXITSTATUS(status) != 0)
510 DEBUG("failed waiting for first dual-fork child");
511 return lxcapi_wait(c, "RUNNING", timeout);
512 }
513
514 static bool am_single_threaded(void)
515 {
516 struct dirent dirent, *direntp;
517 DIR *dir;
518 int count=0;
519
520 dir = opendir("/proc/self/task");
521 if (!dir) {
522 INFO("failed to open /proc/self/task");
523 return false;
524 }
525
526 while (!readdir_r(dir, &dirent, &direntp)) {
527 if (!direntp)
528 break;
529
530 if (!strcmp(direntp->d_name, "."))
531 continue;
532
533 if (!strcmp(direntp->d_name, ".."))
534 continue;
535 if (++count > 1)
536 break;
537 }
538 closedir(dir);
539 return count == 1;
540 }
541
542 /*
543 * I can't decide if it'd be more convenient for callers if we accept '...',
544 * or a null-terminated array (i.e. execl vs execv)
545 */
546 static bool lxcapi_start(struct lxc_container *c, int useinit, char * const argv[])
547 {
548 int ret;
549 struct lxc_conf *conf;
550 bool daemonize = false;
551 FILE *pid_fp = NULL;
552 char *default_args[] = {
553 "/sbin/init",
554 NULL,
555 };
556
557 /* container exists */
558 if (!c)
559 return false;
560 /* container has been setup */
561 if (!c->lxc_conf)
562 return false;
563
564 if ((ret = ongoing_create(c)) < 0) {
565 ERROR("Error checking for incomplete creation");
566 return false;
567 }
568 if (ret == 2) {
569 ERROR("Error: %s creation was not completed", c->name);
570 c->destroy(c);
571 return false;
572 } else if (ret == 1) {
573 ERROR("Error: creation of %s is ongoing", c->name);
574 return false;
575 }
576
577 /* is this app meant to be run through lxcinit, as in lxc-execute? */
578 if (useinit && !argv)
579 return false;
580
581 if (container_mem_lock(c))
582 return false;
583 conf = c->lxc_conf;
584 daemonize = c->daemonize;
585 container_mem_unlock(c);
586
587 if (useinit) {
588 ret = lxc_execute(c->name, argv, 1, conf, c->config_path);
589 return ret == 0 ? true : false;
590 }
591
592 if (!argv)
593 argv = default_args;
594
595 /*
596 * say, I'm not sure - what locks do we want here? Any?
597 * Is liblxc's locking enough here to protect the on disk
598 * container? We don't want to exclude things like lxc_info
599 * while container is running...
600 */
601 if (daemonize) {
602 lxc_monitord_spawn(c->config_path);
603
604 pid_t pid = fork();
605 if (pid < 0)
606 return false;
607
608 if (pid != 0) {
609 /* Set to NULL because we don't want father unlink
610 * the PID file, child will do the free and unlink.
611 */
612 c->pidfile = NULL;
613 return wait_on_daemonized_start(c, pid);
614 }
615
616 /* second fork to be reparented by init */
617 pid = fork();
618 if (pid < 0) {
619 SYSERROR("Error doing dual-fork");
620 return false;
621 }
622 if (pid != 0)
623 exit(0);
624 /* like daemon(), chdir to / and redirect 0,1,2 to /dev/null */
625 if (chdir("/")) {
626 SYSERROR("Error chdir()ing to /.");
627 return false;
628 }
629 lxc_check_inherited(conf, -1);
630 close(0);
631 close(1);
632 close(2);
633 open("/dev/zero", O_RDONLY);
634 open("/dev/null", O_RDWR);
635 open("/dev/null", O_RDWR);
636 setsid();
637 } else {
638 if (!am_single_threaded()) {
639 ERROR("Cannot start non-daemonized container when threaded");
640 return false;
641 }
642 }
643
644 /* We need to write PID file after daeminize, so we always
645 * write the right PID.
646 */
647 if (c->pidfile) {
648 pid_fp = fopen(c->pidfile, "w");
649 if (pid_fp == NULL) {
650 SYSERROR("Failed to create pidfile '%s' for '%s'",
651 c->pidfile, c->name);
652 return false;
653 }
654
655 if (fprintf(pid_fp, "%d\n", getpid()) < 0) {
656 SYSERROR("Failed to write '%s'", c->pidfile);
657 fclose(pid_fp);
658 pid_fp = NULL;
659 return false;
660 }
661
662 fclose(pid_fp);
663 pid_fp = NULL;
664 }
665
666 reboot:
667 conf->reboot = 0;
668 ret = lxc_start(c->name, argv, conf, c->config_path);
669 c->error_num = ret;
670
671 if (conf->reboot) {
672 INFO("container requested reboot");
673 conf->reboot = 0;
674 goto reboot;
675 }
676
677 if (c->pidfile) {
678 unlink(c->pidfile);
679 free(c->pidfile);
680 c->pidfile = NULL;
681 }
682
683 if (daemonize)
684 exit (ret == 0 ? true : false);
685 else
686 return (ret == 0 ? true : false);
687 }
688
689 /*
690 * note there MUST be an ending NULL
691 */
692 static bool lxcapi_startl(struct lxc_container *c, int useinit, ...)
693 {
694 va_list ap;
695 char **inargs = NULL;
696 bool bret = false;
697
698 /* container exists */
699 if (!c)
700 return false;
701
702 va_start(ap, useinit);
703 inargs = lxc_va_arg_list_to_argv(ap, 0, 1);
704 va_end(ap);
705
706 if (!inargs) {
707 ERROR("Memory allocation error.");
708 goto out;
709 }
710
711 /* pass NULL if no arguments were supplied */
712 bret = lxcapi_start(c, useinit, *inargs ? inargs : NULL);
713
714 out:
715 if (inargs) {
716 char **arg;
717 for (arg = inargs; *arg; arg++)
718 free(*arg);
719 free(inargs);
720 }
721
722 return bret;
723 }
724
725 static bool lxcapi_stop(struct lxc_container *c)
726 {
727 int ret;
728
729 if (!c)
730 return false;
731
732 ret = lxc_cmd_stop(c->name, c->config_path);
733
734 return ret == 0;
735 }
736
737 static int do_create_container_dir(const char *path, struct lxc_conf *conf)
738 {
739 int ret = -1, lasterr;
740 char *p = alloca(strlen(path)+1);
741 mode_t mask = umask(0002);
742 ret = mkdir(path, 0770);
743 lasterr = errno;
744 umask(mask);
745 errno = lasterr;
746 if (ret) {
747 if (errno == EEXIST)
748 ret = 0;
749 else {
750 SYSERROR("failed to create container path %s", path);
751 return -1;
752 }
753 }
754 strcpy(p, path);
755 if (!lxc_list_empty(&conf->id_map) && chown_mapped_root(p, conf) != 0) {
756 ERROR("Failed to chown container dir");
757 ret = -1;
758 }
759 return ret;
760 }
761
762 /*
763 * create the standard expected container dir
764 */
765 static bool create_container_dir(struct lxc_container *c)
766 {
767 char *s;
768 int len, ret;
769
770 len = strlen(c->config_path) + strlen(c->name) + 2;
771 s = malloc(len);
772 if (!s)
773 return false;
774 ret = snprintf(s, len, "%s/%s", c->config_path, c->name);
775 if (ret < 0 || ret >= len) {
776 free(s);
777 return false;
778 }
779 ret = do_create_container_dir(s, c->lxc_conf);
780 free(s);
781 return ret == 0;
782 }
783
784 static const char *lxcapi_get_config_path(struct lxc_container *c);
785 static bool lxcapi_set_config_item(struct lxc_container *c, const char *key, const char *v);
786
787 /*
788 * do_bdev_create: thin wrapper around bdev_create(). Like bdev_create(),
789 * it returns a mounted bdev on success, NULL on error.
790 */
791 static struct bdev *do_bdev_create(struct lxc_container *c, const char *type,
792 struct bdev_specs *specs)
793 {
794 char *dest;
795 size_t len;
796 struct bdev *bdev;
797 int ret;
798
799 /* rootfs.path or lxcpath/lxcname/rootfs */
800 if (c->lxc_conf->rootfs.path && access(c->lxc_conf->rootfs.path, F_OK) == 0) {
801 const char *rpath = c->lxc_conf->rootfs.path;
802 len = strlen(rpath) + 1;
803 dest = alloca(len);
804 ret = snprintf(dest, len, "%s", rpath);
805 } else {
806 const char *lxcpath = lxcapi_get_config_path(c);
807 len = strlen(c->name) + strlen(lxcpath) + 9;
808 dest = alloca(len);
809 ret = snprintf(dest, len, "%s/%s/rootfs", lxcpath, c->name);
810 }
811 if (ret < 0 || ret >= len)
812 return NULL;
813
814 bdev = bdev_create(dest, type, c->name, specs);
815 if (!bdev) {
816 ERROR("Failed to create backing store type %s", type);
817 return NULL;
818 }
819
820 lxcapi_set_config_item(c, "lxc.rootfs", bdev->src);
821
822 /* if we are not root, chown the rootfs dir to root in the
823 * target uidmap */
824
825 if (geteuid() != 0 || (c->lxc_conf && !lxc_list_empty(&c->lxc_conf->id_map))) {
826 if (chown_mapped_root(bdev->dest, c->lxc_conf) < 0) {
827 ERROR("Error chowning %s to container root", bdev->dest);
828 suggest_default_idmap();
829 bdev_put(bdev);
830 return NULL;
831 }
832 }
833
834 return bdev;
835 }
836
837 /*
838 * Given the '-t' template option to lxc-create, figure out what to
839 * do. If the template is a full executable path, use that. If it
840 * is something like 'sshd', then return $templatepath/lxc-sshd.
841 * On success return the template, on error return NULL.
842 */
843 static char *get_template_path(const char *t)
844 {
845 int ret, len;
846 char *tpath;
847
848 if (t[0] == '/' && access(t, X_OK) == 0) {
849 tpath = strdup(t);
850 return tpath;
851 }
852
853 len = strlen(LXCTEMPLATEDIR) + strlen(t) + strlen("/lxc-") + 1;
854 tpath = malloc(len);
855 if (!tpath)
856 return NULL;
857 ret = snprintf(tpath, len, "%s/lxc-%s", LXCTEMPLATEDIR, t);
858 if (ret < 0 || ret >= len) {
859 free(tpath);
860 return NULL;
861 }
862 if (access(tpath, X_OK) < 0) {
863 SYSERROR("bad template: %s", t);
864 free(tpath);
865 return NULL;
866 }
867
868 return tpath;
869 }
870
871 static char *lxcbasename(char *path)
872 {
873 char *p = path + strlen(path) - 1;
874 while (*p != '/' && p > path)
875 p--;
876 return p;
877 }
878
879 static bool create_run_template(struct lxc_container *c, char *tpath, bool quiet,
880 char *const argv[])
881 {
882 pid_t pid;
883
884 if (!tpath)
885 return true;
886
887 pid = fork();
888 if (pid < 0) {
889 SYSERROR("failed to fork task for container creation template");
890 return false;
891 }
892
893 if (pid == 0) { // child
894 char *patharg, *namearg, *rootfsarg, *src;
895 struct bdev *bdev = NULL;
896 int i;
897 int ret, len, nargs = 0;
898 char **newargv;
899 struct lxc_conf *conf = c->lxc_conf;
900
901 if (quiet) {
902 close(0);
903 close(1);
904 close(2);
905 open("/dev/zero", O_RDONLY);
906 open("/dev/null", O_RDWR);
907 open("/dev/null", O_RDWR);
908 }
909
910 src = c->lxc_conf->rootfs.path;
911 /*
912 * for an overlay create, what the user wants is the template to fill
913 * in what will become the readonly lower layer. So don't mount for
914 * the template
915 */
916 if (strncmp(src, "overlayfs:", 10) == 0)
917 src = overlay_getlower(src+10);
918 if (strncmp(src, "aufs:", 5) == 0)
919 src = overlay_getlower(src+5);
920
921 bdev = bdev_init(c->lxc_conf, src, c->lxc_conf->rootfs.mount, NULL);
922 if (!bdev) {
923 ERROR("Error opening rootfs");
924 exit(1);
925 }
926
927 if (geteuid() == 0) {
928 if (unshare(CLONE_NEWNS) < 0) {
929 ERROR("error unsharing mounts");
930 exit(1);
931 }
932 if (detect_shared_rootfs()) {
933 if (mount(NULL, "/", NULL, MS_SLAVE|MS_REC, NULL)) {
934 SYSERROR("Failed to make / rslave to run template");
935 ERROR("Continuing...");
936 }
937 }
938 }
939 if (strcmp(bdev->type, "dir") && strcmp(bdev->type, "btrfs")) {
940 if (geteuid() != 0) {
941 ERROR("non-root users can only create btrfs and directory-backed containers");
942 exit(1);
943 }
944 if (bdev->ops->mount(bdev) < 0) {
945 ERROR("Error mounting rootfs");
946 exit(1);
947 }
948 } else { // TODO come up with a better way here!
949 if (bdev->dest)
950 free(bdev->dest);
951 bdev->dest = strdup(bdev->src);
952 }
953
954 /*
955 * create our new array, pre-pend the template name and
956 * base args
957 */
958 if (argv)
959 for (nargs = 0; argv[nargs]; nargs++) ;
960 nargs += 4; // template, path, rootfs and name args
961
962 newargv = malloc(nargs * sizeof(*newargv));
963 if (!newargv)
964 exit(1);
965 newargv[0] = lxcbasename(tpath);
966
967 len = strlen(c->config_path) + strlen(c->name) + strlen("--path=") + 2;
968 patharg = malloc(len);
969 if (!patharg)
970 exit(1);
971 ret = snprintf(patharg, len, "--path=%s/%s", c->config_path, c->name);
972 if (ret < 0 || ret >= len)
973 exit(1);
974 newargv[1] = patharg;
975 len = strlen("--name=") + strlen(c->name) + 1;
976 namearg = malloc(len);
977 if (!namearg)
978 exit(1);
979 ret = snprintf(namearg, len, "--name=%s", c->name);
980 if (ret < 0 || ret >= len)
981 exit(1);
982 newargv[2] = namearg;
983
984 len = strlen("--rootfs=") + 1 + strlen(bdev->dest);
985 rootfsarg = malloc(len);
986 if (!rootfsarg)
987 exit(1);
988 ret = snprintf(rootfsarg, len, "--rootfs=%s", bdev->dest);
989 if (ret < 0 || ret >= len)
990 exit(1);
991 newargv[3] = rootfsarg;
992
993 /* add passed-in args */
994 if (argv)
995 for (i = 4; i < nargs; i++)
996 newargv[i] = argv[i-4];
997
998 /* add trailing NULL */
999 nargs++;
1000 newargv = realloc(newargv, nargs * sizeof(*newargv));
1001 if (!newargv)
1002 exit(1);
1003 newargv[nargs - 1] = NULL;
1004
1005 /*
1006 * If we're running the template in a mapped userns, then
1007 * we prepend the template command with:
1008 * lxc-usernsexec <-m map1> ... <-m mapn> --
1009 * and we append "--mapped-uid x", where x is the mapped uid
1010 * for our geteuid()
1011 */
1012 if (!lxc_list_empty(&conf->id_map)) {
1013 int n2args = 1;
1014 char txtuid[20];
1015 char txtgid[20];
1016 char **n2 = malloc(n2args * sizeof(*n2));
1017 struct lxc_list *it;
1018 struct id_map *map;
1019
1020 if (!n2) {
1021 SYSERROR("out of memory");
1022 exit(1);
1023 }
1024 newargv[0] = tpath;
1025 tpath = "lxc-usernsexec";
1026 n2[0] = "lxc-usernsexec";
1027 lxc_list_for_each(it, &conf->id_map) {
1028 map = it->elem;
1029 n2args += 2;
1030 n2 = realloc(n2, n2args * sizeof(char *));
1031 if (!n2)
1032 exit(1);
1033 n2[n2args-2] = "-m";
1034 n2[n2args-1] = malloc(200);
1035 if (!n2[n2args-1])
1036 exit(1);
1037 ret = snprintf(n2[n2args-1], 200, "%c:%lu:%lu:%lu",
1038 map->idtype == ID_TYPE_UID ? 'u' : 'g',
1039 map->nsid, map->hostid, map->range);
1040 if (ret < 0 || ret >= 200)
1041 exit(1);
1042 }
1043 int hostid_mapped = mapped_hostid(geteuid(), conf, ID_TYPE_UID);
1044 int extraargs = hostid_mapped >= 0 ? 1 : 3;
1045 n2 = realloc(n2, (nargs + n2args + extraargs) * sizeof(char *));
1046 if (!n2)
1047 exit(1);
1048 if (hostid_mapped < 0) {
1049 hostid_mapped = find_unmapped_nsuid(conf, ID_TYPE_UID);
1050 n2[n2args++] = "-m";
1051 if (hostid_mapped < 0) {
1052 ERROR("Could not find free uid to map");
1053 exit(1);
1054 }
1055 n2[n2args++] = malloc(200);
1056 if (!n2[n2args-1]) {
1057 SYSERROR("out of memory");
1058 exit(1);
1059 }
1060 ret = snprintf(n2[n2args-1], 200, "u:%d:%d:1",
1061 hostid_mapped, geteuid());
1062 if (ret < 0 || ret >= 200) {
1063 ERROR("string too long");
1064 exit(1);
1065 }
1066 }
1067 int hostgid_mapped = mapped_hostid(getegid(), conf, ID_TYPE_GID);
1068 extraargs = hostgid_mapped >= 0 ? 1 : 3;
1069 n2 = realloc(n2, (nargs + n2args + extraargs) * sizeof(char *));
1070 if (!n2)
1071 exit(1);
1072 if (hostgid_mapped < 0) {
1073 hostgid_mapped = find_unmapped_nsuid(conf, ID_TYPE_GID);
1074 n2[n2args++] = "-m";
1075 if (hostgid_mapped < 0) {
1076 ERROR("Could not find free uid to map");
1077 exit(1);
1078 }
1079 n2[n2args++] = malloc(200);
1080 if (!n2[n2args-1]) {
1081 SYSERROR("out of memory");
1082 exit(1);
1083 }
1084 ret = snprintf(n2[n2args-1], 200, "g:%d:%d:1",
1085 hostgid_mapped, getegid());
1086 if (ret < 0 || ret >= 200) {
1087 ERROR("string too long");
1088 exit(1);
1089 }
1090 }
1091 n2[n2args++] = "--";
1092 for (i = 0; i < nargs; i++)
1093 n2[i + n2args] = newargv[i];
1094 n2args += nargs;
1095 // Finally add "--mapped-uid $uid" to tell template what to chown
1096 // cached images to
1097 n2args += 4;
1098 n2 = realloc(n2, n2args * sizeof(char *));
1099 if (!n2) {
1100 SYSERROR("out of memory");
1101 exit(1);
1102 }
1103 // note n2[n2args-1] is NULL
1104 n2[n2args-5] = "--mapped-uid";
1105 snprintf(txtuid, 20, "%d", hostid_mapped);
1106 n2[n2args-4] = txtuid;
1107 n2[n2args-3] = "--mapped-gid";
1108 snprintf(txtgid, 20, "%d", hostgid_mapped);
1109 n2[n2args-2] = txtgid;
1110 n2[n2args-1] = NULL;
1111 free(newargv);
1112 newargv = n2;
1113 }
1114 /* execute */
1115 execvp(tpath, newargv);
1116 SYSERROR("failed to execute template %s", tpath);
1117 exit(1);
1118 }
1119
1120 if (wait_for_pid(pid) != 0) {
1121 ERROR("container creation template for %s failed", c->name);
1122 return false;
1123 }
1124
1125 return true;
1126 }
1127
1128 static bool prepend_lxc_header(char *path, const char *t, char *const argv[])
1129 {
1130 long flen;
1131 char *contents;
1132 FILE *f;
1133 int ret = -1;
1134 #if HAVE_LIBGNUTLS
1135 int i;
1136 unsigned char md_value[SHA_DIGEST_LENGTH];
1137 char *tpath;
1138 #endif
1139
1140 f = fopen(path, "r");
1141 if (f == NULL)
1142 return false;
1143
1144 if (fseek(f, 0, SEEK_END) < 0)
1145 goto out_error;
1146 if ((flen = ftell(f)) < 0)
1147 goto out_error;
1148 if (fseek(f, 0, SEEK_SET) < 0)
1149 goto out_error;
1150 if ((contents = malloc(flen + 1)) == NULL)
1151 goto out_error;
1152 if (fread(contents, 1, flen, f) != flen)
1153 goto out_free_contents;
1154
1155 contents[flen] = '\0';
1156 ret = fclose(f);
1157 f = NULL;
1158 if (ret < 0)
1159 goto out_free_contents;
1160
1161 #if HAVE_LIBGNUTLS
1162 tpath = get_template_path(t);
1163 if (!tpath) {
1164 ERROR("bad template: %s", t);
1165 goto out_free_contents;
1166 }
1167
1168 ret = sha1sum_file(tpath, md_value);
1169 if (ret < 0) {
1170 ERROR("Error getting sha1sum of %s", tpath);
1171 free(tpath);
1172 goto out_free_contents;
1173 }
1174 free(tpath);
1175 #endif
1176
1177 f = fopen(path, "w");
1178 if (f == NULL) {
1179 SYSERROR("reopening config for writing");
1180 free(contents);
1181 return false;
1182 }
1183 fprintf(f, "# Template used to create this container: %s\n", t);
1184 if (argv) {
1185 fprintf(f, "# Parameters passed to the template:");
1186 while (*argv) {
1187 fprintf(f, " %s", *argv);
1188 argv++;
1189 }
1190 fprintf(f, "\n");
1191 }
1192 #if HAVE_LIBGNUTLS
1193 fprintf(f, "# Template script checksum (SHA-1): ");
1194 for (i=0; i<SHA_DIGEST_LENGTH; i++)
1195 fprintf(f, "%02x", md_value[i]);
1196 fprintf(f, "\n");
1197 #endif
1198 fprintf(f, "# For additional config options, please look at lxc.container.conf(5)\n");
1199 if (fwrite(contents, 1, flen, f) != flen) {
1200 SYSERROR("Writing original contents");
1201 free(contents);
1202 fclose(f);
1203 return false;
1204 }
1205 ret = 0;
1206 out_free_contents:
1207 free(contents);
1208 out_error:
1209 if (f) {
1210 int newret;
1211 newret = fclose(f);
1212 if (ret == 0)
1213 ret = newret;
1214 }
1215 if (ret < 0) {
1216 SYSERROR("Error prepending header");
1217 return false;
1218 }
1219 return true;
1220 }
1221
1222 static void lxcapi_clear_config(struct lxc_container *c)
1223 {
1224 if (c) {
1225 if (c->lxc_conf) {
1226 lxc_conf_free(c->lxc_conf);
1227 c->lxc_conf = NULL;
1228 }
1229 }
1230 }
1231
1232 static bool lxcapi_destroy(struct lxc_container *c);
1233 static bool container_destroy(struct lxc_container *c);
1234 static bool get_snappath_dir(struct lxc_container *c, char *snappath);
1235 /*
1236 * lxcapi_create:
1237 * create a container with the given parameters.
1238 * @c: container to be created. It has the lxcpath, name, and a starting
1239 * configuration already set
1240 * @t: the template to execute to instantiate the root filesystem and
1241 * adjust the configuration.
1242 * @bdevtype: backing store type to use. If NULL, dir will be used.
1243 * @specs: additional parameters for the backing store, i.e. LVM vg to
1244 * use.
1245 *
1246 * @argv: the arguments to pass to the template, terminated by NULL. If no
1247 * arguments, you can just pass NULL.
1248 */
1249 static bool lxcapi_create(struct lxc_container *c, const char *t,
1250 const char *bdevtype, struct bdev_specs *specs, int flags,
1251 char *const argv[])
1252 {
1253 bool ret = false;
1254 pid_t pid;
1255 char *tpath = NULL;
1256 int partial_fd;
1257
1258 if (!c)
1259 return false;
1260
1261 if (t) {
1262 tpath = get_template_path(t);
1263 if (!tpath) {
1264 ERROR("bad template: %s", t);
1265 goto out;
1266 }
1267 }
1268
1269 /*
1270 * If a template is passed in, and the rootfs already is defined in
1271 * the container config and exists, then * caller is trying to create
1272 * an existing container. Return an error, but do NOT delete the
1273 * container.
1274 */
1275 if (lxcapi_is_defined(c) && c->lxc_conf && c->lxc_conf->rootfs.path &&
1276 access(c->lxc_conf->rootfs.path, F_OK) == 0 && tpath) {
1277 ERROR("Container %s:%s already exists", c->config_path, c->name);
1278 goto free_tpath;
1279 }
1280
1281 if (!c->lxc_conf) {
1282 if (!c->load_config(c, lxc_global_config_value("lxc.default_config"))) {
1283 ERROR("Error loading default configuration file %s", lxc_global_config_value("lxc.default_config"));
1284 goto free_tpath;
1285 }
1286 }
1287
1288 if (!create_container_dir(c))
1289 goto free_tpath;
1290
1291 /*
1292 * either template or rootfs.path should be set.
1293 * if both template and rootfs.path are set, template is setup as rootfs.path.
1294 * container is already created if we have a config and rootfs.path is accessible
1295 */
1296 if (!c->lxc_conf->rootfs.path && !tpath)
1297 /* no template passed in and rootfs does not exist: error */
1298 goto out;
1299 if (c->lxc_conf->rootfs.path && access(c->lxc_conf->rootfs.path, F_OK) != 0)
1300 /* rootfs passed into configuration, but does not exist: error */
1301 goto out;
1302 if (lxcapi_is_defined(c) && c->lxc_conf->rootfs.path && !tpath) {
1303 /* Rootfs already existed, user just wanted to save the
1304 * loaded configuration */
1305 ret = true;
1306 goto out;
1307 }
1308
1309 /* Mark that this container is being created */
1310 if ((partial_fd = create_partial(c)) < 0)
1311 goto out;
1312
1313 /* no need to get disk lock bc we have the partial locked */
1314
1315 /*
1316 * Create the backing store
1317 * Note we can't do this in the same task as we use to execute the
1318 * template because of the way zfs works.
1319 * After you 'zfs create', zfs mounts the fs only in the initial
1320 * namespace.
1321 */
1322 pid = fork();
1323 if (pid < 0) {
1324 SYSERROR("failed to fork task for container creation template");
1325 goto out_unlock;
1326 }
1327
1328 if (pid == 0) { // child
1329 struct bdev *bdev = NULL;
1330
1331 if (!(bdev = do_bdev_create(c, bdevtype, specs))) {
1332 ERROR("Error creating backing store type %s for %s",
1333 bdevtype ? bdevtype : "(none)", c->name);
1334 exit(1);
1335 }
1336
1337 /* save config file again to store the new rootfs location */
1338 if (!c->save_config(c, NULL)) {
1339 ERROR("failed to save starting configuration for %s", c->name);
1340 // parent task won't see bdev in config so we delete it
1341 bdev->ops->umount(bdev);
1342 bdev->ops->destroy(bdev);
1343 exit(1);
1344 }
1345 exit(0);
1346 }
1347 if (wait_for_pid(pid) != 0)
1348 goto out_unlock;
1349
1350 /* reload config to get the rootfs */
1351 lxc_conf_free(c->lxc_conf);
1352 c->lxc_conf = NULL;
1353 if (!load_config_locked(c, c->configfile))
1354 goto out_unlock;
1355
1356 if (!create_run_template(c, tpath, !!(flags & LXC_CREATE_QUIET), argv))
1357 goto out_unlock;
1358
1359 // now clear out the lxc_conf we have, reload from the created
1360 // container
1361 lxcapi_clear_config(c);
1362
1363 if (t) {
1364 if (!prepend_lxc_header(c->configfile, tpath, argv)) {
1365 ERROR("Error prepending header to configuration file");
1366 goto out_unlock;
1367 }
1368 }
1369 ret = load_config_locked(c, c->configfile);
1370
1371 out_unlock:
1372 if (partial_fd >= 0)
1373 remove_partial(c, partial_fd);
1374 out:
1375 if (!ret && c)
1376 container_destroy(c);
1377 free_tpath:
1378 if (tpath)
1379 free(tpath);
1380 return ret;
1381 }
1382
1383 static bool lxcapi_reboot(struct lxc_container *c)
1384 {
1385 pid_t pid;
1386
1387 if (!c)
1388 return false;
1389 if (!c->is_running(c))
1390 return false;
1391 pid = c->init_pid(c);
1392 if (pid <= 0)
1393 return false;
1394 if (kill(pid, SIGINT) < 0)
1395 return false;
1396 return true;
1397
1398 }
1399
1400 static bool lxcapi_shutdown(struct lxc_container *c, int timeout)
1401 {
1402 bool retv;
1403 pid_t pid;
1404 int haltsignal = SIGPWR;
1405
1406 if (!c)
1407 return false;
1408
1409 if (!c->is_running(c))
1410 return true;
1411 pid = c->init_pid(c);
1412 if (pid <= 0)
1413 return true;
1414 if (c->lxc_conf && c->lxc_conf->haltsignal)
1415 haltsignal = c->lxc_conf->haltsignal;
1416 kill(pid, haltsignal);
1417 retv = c->wait(c, "STOPPED", timeout);
1418 return retv;
1419 }
1420
1421 static bool lxcapi_createl(struct lxc_container *c, const char *t,
1422 const char *bdevtype, struct bdev_specs *specs, int flags, ...)
1423 {
1424 bool bret = false;
1425 char **args = NULL;
1426 va_list ap;
1427
1428 if (!c)
1429 return false;
1430
1431 /*
1432 * since we're going to wait for create to finish, I don't think we
1433 * need to get a copy of the arguments.
1434 */
1435 va_start(ap, flags);
1436 args = lxc_va_arg_list_to_argv(ap, 0, 0);
1437 va_end(ap);
1438 if (!args) {
1439 ERROR("Memory allocation error.");
1440 goto out;
1441 }
1442
1443 bret = c->create(c, t, bdevtype, specs, flags, args);
1444
1445 out:
1446 free(args);
1447 return bret;
1448 }
1449
1450 static void do_clear_unexp_config_line(struct lxc_conf *conf, const char *key)
1451 {
1452 if (strcmp(key, "lxc.cgroup") == 0)
1453 clear_unexp_config_line(conf, key, true);
1454 else if (strcmp(key, "lxc.network") == 0)
1455 clear_unexp_config_line(conf, key, true);
1456 else if (strcmp(key, "lxc.hook") == 0)
1457 clear_unexp_config_line(conf, key, true);
1458 else
1459 clear_unexp_config_line(conf, key, false);
1460 if (!do_append_unexp_config_line(conf, key, ""))
1461 WARN("Error clearing configuration for %s", key);
1462 }
1463
1464 static bool lxcapi_clear_config_item(struct lxc_container *c, const char *key)
1465 {
1466 int ret;
1467
1468 if (!c || !c->lxc_conf)
1469 return false;
1470 if (container_mem_lock(c))
1471 return false;
1472 ret = lxc_clear_config_item(c->lxc_conf, key);
1473 if (!ret)
1474 do_clear_unexp_config_line(c->lxc_conf, key);
1475 container_mem_unlock(c);
1476 return ret == 0;
1477 }
1478
1479 static inline bool enter_to_ns(struct lxc_container *c)
1480 {
1481 pid_t pid = c->init_pid(c);
1482
1483 if ((geteuid() != 0 || (c->lxc_conf && !lxc_list_empty(&c->lxc_conf->id_map))) && access("/proc/self/ns/user", F_OK) == 0) {
1484 if (!switch_to_ns(pid, "user"))
1485 return false;
1486 }
1487 return switch_to_ns(pid, "net");
1488 }
1489
1490 // used by qsort and bsearch functions for comparing names
1491 static inline int string_cmp(char **first, char **second)
1492 {
1493 return strcmp(*first, *second);
1494 }
1495
1496 // used by qsort and bsearch functions for comparing container names
1497 static inline int container_cmp(struct lxc_container **first, struct lxc_container **second)
1498 {
1499 return strcmp((*first)->name, (*second)->name);
1500 }
1501
1502 static bool add_to_array(char ***names, char *cname, int pos)
1503 {
1504 char **newnames = realloc(*names, (pos+1) * sizeof(char *));
1505 if (!newnames) {
1506 ERROR("Out of memory");
1507 return false;
1508 }
1509
1510 *names = newnames;
1511 newnames[pos] = strdup(cname);
1512 if (!newnames[pos])
1513 return false;
1514
1515 // sort the arrray as we will use binary search on it
1516 qsort(newnames, pos + 1, sizeof(char *), (int (*)(const void *,const void *))string_cmp);
1517
1518 return true;
1519 }
1520
1521 static bool add_to_clist(struct lxc_container ***list, struct lxc_container *c, int pos, bool sort)
1522 {
1523 struct lxc_container **newlist = realloc(*list, (pos+1) * sizeof(struct lxc_container *));
1524 if (!newlist) {
1525 ERROR("Out of memory");
1526 return false;
1527 }
1528
1529 *list = newlist;
1530 newlist[pos] = c;
1531
1532 // sort the arrray as we will use binary search on it
1533 if (sort)
1534 qsort(newlist, pos + 1, sizeof(struct lxc_container *), (int (*)(const void *,const void *))container_cmp);
1535
1536 return true;
1537 }
1538
1539 static char** get_from_array(char ***names, char *cname, int size)
1540 {
1541 return (char **)bsearch(&cname, *names, size, sizeof(char *), (int (*)(const void *, const void *))string_cmp);
1542 }
1543
1544
1545 static bool array_contains(char ***names, char *cname, int size) {
1546 if(get_from_array(names, cname, size) != NULL)
1547 return true;
1548 return false;
1549 }
1550
1551 static bool remove_from_array(char ***names, char *cname, int size)
1552 {
1553 char **result = get_from_array(names, cname, size);
1554 if (result != NULL) {
1555 free(result);
1556 return true;
1557 }
1558 return false;
1559 }
1560
1561 static char** lxcapi_get_interfaces(struct lxc_container *c)
1562 {
1563 pid_t pid;
1564 int i, count = 0, pipefd[2];
1565 char **interfaces = NULL;
1566 char interface[IFNAMSIZ];
1567
1568 if(pipe(pipefd) < 0) {
1569 SYSERROR("pipe failed");
1570 return NULL;
1571 }
1572
1573 pid = fork();
1574 if (pid < 0) {
1575 SYSERROR("failed to fork task to get interfaces information");
1576 close(pipefd[0]);
1577 close(pipefd[1]);
1578 return NULL;
1579 }
1580
1581 if (pid == 0) { // child
1582 int ret = 1, nbytes;
1583 struct ifaddrs *interfaceArray = NULL, *tempIfAddr = NULL;
1584
1585 /* close the read-end of the pipe */
1586 close(pipefd[0]);
1587
1588 if (!enter_to_ns(c)) {
1589 SYSERROR("failed to enter namespace");
1590 goto out;
1591 }
1592
1593 /* Grab the list of interfaces */
1594 if (getifaddrs(&interfaceArray)) {
1595 SYSERROR("failed to get interfaces list");
1596 goto out;
1597 }
1598
1599 /* Iterate through the interfaces */
1600 for (tempIfAddr = interfaceArray; tempIfAddr != NULL; tempIfAddr = tempIfAddr->ifa_next) {
1601 nbytes = write(pipefd[1], tempIfAddr->ifa_name, IFNAMSIZ);
1602 if (nbytes < 0) {
1603 ERROR("write failed");
1604 goto out;
1605 }
1606 count++;
1607 }
1608 ret = 0;
1609
1610 out:
1611 if (interfaceArray)
1612 freeifaddrs(interfaceArray);
1613
1614 /* close the write-end of the pipe, thus sending EOF to the reader */
1615 close(pipefd[1]);
1616 exit(ret);
1617 }
1618
1619 /* close the write-end of the pipe */
1620 close(pipefd[1]);
1621
1622 while (read(pipefd[0], &interface, IFNAMSIZ) == IFNAMSIZ) {
1623 if (array_contains(&interfaces, interface, count))
1624 continue;
1625
1626 if(!add_to_array(&interfaces, interface, count))
1627 ERROR("PARENT: add_to_array failed");
1628 count++;
1629 }
1630
1631 if (wait_for_pid(pid) != 0) {
1632 for(i=0;i<count;i++)
1633 free(interfaces[i]);
1634 free(interfaces);
1635 interfaces = NULL;
1636 }
1637
1638 /* close the read-end of the pipe */
1639 close(pipefd[0]);
1640
1641 /* Append NULL to the array */
1642 if(interfaces)
1643 interfaces = (char **)lxc_append_null_to_array((void **)interfaces, count);
1644
1645 return interfaces;
1646 }
1647
1648 static char** lxcapi_get_ips(struct lxc_container *c, const char* interface, const char* family, int scope)
1649 {
1650 pid_t pid;
1651 int i, count = 0, pipefd[2];
1652 char **addresses = NULL;
1653 char address[INET6_ADDRSTRLEN];
1654
1655 if(pipe(pipefd) < 0) {
1656 SYSERROR("pipe failed");
1657 return NULL;
1658 }
1659
1660 pid = fork();
1661 if (pid < 0) {
1662 SYSERROR("failed to fork task to get container ips");
1663 close(pipefd[0]);
1664 close(pipefd[1]);
1665 return NULL;
1666 }
1667
1668 if (pid == 0) { // child
1669 int ret = 1, nbytes;
1670 struct ifaddrs *interfaceArray = NULL, *tempIfAddr = NULL;
1671 char addressOutputBuffer[INET6_ADDRSTRLEN];
1672 void *tempAddrPtr = NULL;
1673 char *address = NULL;
1674
1675 /* close the read-end of the pipe */
1676 close(pipefd[0]);
1677
1678 if (!enter_to_ns(c)) {
1679 SYSERROR("failed to enter namespace");
1680 goto out;
1681 }
1682
1683 /* Grab the list of interfaces */
1684 if (getifaddrs(&interfaceArray)) {
1685 SYSERROR("failed to get interfaces list");
1686 goto out;
1687 }
1688
1689 /* Iterate through the interfaces */
1690 for (tempIfAddr = interfaceArray; tempIfAddr != NULL; tempIfAddr = tempIfAddr->ifa_next) {
1691 if (tempIfAddr->ifa_addr == NULL)
1692 continue;
1693
1694 if(tempIfAddr->ifa_addr->sa_family == AF_INET) {
1695 if (family && strcmp(family, "inet"))
1696 continue;
1697 tempAddrPtr = &((struct sockaddr_in *)tempIfAddr->ifa_addr)->sin_addr;
1698 }
1699 else {
1700 if (family && strcmp(family, "inet6"))
1701 continue;
1702
1703 if (((struct sockaddr_in6 *)tempIfAddr->ifa_addr)->sin6_scope_id != scope)
1704 continue;
1705
1706 tempAddrPtr = &((struct sockaddr_in6 *)tempIfAddr->ifa_addr)->sin6_addr;
1707 }
1708
1709 if (interface && strcmp(interface, tempIfAddr->ifa_name))
1710 continue;
1711 else if (!interface && strcmp("lo", tempIfAddr->ifa_name) == 0)
1712 continue;
1713
1714 address = (char *)inet_ntop(tempIfAddr->ifa_addr->sa_family,
1715 tempAddrPtr,
1716 addressOutputBuffer,
1717 sizeof(addressOutputBuffer));
1718 if (!address)
1719 continue;
1720
1721 nbytes = write(pipefd[1], address, INET6_ADDRSTRLEN);
1722 if (nbytes < 0) {
1723 ERROR("write failed");
1724 goto out;
1725 }
1726 count++;
1727 }
1728 ret = 0;
1729
1730 out:
1731 if(interfaceArray)
1732 freeifaddrs(interfaceArray);
1733
1734 /* close the write-end of the pipe, thus sending EOF to the reader */
1735 close(pipefd[1]);
1736 exit(ret);
1737 }
1738
1739 /* close the write-end of the pipe */
1740 close(pipefd[1]);
1741
1742 while (read(pipefd[0], &address, INET6_ADDRSTRLEN) == INET6_ADDRSTRLEN) {
1743 if(!add_to_array(&addresses, address, count))
1744 ERROR("PARENT: add_to_array failed");
1745 count++;
1746 }
1747
1748 if (wait_for_pid(pid) != 0) {
1749 for(i=0;i<count;i++)
1750 free(addresses[i]);
1751 free(addresses);
1752 addresses = NULL;
1753 }
1754
1755 /* close the read-end of the pipe */
1756 close(pipefd[0]);
1757
1758 /* Append NULL to the array */
1759 if(addresses)
1760 addresses = (char **)lxc_append_null_to_array((void **)addresses, count);
1761
1762 return addresses;
1763 }
1764
1765 static int lxcapi_get_config_item(struct lxc_container *c, const char *key, char *retv, int inlen)
1766 {
1767 int ret;
1768
1769 if (!c || !c->lxc_conf)
1770 return -1;
1771 if (container_mem_lock(c))
1772 return -1;
1773 ret = lxc_get_config_item(c->lxc_conf, key, retv, inlen);
1774 container_mem_unlock(c);
1775 return ret;
1776 }
1777
1778 static char* lxcapi_get_running_config_item(struct lxc_container *c, const char *key)
1779 {
1780 char *ret;
1781
1782 if (!c || !c->lxc_conf)
1783 return NULL;
1784 if (container_mem_lock(c))
1785 return NULL;
1786 ret = lxc_cmd_get_config_item(c->name, key, c->get_config_path(c));
1787 container_mem_unlock(c);
1788 return ret;
1789 }
1790
1791 static int lxcapi_get_keys(struct lxc_container *c, const char *key, char *retv, int inlen)
1792 {
1793 if (!key)
1794 return lxc_listconfigs(retv, inlen);
1795 /*
1796 * Support 'lxc.network.<idx>', i.e. 'lxc.network.0'
1797 * This is an intelligent result to show which keys are valid given
1798 * the type of nic it is
1799 */
1800 if (!c || !c->lxc_conf)
1801 return -1;
1802 if (container_mem_lock(c))
1803 return -1;
1804 int ret = -1;
1805 if (strncmp(key, "lxc.network.", 12) == 0)
1806 ret = lxc_list_nicconfigs(c->lxc_conf, key, retv, inlen);
1807 container_mem_unlock(c);
1808 return ret;
1809 }
1810
1811 static bool lxcapi_save_config(struct lxc_container *c, const char *alt_file)
1812 {
1813 FILE *fout;
1814 bool ret = false, need_disklock = false;
1815 int lret;
1816
1817 if (!alt_file)
1818 alt_file = c->configfile;
1819 if (!alt_file)
1820 return false; // should we write to stdout if no file is specified?
1821
1822 // If we haven't yet loaded a config, load the stock config
1823 if (!c->lxc_conf) {
1824 if (!c->load_config(c, lxc_global_config_value("lxc.default_config"))) {
1825 ERROR("Error loading default configuration file %s while saving %s", lxc_global_config_value("lxc.default_config"), c->name);
1826 return false;
1827 }
1828 }
1829
1830 if (!create_container_dir(c))
1831 return false;
1832
1833 /*
1834 * If we're writing to the container's config file, take the
1835 * disk lock. Otherwise just take the memlock to protect the
1836 * struct lxc_container while we're traversing it.
1837 */
1838 if (strcmp(c->configfile, alt_file) == 0)
1839 need_disklock = true;
1840
1841 if (need_disklock)
1842 lret = container_disk_lock(c);
1843 else
1844 lret = container_mem_lock(c);
1845
1846 if (lret)
1847 return false;
1848
1849 fout = fopen(alt_file, "w");
1850 if (!fout)
1851 goto out;
1852 write_config(fout, c->lxc_conf);
1853 fclose(fout);
1854 ret = true;
1855
1856 out:
1857 if (need_disklock)
1858 container_disk_unlock(c);
1859 else
1860 container_mem_unlock(c);
1861 return ret;
1862 }
1863
1864 static bool mod_rdep(struct lxc_container *c, bool inc)
1865 {
1866 char path[MAXPATHLEN];
1867 int ret, v = 0;
1868 FILE *f;
1869 bool bret = false;
1870
1871 if (container_disk_lock(c))
1872 return false;
1873 ret = snprintf(path, MAXPATHLEN, "%s/%s/lxc_snapshots", c->config_path,
1874 c->name);
1875 if (ret < 0 || ret > MAXPATHLEN)
1876 goto out;
1877 f = fopen(path, "r");
1878 if (f) {
1879 ret = fscanf(f, "%d", &v);
1880 fclose(f);
1881 if (ret != 1) {
1882 ERROR("Corrupted file %s", path);
1883 goto out;
1884 }
1885 }
1886 v += inc ? 1 : -1;
1887 f = fopen(path, "w");
1888 if (!f)
1889 goto out;
1890 if (fprintf(f, "%d\n", v) < 0) {
1891 ERROR("Error writing new snapshots value");
1892 fclose(f);
1893 goto out;
1894 }
1895 ret = fclose(f);
1896 if (ret != 0) {
1897 SYSERROR("Error writing to or closing snapshots file");
1898 goto out;
1899 }
1900
1901 bret = true;
1902
1903 out:
1904 container_disk_unlock(c);
1905 return bret;
1906 }
1907
1908 static void strip_newline(char *p)
1909 {
1910 size_t len = strlen(p);
1911 if (len < 1)
1912 return;
1913 if (p[len-1] == '\n')
1914 p[len-1] = '\0';
1915 }
1916
1917 static void mod_all_rdeps(struct lxc_container *c, bool inc)
1918 {
1919 struct lxc_container *p;
1920 char *lxcpath = NULL, *lxcname = NULL, path[MAXPATHLEN];
1921 size_t pathlen = 0, namelen = 0;
1922 FILE *f;
1923 int ret;
1924
1925 ret = snprintf(path, MAXPATHLEN, "%s/%s/lxc_rdepends",
1926 c->config_path, c->name);
1927 if (ret < 0 || ret >= MAXPATHLEN) {
1928 ERROR("Path name too long");
1929 return;
1930 }
1931 f = fopen(path, "r");
1932 if (f == NULL)
1933 return;
1934 while (getline(&lxcpath, &pathlen, f) != -1) {
1935 if (getline(&lxcname, &namelen, f) == -1) {
1936 ERROR("badly formatted file %s", path);
1937 goto out;
1938 }
1939 strip_newline(lxcpath);
1940 strip_newline(lxcname);
1941 if ((p = lxc_container_new(lxcname, lxcpath)) == NULL) {
1942 ERROR("Unable to find dependent container %s:%s",
1943 lxcpath, lxcname);
1944 continue;
1945 }
1946 if (!mod_rdep(p, inc))
1947 ERROR("Failed to increase numsnapshots for %s:%s",
1948 lxcpath, lxcname);
1949 lxc_container_put(p);
1950 }
1951 out:
1952 if (lxcpath) free(lxcpath);
1953 if (lxcname) free(lxcname);
1954 fclose(f);
1955 }
1956
1957 static bool has_fs_snapshots(struct lxc_container *c)
1958 {
1959 char path[MAXPATHLEN];
1960 int ret, v;
1961 FILE *f;
1962 bool bret = false;
1963
1964 ret = snprintf(path, MAXPATHLEN, "%s/%s/lxc_snapshots", c->config_path,
1965 c->name);
1966 if (ret < 0 || ret > MAXPATHLEN)
1967 goto out;
1968 f = fopen(path, "r");
1969 if (!f)
1970 goto out;
1971 ret = fscanf(f, "%d", &v);
1972 fclose(f);
1973 if (ret != 1)
1974 goto out;
1975 bret = v != 0;
1976
1977 out:
1978 return bret;
1979 }
1980
1981 static bool has_snapshots(struct lxc_container *c)
1982 {
1983 char path[MAXPATHLEN];
1984 struct dirent dirent, *direntp;
1985 int count=0;
1986 DIR *dir;
1987
1988 if (!get_snappath_dir(c, path))
1989 return false;
1990 dir = opendir(path);
1991 if (!dir)
1992 return false;
1993 while (!readdir_r(dir, &dirent, &direntp)) {
1994 if (!direntp)
1995 break;
1996
1997 if (!strcmp(direntp->d_name, "."))
1998 continue;
1999
2000 if (!strcmp(direntp->d_name, ".."))
2001 continue;
2002 count++;
2003 break;
2004 }
2005 closedir(dir);
2006 return count > 0;
2007 }
2008
2009 static int lxc_rmdir_onedev_wrapper(void *data)
2010 {
2011 char *arg = (char *) data;
2012 return lxc_rmdir_onedev(arg, "snaps");
2013 }
2014
2015 static int do_bdev_destroy(struct lxc_conf *conf)
2016 {
2017 struct bdev *r;
2018 int ret = 0;
2019
2020 r = bdev_init(conf, conf->rootfs.path, conf->rootfs.mount, NULL);
2021 if (!r)
2022 return -1;
2023
2024 if (r->ops->destroy(r) < 0)
2025 ret = -1;
2026 bdev_put(r);
2027 return ret;
2028 }
2029
2030 static int bdev_destroy_wrapper(void *data)
2031 {
2032 struct lxc_conf *conf = data;
2033
2034 if (setgid(0) < 0) {
2035 ERROR("Failed to setgid to 0");
2036 return -1;
2037 }
2038 if (setgroups(0, NULL) < 0)
2039 WARN("Failed to clear groups");
2040 if (setuid(0) < 0) {
2041 ERROR("Failed to setuid to 0");
2042 return -1;
2043 }
2044 return do_bdev_destroy(conf);
2045 }
2046
2047 static bool container_destroy(struct lxc_container *c)
2048 {
2049 bool bret = false;
2050 int ret;
2051
2052 if (!c || !lxcapi_is_defined(c))
2053 return false;
2054
2055 if (container_disk_lock(c))
2056 return false;
2057
2058 if (!is_stopped(c)) {
2059 // we should queue some sort of error - in c->error_string?
2060 ERROR("container %s is not stopped", c->name);
2061 goto out;
2062 }
2063
2064 if (c->lxc_conf && c->lxc_conf->rootfs.path && c->lxc_conf->rootfs.mount) {
2065 if (am_unpriv())
2066 ret = userns_exec_1(c->lxc_conf, bdev_destroy_wrapper, c->lxc_conf);
2067 else
2068 ret = do_bdev_destroy(c->lxc_conf);
2069 if (ret < 0) {
2070 ERROR("Error destroying rootfs for %s", c->name);
2071 goto out;
2072 }
2073 }
2074
2075 mod_all_rdeps(c, false);
2076
2077 const char *p1 = lxcapi_get_config_path(c);
2078 char *path = alloca(strlen(p1) + strlen(c->name) + 2);
2079 sprintf(path, "%s/%s", p1, c->name);
2080 if (am_unpriv())
2081 ret = userns_exec_1(c->lxc_conf, lxc_rmdir_onedev_wrapper, path);
2082 else
2083 ret = lxc_rmdir_onedev(path, "snaps");
2084 if (ret < 0) {
2085 ERROR("Error destroying container directory for %s", c->name);
2086 goto out;
2087 }
2088 bret = true;
2089
2090 out:
2091 container_disk_unlock(c);
2092 return bret;
2093 }
2094
2095 static bool lxcapi_destroy(struct lxc_container *c)
2096 {
2097 if (!c || !lxcapi_is_defined(c))
2098 return false;
2099 if (has_snapshots(c)) {
2100 ERROR("Container %s has snapshots; not removing", c->name);
2101 return false;
2102 }
2103
2104 if (has_fs_snapshots(c)) {
2105 ERROR("container %s has snapshots on its rootfs", c->name);
2106 return false;
2107 }
2108
2109 return container_destroy(c);
2110 }
2111
2112 static bool lxcapi_snapshot_destroy_all(struct lxc_container *c);
2113
2114 static bool lxcapi_destroy_with_snapshots(struct lxc_container *c)
2115 {
2116 if (!c || !lxcapi_is_defined(c))
2117 return false;
2118 if (!lxcapi_snapshot_destroy_all(c)) {
2119 ERROR("Error deleting all snapshots");
2120 return false;
2121 }
2122 return lxcapi_destroy(c);
2123 }
2124
2125 static bool set_config_item_locked(struct lxc_container *c, const char *key, const char *v)
2126 {
2127 struct lxc_config_t *config;
2128
2129 if (!c->lxc_conf)
2130 c->lxc_conf = lxc_conf_init();
2131 if (!c->lxc_conf)
2132 return false;
2133 config = lxc_getconfig(key);
2134 if (!config)
2135 return false;
2136 if (config->cb(key, v, c->lxc_conf) != 0)
2137 return false;
2138 return do_append_unexp_config_line(c->lxc_conf, key, v);
2139 }
2140
2141 static bool lxcapi_set_config_item(struct lxc_container *c, const char *key, const char *v)
2142 {
2143 bool b = false;
2144
2145 if (!c)
2146 return false;
2147
2148 if (container_mem_lock(c))
2149 return false;
2150
2151 b = set_config_item_locked(c, key, v);
2152
2153 container_mem_unlock(c);
2154 return b;
2155 }
2156
2157 static char *lxcapi_config_file_name(struct lxc_container *c)
2158 {
2159 if (!c || !c->configfile)
2160 return NULL;
2161 return strdup(c->configfile);
2162 }
2163
2164 static const char *lxcapi_get_config_path(struct lxc_container *c)
2165 {
2166 if (!c || !c->config_path)
2167 return NULL;
2168 return (const char *)(c->config_path);
2169 }
2170
2171 /*
2172 * not for export
2173 * Just recalculate the c->configfile based on the
2174 * c->config_path, which must be set.
2175 * The lxc_container must be locked or not yet public.
2176 */
2177 static bool set_config_filename(struct lxc_container *c)
2178 {
2179 char *newpath;
2180 int len, ret;
2181
2182 if (!c->config_path)
2183 return false;
2184
2185 /* $lxc_path + "/" + c->name + "/" + "config" + '\0' */
2186 len = strlen(c->config_path) + strlen(c->name) + strlen("config") + 3;
2187 newpath = malloc(len);
2188 if (!newpath)
2189 return false;
2190
2191 ret = snprintf(newpath, len, "%s/%s/config", c->config_path, c->name);
2192 if (ret < 0 || ret >= len) {
2193 fprintf(stderr, "Error printing out config file name\n");
2194 free(newpath);
2195 return false;
2196 }
2197
2198 if (c->configfile)
2199 free(c->configfile);
2200 c->configfile = newpath;
2201
2202 return true;
2203 }
2204
2205 static bool lxcapi_set_config_path(struct lxc_container *c, const char *path)
2206 {
2207 char *p;
2208 bool b = false;
2209 char *oldpath = NULL;
2210
2211 if (!c)
2212 return b;
2213
2214 if (container_mem_lock(c))
2215 return b;
2216
2217 p = strdup(path);
2218 if (!p) {
2219 ERROR("Out of memory setting new lxc path");
2220 goto err;
2221 }
2222
2223 b = true;
2224 if (c->config_path)
2225 oldpath = c->config_path;
2226 c->config_path = p;
2227
2228 /* Since we've changed the config path, we have to change the
2229 * config file name too */
2230 if (!set_config_filename(c)) {
2231 ERROR("Out of memory setting new config filename");
2232 b = false;
2233 free(c->config_path);
2234 c->config_path = oldpath;
2235 oldpath = NULL;
2236 }
2237 err:
2238 if (oldpath)
2239 free(oldpath);
2240 container_mem_unlock(c);
2241 return b;
2242 }
2243
2244
2245 static bool lxcapi_set_cgroup_item(struct lxc_container *c, const char *subsys, const char *value)
2246 {
2247 int ret;
2248
2249 if (!c)
2250 return false;
2251
2252 if (is_stopped(c))
2253 return false;
2254
2255 if (container_disk_lock(c))
2256 return false;
2257
2258 ret = lxc_cgroup_set(subsys, value, c->name, c->config_path);
2259
2260 container_disk_unlock(c);
2261 return ret == 0;
2262 }
2263
2264 static int lxcapi_get_cgroup_item(struct lxc_container *c, const char *subsys, char *retv, int inlen)
2265 {
2266 int ret;
2267
2268 if (!c)
2269 return -1;
2270
2271 if (is_stopped(c))
2272 return -1;
2273
2274 if (container_disk_lock(c))
2275 return -1;
2276
2277 ret = lxc_cgroup_get(subsys, retv, inlen, c->name, c->config_path);
2278
2279 container_disk_unlock(c);
2280 return ret;
2281 }
2282
2283 const char *lxc_get_global_config_item(const char *key)
2284 {
2285 return lxc_global_config_value(key);
2286 }
2287
2288 const char *lxc_get_version(void)
2289 {
2290 return LXC_VERSION;
2291 }
2292
2293 static int copy_file(const char *old, const char *new)
2294 {
2295 int in, out;
2296 ssize_t len, ret;
2297 char buf[8096];
2298 struct stat sbuf;
2299
2300 if (file_exists(new)) {
2301 ERROR("copy destination %s exists", new);
2302 return -1;
2303 }
2304 ret = stat(old, &sbuf);
2305 if (ret < 0) {
2306 INFO("Error stat'ing %s", old);
2307 return -1;
2308 }
2309
2310 in = open(old, O_RDONLY);
2311 if (in < 0) {
2312 SYSERROR("Error opening original file %s", old);
2313 return -1;
2314 }
2315 out = open(new, O_CREAT | O_EXCL | O_WRONLY, 0644);
2316 if (out < 0) {
2317 SYSERROR("Error opening new file %s", new);
2318 close(in);
2319 return -1;
2320 }
2321
2322 while (1) {
2323 len = read(in, buf, 8096);
2324 if (len < 0) {
2325 SYSERROR("Error reading old file %s", old);
2326 goto err;
2327 }
2328 if (len == 0)
2329 break;
2330 ret = write(out, buf, len);
2331 if (ret < len) { // should we retry?
2332 SYSERROR("Error: write to new file %s was interrupted", new);
2333 goto err;
2334 }
2335 }
2336 close(in);
2337 close(out);
2338
2339 // we set mode, but not owner/group
2340 ret = chmod(new, sbuf.st_mode);
2341 if (ret) {
2342 SYSERROR("Error setting mode on %s", new);
2343 return -1;
2344 }
2345
2346 return 0;
2347
2348 err:
2349 close(in);
2350 close(out);
2351 return -1;
2352 }
2353
2354 static int copyhooks(struct lxc_container *oldc, struct lxc_container *c)
2355 {
2356 int i, len, ret;
2357 struct lxc_list *it;
2358 char *cpath;
2359
2360 len = strlen(oldc->config_path) + strlen(oldc->name) + 3;
2361 cpath = alloca(len);
2362 ret = snprintf(cpath, len, "%s/%s/", oldc->config_path, oldc->name);
2363 if (ret < 0 || ret >= len)
2364 return -1;
2365
2366 for (i=0; i<NUM_LXC_HOOKS; i++) {
2367 lxc_list_for_each(it, &c->lxc_conf->hooks[i]) {
2368 char *hookname = it->elem;
2369 char *fname = strrchr(hookname, '/');
2370 char tmppath[MAXPATHLEN];
2371 if (!fname) // relative path - we don't support, but maybe we should
2372 return 0;
2373 if (strncmp(hookname, cpath, len - 1) != 0) {
2374 // this hook is public - ignore
2375 continue;
2376 }
2377 // copy the script, and change the entry in confile
2378 ret = snprintf(tmppath, MAXPATHLEN, "%s/%s/%s",
2379 c->config_path, c->name, fname+1);
2380 if (ret < 0 || ret >= MAXPATHLEN)
2381 return -1;
2382 ret = copy_file(it->elem, tmppath);
2383 if (ret < 0)
2384 return -1;
2385 free(it->elem);
2386 it->elem = strdup(tmppath);
2387 if (!it->elem) {
2388 ERROR("out of memory copying hook path");
2389 return -1;
2390 }
2391 }
2392 }
2393
2394 if (!clone_update_unexp_hooks(c->lxc_conf, oldc->config_path,
2395 c->config_path, oldc->name, c->name)) {
2396 ERROR("Error saving new hooks in clone");
2397 return -1;
2398 }
2399 c->save_config(c, NULL);
2400 return 0;
2401 }
2402
2403
2404 static int copy_fstab(struct lxc_container *oldc, struct lxc_container *c)
2405 {
2406 char newpath[MAXPATHLEN];
2407 char *oldpath = oldc->lxc_conf->fstab;
2408 int ret;
2409
2410 if (!oldpath)
2411 return 0;
2412
2413 clear_unexp_config_line(c->lxc_conf, "lxc.mount", false);
2414
2415 char *p = strrchr(oldpath, '/');
2416 if (!p)
2417 return -1;
2418 ret = snprintf(newpath, MAXPATHLEN, "%s/%s%s",
2419 c->config_path, c->name, p);
2420 if (ret < 0 || ret >= MAXPATHLEN) {
2421 ERROR("error printing new path for %s", oldpath);
2422 return -1;
2423 }
2424 if (file_exists(newpath)) {
2425 ERROR("error: fstab file %s exists", newpath);
2426 return -1;
2427 }
2428
2429 if (copy_file(oldpath, newpath) < 0) {
2430 ERROR("error: copying %s to %s", oldpath, newpath);
2431 return -1;
2432 }
2433 free(c->lxc_conf->fstab);
2434 c->lxc_conf->fstab = strdup(newpath);
2435 if (!c->lxc_conf->fstab) {
2436 ERROR("error: allocating pathname");
2437 return -1;
2438 }
2439 if (!do_append_unexp_config_line(c->lxc_conf, "lxc.mount", newpath)) {
2440 ERROR("error saving new lxctab");
2441 return -1;
2442 }
2443
2444 return 0;
2445 }
2446
2447 static void copy_rdepends(struct lxc_container *c, struct lxc_container *c0)
2448 {
2449 char path0[MAXPATHLEN], path1[MAXPATHLEN];
2450 int ret;
2451
2452 ret = snprintf(path0, MAXPATHLEN, "%s/%s/lxc_rdepends", c0->config_path,
2453 c0->name);
2454 if (ret < 0 || ret >= MAXPATHLEN) {
2455 WARN("Error copying reverse dependencies");
2456 return;
2457 }
2458 ret = snprintf(path1, MAXPATHLEN, "%s/%s/lxc_rdepends", c->config_path,
2459 c->name);
2460 if (ret < 0 || ret >= MAXPATHLEN) {
2461 WARN("Error copying reverse dependencies");
2462 return;
2463 }
2464 if (copy_file(path0, path1) < 0) {
2465 INFO("Error copying reverse dependencies");
2466 return;
2467 }
2468 }
2469
2470 static bool add_rdepends(struct lxc_container *c, struct lxc_container *c0)
2471 {
2472 int ret;
2473 char path[MAXPATHLEN];
2474 FILE *f;
2475 bool bret;
2476
2477 ret = snprintf(path, MAXPATHLEN, "%s/%s/lxc_rdepends", c->config_path,
2478 c->name);
2479 if (ret < 0 || ret >= MAXPATHLEN)
2480 return false;
2481 f = fopen(path, "a");
2482 if (!f)
2483 return false;
2484 bret = true;
2485 // if anything goes wrong, just return an error
2486 if (fprintf(f, "%s\n%s\n", c0->config_path, c0->name) < 0)
2487 bret = false;
2488 if (fclose(f) != 0)
2489 bret = false;
2490 return bret;
2491 }
2492
2493 static int copy_storage(struct lxc_container *c0, struct lxc_container *c,
2494 const char *newtype, int flags, const char *bdevdata, uint64_t newsize)
2495 {
2496 struct bdev *bdev;
2497 int need_rdep;
2498
2499 bdev = bdev_copy(c0, c->name, c->config_path, newtype, flags,
2500 bdevdata, newsize, &need_rdep);
2501 if (!bdev) {
2502 ERROR("Error copying storage");
2503 return -1;
2504 }
2505 free(c->lxc_conf->rootfs.path);
2506 c->lxc_conf->rootfs.path = strdup(bdev->src);
2507 bdev_put(bdev);
2508 if (!c->lxc_conf->rootfs.path) {
2509 ERROR("Out of memory while setting storage path");
2510 return -1;
2511 }
2512 // We will simply append a new lxc.rootfs entry to the unexpanded config
2513 clear_unexp_config_line(c->lxc_conf, "lxc.rootfs", false);
2514 if (!do_append_unexp_config_line(c->lxc_conf, "lxc.rootfs", c->lxc_conf->rootfs.path)) {
2515 ERROR("Error saving new rootfs to cloend config");
2516 return -1;
2517 }
2518 if (flags & LXC_CLONE_SNAPSHOT)
2519 copy_rdepends(c, c0);
2520 if (need_rdep) {
2521 if (!add_rdepends(c, c0))
2522 WARN("Error adding reverse dependency from %s to %s",
2523 c->name, c0->name);
2524 }
2525
2526 mod_all_rdeps(c, true);
2527
2528 return 0;
2529 }
2530
2531 struct clone_update_data {
2532 struct lxc_container *c0;
2533 struct lxc_container *c1;
2534 int flags;
2535 char **hookargs;
2536 };
2537
2538 static int clone_update_rootfs(struct clone_update_data *data)
2539 {
2540 struct lxc_container *c0 = data->c0;
2541 struct lxc_container *c = data->c1;
2542 int flags = data->flags;
2543 char **hookargs = data->hookargs;
2544 int ret = -1;
2545 char path[MAXPATHLEN];
2546 struct bdev *bdev;
2547 FILE *fout;
2548 struct lxc_conf *conf = c->lxc_conf;
2549
2550 /* update hostname in rootfs */
2551 /* we're going to mount, so run in a clean namespace to simplify cleanup */
2552
2553 if (setgid(0) < 0) {
2554 ERROR("Failed to setgid to 0");
2555 return -1;
2556 }
2557 if (setuid(0) < 0) {
2558 ERROR("Failed to setuid to 0");
2559 return -1;
2560 }
2561 if (setgroups(0, NULL) < 0)
2562 WARN("Failed to clear groups");
2563
2564 if (unshare(CLONE_NEWNS) < 0)
2565 return -1;
2566 bdev = bdev_init(c->lxc_conf, c->lxc_conf->rootfs.path, c->lxc_conf->rootfs.mount, NULL);
2567 if (!bdev)
2568 return -1;
2569 if (strcmp(bdev->type, "dir") != 0) {
2570 if (unshare(CLONE_NEWNS) < 0) {
2571 ERROR("error unsharing mounts");
2572 bdev_put(bdev);
2573 return -1;
2574 }
2575 if (detect_shared_rootfs()) {
2576 if (mount(NULL, "/", NULL, MS_SLAVE|MS_REC, NULL)) {
2577 SYSERROR("Failed to make / rslave");
2578 ERROR("Continuing...");
2579 }
2580 }
2581 if (bdev->ops->mount(bdev) < 0) {
2582 bdev_put(bdev);
2583 return -1;
2584 }
2585 } else { // TODO come up with a better way
2586 if (bdev->dest)
2587 free(bdev->dest);
2588 bdev->dest = strdup(bdev->src);
2589 }
2590
2591 if (!lxc_list_empty(&conf->hooks[LXCHOOK_CLONE])) {
2592 /* Start of environment variable setup for hooks */
2593 if (setenv("LXC_SRC_NAME", c0->name, 1)) {
2594 SYSERROR("failed to set environment variable for source container name");
2595 }
2596 if (setenv("LXC_NAME", c->name, 1)) {
2597 SYSERROR("failed to set environment variable for container name");
2598 }
2599 if (setenv("LXC_CONFIG_FILE", conf->rcfile, 1)) {
2600 SYSERROR("failed to set environment variable for config path");
2601 }
2602 if (setenv("LXC_ROOTFS_MOUNT", bdev->dest, 1)) {
2603 SYSERROR("failed to set environment variable for rootfs mount");
2604 }
2605 if (setenv("LXC_ROOTFS_PATH", conf->rootfs.path, 1)) {
2606 SYSERROR("failed to set environment variable for rootfs mount");
2607 }
2608
2609 if (run_lxc_hooks(c->name, "clone", conf, c->get_config_path(c), hookargs)) {
2610 ERROR("Error executing clone hook for %s", c->name);
2611 bdev_put(bdev);
2612 return -1;
2613 }
2614 }
2615
2616 if (!(flags & LXC_CLONE_KEEPNAME)) {
2617 ret = snprintf(path, MAXPATHLEN, "%s/etc/hostname", bdev->dest);
2618 bdev_put(bdev);
2619
2620 if (ret < 0 || ret >= MAXPATHLEN)
2621 return -1;
2622 if (!file_exists(path))
2623 return 0;
2624 if (!(fout = fopen(path, "w"))) {
2625 SYSERROR("unable to open %s: ignoring", path);
2626 return 0;
2627 }
2628 if (fprintf(fout, "%s", c->name) < 0) {
2629 fclose(fout);
2630 return -1;
2631 }
2632 if (fclose(fout) < 0)
2633 return -1;
2634 }
2635 else
2636 bdev_put(bdev);
2637
2638 return 0;
2639 }
2640
2641 static int clone_update_rootfs_wrapper(void *data)
2642 {
2643 struct clone_update_data *arg = (struct clone_update_data *) data;
2644 return clone_update_rootfs(arg);
2645 }
2646
2647 /*
2648 * We want to support:
2649 sudo lxc-clone -o o1 -n n1 -s -L|-fssize fssize -v|--vgname vgname \
2650 -p|--lvprefix lvprefix -t|--fstype fstype -B backingstore
2651
2652 -s [ implies overlayfs]
2653 -s -B overlayfs
2654 -s -B aufs
2655
2656 only rootfs gets converted (copied/snapshotted) on clone.
2657 */
2658
2659 static int create_file_dirname(char *path, struct lxc_conf *conf)
2660 {
2661 char *p = strrchr(path, '/');
2662 int ret = -1;
2663
2664 if (!p)
2665 return -1;
2666 *p = '\0';
2667 ret = do_create_container_dir(path, conf);
2668 *p = '/';
2669 return ret;
2670 }
2671
2672 static struct lxc_container *lxcapi_clone(struct lxc_container *c, const char *newname,
2673 const char *lxcpath, int flags,
2674 const char *bdevtype, const char *bdevdata, uint64_t newsize,
2675 char **hookargs)
2676 {
2677 struct lxc_container *c2 = NULL;
2678 char newpath[MAXPATHLEN];
2679 int ret, storage_copied = 0;
2680 char *origroot = NULL;
2681 struct clone_update_data data;
2682 FILE *fout;
2683 pid_t pid;
2684
2685 if (!c || !c->is_defined(c))
2686 return NULL;
2687
2688 if (container_mem_lock(c))
2689 return NULL;
2690
2691 if (!is_stopped(c)) {
2692 ERROR("error: Original container (%s) is running", c->name);
2693 goto out;
2694 }
2695
2696 // Make sure the container doesn't yet exist.
2697 if (!newname)
2698 newname = c->name;
2699 if (!lxcpath)
2700 lxcpath = c->get_config_path(c);
2701 ret = snprintf(newpath, MAXPATHLEN, "%s/%s/config", lxcpath, newname);
2702 if (ret < 0 || ret >= MAXPATHLEN) {
2703 SYSERROR("clone: failed making config pathname");
2704 goto out;
2705 }
2706 if (file_exists(newpath)) {
2707 ERROR("error: clone: %s exists", newpath);
2708 goto out;
2709 }
2710
2711 ret = create_file_dirname(newpath, c->lxc_conf);
2712 if (ret < 0 && errno != EEXIST) {
2713 ERROR("Error creating container dir for %s", newpath);
2714 goto out;
2715 }
2716
2717 // copy the configuration, tweak it as needed,
2718 if (c->lxc_conf->rootfs.path) {
2719 origroot = c->lxc_conf->rootfs.path;
2720 c->lxc_conf->rootfs.path = NULL;
2721 }
2722 fout = fopen(newpath, "w");
2723 if (!fout) {
2724 SYSERROR("open %s", newpath);
2725 goto out;
2726 }
2727 write_config(fout, c->lxc_conf);
2728 fclose(fout);
2729 c->lxc_conf->rootfs.path = origroot;
2730
2731 sprintf(newpath, "%s/%s/rootfs", lxcpath, newname);
2732 if (mkdir(newpath, 0755) < 0) {
2733 SYSERROR("error creating %s", newpath);
2734 goto out;
2735 }
2736
2737 if (am_unpriv()) {
2738 if (chown_mapped_root(newpath, c->lxc_conf) < 0) {
2739 ERROR("Error chowning %s to container root", newpath);
2740 goto out;
2741 }
2742 }
2743
2744 c2 = lxc_container_new(newname, lxcpath);
2745 if (!c2) {
2746 ERROR("clone: failed to create new container (%s %s)", newname,
2747 lxcpath);
2748 goto out;
2749 }
2750
2751 // copy/snapshot rootfs's
2752 ret = copy_storage(c, c2, bdevtype, flags, bdevdata, newsize);
2753 if (ret < 0)
2754 goto out;
2755
2756 clear_unexp_config_line(c2->lxc_conf, "lxc.utsname", false);
2757
2758 // update utsname
2759 if (!set_config_item_locked(c2, "lxc.utsname", newname)) {
2760 ERROR("Error setting new hostname");
2761 goto out;
2762 }
2763
2764 // copy hooks
2765 ret = copyhooks(c, c2);
2766 if (ret < 0) {
2767 ERROR("error copying hooks");
2768 goto out;
2769 }
2770
2771 if (copy_fstab(c, c2) < 0) {
2772 ERROR("error copying fstab");
2773 goto out;
2774 }
2775
2776 // update macaddrs
2777 if (!(flags & LXC_CLONE_KEEPMACADDR)) {
2778 if (!network_new_hwaddrs(c2->lxc_conf)) {
2779 ERROR("Error updating mac addresses");
2780 goto out;
2781 }
2782 }
2783
2784 // We've now successfully created c2's storage, so clear it out if we
2785 // fail after this
2786 storage_copied = 1;
2787
2788 if (!c2->save_config(c2, NULL))
2789 goto out;
2790
2791 if ((pid = fork()) < 0) {
2792 SYSERROR("fork");
2793 goto out;
2794 }
2795 if (pid > 0) {
2796 ret = wait_for_pid(pid);
2797 if (ret)
2798 goto out;
2799 container_mem_unlock(c);
2800 return c2;
2801 }
2802 data.c0 = c;
2803 data.c1 = c2;
2804 data.flags = flags;
2805 data.hookargs = hookargs;
2806 if (am_unpriv())
2807 ret = userns_exec_1(c->lxc_conf, clone_update_rootfs_wrapper,
2808 &data);
2809 else
2810 ret = clone_update_rootfs(&data);
2811 if (ret < 0)
2812 exit(1);
2813
2814 container_mem_unlock(c);
2815 exit(0);
2816
2817 out:
2818 container_mem_unlock(c);
2819 if (c2) {
2820 if (!storage_copied)
2821 c2->lxc_conf->rootfs.path = NULL;
2822 c2->destroy(c2);
2823 lxc_container_put(c2);
2824 }
2825
2826 return NULL;
2827 }
2828
2829 static bool lxcapi_rename(struct lxc_container *c, const char *newname)
2830 {
2831 struct bdev *bdev;
2832 struct lxc_container *newc;
2833
2834 if (!c || !c->name || !c->config_path || !c->lxc_conf)
2835 return false;
2836
2837 if (has_fs_snapshots(c) || has_snapshots(c)) {
2838 ERROR("Renaming a container with snapshots is not supported");
2839 return false;
2840 }
2841 bdev = bdev_init(c->lxc_conf, c->lxc_conf->rootfs.path, c->lxc_conf->rootfs.mount, NULL);
2842 if (!bdev) {
2843 ERROR("Failed to find original backing store type");
2844 return false;
2845 }
2846
2847 newc = lxcapi_clone(c, newname, c->config_path, LXC_CLONE_KEEPMACADDR, NULL, bdev->type, 0, NULL);
2848 bdev_put(bdev);
2849 if (!newc) {
2850 lxc_container_put(newc);
2851 return false;
2852 }
2853
2854 if (newc && lxcapi_is_defined(newc))
2855 lxc_container_put(newc);
2856
2857 if (!container_destroy(c)) {
2858 ERROR("Could not destroy existing container %s", c->name);
2859 return false;
2860 }
2861 return true;
2862 }
2863
2864 static int lxcapi_attach(struct lxc_container *c, lxc_attach_exec_t exec_function, void *exec_payload, lxc_attach_options_t *options, pid_t *attached_process)
2865 {
2866 if (!c)
2867 return -1;
2868
2869 return lxc_attach(c->name, c->config_path, exec_function, exec_payload, options, attached_process);
2870 }
2871
2872 static int lxcapi_attach_run_wait(struct lxc_container *c, lxc_attach_options_t *options, const char *program, const char * const argv[])
2873 {
2874 lxc_attach_command_t command;
2875 pid_t pid;
2876 int r;
2877
2878 if (!c)
2879 return -1;
2880
2881 command.program = (char*)program;
2882 command.argv = (char**)argv;
2883 r = lxc_attach(c->name, c->config_path, lxc_attach_run_command, &command, options, &pid);
2884 if (r < 0) {
2885 ERROR("ups");
2886 return r;
2887 }
2888 return lxc_wait_for_pid_status(pid);
2889 }
2890
2891 static int get_next_index(const char *lxcpath, char *cname)
2892 {
2893 char *fname;
2894 struct stat sb;
2895 int i = 0, ret;
2896
2897 fname = alloca(strlen(lxcpath) + 20);
2898 while (1) {
2899 sprintf(fname, "%s/snap%d", lxcpath, i);
2900 ret = stat(fname, &sb);
2901 if (ret != 0)
2902 return i;
2903 i++;
2904 }
2905 }
2906
2907 static bool get_snappath_dir(struct lxc_container *c, char *snappath)
2908 {
2909 int ret;
2910 /*
2911 * If the old style snapshot path exists, use it
2912 * /var/lib/lxc -> /var/lib/lxcsnaps
2913 */
2914 ret = snprintf(snappath, MAXPATHLEN, "%ssnaps", c->config_path);
2915 if (ret < 0 || ret >= MAXPATHLEN)
2916 return false;
2917 if (dir_exists(snappath)) {
2918 ret = snprintf(snappath, MAXPATHLEN, "%ssnaps/%s", c->config_path, c->name);
2919 if (ret < 0 || ret >= MAXPATHLEN)
2920 return false;
2921 return true;
2922 }
2923
2924 /*
2925 * Use the new style path
2926 * /var/lib/lxc -> /var/lib/lxc + c->name + /snaps + \0
2927 */
2928 ret = snprintf(snappath, MAXPATHLEN, "%s/%s/snaps", c->config_path, c->name);
2929 if (ret < 0 || ret >= MAXPATHLEN)
2930 return false;
2931 return true;
2932 }
2933
2934 static int lxcapi_snapshot(struct lxc_container *c, const char *commentfile)
2935 {
2936 int i, flags, ret;
2937 struct lxc_container *c2;
2938 char snappath[MAXPATHLEN], newname[20];
2939
2940 if (!c || !lxcapi_is_defined(c))
2941 return -1;
2942
2943 if (!bdev_can_backup(c->lxc_conf)) {
2944 ERROR("%s's backing store cannot be backed up.", c->name);
2945 ERROR("Your container must use another backing store type.");
2946 return -1;
2947 }
2948
2949 if (!get_snappath_dir(c, snappath))
2950 return -1;
2951
2952 i = get_next_index(snappath, c->name);
2953
2954 if (mkdir_p(snappath, 0755) < 0) {
2955 ERROR("Failed to create snapshot directory %s", snappath);
2956 return -1;
2957 }
2958
2959 ret = snprintf(newname, 20, "snap%d", i);
2960 if (ret < 0 || ret >= 20)
2961 return -1;
2962
2963 /*
2964 * We pass LXC_CLONE_SNAPSHOT to make sure that a rdepends file entry is
2965 * created in the original container
2966 */
2967 flags = LXC_CLONE_SNAPSHOT | LXC_CLONE_KEEPMACADDR | LXC_CLONE_KEEPNAME |
2968 LXC_CLONE_KEEPBDEVTYPE | LXC_CLONE_MAYBE_SNAPSHOT;
2969 if (bdev_is_dir(c->lxc_conf, c->lxc_conf->rootfs.path)) {
2970 ERROR("Snapshot of directory-backed container requested.");
2971 ERROR("Making a copy-clone. If you do want snapshots, then");
2972 ERROR("please create an aufs or overlayfs clone first, snapshot that");
2973 ERROR("and keep the original container pristine.");
2974 flags &= ~LXC_CLONE_SNAPSHOT | LXC_CLONE_MAYBE_SNAPSHOT;
2975 }
2976 c2 = c->clone(c, newname, snappath, flags, NULL, NULL, 0, NULL);
2977 if (!c2) {
2978 ERROR("clone of %s:%s failed", c->config_path, c->name);
2979 return -1;
2980 }
2981
2982 lxc_container_put(c2);
2983
2984 // Now write down the creation time
2985 time_t timer;
2986 char buffer[25];
2987 struct tm* tm_info;
2988 FILE *f;
2989
2990 time(&timer);
2991 tm_info = localtime(&timer);
2992
2993 strftime(buffer, 25, "%Y:%m:%d %H:%M:%S", tm_info);
2994
2995 char *dfnam = alloca(strlen(snappath) + strlen(newname) + 5);
2996 sprintf(dfnam, "%s/%s/ts", snappath, newname);
2997 f = fopen(dfnam, "w");
2998 if (!f) {
2999 ERROR("Failed to open %s", dfnam);
3000 return -1;
3001 }
3002 if (fprintf(f, "%s", buffer) < 0) {
3003 SYSERROR("Writing timestamp");
3004 fclose(f);
3005 return -1;
3006 }
3007 ret = fclose(f);
3008 if (ret != 0) {
3009 SYSERROR("Writing timestamp");
3010 return -1;
3011 }
3012
3013 if (commentfile) {
3014 // $p / $name / comment \0
3015 int len = strlen(snappath) + strlen(newname) + 10;
3016 char *path = alloca(len);
3017 sprintf(path, "%s/%s/comment", snappath, newname);
3018 return copy_file(commentfile, path) < 0 ? -1 : i;
3019 }
3020
3021 return i;
3022 }
3023
3024 static void lxcsnap_free(struct lxc_snapshot *s)
3025 {
3026 if (s->name)
3027 free(s->name);
3028 if (s->comment_pathname)
3029 free(s->comment_pathname);
3030 if (s->timestamp)
3031 free(s->timestamp);
3032 if (s->lxcpath)
3033 free(s->lxcpath);
3034 }
3035
3036 static char *get_snapcomment_path(char* snappath, char *name)
3037 {
3038 // $snappath/$name/comment
3039 int ret, len = strlen(snappath) + strlen(name) + 10;
3040 char *s = malloc(len);
3041
3042 if (s) {
3043 ret = snprintf(s, len, "%s/%s/comment", snappath, name);
3044 if (ret < 0 || ret >= len) {
3045 free(s);
3046 s = NULL;
3047 }
3048 }
3049 return s;
3050 }
3051
3052 static char *get_timestamp(char* snappath, char *name)
3053 {
3054 char path[MAXPATHLEN], *s = NULL;
3055 int ret, len;
3056 FILE *fin;
3057
3058 ret = snprintf(path, MAXPATHLEN, "%s/%s/ts", snappath, name);
3059 if (ret < 0 || ret >= MAXPATHLEN)
3060 return NULL;
3061 fin = fopen(path, "r");
3062 if (!fin)
3063 return NULL;
3064 (void) fseek(fin, 0, SEEK_END);
3065 len = ftell(fin);
3066 (void) fseek(fin, 0, SEEK_SET);
3067 if (len > 0) {
3068 s = malloc(len+1);
3069 if (s) {
3070 s[len] = '\0';
3071 if (fread(s, 1, len, fin) != len) {
3072 SYSERROR("reading timestamp");
3073 free(s);
3074 s = NULL;
3075 }
3076 }
3077 }
3078 fclose(fin);
3079 return s;
3080 }
3081
3082 static int lxcapi_snapshot_list(struct lxc_container *c, struct lxc_snapshot **ret_snaps)
3083 {
3084 char snappath[MAXPATHLEN], path2[MAXPATHLEN];
3085 int count = 0, ret;
3086 struct dirent dirent, *direntp;
3087 struct lxc_snapshot *snaps =NULL, *nsnaps;
3088 DIR *dir;
3089
3090 if (!c || !lxcapi_is_defined(c))
3091 return -1;
3092
3093 if (!get_snappath_dir(c, snappath)) {
3094 ERROR("path name too long");
3095 return -1;
3096 }
3097 dir = opendir(snappath);
3098 if (!dir) {
3099 INFO("failed to open %s - assuming no snapshots", snappath);
3100 return 0;
3101 }
3102
3103 while (!readdir_r(dir, &dirent, &direntp)) {
3104 if (!direntp)
3105 break;
3106
3107 if (!strcmp(direntp->d_name, "."))
3108 continue;
3109
3110 if (!strcmp(direntp->d_name, ".."))
3111 continue;
3112
3113 ret = snprintf(path2, MAXPATHLEN, "%s/%s/config", snappath, direntp->d_name);
3114 if (ret < 0 || ret >= MAXPATHLEN) {
3115 ERROR("pathname too long");
3116 goto out_free;
3117 }
3118 if (!file_exists(path2))
3119 continue;
3120 nsnaps = realloc(snaps, (count + 1)*sizeof(*snaps));
3121 if (!nsnaps) {
3122 SYSERROR("Out of memory");
3123 goto out_free;
3124 }
3125 snaps = nsnaps;
3126 snaps[count].free = lxcsnap_free;
3127 snaps[count].name = strdup(direntp->d_name);
3128 if (!snaps[count].name)
3129 goto out_free;
3130 snaps[count].lxcpath = strdup(snappath);
3131 if (!snaps[count].lxcpath) {
3132 free(snaps[count].name);
3133 goto out_free;
3134 }
3135 snaps[count].comment_pathname = get_snapcomment_path(snappath, direntp->d_name);
3136 snaps[count].timestamp = get_timestamp(snappath, direntp->d_name);
3137 count++;
3138 }
3139
3140 if (closedir(dir))
3141 WARN("failed to close directory");
3142
3143 *ret_snaps = snaps;
3144 return count;
3145
3146 out_free:
3147 if (snaps) {
3148 int i;
3149 for (i=0; i<count; i++)
3150 lxcsnap_free(&snaps[i]);
3151 free(snaps);
3152 }
3153 if (closedir(dir))
3154 WARN("failed to close directory");
3155 return -1;
3156 }
3157
3158 static bool lxcapi_snapshot_restore(struct lxc_container *c, const char *snapname, const char *newname)
3159 {
3160 char clonelxcpath[MAXPATHLEN];
3161 int flags = 0;
3162 struct lxc_container *snap, *rest;
3163 struct bdev *bdev;
3164 bool b = false;
3165
3166 if (!c || !c->name || !c->config_path)
3167 return false;
3168
3169 if (has_fs_snapshots(c)) {
3170 ERROR("container rootfs has dependent snapshots");
3171 return false;
3172 }
3173
3174 bdev = bdev_init(c->lxc_conf, c->lxc_conf->rootfs.path, c->lxc_conf->rootfs.mount, NULL);
3175 if (!bdev) {
3176 ERROR("Failed to find original backing store type");
3177 return false;
3178 }
3179
3180 if (!newname)
3181 newname = c->name;
3182
3183 if (!get_snappath_dir(c, clonelxcpath)) {
3184 bdev_put(bdev);
3185 return false;
3186 }
3187 // how should we lock this?
3188
3189 snap = lxc_container_new(snapname, clonelxcpath);
3190 if (!snap || !lxcapi_is_defined(snap)) {
3191 ERROR("Could not open snapshot %s", snapname);
3192 if (snap) lxc_container_put(snap);
3193 bdev_put(bdev);
3194 return false;
3195 }
3196
3197 if (strcmp(c->name, newname) == 0) {
3198 if (!container_destroy(c)) {
3199 ERROR("Could not destroy existing container %s", newname);
3200 lxc_container_put(snap);
3201 bdev_put(bdev);
3202 return false;
3203 }
3204 }
3205
3206 if (strcmp(bdev->type, "dir") != 0 && strcmp(bdev->type, "loop") != 0)
3207 flags = LXC_CLONE_SNAPSHOT | LXC_CLONE_MAYBE_SNAPSHOT;
3208 rest = lxcapi_clone(snap, newname, c->config_path, flags,
3209 bdev->type, NULL, 0, NULL);
3210 bdev_put(bdev);
3211 if (rest && lxcapi_is_defined(rest))
3212 b = true;
3213 if (rest)
3214 lxc_container_put(rest);
3215 lxc_container_put(snap);
3216 return b;
3217 }
3218
3219 static bool do_snapshot_destroy(const char *snapname, const char *clonelxcpath)
3220 {
3221 struct lxc_container *snap = NULL;
3222 bool bret = false;
3223
3224 snap = lxc_container_new(snapname, clonelxcpath);
3225 if (!snap) {
3226 ERROR("Could not find snapshot %s", snapname);
3227 goto err;
3228 }
3229
3230 if (!lxcapi_destroy(snap)) {
3231 ERROR("Could not destroy snapshot %s", snapname);
3232 goto err;
3233 }
3234 bret = true;
3235
3236 err:
3237 if (snap)
3238 lxc_container_put(snap);
3239 return bret;
3240 }
3241
3242 static bool remove_all_snapshots(const char *path)
3243 {
3244 DIR *dir;
3245 struct dirent dirent, *direntp;
3246 bool bret = true;
3247
3248 dir = opendir(path);
3249 if (!dir) {
3250 SYSERROR("opendir on snapshot path %s", path);
3251 return false;
3252 }
3253 while (!readdir_r(dir, &dirent, &direntp)) {
3254 if (!direntp)
3255 break;
3256 if (!strcmp(direntp->d_name, "."))
3257 continue;
3258 if (!strcmp(direntp->d_name, ".."))
3259 continue;
3260 if (!do_snapshot_destroy(direntp->d_name, path)) {
3261 bret = false;
3262 continue;
3263 }
3264 }
3265
3266 closedir(dir);
3267
3268 if (rmdir(path))
3269 SYSERROR("Error removing directory %s", path);
3270
3271 return bret;
3272 }
3273
3274 static bool lxcapi_snapshot_destroy(struct lxc_container *c, const char *snapname)
3275 {
3276 char clonelxcpath[MAXPATHLEN];
3277
3278 if (!c || !c->name || !c->config_path || !snapname)
3279 return false;
3280
3281 if (!get_snappath_dir(c, clonelxcpath))
3282 return false;
3283
3284 return do_snapshot_destroy(snapname, clonelxcpath);
3285 }
3286
3287 static bool lxcapi_snapshot_destroy_all(struct lxc_container *c)
3288 {
3289 char clonelxcpath[MAXPATHLEN];
3290
3291 if (!c || !c->name || !c->config_path)
3292 return false;
3293
3294 if (!get_snappath_dir(c, clonelxcpath))
3295 return false;
3296
3297 return remove_all_snapshots(clonelxcpath);
3298 }
3299
3300 static bool lxcapi_may_control(struct lxc_container *c)
3301 {
3302 return lxc_try_cmd(c->name, c->config_path) == 0;
3303 }
3304
3305 static bool do_add_remove_node(pid_t init_pid, const char *path, bool add,
3306 struct stat *st)
3307 {
3308 char chrootpath[MAXPATHLEN];
3309 char *directory_path = NULL;
3310 pid_t pid;
3311 int ret;
3312
3313 if ((pid = fork()) < 0) {
3314 SYSERROR("failed to fork a child helper");
3315 return false;
3316 }
3317 if (pid) {
3318 if (wait_for_pid(pid) != 0) {
3319 ERROR("Failed to create note in guest");
3320 return false;
3321 }
3322 return true;
3323 }
3324
3325 /* prepare the path */
3326 ret = snprintf(chrootpath, MAXPATHLEN, "/proc/%d/root", init_pid);
3327 if (ret < 0 || ret >= MAXPATHLEN)
3328 return false;
3329
3330 if (chroot(chrootpath) < 0)
3331 exit(1);
3332 if (chdir("/") < 0)
3333 exit(1);
3334 /* remove path if it exists */
3335 if(faccessat(AT_FDCWD, path, F_OK, AT_SYMLINK_NOFOLLOW) == 0) {
3336 if (unlink(path) < 0) {
3337 ERROR("unlink failed");
3338 exit(1);
3339 }
3340 }
3341 if (!add)
3342 exit(0);
3343
3344 /* create any missing directories */
3345 directory_path = dirname(strdup(path));
3346 if (mkdir_p(directory_path, 0755) < 0 && errno != EEXIST) {
3347 ERROR("failed to create directory");
3348 exit(1);
3349 }
3350
3351 /* create the device node */
3352 if (mknod(path, st->st_mode, st->st_rdev) < 0) {
3353 ERROR("mknod failed");
3354 exit(1);
3355 }
3356
3357 exit(0);
3358 }
3359
3360 static bool add_remove_device_node(struct lxc_container *c, const char *src_path, const char *dest_path, bool add)
3361 {
3362 int ret;
3363 struct stat st;
3364 char value[MAX_BUFFER];
3365 const char *p;
3366
3367 /* make sure container is running */
3368 if (!c->is_running(c)) {
3369 ERROR("container is not running");
3370 return false;
3371 }
3372
3373 /* use src_path if dest_path is NULL otherwise use dest_path */
3374 p = dest_path ? dest_path : src_path;
3375
3376 /* make sure we can access p */
3377 if(access(p, F_OK) < 0 || stat(p, &st) < 0)
3378 return false;
3379
3380 /* continue if path is character device or block device */
3381 if (S_ISCHR(st.st_mode))
3382 ret = snprintf(value, MAX_BUFFER, "c %d:%d rwm", major(st.st_rdev), minor(st.st_rdev));
3383 else if (S_ISBLK(st.st_mode))
3384 ret = snprintf(value, MAX_BUFFER, "b %d:%d rwm", major(st.st_rdev), minor(st.st_rdev));
3385 else
3386 return false;
3387
3388 /* check snprintf return code */
3389 if (ret < 0 || ret >= MAX_BUFFER)
3390 return false;
3391
3392 if (!do_add_remove_node(c->init_pid(c), p, add, &st))
3393 return false;
3394
3395 /* add or remove device to/from cgroup access list */
3396 if (add) {
3397 if (!c->set_cgroup_item(c, "devices.allow", value)) {
3398 ERROR("set_cgroup_item failed while adding the device node");
3399 return false;
3400 }
3401 } else {
3402 if (!c->set_cgroup_item(c, "devices.deny", value)) {
3403 ERROR("set_cgroup_item failed while removing the device node");
3404 return false;
3405 }
3406 }
3407
3408 return true;
3409 }
3410
3411 static bool lxcapi_add_device_node(struct lxc_container *c, const char *src_path, const char *dest_path)
3412 {
3413 if (am_unpriv()) {
3414 ERROR(NOT_SUPPORTED_ERROR, __FUNCTION__);
3415 return false;
3416 }
3417 return add_remove_device_node(c, src_path, dest_path, true);
3418 }
3419
3420 static bool lxcapi_remove_device_node(struct lxc_container *c, const char *src_path, const char *dest_path)
3421 {
3422 if (am_unpriv()) {
3423 ERROR(NOT_SUPPORTED_ERROR, __FUNCTION__);
3424 return false;
3425 }
3426 return add_remove_device_node(c, src_path, dest_path, false);
3427 }
3428
3429 struct criu_opts {
3430 /* The type of criu invocation, one of "dump" or "restore" */
3431 char *action;
3432
3433 /* The directory to pass to criu */
3434 char *directory;
3435
3436 /* The container to dump */
3437 struct lxc_container *c;
3438
3439 /* Enable criu verbose mode? */
3440 bool verbose;
3441
3442 /* dump: stop the container or not after dumping? */
3443 bool stop;
3444
3445 /* restore: the file to write the init process' pid into */
3446 char *pidfile;
3447 const char *cgroup_path;
3448 };
3449
3450 /*
3451 * @out must be 128 bytes long
3452 */
3453 static int read_criu_file(const char *directory, const char *file, int netnr, char *out)
3454 {
3455 char path[PATH_MAX];
3456 int ret;
3457 FILE *f;
3458
3459 ret = snprintf(path, PATH_MAX, "%s/%s%d", directory, file, netnr);
3460 if (ret < 0 || ret >= PATH_MAX) {
3461 ERROR("%s: path too long", __func__);
3462 return -1;
3463 }
3464
3465 f = fopen(path, "r");
3466 if (!f)
3467 return -1;
3468
3469 ret = fscanf(f, "%127s", out);
3470 fclose(f);
3471 if (ret <= 0)
3472 return -1;
3473
3474 return 0;
3475 }
3476
3477 static void exec_criu(struct criu_opts *opts)
3478 {
3479 char **argv, log[PATH_MAX];
3480 int static_args = 14, argc = 0, i, ret;
3481
3482 /* The command line always looks like:
3483 * criu $(action) --tcp-established --file-locks --link-remap --force-irmap \
3484 * --manage-cgroups action-script foo.sh -D $(directory) \
3485 * -o $(directory)/$(action).log
3486 * +1 for final NULL */
3487
3488 if (strcmp(opts->action, "dump") == 0) {
3489 /* -t pid */
3490 static_args += 2;
3491
3492 /* --leave-running */
3493 if (!opts->stop)
3494 static_args++;
3495 } else if (strcmp(opts->action, "restore") == 0) {
3496 /* --root $(lxc_mount_point) --restore-detached
3497 * --restore-sibling --pidfile $foo --cgroup-root $foo */
3498 static_args += 8;
3499 } else {
3500 return;
3501 }
3502
3503 if (opts->verbose)
3504 static_args++;
3505
3506 ret = snprintf(log, PATH_MAX, "%s/%s.log", opts->directory, opts->action);
3507 if (ret < 0 || ret >= PATH_MAX) {
3508 ERROR("logfile name too long\n");
3509 return;
3510 }
3511
3512 argv = malloc(static_args * sizeof(*argv));
3513 if (!argv)
3514 return;
3515
3516 memset(argv, 0, static_args * sizeof(*argv));
3517
3518 #define DECLARE_ARG(arg) \
3519 do { \
3520 if (arg == NULL) { \
3521 ERROR("Got NULL argument for criu"); \
3522 goto err; \
3523 } \
3524 argv[argc++] = strdup(arg); \
3525 if (!argv[argc-1]) \
3526 goto err; \
3527 } while (0)
3528
3529 argv[argc++] = on_path("criu", NULL);
3530 if (!argv[argc-1]) {
3531 ERROR("Couldn't find criu binary\n");
3532 goto err;
3533 }
3534
3535 DECLARE_ARG(opts->action);
3536 DECLARE_ARG("--tcp-established");
3537 DECLARE_ARG("--file-locks");
3538 DECLARE_ARG("--link-remap");
3539 DECLARE_ARG("--force-irmap");
3540 DECLARE_ARG("--manage-cgroups");
3541 DECLARE_ARG("--action-script");
3542 DECLARE_ARG(LIBEXECDIR "/lxc/lxc-restore-net");
3543 DECLARE_ARG("-D");
3544 DECLARE_ARG(opts->directory);
3545 DECLARE_ARG("-o");
3546 DECLARE_ARG(log);
3547
3548 if (opts->verbose)
3549 DECLARE_ARG("-vvvvvv");
3550
3551 if (strcmp(opts->action, "dump") == 0) {
3552 char pid[32];
3553
3554 if (sprintf(pid, "%d", lxcapi_init_pid(opts->c)) < 0)
3555 goto err;
3556
3557 DECLARE_ARG("-t");
3558 DECLARE_ARG(pid);
3559 if (!opts->stop)
3560 DECLARE_ARG("--leave-running");
3561 } else if (strcmp(opts->action, "restore") == 0) {
3562 int netnr = 0;
3563 struct lxc_list *it;
3564
3565 DECLARE_ARG("--root");
3566 DECLARE_ARG(opts->c->lxc_conf->rootfs.mount);
3567 DECLARE_ARG("--restore-detached");
3568 DECLARE_ARG("--restore-sibling");
3569 DECLARE_ARG("--pidfile");
3570 DECLARE_ARG(opts->pidfile);
3571 DECLARE_ARG("--cgroup-root");
3572 DECLARE_ARG(opts->cgroup_path);
3573
3574 lxc_list_for_each(it, &opts->c->lxc_conf->network) {
3575 char eth[128], veth[128], buf[257];
3576 void *m;
3577
3578 if (read_criu_file(opts->directory, "veth", netnr, veth))
3579 goto err;
3580 if (read_criu_file(opts->directory, "eth", netnr, eth))
3581 goto err;
3582 ret = snprintf(buf, 257, "%s=%s", eth, veth);
3583 if (ret < 0 || ret >= 257)
3584 goto err;
3585
3586 /* final NULL and --veth-pair eth0:vethASDF */
3587 m = realloc(argv, (argc + 1 + 2) * sizeof(*argv));
3588 if (!m)
3589 goto err;
3590 argv = m;
3591
3592 DECLARE_ARG("--veth-pair");
3593 DECLARE_ARG(buf);
3594 argv[argc] = NULL;
3595
3596 netnr++;
3597 }
3598 }
3599
3600 #undef DECLARE_ARG
3601
3602 execv(argv[0], argv);
3603 err:
3604 for (i = 0; argv[i]; i++)
3605 free(argv[i]);
3606 free(argv);
3607 }
3608
3609 /* Check and make sure the container has a configuration that we know CRIU can
3610 * dump. */
3611 static bool criu_ok(struct lxc_container *c)
3612 {
3613 struct lxc_list *it;
3614 bool found_deny_rule = false;
3615
3616 if (geteuid()) {
3617 ERROR("Must be root to checkpoint\n");
3618 return false;
3619 }
3620
3621 /* We only know how to restore containers with veth networks. */
3622 lxc_list_for_each(it, &c->lxc_conf->network) {
3623 struct lxc_netdev *n = it->elem;
3624 if (n->type != LXC_NET_VETH && n->type != LXC_NET_NONE) {
3625 ERROR("Found network that is not VETH or NONE\n");
3626 return false;
3627 }
3628 }
3629
3630 // These requirements come from http://criu.org/LXC
3631 if (c->lxc_conf->console.path &&
3632 strcmp(c->lxc_conf->console.path, "none") != 0) {
3633 ERROR("lxc.console must be none\n");
3634 return false;
3635 }
3636
3637 if (c->lxc_conf->tty != 0) {
3638 ERROR("lxc.tty must be 0\n");
3639 return false;
3640 }
3641
3642 lxc_list_for_each(it, &c->lxc_conf->cgroup) {
3643 struct lxc_cgroup *cg = it->elem;
3644 if (strcmp(cg->subsystem, "devices.deny") == 0 &&
3645 strcmp(cg->value, "c 5:1 rwm") == 0) {
3646
3647 found_deny_rule = true;
3648 break;
3649 }
3650 }
3651
3652 if (!found_deny_rule) {
3653 ERROR("couldn't find devices.deny = c 5:1 rwm");
3654 return false;
3655 }
3656
3657 return true;
3658 }
3659
3660 static bool lxcapi_checkpoint(struct lxc_container *c, char *directory, bool stop, bool verbose)
3661 {
3662 int netnr, status;
3663 struct lxc_list *it;
3664 bool error = false;
3665 pid_t pid;
3666
3667 if (!criu_ok(c))
3668 return false;
3669
3670 if (mkdir(directory, 0700) < 0 && errno != EEXIST)
3671 return false;
3672
3673 netnr = 0;
3674 lxc_list_for_each(it, &c->lxc_conf->network) {
3675 char *veth = NULL, *bridge = NULL, veth_path[PATH_MAX], eth[128];
3676 struct lxc_netdev *n = it->elem;
3677 int pret;
3678
3679 pret = snprintf(veth_path, PATH_MAX, "lxc.network.%d.veth.pair", netnr);
3680 if (pret < 0 || pret >= PATH_MAX) {
3681 error = true;
3682 goto out;
3683 }
3684
3685 veth = lxcapi_get_running_config_item(c, veth_path);
3686 if (!veth) {
3687 /* criu_ok() checks that all interfaces are
3688 * LXC_NET{VETH,NONE}, and VETHs should have this
3689 * config */
3690 assert(n->type == LXC_NET_NONE);
3691 break;
3692 }
3693
3694 pret = snprintf(veth_path, PATH_MAX, "lxc.network.%d.link", netnr);
3695 if (pret < 0 || pret >= PATH_MAX) {
3696 error = true;
3697 goto out;
3698 }
3699
3700 bridge = lxcapi_get_running_config_item(c, veth_path);
3701 if (!bridge) {
3702 error = true;
3703 goto out;
3704 }
3705
3706 pret = snprintf(veth_path, PATH_MAX, "%s/veth%d", directory, netnr);
3707 if (pret < 0 || pret >= PATH_MAX || print_to_file(veth_path, veth) < 0) {
3708 error = true;
3709 goto out;
3710 }
3711
3712 pret = snprintf(veth_path, PATH_MAX, "%s/bridge%d", directory, netnr);
3713 if (pret < 0 || pret >= PATH_MAX || print_to_file(veth_path, bridge) < 0) {
3714 error = true;
3715 goto out;
3716 }
3717
3718 if (n->name) {
3719 if (strlen(n->name) >= 128) {
3720 error = true;
3721 goto out;
3722 }
3723 strncpy(eth, n->name, 128);
3724 } else
3725 sprintf(eth, "eth%d", netnr);
3726
3727 pret = snprintf(veth_path, PATH_MAX, "%s/eth%d", directory, netnr);
3728 if (pret < 0 || pret >= PATH_MAX || print_to_file(veth_path, eth) < 0)
3729 error = true;
3730
3731 out:
3732 free(veth);
3733 free(bridge);
3734 if (error)
3735 return false;
3736 }
3737
3738 pid = fork();
3739 if (pid < 0)
3740 return false;
3741
3742 if (pid == 0) {
3743 struct criu_opts os;
3744
3745 os.action = "dump";
3746 os.directory = directory;
3747 os.c = c;
3748 os.stop = stop;
3749 os.verbose = verbose;
3750
3751 /* exec_criu() returning is an error */
3752 exec_criu(&os);
3753 exit(1);
3754 } else {
3755 pid_t w = waitpid(pid, &status, 0);
3756 if (w == -1) {
3757 perror("waitpid");
3758 return false;
3759 }
3760
3761 if (WIFEXITED(status)) {
3762 return !WEXITSTATUS(status);
3763 }
3764
3765 return false;
3766 }
3767 }
3768
3769 static bool lxcapi_restore(struct lxc_container *c, char *directory, bool verbose)
3770 {
3771 pid_t pid;
3772 struct lxc_list *it;
3773 struct lxc_rootfs *rootfs;
3774 char pidfile[L_tmpnam];
3775 struct lxc_handler *handler;
3776 bool has_error = true;
3777
3778 if (!criu_ok(c))
3779 return false;
3780
3781 if (geteuid()) {
3782 ERROR("Must be root to restore\n");
3783 return false;
3784 }
3785
3786 if (!tmpnam(pidfile))
3787 return false;
3788
3789 handler = lxc_init(c->name, c->lxc_conf, c->config_path);
3790 if (!handler)
3791 return false;
3792
3793 if (!cgroup_init(handler)) {
3794 ERROR("failed initing cgroups");
3795 goto out_fini_handler;
3796 }
3797
3798 if (!cgroup_create(handler)) {
3799 ERROR("failed creating groups");
3800 goto out_fini_handler;
3801 }
3802
3803 pid = fork();
3804 if (pid < 0)
3805 goto out_fini_handler;
3806
3807 if (pid == 0) {
3808 struct criu_opts os;
3809
3810 if (unshare(CLONE_NEWNS))
3811 exit(1);
3812
3813 /* CRIU needs the lxc root bind mounted so that it is the root of some
3814 * mount. */
3815 rootfs = &c->lxc_conf->rootfs;
3816
3817 if (rootfs_is_blockdev(c->lxc_conf)) {
3818 if (do_rootfs_setup(c->lxc_conf, c->name, c->config_path) < 0)
3819 exit(1);
3820 }
3821 else {
3822 if (mkdir(rootfs->mount, 0755) < 0 && errno != EEXIST)
3823 exit(1);
3824
3825 if (mount(rootfs->path, rootfs->mount, NULL, MS_BIND, NULL) < 0) {
3826 rmdir(rootfs->mount);
3827 exit(1);
3828 }
3829 }
3830
3831 os.action = "restore";
3832 os.directory = directory;
3833 os.c = c;
3834 os.pidfile = pidfile;
3835 os.verbose = verbose;
3836 os.cgroup_path = cgroup_canonical_path(handler);
3837
3838 /* exec_criu() returning is an error */
3839 exec_criu(&os);
3840 umount(rootfs->mount);
3841 rmdir(rootfs->mount);
3842 exit(1);
3843 } else {
3844 int status;
3845
3846 pid_t w = waitpid(pid, &status, 0);
3847
3848 if (w == -1) {
3849 perror("waitpid");
3850 goto out_fini_handler;
3851 }
3852
3853 if (WIFEXITED(status)) {
3854 if (WEXITSTATUS(status)) {
3855 goto out_fini_handler;
3856 }
3857 else {
3858 int netnr = 0, ret;
3859 FILE *f = fopen(pidfile, "r");
3860 if (!f) {
3861 perror("reading pidfile");
3862 ERROR("couldn't read restore's init pidfile %s\n", pidfile);
3863 goto out_fini_handler;
3864 }
3865
3866 ret = fscanf(f, "%d", (int*) &handler->pid);
3867 fclose(f);
3868 if (ret != 1) {
3869 ERROR("reading restore pid failed");
3870 goto out_fini_handler;
3871 }
3872
3873 if (container_mem_lock(c))
3874 goto out_fini_handler;
3875
3876 lxc_list_for_each(it, &c->lxc_conf->network) {
3877 char eth[128], veth[128];
3878 struct lxc_netdev *netdev = it->elem;
3879
3880 if (read_criu_file(directory, "veth", netnr, veth)) {
3881 container_mem_unlock(c);
3882 goto out_fini_handler;
3883 }
3884
3885 if (read_criu_file(directory, "eth", netnr, eth)) {
3886 container_mem_unlock(c);
3887 goto out_fini_handler;
3888 }
3889
3890 netdev->priv.veth_attr.pair = strdup(veth);
3891 if (!netdev->priv.veth_attr.pair) {
3892 container_mem_unlock(c);
3893 goto out_fini_handler;
3894 }
3895
3896 netnr++;
3897 }
3898
3899 container_mem_unlock(c);
3900
3901 if (lxc_set_state(c->name, handler, RUNNING))
3902 goto out_fini_handler;
3903 }
3904 } else {
3905 ERROR("CRIU was killed with signal %d\n", WTERMSIG(status));
3906 goto out_fini_handler;
3907 }
3908
3909 if (lxc_poll(c->name, handler)) {
3910 lxc_abort(c->name, handler);
3911 goto out_fini_handler;
3912 }
3913 }
3914
3915 has_error = false;
3916
3917 out_fini_handler:
3918 lxc_fini(c->name, handler);
3919 return !has_error;
3920 }
3921
3922 static int lxcapi_attach_run_waitl(struct lxc_container *c, lxc_attach_options_t *options, const char *program, const char *arg, ...)
3923 {
3924 va_list ap;
3925 const char **argv;
3926 int ret;
3927
3928 if (!c)
3929 return -1;
3930
3931 va_start(ap, arg);
3932 argv = lxc_va_arg_list_to_argv_const(ap, 1);
3933 va_end(ap);
3934
3935 if (!argv) {
3936 ERROR("Memory allocation error.");
3937 return -1;
3938 }
3939 argv[0] = arg;
3940
3941 ret = lxcapi_attach_run_wait(c, options, program, (const char * const *)argv);
3942 free((void*)argv);
3943 return ret;
3944 }
3945
3946 struct lxc_container *lxc_container_new(const char *name, const char *configpath)
3947 {
3948 struct lxc_container *c;
3949
3950 if (!name)
3951 return NULL;
3952
3953 c = malloc(sizeof(*c));
3954 if (!c) {
3955 fprintf(stderr, "failed to malloc lxc_container\n");
3956 return NULL;
3957 }
3958 memset(c, 0, sizeof(*c));
3959
3960 if (configpath)
3961 c->config_path = strdup(configpath);
3962 else
3963 c->config_path = strdup(lxc_global_config_value("lxc.lxcpath"));
3964
3965 if (!c->config_path) {
3966 fprintf(stderr, "Out of memory\n");
3967 goto err;
3968 }
3969
3970 remove_trailing_slashes(c->config_path);
3971 c->name = malloc(strlen(name)+1);
3972 if (!c->name) {
3973 fprintf(stderr, "Error allocating lxc_container name\n");
3974 goto err;
3975 }
3976 strcpy(c->name, name);
3977
3978 c->numthreads = 1;
3979 if (!(c->slock = lxc_newlock(c->config_path, name))) {
3980 fprintf(stderr, "failed to create lock\n");
3981 goto err;
3982 }
3983
3984 if (!(c->privlock = lxc_newlock(NULL, NULL))) {
3985 fprintf(stderr, "failed to alloc privlock\n");
3986 goto err;
3987 }
3988
3989 if (!set_config_filename(c)) {
3990 fprintf(stderr, "Error allocating config file pathname\n");
3991 goto err;
3992 }
3993
3994 if (file_exists(c->configfile) && !lxcapi_load_config(c, NULL))
3995 goto err;
3996
3997 if (ongoing_create(c) == 2) {
3998 ERROR("Error: %s creation was not completed", c->name);
3999 container_destroy(c);
4000 lxcapi_clear_config(c);
4001 }
4002 c->daemonize = true;
4003 c->pidfile = NULL;
4004
4005 // assign the member functions
4006 c->is_defined = lxcapi_is_defined;
4007 c->state = lxcapi_state;
4008 c->is_running = lxcapi_is_running;
4009 c->freeze = lxcapi_freeze;
4010 c->unfreeze = lxcapi_unfreeze;
4011 c->console = lxcapi_console;
4012 c->console_getfd = lxcapi_console_getfd;
4013 c->init_pid = lxcapi_init_pid;
4014 c->load_config = lxcapi_load_config;
4015 c->want_daemonize = lxcapi_want_daemonize;
4016 c->want_close_all_fds = lxcapi_want_close_all_fds;
4017 c->start = lxcapi_start;
4018 c->startl = lxcapi_startl;
4019 c->stop = lxcapi_stop;
4020 c->config_file_name = lxcapi_config_file_name;
4021 c->wait = lxcapi_wait;
4022 c->set_config_item = lxcapi_set_config_item;
4023 c->destroy = lxcapi_destroy;
4024 c->destroy_with_snapshots = lxcapi_destroy_with_snapshots;
4025 c->rename = lxcapi_rename;
4026 c->save_config = lxcapi_save_config;
4027 c->get_keys = lxcapi_get_keys;
4028 c->create = lxcapi_create;
4029 c->createl = lxcapi_createl;
4030 c->shutdown = lxcapi_shutdown;
4031 c->reboot = lxcapi_reboot;
4032 c->clear_config = lxcapi_clear_config;
4033 c->clear_config_item = lxcapi_clear_config_item;
4034 c->get_config_item = lxcapi_get_config_item;
4035 c->get_running_config_item = lxcapi_get_running_config_item;
4036 c->get_cgroup_item = lxcapi_get_cgroup_item;
4037 c->set_cgroup_item = lxcapi_set_cgroup_item;
4038 c->get_config_path = lxcapi_get_config_path;
4039 c->set_config_path = lxcapi_set_config_path;
4040 c->clone = lxcapi_clone;
4041 c->get_interfaces = lxcapi_get_interfaces;
4042 c->get_ips = lxcapi_get_ips;
4043 c->attach = lxcapi_attach;
4044 c->attach_run_wait = lxcapi_attach_run_wait;
4045 c->attach_run_waitl = lxcapi_attach_run_waitl;
4046 c->snapshot = lxcapi_snapshot;
4047 c->snapshot_list = lxcapi_snapshot_list;
4048 c->snapshot_restore = lxcapi_snapshot_restore;
4049 c->snapshot_destroy = lxcapi_snapshot_destroy;
4050 c->snapshot_destroy_all = lxcapi_snapshot_destroy_all;
4051 c->may_control = lxcapi_may_control;
4052 c->add_device_node = lxcapi_add_device_node;
4053 c->remove_device_node = lxcapi_remove_device_node;
4054 c->checkpoint = lxcapi_checkpoint;
4055 c->restore = lxcapi_restore;
4056
4057 /* we'll allow the caller to update these later */
4058 if (lxc_log_init(NULL, "none", NULL, "lxc_container", 0, c->config_path)) {
4059 fprintf(stderr, "failed to open log\n");
4060 goto err;
4061 }
4062
4063 return c;
4064
4065 err:
4066 lxc_container_free(c);
4067 return NULL;
4068 }
4069
4070 int lxc_get_wait_states(const char **states)
4071 {
4072 int i;
4073
4074 if (states)
4075 for (i=0; i<MAX_STATE; i++)
4076 states[i] = lxc_state2str(i);
4077 return MAX_STATE;
4078 }
4079
4080 /*
4081 * These next two could probably be done smarter with reusing a common function
4082 * with different iterators and tests...
4083 */
4084 int list_defined_containers(const char *lxcpath, char ***names, struct lxc_container ***cret)
4085 {
4086 DIR *dir;
4087 int i, cfound = 0, nfound = 0;
4088 struct dirent dirent, *direntp;
4089 struct lxc_container *c;
4090
4091 if (!lxcpath)
4092 lxcpath = lxc_global_config_value("lxc.lxcpath");
4093
4094 dir = opendir(lxcpath);
4095 if (!dir) {
4096 SYSERROR("opendir on lxcpath");
4097 return -1;
4098 }
4099
4100 if (cret)
4101 *cret = NULL;
4102 if (names)
4103 *names = NULL;
4104
4105 while (!readdir_r(dir, &dirent, &direntp)) {
4106 if (!direntp)
4107 break;
4108 if (!strcmp(direntp->d_name, "."))
4109 continue;
4110 if (!strcmp(direntp->d_name, ".."))
4111 continue;
4112
4113 if (!config_file_exists(lxcpath, direntp->d_name))
4114 continue;
4115
4116 if (names) {
4117 if (!add_to_array(names, direntp->d_name, cfound))
4118 goto free_bad;
4119 }
4120 cfound++;
4121
4122 if (!cret) {
4123 nfound++;
4124 continue;
4125 }
4126
4127 c = lxc_container_new(direntp->d_name, lxcpath);
4128 if (!c) {
4129 INFO("Container %s:%s has a config but could not be loaded",
4130 lxcpath, direntp->d_name);
4131 if (names)
4132 if(!remove_from_array(names, direntp->d_name, cfound--))
4133 goto free_bad;
4134 continue;
4135 }
4136 if (!lxcapi_is_defined(c)) {
4137 INFO("Container %s:%s has a config but is not defined",
4138 lxcpath, direntp->d_name);
4139 if (names)
4140 if(!remove_from_array(names, direntp->d_name, cfound--))
4141 goto free_bad;
4142 lxc_container_put(c);
4143 continue;
4144 }
4145
4146 if (!add_to_clist(cret, c, nfound, true)) {
4147 lxc_container_put(c);
4148 goto free_bad;
4149 }
4150 nfound++;
4151 }
4152
4153 closedir(dir);
4154 return nfound;
4155
4156 free_bad:
4157 if (names && *names) {
4158 for (i=0; i<cfound; i++)
4159 free((*names)[i]);
4160 free(*names);
4161 }
4162 if (cret && *cret) {
4163 for (i=0; i<nfound; i++)
4164 lxc_container_put((*cret)[i]);
4165 free(*cret);
4166 }
4167 closedir(dir);
4168 return -1;
4169 }
4170
4171 int list_active_containers(const char *lxcpath, char ***nret,
4172 struct lxc_container ***cret)
4173 {
4174 int i, ret = -1, cret_cnt = 0, ct_name_cnt = 0;
4175 int lxcpath_len;
4176 char *line = NULL;
4177 char **ct_name = NULL;
4178 size_t len = 0;
4179 struct lxc_container *c;
4180 bool is_hashed;
4181
4182 if (!lxcpath)
4183 lxcpath = lxc_global_config_value("lxc.lxcpath");
4184 lxcpath_len = strlen(lxcpath);
4185
4186 if (cret)
4187 *cret = NULL;
4188 if (nret)
4189 *nret = NULL;
4190
4191 FILE *f = fopen("/proc/net/unix", "r");
4192 if (!f)
4193 return -1;
4194
4195 while (getline(&line, &len, f) != -1) {
4196
4197 char *p = strrchr(line, ' '), *p2;
4198 if (!p)
4199 continue;
4200 p++;
4201 if (*p != 0x40)
4202 continue;
4203 p++;
4204
4205 is_hashed = false;
4206 if (strncmp(p, lxcpath, lxcpath_len) == 0) {
4207 p += lxcpath_len;
4208 } else if (strncmp(p, "lxc/", 4) == 0) {
4209 p += 4;
4210 is_hashed = true;
4211 } else {
4212 continue;
4213 }
4214
4215 while (*p == '/')
4216 p++;
4217
4218 // Now p is the start of lxc_name
4219 p2 = index(p, '/');
4220 if (!p2 || strncmp(p2, "/command", 8) != 0)
4221 continue;
4222 *p2 = '\0';
4223
4224 if (is_hashed) {
4225 if (strncmp(lxcpath, lxc_cmd_get_lxcpath(p), lxcpath_len) != 0)
4226 continue;
4227 p = lxc_cmd_get_name(p);
4228 }
4229
4230 if (array_contains(&ct_name, p, ct_name_cnt))
4231 continue;
4232
4233 if (!add_to_array(&ct_name, p, ct_name_cnt))
4234 goto free_cret_list;
4235
4236 ct_name_cnt++;
4237
4238 if (!cret)
4239 continue;
4240
4241 c = lxc_container_new(p, lxcpath);
4242 if (!c) {
4243 INFO("Container %s:%s is running but could not be loaded",
4244 lxcpath, p);
4245 remove_from_array(&ct_name, p, ct_name_cnt--);
4246 continue;
4247 }
4248
4249 /*
4250 * If this is an anonymous container, then is_defined *can*
4251 * return false. So we don't do that check. Count on the
4252 * fact that the command socket exists.
4253 */
4254
4255 if (!add_to_clist(cret, c, cret_cnt, true)) {
4256 lxc_container_put(c);
4257 goto free_cret_list;
4258 }
4259 cret_cnt++;
4260 }
4261
4262 assert(!nret || !cret || cret_cnt == ct_name_cnt);
4263 ret = ct_name_cnt;
4264 if (nret)
4265 *nret = ct_name;
4266 else
4267 goto free_ct_name;
4268 goto out;
4269
4270 free_cret_list:
4271 if (cret && *cret) {
4272 for (i = 0; i < cret_cnt; i++)
4273 lxc_container_put((*cret)[i]);
4274 free(*cret);
4275 }
4276
4277 free_ct_name:
4278 if (ct_name) {
4279 for (i = 0; i < ct_name_cnt; i++)
4280 free(ct_name[i]);
4281 free(ct_name);
4282 }
4283
4284 out:
4285 if (line)
4286 free(line);
4287
4288 fclose(f);
4289 return ret;
4290 }
4291
4292 int list_all_containers(const char *lxcpath, char ***nret,
4293 struct lxc_container ***cret)
4294 {
4295 int i, ret, active_cnt, ct_cnt, ct_list_cnt;
4296 char **active_name;
4297 char **ct_name;
4298 struct lxc_container **ct_list = NULL;
4299
4300 ct_cnt = list_defined_containers(lxcpath, &ct_name, NULL);
4301 if (ct_cnt < 0)
4302 return ct_cnt;
4303
4304 active_cnt = list_active_containers(lxcpath, &active_name, NULL);
4305 if (active_cnt < 0) {
4306 ret = active_cnt;
4307 goto free_ct_name;
4308 }
4309
4310 for (i = 0; i < active_cnt; i++) {
4311 if (!array_contains(&ct_name, active_name[i], ct_cnt)) {
4312 if (!add_to_array(&ct_name, active_name[i], ct_cnt)) {
4313 ret = -1;
4314 goto free_active_name;
4315 }
4316 ct_cnt++;
4317 }
4318 free(active_name[i]);
4319 active_name[i] = NULL;
4320 }
4321 free(active_name);
4322 active_name = NULL;
4323 active_cnt = 0;
4324
4325 for (i = 0, ct_list_cnt = 0; i < ct_cnt && cret; i++) {
4326 struct lxc_container *c;
4327
4328 c = lxc_container_new(ct_name[i], lxcpath);
4329 if (!c) {
4330 WARN("Container %s:%s could not be loaded", lxcpath, ct_name[i]);
4331 remove_from_array(&ct_name, ct_name[i], ct_cnt--);
4332 continue;
4333 }
4334
4335 if (!add_to_clist(&ct_list, c, ct_list_cnt, false)) {
4336 lxc_container_put(c);
4337 ret = -1;
4338 goto free_ct_list;
4339 }
4340 ct_list_cnt++;
4341 }
4342
4343 if (cret)
4344 *cret = ct_list;
4345
4346 if (nret)
4347 *nret = ct_name;
4348 else {
4349 ret = ct_cnt;
4350 goto free_ct_name;
4351 }
4352 return ct_cnt;
4353
4354 free_ct_list:
4355 for (i = 0; i < ct_list_cnt; i++) {
4356 lxc_container_put(ct_list[i]);
4357 }
4358 if (ct_list)
4359 free(ct_list);
4360
4361 free_active_name:
4362 for (i = 0; i < active_cnt; i++) {
4363 if (active_name[i])
4364 free(active_name[i]);
4365 }
4366 if (active_name)
4367 free(active_name);
4368
4369 free_ct_name:
4370 for (i = 0; i < ct_cnt; i++) {
4371 free(ct_name[i]);
4372 }
4373 free(ct_name);
4374 return ret;
4375 }