]> git.proxmox.com Git - systemd.git/blame - src/core/main.c
Imported Upstream version 218
[systemd.git] / src / core / main.c
CommitLineData
663996b3
MS
1/*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
2
3/***
4 This file is part of systemd.
5
6 Copyright 2010 Lennart Poettering
7
8 systemd is free software; you can redistribute it and/or modify it
9 under the terms of the GNU Lesser General Public License as published by
10 the Free Software Foundation; either version 2.1 of the License, or
11 (at your option) any later version.
12
13 systemd is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 Lesser General Public License for more details.
17
18 You should have received a copy of the GNU Lesser General Public License
19 along with systemd; If not, see <http://www.gnu.org/licenses/>.
20***/
21
663996b3
MS
22#include <stdio.h>
23#include <errno.h>
24#include <string.h>
25#include <unistd.h>
26#include <sys/types.h>
27#include <sys/stat.h>
28#include <getopt.h>
29#include <signal.h>
30#include <sys/wait.h>
31#include <fcntl.h>
32#include <sys/prctl.h>
33#include <sys/mount.h>
34
60f067b4
JS
35#ifdef HAVE_VALGRIND_VALGRIND_H
36#include <valgrind/valgrind.h>
37#endif
38#ifdef HAVE_SECCOMP
39#include <seccomp.h>
40#endif
41
42#include "sd-daemon.h"
43#include "sd-messages.h"
44#include "sd-bus.h"
663996b3
MS
45#include "manager.h"
46#include "log.h"
47#include "load-fragment.h"
48#include "fdset.h"
49#include "special.h"
50#include "conf-parser.h"
663996b3
MS
51#include "missing.h"
52#include "label.h"
5eef597e 53#include "pager.h"
663996b3
MS
54#include "build.h"
55#include "strv.h"
56#include "def.h"
57#include "virt.h"
60f067b4 58#include "architecture.h"
663996b3
MS
59#include "watchdog.h"
60#include "path-util.h"
61#include "switch-root.h"
62#include "capability.h"
63#include "killall.h"
64#include "env-util.h"
60f067b4
JS
65#include "clock-util.h"
66#include "fileio.h"
67#include "dbus-manager.h"
68#include "bus-error.h"
69#include "bus-util.h"
663996b3
MS
70
71#include "mount-setup.h"
72#include "loopback-setup.h"
663996b3
MS
73#include "hostname-setup.h"
74#include "machine-id-setup.h"
663996b3
MS
75#include "selinux-setup.h"
76#include "ima-setup.h"
663996b3 77#include "smack-setup.h"
60f067b4 78#include "kmod-setup.h"
663996b3
MS
79
80static enum {
81 ACTION_RUN,
82 ACTION_HELP,
83 ACTION_VERSION,
84 ACTION_TEST,
85 ACTION_DUMP_CONFIGURATION_ITEMS,
86 ACTION_DONE
87} arg_action = ACTION_RUN;
663996b3
MS
88static char *arg_default_unit = NULL;
89static SystemdRunningAs arg_running_as = _SYSTEMD_RUNNING_AS_INVALID;
663996b3
MS
90static bool arg_dump_core = true;
91static bool arg_crash_shell = false;
92static int arg_crash_chvt = -1;
93static bool arg_confirm_spawn = false;
60f067b4 94static ShowStatus arg_show_status = _SHOW_STATUS_UNSET;
663996b3 95static bool arg_switched_root = false;
5eef597e 96static int arg_no_pager = -1;
663996b3
MS
97static char ***arg_join_controllers = NULL;
98static ExecOutput arg_default_std_output = EXEC_OUTPUT_JOURNAL;
99static ExecOutput arg_default_std_error = EXEC_OUTPUT_INHERIT;
60f067b4
JS
100static usec_t arg_default_restart_usec = DEFAULT_RESTART_USEC;
101static usec_t arg_default_timeout_start_usec = DEFAULT_TIMEOUT_USEC;
102static usec_t arg_default_timeout_stop_usec = DEFAULT_TIMEOUT_USEC;
103static usec_t arg_default_start_limit_interval = DEFAULT_START_LIMIT_INTERVAL;
104static unsigned arg_default_start_limit_burst = DEFAULT_START_LIMIT_BURST;
663996b3
MS
105static usec_t arg_runtime_watchdog = 0;
106static usec_t arg_shutdown_watchdog = 10 * USEC_PER_MINUTE;
14228c0d 107static char **arg_default_environment = NULL;
60f067b4 108static struct rlimit *arg_default_rlimit[_RLIMIT_MAX] = {};
663996b3 109static uint64_t arg_capability_bounding_set_drop = 0;
5eef597e 110static nsec_t arg_timer_slack_nsec = NSEC_INFINITY;
60f067b4
JS
111static usec_t arg_default_timer_accuracy_usec = 1 * USEC_PER_MINUTE;
112static Set* arg_syscall_archs = NULL;
113static FILE* arg_serialization = NULL;
114static bool arg_default_cpu_accounting = false;
115static bool arg_default_blockio_accounting = false;
116static bool arg_default_memory_accounting = false;
663996b3 117
60f067b4 118static void nop_handler(int sig) {}
663996b3 119
5eef597e
MP
120static void pager_open_if_enabled(void) {
121
122 if (arg_no_pager <= 0)
123 return;
124
125 pager_open(false);
126}
127
60f067b4 128noreturn static void crash(int sig) {
663996b3 129
14228c0d
MB
130 if (getpid() != 1)
131 /* Pass this on immediately, if this is not PID 1 */
132 raise(sig);
133 else if (!arg_dump_core)
f47781d8 134 log_emergency("Caught <%s>, not dumping core.", signal_to_string(sig));
663996b3
MS
135 else {
136 struct sigaction sa = {
137 .sa_handler = nop_handler,
138 .sa_flags = SA_NOCLDSTOP|SA_RESTART,
139 };
140 pid_t pid;
141
142 /* We want to wait for the core process, hence let's enable SIGCHLD */
14228c0d 143 sigaction(SIGCHLD, &sa, NULL);
663996b3
MS
144
145 pid = fork();
146 if (pid < 0)
f47781d8 147 log_emergency_errno(errno, "Caught <%s>, cannot fork for core dump: %m", signal_to_string(sig));
663996b3
MS
148
149 else if (pid == 0) {
150 struct rlimit rl = {};
151
152 /* Enable default signal handler for core dump */
153 zero(sa);
154 sa.sa_handler = SIG_DFL;
14228c0d 155 sigaction(sig, &sa, NULL);
663996b3
MS
156
157 /* Don't limit the core dump size */
158 rl.rlim_cur = RLIM_INFINITY;
159 rl.rlim_max = RLIM_INFINITY;
160 setrlimit(RLIMIT_CORE, &rl);
161
162 /* Just to be sure... */
14228c0d 163 chdir("/");
663996b3
MS
164
165 /* Raise the signal again */
166 raise(sig);
167
168 assert_not_reached("We shouldn't be here...");
169 _exit(1);
170
171 } else {
172 siginfo_t status;
173 int r;
174
175 /* Order things nicely. */
176 r = wait_for_terminate(pid, &status);
177 if (r < 0)
f47781d8 178 log_emergency_errno(r, "Caught <%s>, waitpid() failed: %m", signal_to_string(sig));
663996b3 179 else if (status.si_code != CLD_DUMPED)
f47781d8 180 log_emergency("Caught <%s>, core dump failed.", signal_to_string(sig));
663996b3 181 else
f47781d8 182 log_emergency("Caught <%s>, dumped core as pid "PID_FMT".", signal_to_string(sig), pid);
663996b3
MS
183 }
184 }
185
186 if (arg_crash_chvt)
187 chvt(arg_crash_chvt);
188
189 if (arg_crash_shell) {
190 struct sigaction sa = {
191 .sa_handler = SIG_IGN,
192 .sa_flags = SA_NOCLDSTOP|SA_NOCLDWAIT|SA_RESTART,
193 };
194 pid_t pid;
195
196 log_info("Executing crash shell in 10s...");
197 sleep(10);
198
199 /* Let the kernel reap children for us */
200 assert_se(sigaction(SIGCHLD, &sa, NULL) == 0);
201
202 pid = fork();
203 if (pid < 0)
f47781d8 204 log_emergency_errno(errno, "Failed to fork off crash shell: %m");
663996b3
MS
205 else if (pid == 0) {
206 make_console_stdio();
207 execl("/bin/sh", "/bin/sh", NULL);
208
f47781d8 209 log_emergency_errno(errno, "execl() failed: %m");
663996b3
MS
210 _exit(1);
211 }
212
60f067b4 213 log_info("Successfully spawned crash shell as pid "PID_FMT".", pid);
663996b3
MS
214 }
215
f47781d8 216 log_emergency("Freezing execution.");
663996b3
MS
217 freeze();
218}
219
220static void install_crash_handler(void) {
221 struct sigaction sa = {
222 .sa_handler = crash,
223 .sa_flags = SA_NODEFER,
224 };
225
226 sigaction_many(&sa, SIGNALS_CRASH_HANDLER, -1);
227}
228
5eef597e
MP
229static int console_setup(void) {
230 _cleanup_close_ int tty_fd = -1;
231 int r;
663996b3
MS
232
233 tty_fd = open_terminal("/dev/console", O_WRONLY|O_NOCTTY|O_CLOEXEC);
f47781d8
MP
234 if (tty_fd < 0)
235 return log_error_errno(tty_fd, "Failed to open /dev/console: %m");
663996b3 236
5eef597e
MP
237 /* We don't want to force text mode. plymouth may be showing
238 * pictures already from initrd. */
663996b3 239 r = reset_terminal_fd(tty_fd, false);
f47781d8
MP
240 if (r < 0)
241 return log_error_errno(r, "Failed to reset /dev/console: %m");
663996b3 242
5eef597e 243 return 0;
663996b3
MS
244}
245
246static int set_default_unit(const char *u) {
247 char *c;
248
249 assert(u);
250
251 c = strdup(u);
252 if (!c)
253 return -ENOMEM;
254
255 free(arg_default_unit);
256 arg_default_unit = c;
257
258 return 0;
259}
260
60f067b4 261static int parse_proc_cmdline_item(const char *key, const char *value) {
663996b3
MS
262
263 static const char * const rlmap[] = {
264 "emergency", SPECIAL_EMERGENCY_TARGET,
265 "-b", SPECIAL_EMERGENCY_TARGET,
5eef597e 266 "rescue", SPECIAL_RESCUE_TARGET,
663996b3
MS
267 "single", SPECIAL_RESCUE_TARGET,
268 "-s", SPECIAL_RESCUE_TARGET,
269 "s", SPECIAL_RESCUE_TARGET,
270 "S", SPECIAL_RESCUE_TARGET,
271 "1", SPECIAL_RESCUE_TARGET,
272 "2", SPECIAL_RUNLEVEL2_TARGET,
273 "3", SPECIAL_RUNLEVEL3_TARGET,
274 "4", SPECIAL_RUNLEVEL4_TARGET,
275 "5", SPECIAL_RUNLEVEL5_TARGET,
276 };
60f067b4 277 int r;
663996b3 278
60f067b4 279 assert(key);
663996b3 280
60f067b4 281 if (streq(key, "systemd.unit") && value) {
663996b3
MS
282
283 if (!in_initrd())
60f067b4 284 return set_default_unit(value);
663996b3 285
60f067b4 286 } else if (streq(key, "rd.systemd.unit") && value) {
663996b3 287
e842803a
MB
288 if (in_initrd())
289 return set_default_unit(value);
663996b3 290
60f067b4 291 } else if (streq(key, "systemd.dump_core") && value) {
663996b3 292
60f067b4
JS
293 r = parse_boolean(value);
294 if (r < 0)
295 log_warning("Failed to parse dump core switch %s. Ignoring.", value);
663996b3
MS
296 else
297 arg_dump_core = r;
298
60f067b4 299 } else if (streq(key, "systemd.crash_shell") && value) {
663996b3 300
60f067b4
JS
301 r = parse_boolean(value);
302 if (r < 0)
303 log_warning("Failed to parse crash shell switch %s. Ignoring.", value);
663996b3
MS
304 else
305 arg_crash_shell = r;
306
60f067b4 307 } else if (streq(key, "systemd.crash_chvt") && value) {
663996b3 308
60f067b4
JS
309 if (safe_atoi(value, &r) < 0)
310 log_warning("Failed to parse crash chvt switch %s. Ignoring.", value);
663996b3 311 else
60f067b4 312 arg_crash_chvt = r;
663996b3 313
60f067b4 314 } else if (streq(key, "systemd.confirm_spawn") && value) {
663996b3 315
60f067b4
JS
316 r = parse_boolean(value);
317 if (r < 0)
318 log_warning("Failed to parse confirm spawn switch %s. Ignoring.", value);
663996b3 319 else
60f067b4 320 arg_confirm_spawn = r;
663996b3 321
60f067b4 322 } else if (streq(key, "systemd.show_status") && value) {
663996b3 323
60f067b4
JS
324 r = parse_show_status(value, &arg_show_status);
325 if (r < 0)
326 log_warning("Failed to parse show status switch %s. Ignoring.", value);
327
328 } else if (streq(key, "systemd.default_standard_output") && value) {
663996b3 329
60f067b4
JS
330 r = exec_output_from_string(value);
331 if (r < 0)
332 log_warning("Failed to parse default standard output switch %s. Ignoring.", value);
663996b3
MS
333 else
334 arg_default_std_output = r;
663996b3 335
60f067b4
JS
336 } else if (streq(key, "systemd.default_standard_error") && value) {
337
338 r = exec_output_from_string(value);
339 if (r < 0)
340 log_warning("Failed to parse default standard error switch %s. Ignoring.", value);
663996b3
MS
341 else
342 arg_default_std_error = r;
663996b3 343
60f067b4 344 } else if (streq(key, "systemd.setenv") && value) {
663996b3 345
60f067b4 346 if (env_assignment_is_valid(value)) {
14228c0d
MB
347 char **env;
348
60f067b4 349 env = strv_env_set(arg_default_environment, value);
14228c0d
MB
350 if (env)
351 arg_default_environment = env;
352 else
f47781d8 353 log_warning_errno(ENOMEM, "Setting environment variable '%s' failed, ignoring: %m", value);
14228c0d 354 } else
60f067b4 355 log_warning("Environment variable name '%s' is not valid. Ignoring.", value);
663996b3 356
60f067b4 357 } else if (streq(key, "quiet") && !value) {
e842803a
MB
358
359 log_set_max_level(LOG_NOTICE);
360
60f067b4
JS
361 if (arg_show_status == _SHOW_STATUS_UNSET)
362 arg_show_status = SHOW_STATUS_AUTO;
363
364 } else if (streq(key, "debug") && !value) {
e842803a 365
5eef597e
MP
366 /* Note that log_parse_environment() handles 'debug'
367 * too, and sets the log level to LOG_DEBUG. */
e842803a 368
60f067b4
JS
369 if (detect_container(NULL) > 0)
370 log_set_target(LOG_TARGET_CONSOLE);
371
372 } else if (!in_initrd() && !value) {
663996b3
MS
373 unsigned i;
374
375 /* SysV compatibility */
376 for (i = 0; i < ELEMENTSOF(rlmap); i += 2)
60f067b4 377 if (streq(key, rlmap[i]))
663996b3
MS
378 return set_default_unit(rlmap[i+1]);
379 }
380
381 return 0;
382}
383
384#define DEFINE_SETTER(name, func, descr) \
385 static int name(const char *unit, \
386 const char *filename, \
387 unsigned line, \
388 const char *section, \
60f067b4 389 unsigned section_line, \
663996b3
MS
390 const char *lvalue, \
391 int ltype, \
392 const char *rvalue, \
393 void *data, \
394 void *userdata) { \
395 \
396 int r; \
397 \
398 assert(filename); \
399 assert(lvalue); \
400 assert(rvalue); \
401 \
402 r = func(rvalue); \
403 if (r < 0) \
404 log_syntax(unit, LOG_ERR, filename, line, -r, \
405 "Invalid " descr "'%s': %s", \
406 rvalue, strerror(-r)); \
407 \
408 return 0; \
409 }
410
411DEFINE_SETTER(config_parse_level2, log_set_max_level_from_string, "log level")
412DEFINE_SETTER(config_parse_target, log_set_target_from_string, "target")
413DEFINE_SETTER(config_parse_color, log_show_color_from_string, "color" )
414DEFINE_SETTER(config_parse_location, log_show_location_from_string, "location")
415
60f067b4
JS
416static int config_parse_cpu_affinity2(
417 const char *unit,
418 const char *filename,
419 unsigned line,
420 const char *section,
421 unsigned section_line,
422 const char *lvalue,
423 int ltype,
424 const char *rvalue,
425 void *data,
426 void *userdata) {
663996b3 427
5eef597e 428 const char *word, *state;
663996b3 429 size_t l;
663996b3
MS
430 cpu_set_t *c = NULL;
431 unsigned ncpus = 0;
432
433 assert(filename);
434 assert(lvalue);
435 assert(rvalue);
436
5eef597e 437 FOREACH_WORD_QUOTED(word, l, rvalue, state) {
663996b3
MS
438 char *t;
439 int r;
440 unsigned cpu;
441
5eef597e 442 if (!(t = strndup(word, l)))
663996b3
MS
443 return log_oom();
444
445 r = safe_atou(t, &cpu);
446 free(t);
447
448 if (!c)
449 if (!(c = cpu_set_malloc(&ncpus)))
450 return log_oom();
451
452 if (r < 0 || cpu >= ncpus) {
453 log_syntax(unit, LOG_ERR, filename, line, -r,
454 "Failed to parse CPU affinity '%s'", rvalue);
455 CPU_FREE(c);
456 return -EBADMSG;
457 }
458
459 CPU_SET_S(cpu, CPU_ALLOC_SIZE(ncpus), c);
460 }
5eef597e
MP
461 if (!isempty(state))
462 log_syntax(unit, LOG_ERR, filename, line, EINVAL,
463 "Trailing garbage, ignoring.");
663996b3
MS
464
465 if (c) {
466 if (sched_setaffinity(0, CPU_ALLOC_SIZE(ncpus), c) < 0)
f47781d8 467 log_unit_warning(unit, "Failed to set CPU affinity: %m");
663996b3
MS
468
469 CPU_FREE(c);
470 }
471
472 return 0;
473}
474
60f067b4
JS
475static int config_parse_show_status(
476 const char* unit,
477 const char *filename,
478 unsigned line,
479 const char *section,
480 unsigned section_line,
481 const char *lvalue,
482 int ltype,
483 const char *rvalue,
484 void *data,
485 void *userdata) {
486
487 int k;
488 ShowStatus *b = data;
489
490 assert(filename);
491 assert(lvalue);
492 assert(rvalue);
493 assert(data);
494
495 k = parse_show_status(rvalue, b);
496 if (k < 0) {
497 log_syntax(unit, LOG_ERR, filename, line, -k,
498 "Failed to parse show status setting, ignoring: %s", rvalue);
499 return 0;
500 }
501
502 return 0;
503}
504
663996b3
MS
505static void strv_free_free(char ***l) {
506 char ***i;
507
508 if (!l)
509 return;
510
511 for (i = l; *i; i++)
512 strv_free(*i);
513
514 free(l);
515}
516
517static void free_join_controllers(void) {
518 strv_free_free(arg_join_controllers);
519 arg_join_controllers = NULL;
520}
521
522static int config_parse_join_controllers(const char *unit,
523 const char *filename,
524 unsigned line,
525 const char *section,
60f067b4 526 unsigned section_line,
663996b3
MS
527 const char *lvalue,
528 int ltype,
529 const char *rvalue,
530 void *data,
531 void *userdata) {
532
533 unsigned n = 0;
5eef597e 534 const char *word, *state;
663996b3
MS
535 size_t length;
536
537 assert(filename);
538 assert(lvalue);
539 assert(rvalue);
540
541 free_join_controllers();
542
5eef597e 543 FOREACH_WORD_QUOTED(word, length, rvalue, state) {
663996b3
MS
544 char *s, **l;
545
5eef597e 546 s = strndup(word, length);
663996b3
MS
547 if (!s)
548 return log_oom();
549
550 l = strv_split(s, ",");
551 free(s);
552
553 strv_uniq(l);
554
555 if (strv_length(l) <= 1) {
556 strv_free(l);
557 continue;
558 }
559
560 if (!arg_join_controllers) {
561 arg_join_controllers = new(char**, 2);
562 if (!arg_join_controllers) {
563 strv_free(l);
564 return log_oom();
565 }
566
567 arg_join_controllers[0] = l;
568 arg_join_controllers[1] = NULL;
569
570 n = 1;
571 } else {
572 char ***a;
573 char ***t;
574
575 t = new0(char**, n+2);
576 if (!t) {
577 strv_free(l);
578 return log_oom();
579 }
580
581 n = 0;
582
583 for (a = arg_join_controllers; *a; a++) {
584
585 if (strv_overlap(*a, l)) {
60f067b4 586 if (strv_extend_strv(&l, *a) < 0) {
663996b3
MS
587 strv_free(l);
588 strv_free_free(t);
589 return log_oom();
590 }
591
663996b3
MS
592 } else {
593 char **c;
594
595 c = strv_copy(*a);
596 if (!c) {
597 strv_free(l);
598 strv_free_free(t);
599 return log_oom();
600 }
601
602 t[n++] = c;
603 }
604 }
605
606 t[n++] = strv_uniq(l);
607
608 strv_free_free(arg_join_controllers);
609 arg_join_controllers = t;
610 }
611 }
5eef597e
MP
612 if (!isempty(state))
613 log_syntax(unit, LOG_ERR, filename, line, EINVAL,
614 "Trailing garbage, ignoring.");
663996b3
MS
615
616 return 0;
617}
618
619static int parse_config_file(void) {
620
621 const ConfigTableItem items[] = {
60f067b4
JS
622 { "Manager", "LogLevel", config_parse_level2, 0, NULL },
623 { "Manager", "LogTarget", config_parse_target, 0, NULL },
624 { "Manager", "LogColor", config_parse_color, 0, NULL },
625 { "Manager", "LogLocation", config_parse_location, 0, NULL },
626 { "Manager", "DumpCore", config_parse_bool, 0, &arg_dump_core },
627 { "Manager", "CrashShell", config_parse_bool, 0, &arg_crash_shell },
628 { "Manager", "ShowStatus", config_parse_show_status, 0, &arg_show_status },
629 { "Manager", "CrashChVT", config_parse_int, 0, &arg_crash_chvt },
630 { "Manager", "CPUAffinity", config_parse_cpu_affinity2, 0, NULL },
631 { "Manager", "JoinControllers", config_parse_join_controllers, 0, &arg_join_controllers },
632 { "Manager", "RuntimeWatchdogSec", config_parse_sec, 0, &arg_runtime_watchdog },
633 { "Manager", "ShutdownWatchdogSec", config_parse_sec, 0, &arg_shutdown_watchdog },
634 { "Manager", "CapabilityBoundingSet", config_parse_bounding_set, 0, &arg_capability_bounding_set_drop },
635#ifdef HAVE_SECCOMP
636 { "Manager", "SystemCallArchitectures", config_parse_syscall_archs, 0, &arg_syscall_archs },
637#endif
638 { "Manager", "TimerSlackNSec", config_parse_nsec, 0, &arg_timer_slack_nsec },
639 { "Manager", "DefaultTimerAccuracySec", config_parse_sec, 0, &arg_default_timer_accuracy_usec },
640 { "Manager", "DefaultStandardOutput", config_parse_output, 0, &arg_default_std_output },
641 { "Manager", "DefaultStandardError", config_parse_output, 0, &arg_default_std_error },
642 { "Manager", "DefaultTimeoutStartSec", config_parse_sec, 0, &arg_default_timeout_start_usec },
643 { "Manager", "DefaultTimeoutStopSec", config_parse_sec, 0, &arg_default_timeout_stop_usec },
644 { "Manager", "DefaultRestartSec", config_parse_sec, 0, &arg_default_restart_usec },
645 { "Manager", "DefaultStartLimitInterval", config_parse_sec, 0, &arg_default_start_limit_interval },
646 { "Manager", "DefaultStartLimitBurst", config_parse_unsigned, 0, &arg_default_start_limit_burst },
647 { "Manager", "DefaultEnvironment", config_parse_environ, 0, &arg_default_environment },
648 { "Manager", "DefaultLimitCPU", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_CPU] },
649 { "Manager", "DefaultLimitFSIZE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_FSIZE] },
650 { "Manager", "DefaultLimitDATA", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_DATA] },
651 { "Manager", "DefaultLimitSTACK", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_STACK] },
652 { "Manager", "DefaultLimitCORE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_CORE] },
653 { "Manager", "DefaultLimitRSS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RSS] },
654 { "Manager", "DefaultLimitNOFILE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NOFILE] },
655 { "Manager", "DefaultLimitAS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_AS] },
656 { "Manager", "DefaultLimitNPROC", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NPROC] },
657 { "Manager", "DefaultLimitMEMLOCK", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_MEMLOCK] },
658 { "Manager", "DefaultLimitLOCKS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_LOCKS] },
659 { "Manager", "DefaultLimitSIGPENDING", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_SIGPENDING] },
660 { "Manager", "DefaultLimitMSGQUEUE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_MSGQUEUE] },
661 { "Manager", "DefaultLimitNICE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NICE] },
662 { "Manager", "DefaultLimitRTPRIO", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RTPRIO] },
663 { "Manager", "DefaultLimitRTTIME", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RTTIME] },
664 { "Manager", "DefaultCPUAccounting", config_parse_bool, 0, &arg_default_cpu_accounting },
665 { "Manager", "DefaultBlockIOAccounting", config_parse_bool, 0, &arg_default_blockio_accounting },
666 { "Manager", "DefaultMemoryAccounting", config_parse_bool, 0, &arg_default_memory_accounting },
667 {}
663996b3
MS
668 };
669
f47781d8 670 const char *fn, *conf_dirs_nulstr;
663996b3
MS
671
672 fn = arg_running_as == SYSTEMD_SYSTEM ? PKGSYSCONFDIR "/system.conf" : PKGSYSCONFDIR "/user.conf";
f47781d8
MP
673 conf_dirs_nulstr = arg_running_as == SYSTEMD_SYSTEM ? CONF_DIRS_NULSTR("systemd/system.conf") : CONF_DIRS_NULSTR("systemd/user.conf");
674 config_parse_many(fn, conf_dirs_nulstr, "Manager\0",
675 config_item_table_lookup, items, false, NULL);
663996b3
MS
676
677 return 0;
678}
679
663996b3
MS
680static int parse_argv(int argc, char *argv[]) {
681
682 enum {
683 ARG_LOG_LEVEL = 0x100,
684 ARG_LOG_TARGET,
685 ARG_LOG_COLOR,
686 ARG_LOG_LOCATION,
687 ARG_UNIT,
688 ARG_SYSTEM,
689 ARG_USER,
690 ARG_TEST,
5eef597e 691 ARG_NO_PAGER,
663996b3
MS
692 ARG_VERSION,
693 ARG_DUMP_CONFIGURATION_ITEMS,
694 ARG_DUMP_CORE,
695 ARG_CRASH_SHELL,
696 ARG_CONFIRM_SPAWN,
697 ARG_SHOW_STATUS,
698 ARG_DESERIALIZE,
699 ARG_SWITCHED_ROOT,
663996b3
MS
700 ARG_DEFAULT_STD_OUTPUT,
701 ARG_DEFAULT_STD_ERROR
702 };
703
704 static const struct option options[] = {
705 { "log-level", required_argument, NULL, ARG_LOG_LEVEL },
706 { "log-target", required_argument, NULL, ARG_LOG_TARGET },
707 { "log-color", optional_argument, NULL, ARG_LOG_COLOR },
708 { "log-location", optional_argument, NULL, ARG_LOG_LOCATION },
709 { "unit", required_argument, NULL, ARG_UNIT },
710 { "system", no_argument, NULL, ARG_SYSTEM },
711 { "user", no_argument, NULL, ARG_USER },
712 { "test", no_argument, NULL, ARG_TEST },
5eef597e 713 { "no-pager", no_argument, NULL, ARG_NO_PAGER },
663996b3
MS
714 { "help", no_argument, NULL, 'h' },
715 { "version", no_argument, NULL, ARG_VERSION },
716 { "dump-configuration-items", no_argument, NULL, ARG_DUMP_CONFIGURATION_ITEMS },
717 { "dump-core", optional_argument, NULL, ARG_DUMP_CORE },
718 { "crash-shell", optional_argument, NULL, ARG_CRASH_SHELL },
719 { "confirm-spawn", optional_argument, NULL, ARG_CONFIRM_SPAWN },
720 { "show-status", optional_argument, NULL, ARG_SHOW_STATUS },
721 { "deserialize", required_argument, NULL, ARG_DESERIALIZE },
722 { "switched-root", no_argument, NULL, ARG_SWITCHED_ROOT },
663996b3
MS
723 { "default-standard-output", required_argument, NULL, ARG_DEFAULT_STD_OUTPUT, },
724 { "default-standard-error", required_argument, NULL, ARG_DEFAULT_STD_ERROR, },
60f067b4 725 {}
663996b3
MS
726 };
727
728 int c, r;
729
730 assert(argc >= 1);
731 assert(argv);
732
733 if (getpid() == 1)
734 opterr = 0;
735
736 while ((c = getopt_long(argc, argv, "hDbsz:", options, NULL)) >= 0)
737
738 switch (c) {
739
740 case ARG_LOG_LEVEL:
60f067b4
JS
741 r = log_set_max_level_from_string(optarg);
742 if (r < 0) {
663996b3
MS
743 log_error("Failed to parse log level %s.", optarg);
744 return r;
745 }
746
747 break;
748
749 case ARG_LOG_TARGET:
60f067b4
JS
750 r = log_set_target_from_string(optarg);
751 if (r < 0) {
663996b3
MS
752 log_error("Failed to parse log target %s.", optarg);
753 return r;
754 }
755
756 break;
757
758 case ARG_LOG_COLOR:
759
760 if (optarg) {
60f067b4
JS
761 r = log_show_color_from_string(optarg);
762 if (r < 0) {
663996b3
MS
763 log_error("Failed to parse log color setting %s.", optarg);
764 return r;
765 }
766 } else
767 log_show_color(true);
768
769 break;
770
771 case ARG_LOG_LOCATION:
663996b3 772 if (optarg) {
60f067b4
JS
773 r = log_show_location_from_string(optarg);
774 if (r < 0) {
663996b3
MS
775 log_error("Failed to parse log location setting %s.", optarg);
776 return r;
777 }
778 } else
779 log_show_location(true);
780
781 break;
782
783 case ARG_DEFAULT_STD_OUTPUT:
60f067b4
JS
784 r = exec_output_from_string(optarg);
785 if (r < 0) {
663996b3
MS
786 log_error("Failed to parse default standard output setting %s.", optarg);
787 return r;
788 } else
789 arg_default_std_output = r;
790 break;
791
792 case ARG_DEFAULT_STD_ERROR:
60f067b4
JS
793 r = exec_output_from_string(optarg);
794 if (r < 0) {
663996b3
MS
795 log_error("Failed to parse default standard error output setting %s.", optarg);
796 return r;
797 } else
798 arg_default_std_error = r;
799 break;
800
801 case ARG_UNIT:
802
60f067b4 803 r = set_default_unit(optarg);
f47781d8
MP
804 if (r < 0)
805 return log_error_errno(r, "Failed to set default unit %s: %m", optarg);
663996b3
MS
806
807 break;
808
809 case ARG_SYSTEM:
810 arg_running_as = SYSTEMD_SYSTEM;
811 break;
812
813 case ARG_USER:
814 arg_running_as = SYSTEMD_USER;
815 break;
816
817 case ARG_TEST:
818 arg_action = ACTION_TEST;
5eef597e
MP
819 if (arg_no_pager < 0)
820 arg_no_pager = true;
821 break;
822
823 case ARG_NO_PAGER:
824 arg_no_pager = true;
663996b3
MS
825 break;
826
827 case ARG_VERSION:
828 arg_action = ACTION_VERSION;
829 break;
830
831 case ARG_DUMP_CONFIGURATION_ITEMS:
832 arg_action = ACTION_DUMP_CONFIGURATION_ITEMS;
833 break;
834
835 case ARG_DUMP_CORE:
836 r = optarg ? parse_boolean(optarg) : 1;
837 if (r < 0) {
838 log_error("Failed to parse dump core boolean %s.", optarg);
839 return r;
840 }
841 arg_dump_core = r;
842 break;
843
844 case ARG_CRASH_SHELL:
845 r = optarg ? parse_boolean(optarg) : 1;
846 if (r < 0) {
847 log_error("Failed to parse crash shell boolean %s.", optarg);
848 return r;
849 }
850 arg_crash_shell = r;
851 break;
852
853 case ARG_CONFIRM_SPAWN:
854 r = optarg ? parse_boolean(optarg) : 1;
855 if (r < 0) {
856 log_error("Failed to parse confirm spawn boolean %s.", optarg);
857 return r;
858 }
859 arg_confirm_spawn = r;
860 break;
861
862 case ARG_SHOW_STATUS:
60f067b4
JS
863 if (optarg) {
864 r = parse_show_status(optarg, &arg_show_status);
865 if (r < 0) {
866 log_error("Failed to parse show status boolean %s.", optarg);
867 return r;
868 }
869 } else
870 arg_show_status = SHOW_STATUS_YES;
663996b3
MS
871 break;
872
873 case ARG_DESERIALIZE: {
874 int fd;
875 FILE *f;
876
877 r = safe_atoi(optarg, &fd);
878 if (r < 0 || fd < 0) {
879 log_error("Failed to parse deserialize option %s.", optarg);
880 return r < 0 ? r : -EINVAL;
881 }
882
883 fd_cloexec(fd, true);
884
885 f = fdopen(fd, "r");
f47781d8
MP
886 if (!f)
887 return log_error_errno(errno, "Failed to open serialization fd: %m");
663996b3 888
60f067b4
JS
889 if (arg_serialization)
890 fclose(arg_serialization);
663996b3 891
60f067b4 892 arg_serialization = f;
663996b3
MS
893
894 break;
895 }
896
897 case ARG_SWITCHED_ROOT:
898 arg_switched_root = true;
899 break;
900
663996b3
MS
901 case 'h':
902 arg_action = ACTION_HELP;
5eef597e
MP
903 if (arg_no_pager < 0)
904 arg_no_pager = true;
663996b3
MS
905 break;
906
907 case 'D':
908 log_set_max_level(LOG_DEBUG);
909 break;
910
911 case 'b':
912 case 's':
913 case 'z':
914 /* Just to eat away the sysvinit kernel
915 * cmdline args without getopt() error
916 * messages that we'll parse in
917 * parse_proc_cmdline_word() or ignore. */
918
919 case '?':
5eef597e 920 if (getpid() != 1)
663996b3 921 return -EINVAL;
5eef597e
MP
922 else
923 return 0;
663996b3 924
5eef597e
MP
925 default:
926 assert_not_reached("Unhandled option code.");
663996b3
MS
927 }
928
929 if (optind < argc && getpid() != 1) {
930 /* Hmm, when we aren't run as init system
931 * let's complain about excess arguments */
932
933 log_error("Excess arguments.");
934 return -EINVAL;
935 }
936
663996b3
MS
937 return 0;
938}
939
940static int help(void) {
941
942 printf("%s [OPTIONS...]\n\n"
943 "Starts up and maintains the system or user services.\n\n"
944 " -h --help Show this help\n"
945 " --test Determine startup sequence, dump it and exit\n"
5eef597e 946 " --no-pager Do not pipe output into a pager\n"
663996b3 947 " --dump-configuration-items Dump understood unit configuration items\n"
663996b3
MS
948 " --unit=UNIT Set default unit\n"
949 " --system Run a system instance, even if PID != 1\n"
950 " --user Run a user instance\n"
951 " --dump-core[=0|1] Dump core on crash\n"
952 " --crash-shell[=0|1] Run shell on crash\n"
953 " --confirm-spawn[=0|1] Ask for confirmation when spawning processes\n"
954 " --show-status[=0|1] Show status updates on the console during bootup\n"
5eef597e 955 " --log-target=TARGET Set log target (console, journal, kmsg, journal-or-kmsg, null)\n"
663996b3
MS
956 " --log-level=LEVEL Set log level (debug, info, notice, warning, err, crit, alert, emerg)\n"
957 " --log-color[=0|1] Highlight important log messages\n"
958 " --log-location[=0|1] Include code location in log messages\n"
959 " --default-standard-output= Set default standard output for services\n"
960 " --default-standard-error= Set default standard error output for services\n",
961 program_invocation_short_name);
962
963 return 0;
964}
965
966static int version(void) {
967 puts(PACKAGE_STRING);
968 puts(SYSTEMD_FEATURES);
969
970 return 0;
971}
972
973static int prepare_reexecute(Manager *m, FILE **_f, FDSet **_fds, bool switching_root) {
974 FILE *f = NULL;
975 FDSet *fds = NULL;
976 int r;
977
978 assert(m);
979 assert(_f);
980 assert(_fds);
981
663996b3
MS
982 r = manager_open_serialization(m, &f);
983 if (r < 0) {
f47781d8 984 log_error_errno(r, "Failed to create serialization file: %m");
663996b3
MS
985 goto fail;
986 }
987
14228c0d
MB
988 /* Make sure nothing is really destructed when we shut down */
989 m->n_reloading ++;
60f067b4 990 bus_manager_send_reloading(m, true);
14228c0d 991
663996b3
MS
992 fds = fdset_new();
993 if (!fds) {
994 r = -ENOMEM;
f47781d8 995 log_error_errno(r, "Failed to allocate fd set: %m");
663996b3
MS
996 goto fail;
997 }
998
999 r = manager_serialize(m, f, fds, switching_root);
1000 if (r < 0) {
f47781d8 1001 log_error_errno(r, "Failed to serialize state: %m");
663996b3
MS
1002 goto fail;
1003 }
1004
1005 if (fseeko(f, 0, SEEK_SET) < 0) {
f47781d8 1006 log_error_errno(errno, "Failed to rewind serialization fd: %m");
663996b3
MS
1007 goto fail;
1008 }
1009
1010 r = fd_cloexec(fileno(f), false);
1011 if (r < 0) {
f47781d8 1012 log_error_errno(r, "Failed to disable O_CLOEXEC for serialization: %m");
663996b3
MS
1013 goto fail;
1014 }
1015
1016 r = fdset_cloexec(fds, false);
1017 if (r < 0) {
f47781d8 1018 log_error_errno(r, "Failed to disable O_CLOEXEC for serialization fds: %m");
663996b3
MS
1019 goto fail;
1020 }
1021
1022 *_f = f;
1023 *_fds = fds;
1024
1025 return 0;
1026
1027fail:
1028 fdset_free(fds);
1029
1030 if (f)
1031 fclose(f);
1032
1033 return r;
1034}
1035
1036static int bump_rlimit_nofile(struct rlimit *saved_rlimit) {
1037 struct rlimit nl;
1038 int r;
1039
1040 assert(saved_rlimit);
1041
1042 /* Save the original RLIMIT_NOFILE so that we can reset it
1043 * later when transitioning from the initrd to the main
1044 * systemd or suchlike. */
f47781d8
MP
1045 if (getrlimit(RLIMIT_NOFILE, saved_rlimit) < 0)
1046 return log_error_errno(errno, "Reading RLIMIT_NOFILE failed: %m");
663996b3
MS
1047
1048 /* Make sure forked processes get the default kernel setting */
1049 if (!arg_default_rlimit[RLIMIT_NOFILE]) {
1050 struct rlimit *rl;
1051
1052 rl = newdup(struct rlimit, saved_rlimit, 1);
1053 if (!rl)
1054 return log_oom();
1055
1056 arg_default_rlimit[RLIMIT_NOFILE] = rl;
1057 }
1058
1059 /* Bump up the resource limit for ourselves substantially */
1060 nl.rlim_cur = nl.rlim_max = 64*1024;
1061 r = setrlimit_closest(RLIMIT_NOFILE, &nl);
f47781d8
MP
1062 if (r < 0)
1063 return log_error_errno(r, "Setting RLIMIT_NOFILE failed: %m");
663996b3
MS
1064
1065 return 0;
1066}
1067
663996b3 1068static void test_mtab(void) {
663996b3 1069
e842803a
MB
1070 static const char ok[] =
1071 "/proc/self/mounts\0"
1072 "/proc/mounts\0"
1073 "../proc/self/mounts\0"
1074 "../proc/mounts\0";
663996b3 1075
e842803a
MB
1076 _cleanup_free_ char *p = NULL;
1077 int r;
663996b3 1078
e842803a
MB
1079 /* Check that /etc/mtab is a symlink to the right place or
1080 * non-existing. But certainly not a file, or a symlink to
1081 * some weird place... */
663996b3 1082
e842803a
MB
1083 r = readlink_malloc("/etc/mtab", &p);
1084 if (r == -ENOENT)
1085 return;
1086 if (r >= 0 && nulstr_contains(ok, p))
1087 return;
663996b3
MS
1088
1089 log_warning("/etc/mtab is not a symlink or not pointing to /proc/self/mounts. "
1090 "This is not supported anymore. "
1091 "Please make sure to replace this file by a symlink to avoid incorrect or misleading mount(8) output.");
1092}
1093
1094static void test_usr(void) {
1095
1096 /* Check that /usr is not a separate fs */
1097
1098 if (dir_is_empty("/usr") <= 0)
1099 return;
1100
1101 log_warning("/usr appears to be on its own filesytem and is not already mounted. This is not a supported setup. "
1102 "Some things will probably break (sometimes even silently) in mysterious ways. "
1103 "Consult http://freedesktop.org/wiki/Software/systemd/separate-usr-is-broken for more information.");
1104}
1105
663996b3
MS
1106static int initialize_join_controllers(void) {
1107 /* By default, mount "cpu" + "cpuacct" together, and "net_cls"
1108 * + "net_prio". We'd like to add "cpuset" to the mix, but
1109 * "cpuset" does't really work for groups with no initialized
1110 * attributes. */
1111
1112 arg_join_controllers = new(char**, 3);
1113 if (!arg_join_controllers)
1114 return -ENOMEM;
1115
1116 arg_join_controllers[0] = strv_new("cpu", "cpuacct", NULL);
1117 arg_join_controllers[1] = strv_new("net_cls", "net_prio", NULL);
1118 arg_join_controllers[2] = NULL;
1119
1120 if (!arg_join_controllers[0] || !arg_join_controllers[1]) {
1121 free_join_controllers();
1122 return -ENOMEM;
1123 }
1124
1125 return 0;
1126}
1127
60f067b4
JS
1128static int enforce_syscall_archs(Set *archs) {
1129#ifdef HAVE_SECCOMP
1130 scmp_filter_ctx *seccomp;
1131 Iterator i;
1132 void *id;
1133 int r;
1134
1135 seccomp = seccomp_init(SCMP_ACT_ALLOW);
1136 if (!seccomp)
1137 return log_oom();
1138
1139 SET_FOREACH(id, arg_syscall_archs, i) {
1140 r = seccomp_arch_add(seccomp, PTR_TO_UINT32(id) - 1);
1141 if (r == -EEXIST)
1142 continue;
1143 if (r < 0) {
f47781d8 1144 log_error_errno(r, "Failed to add architecture to seccomp: %m");
60f067b4
JS
1145 goto finish;
1146 }
1147 }
1148
1149 r = seccomp_attr_set(seccomp, SCMP_FLTATR_CTL_NNP, 0);
1150 if (r < 0) {
f47781d8 1151 log_error_errno(r, "Failed to unset NO_NEW_PRIVS: %m");
60f067b4
JS
1152 goto finish;
1153 }
1154
1155 r = seccomp_load(seccomp);
1156 if (r < 0)
f47781d8 1157 log_error_errno(r, "Failed to add install architecture seccomp: %m");
60f067b4
JS
1158
1159finish:
1160 seccomp_release(seccomp);
1161 return r;
1162#else
1163 return 0;
1164#endif
1165}
1166
1167static int status_welcome(void) {
1168 _cleanup_free_ char *pretty_name = NULL, *ansi_color = NULL;
1169 int r;
1170
1171 r = parse_env_file("/etc/os-release", NEWLINE,
1172 "PRETTY_NAME", &pretty_name,
1173 "ANSI_COLOR", &ansi_color,
1174 NULL);
e842803a
MB
1175 if (r == -ENOENT) {
1176 r = parse_env_file("/usr/lib/os-release", NEWLINE,
1177 "PRETTY_NAME", &pretty_name,
1178 "ANSI_COLOR", &ansi_color,
1179 NULL);
1180 }
60f067b4
JS
1181
1182 if (r < 0 && r != -ENOENT)
f47781d8 1183 log_warning_errno(r, "Failed to read os-release file: %m");
60f067b4
JS
1184
1185 return status_printf(NULL, false, false,
1186 "\nWelcome to \x1B[%sm%s\x1B[0m!\n",
1187 isempty(ansi_color) ? "1" : ansi_color,
1188 isempty(pretty_name) ? "Linux" : pretty_name);
1189}
1190
1191static int write_container_id(void) {
1192 const char *c;
1193
1194 c = getenv("container");
1195 if (isempty(c))
1196 return 0;
1197
1198 return write_string_file("/run/systemd/container", c);
1199}
1200
663996b3
MS
1201int main(int argc, char *argv[]) {
1202 Manager *m = NULL;
1203 int r, retval = EXIT_FAILURE;
1204 usec_t before_startup, after_startup;
1205 char timespan[FORMAT_TIMESPAN_MAX];
1206 FDSet *fds = NULL;
1207 bool reexecute = false;
1208 const char *shutdown_verb = NULL;
1209 dual_timestamp initrd_timestamp = { 0ULL, 0ULL };
1210 dual_timestamp userspace_timestamp = { 0ULL, 0ULL };
1211 dual_timestamp kernel_timestamp = { 0ULL, 0ULL };
60f067b4
JS
1212 dual_timestamp security_start_timestamp = { 0ULL, 0ULL };
1213 dual_timestamp security_finish_timestamp = { 0ULL, 0ULL };
663996b3
MS
1214 static char systemd[] = "systemd";
1215 bool skip_setup = false;
60f067b4 1216 unsigned j;
663996b3
MS
1217 bool loaded_policy = false;
1218 bool arm_reboot_watchdog = false;
1219 bool queue_default_job = false;
e842803a 1220 bool empty_etc = false;
663996b3
MS
1221 char *switch_root_dir = NULL, *switch_root_init = NULL;
1222 static struct rlimit saved_rlimit_nofile = { 0, 0 };
f47781d8 1223 const char *error_message = NULL;
663996b3
MS
1224
1225#ifdef HAVE_SYSV_COMPAT
1226 if (getpid() != 1 && strstr(program_invocation_short_name, "init")) {
1227 /* This is compatibility support for SysV, where
1228 * calling init as a user is identical to telinit. */
1229
1230 errno = -ENOENT;
1231 execv(SYSTEMCTL_BINARY_PATH, argv);
f47781d8 1232 log_error_errno(errno, "Failed to exec " SYSTEMCTL_BINARY_PATH ": %m");
663996b3
MS
1233 return 1;
1234 }
1235#endif
1236
1237 dual_timestamp_from_monotonic(&kernel_timestamp, 0);
1238 dual_timestamp_get(&userspace_timestamp);
1239
1240 /* Determine if this is a reexecution or normal bootup. We do
1241 * the full command line parsing much later, so let's just
1242 * have a quick peek here. */
1243 if (strv_find(argv+1, "--deserialize"))
1244 skip_setup = true;
1245
1246 /* If we have switched root, do all the special setup
1247 * things */
1248 if (strv_find(argv+1, "--switched-root"))
1249 skip_setup = false;
1250
1251 /* If we get started via the /sbin/init symlink then we are
1252 called 'init'. After a subsequent reexecution we are then
1253 called 'systemd'. That is confusing, hence let's call us
1254 systemd right-away. */
1255 program_invocation_short_name = systemd;
1256 prctl(PR_SET_NAME, systemd);
1257
1258 saved_argv = argv;
1259 saved_argc = argc;
1260
1261 log_show_color(isatty(STDERR_FILENO) > 0);
5eef597e 1262 log_set_upgrade_syslog_to_journal(true);
663996b3 1263
14228c0d
MB
1264 /* Disable the umask logic */
1265 if (getpid() == 1)
1266 umask(0);
1267
663996b3 1268 if (getpid() == 1 && detect_container(NULL) <= 0) {
14228c0d 1269
663996b3
MS
1270 /* Running outside of a container as PID 1 */
1271 arg_running_as = SYSTEMD_SYSTEM;
1272 make_null_stdio();
1273 log_set_target(LOG_TARGET_KMSG);
1274 log_open();
1275
14228c0d 1276 if (in_initrd())
663996b3 1277 initrd_timestamp = userspace_timestamp;
663996b3
MS
1278
1279 if (!skip_setup) {
1280 mount_setup_early();
60f067b4 1281 dual_timestamp_get(&security_start_timestamp);
f47781d8
MP
1282 if (mac_selinux_setup(&loaded_policy) < 0) {
1283 error_message = "Failed to load SELinux policy";
663996b3 1284 goto finish;
f47781d8
MP
1285 } else if (ima_setup() < 0) {
1286 error_message = "Failed to load IMA policy";
663996b3 1287 goto finish;
f47781d8
MP
1288 } else if (mac_smack_setup(&loaded_policy) < 0) {
1289 error_message = "Failed to load SMACK policy";
663996b3 1290 goto finish;
f47781d8 1291 }
60f067b4 1292 dual_timestamp_get(&security_finish_timestamp);
663996b3
MS
1293 }
1294
f47781d8
MP
1295 if (mac_selinux_init(NULL) < 0) {
1296 error_message = "Failed to initialize SELinux policy";
663996b3 1297 goto finish;
f47781d8 1298 }
663996b3
MS
1299
1300 if (!skip_setup) {
60f067b4 1301 if (clock_is_localtime() > 0) {
663996b3
MS
1302 int min;
1303
5eef597e
MP
1304 /*
1305 * The very first call of settimeofday() also does a time warp in the kernel.
1306 *
1307 * In the rtc-in-local time mode, we set the kernel's timezone, and rely on
1308 * external tools to take care of maintaining the RTC and do all adjustments.
1309 * This matches the behavior of Windows, which leaves the RTC alone if the
1310 * registry tells that the RTC runs in UTC.
1311 */
60f067b4 1312 r = clock_set_timezone(&min);
663996b3 1313 if (r < 0)
f47781d8 1314 log_error_errno(r, "Failed to apply local time delta, ignoring: %m");
663996b3
MS
1315 else
1316 log_info("RTC configured in localtime, applying delta of %i minutes to system time.", min);
1317 } else if (!in_initrd()) {
1318 /*
5eef597e 1319 * Do a dummy very first call to seal the kernel's time warp magic.
663996b3
MS
1320 *
1321 * Do not call this this from inside the initrd. The initrd might not
1322 * carry /etc/adjtime with LOCAL, but the real system could be set up
1323 * that way. In such case, we need to delay the time-warp or the sealing
1324 * until we reach the real system.
5eef597e
MP
1325 *
1326 * Do no set the kernel's timezone. The concept of local time cannot
1327 * be supported reliably, the time will jump or be incorrect at every daylight
1328 * saving time change. All kernel local time concepts will be treated
1329 * as UTC that way.
663996b3 1330 */
5eef597e 1331 clock_reset_timewarp();
663996b3
MS
1332 }
1333 }
1334
1335 /* Set the default for later on, but don't actually
1336 * open the logs like this for now. Note that if we
1337 * are transitioning from the initrd there might still
1338 * be journal fd open, and we shouldn't attempt
1339 * opening that before we parsed /proc/cmdline which
1340 * might redirect output elsewhere. */
1341 log_set_target(LOG_TARGET_JOURNAL_OR_KMSG);
1342
1343 } else if (getpid() == 1) {
1344 /* Running inside a container, as PID 1 */
1345 arg_running_as = SYSTEMD_SYSTEM;
1346 log_set_target(LOG_TARGET_CONSOLE);
60f067b4 1347 log_close_console(); /* force reopen of /dev/console */
663996b3
MS
1348 log_open();
1349
1350 /* For the later on, see above... */
1351 log_set_target(LOG_TARGET_JOURNAL);
1352
1353 /* clear the kernel timestamp,
1354 * because we are in a container */
1355 kernel_timestamp.monotonic = 0ULL;
1356 kernel_timestamp.realtime = 0ULL;
1357
1358 } else {
1359 /* Running as user instance */
1360 arg_running_as = SYSTEMD_USER;
1361 log_set_target(LOG_TARGET_AUTO);
1362 log_open();
1363
1364 /* clear the kernel timestamp,
1365 * because we are not PID 1 */
1366 kernel_timestamp.monotonic = 0ULL;
1367 kernel_timestamp.realtime = 0ULL;
1368 }
1369
1370 /* Initialize default unit */
1371 r = set_default_unit(SPECIAL_DEFAULT_TARGET);
1372 if (r < 0) {
f47781d8
MP
1373 log_emergency_errno(r, "Failed to set default unit %s: %m", SPECIAL_DEFAULT_TARGET);
1374 error_message = "Failed to set default unit";
663996b3
MS
1375 goto finish;
1376 }
1377
1378 r = initialize_join_controllers();
f47781d8
MP
1379 if (r < 0) {
1380 error_message = "Failed to initalize cgroup controllers";
663996b3 1381 goto finish;
f47781d8 1382 }
663996b3
MS
1383
1384 /* Mount /proc, /sys and friends, so that /proc/cmdline and
1385 * /proc/$PID/fd is available. */
1386 if (getpid() == 1) {
f47781d8
MP
1387
1388 /* Load the kernel modules early, so that we kdbus.ko is loaded before kdbusfs shall be mounted */
1389 if (!skip_setup)
1390 kmod_setup();
1391
663996b3 1392 r = mount_setup(loaded_policy);
f47781d8
MP
1393 if (r < 0) {
1394 error_message = "Failed to mount API filesystems";
663996b3 1395 goto finish;
f47781d8 1396 }
663996b3
MS
1397 }
1398
1399 /* Reset all signal handlers. */
1400 assert_se(reset_all_signal_handlers() == 0);
1401
663996b3
MS
1402 ignore_signals(SIGNALS_IGNORE, -1);
1403
f47781d8
MP
1404 if (parse_config_file() < 0) {
1405 error_message = "Failed to parse config file";
663996b3 1406 goto finish;
f47781d8 1407 }
663996b3 1408
f47781d8
MP
1409 if (arg_running_as == SYSTEMD_SYSTEM) {
1410 r = parse_proc_cmdline(parse_proc_cmdline_item);
1411 if (r < 0)
1412 log_warning_errno(r, "Failed to parse kernel command line, ignoring: %m");
1413 }
663996b3 1414
5eef597e
MP
1415 /* Note that this also parses bits from the kernel command
1416 * line, including "debug". */
663996b3
MS
1417 log_parse_environment();
1418
f47781d8
MP
1419 if (parse_argv(argc, argv) < 0) {
1420 error_message = "Failed to parse commandline arguments";
663996b3 1421 goto finish;
f47781d8 1422 }
663996b3
MS
1423
1424 if (arg_action == ACTION_TEST &&
1425 geteuid() == 0) {
1426 log_error("Don't run test mode as root.");
1427 goto finish;
1428 }
1429
1430 if (arg_running_as == SYSTEMD_USER &&
1431 arg_action == ACTION_RUN &&
1432 sd_booted() <= 0) {
1433 log_error("Trying to run as user instance, but the system has not been booted with systemd.");
1434 goto finish;
1435 }
1436
1437 if (arg_running_as == SYSTEMD_SYSTEM &&
1438 arg_action == ACTION_RUN &&
1439 running_in_chroot() > 0) {
1440 log_error("Cannot be run in a chroot() environment.");
1441 goto finish;
1442 }
1443
5eef597e
MP
1444 if (arg_action == ACTION_TEST)
1445 skip_setup = true;
1446
1447 pager_open_if_enabled();
1448
663996b3
MS
1449 if (arg_action == ACTION_HELP) {
1450 retval = help();
1451 goto finish;
1452 } else if (arg_action == ACTION_VERSION) {
1453 retval = version();
1454 goto finish;
1455 } else if (arg_action == ACTION_DUMP_CONFIGURATION_ITEMS) {
1456 unit_dump_config_items(stdout);
1457 retval = EXIT_SUCCESS;
1458 goto finish;
1459 } else if (arg_action == ACTION_DONE) {
1460 retval = EXIT_SUCCESS;
1461 goto finish;
1462 }
1463
60f067b4
JS
1464 if (arg_running_as == SYSTEMD_USER &&
1465 !getenv("XDG_RUNTIME_DIR")) {
1466 log_error("Trying to run as user instance, but $XDG_RUNTIME_DIR is not set.");
1467 goto finish;
1468 }
1469
663996b3
MS
1470 assert_se(arg_action == ACTION_RUN || arg_action == ACTION_TEST);
1471
1472 /* Close logging fds, in order not to confuse fdset below */
1473 log_close();
1474
1475 /* Remember open file descriptors for later deserialization */
1476 r = fdset_new_fill(&fds);
1477 if (r < 0) {
f47781d8
MP
1478 log_emergency_errno(r, "Failed to allocate fd set: %m");
1479 error_message = "Failed to allocate fd set";
663996b3
MS
1480 goto finish;
1481 } else
1482 fdset_cloexec(fds, true);
1483
60f067b4
JS
1484 if (arg_serialization)
1485 assert_se(fdset_remove(fds, fileno(arg_serialization)) >= 0);
663996b3 1486
14228c0d 1487 if (arg_running_as == SYSTEMD_SYSTEM)
663996b3
MS
1488 /* Become a session leader if we aren't one yet. */
1489 setsid();
1490
14228c0d
MB
1491 /* Move out of the way, so that we won't block unmounts */
1492 assert_se(chdir("/") == 0);
663996b3 1493
663996b3
MS
1494 /* Reset the console, but only if this is really init and we
1495 * are freshly booted */
5eef597e
MP
1496 if (arg_running_as == SYSTEMD_SYSTEM && arg_action == ACTION_RUN) {
1497
1498 /* If we are init, we connect stdin/stdout/stderr to
1499 * /dev/null and make sure we don't have a controlling
1500 * tty. */
1501 release_terminal();
1502
1503 if (getpid() == 1 && !skip_setup)
1504 console_setup();
1505 }
663996b3
MS
1506
1507 /* Open the logging devices, if possible and necessary */
1508 log_open();
1509
60f067b4
JS
1510 if (arg_show_status == _SHOW_STATUS_UNSET)
1511 arg_show_status = SHOW_STATUS_YES;
1512
663996b3
MS
1513 /* Make sure we leave a core dump without panicing the
1514 * kernel. */
1515 if (getpid() == 1) {
1516 install_crash_handler();
1517
1518 r = mount_cgroup_controllers(arg_join_controllers);
1519 if (r < 0)
1520 goto finish;
1521 }
1522
1523 if (arg_running_as == SYSTEMD_SYSTEM) {
1524 const char *virtualization = NULL;
1525
5eef597e
MP
1526 log_info(PACKAGE_STRING " running in %ssystem mode. (" SYSTEMD_FEATURES ")",
1527 arg_action == ACTION_TEST ? "test " : "" );
663996b3
MS
1528
1529 detect_virtualization(&virtualization);
1530 if (virtualization)
1531 log_info("Detected virtualization '%s'.", virtualization);
1532
60f067b4
JS
1533 write_container_id();
1534
1535 log_info("Detected architecture '%s'.", architecture_to_string(uname_architecture()));
1536
663996b3
MS
1537 if (in_initrd())
1538 log_info("Running in initial RAM disk.");
1539
5eef597e
MP
1540 /* Let's check whether /etc is already populated. We
1541 * don't actually really check for that, but use
1542 * /etc/machine-id as flag file. This allows container
1543 * managers and installers to provision a couple of
1544 * files already. If the container manager wants to
1545 * provision the machine ID itself it should pass
1546 * $container_uuid to PID 1.*/
1547
1548 empty_etc = access("/etc/machine-id", F_OK) < 0;
e842803a
MB
1549 if (empty_etc)
1550 log_info("Running with unpopulated /etc.");
60f067b4 1551 } else {
e842803a
MB
1552 _cleanup_free_ char *t;
1553
1554 t = uid_to_name(getuid());
5eef597e
MP
1555 log_debug(PACKAGE_STRING " running in %suser mode for user "UID_FMT"/%s. (" SYSTEMD_FEATURES ")",
1556 arg_action == ACTION_TEST ? " test" : "", getuid(), t);
60f067b4 1557 }
663996b3
MS
1558
1559 if (arg_running_as == SYSTEMD_SYSTEM && !skip_setup) {
60f067b4 1560 if (arg_show_status > 0 || plymouth_running())
663996b3
MS
1561 status_welcome();
1562
663996b3 1563 hostname_setup();
e842803a 1564 machine_id_setup(NULL);
663996b3
MS
1565 loopback_setup();
1566
1567 test_mtab();
1568 test_usr();
663996b3
MS
1569 }
1570
1571 if (arg_running_as == SYSTEMD_SYSTEM && arg_runtime_watchdog > 0)
1572 watchdog_set_timeout(&arg_runtime_watchdog);
1573
5eef597e 1574 if (arg_timer_slack_nsec != NSEC_INFINITY)
663996b3 1575 if (prctl(PR_SET_TIMERSLACK, arg_timer_slack_nsec) < 0)
f47781d8 1576 log_error_errno(errno, "Failed to adjust timer slack: %m");
663996b3
MS
1577
1578 if (arg_capability_bounding_set_drop) {
14228c0d 1579 r = capability_bounding_set_drop_usermode(arg_capability_bounding_set_drop);
663996b3 1580 if (r < 0) {
f47781d8
MP
1581 log_emergency_errno(r, "Failed to drop capability bounding set of usermode helpers: %m");
1582 error_message = "Failed to drop capability bounding set of usermode helpers";
663996b3
MS
1583 goto finish;
1584 }
14228c0d 1585 r = capability_bounding_set_drop(arg_capability_bounding_set_drop, true);
663996b3 1586 if (r < 0) {
f47781d8
MP
1587 log_emergency_errno(r, "Failed to drop capability bounding set: %m");
1588 error_message = "Failed to drop capability bounding set";
663996b3
MS
1589 goto finish;
1590 }
1591 }
1592
60f067b4
JS
1593 if (arg_syscall_archs) {
1594 r = enforce_syscall_archs(arg_syscall_archs);
f47781d8
MP
1595 if (r < 0) {
1596 error_message = "Failed to set syscall architectures";
60f067b4 1597 goto finish;
f47781d8 1598 }
60f067b4
JS
1599 }
1600
663996b3
MS
1601 if (arg_running_as == SYSTEMD_USER) {
1602 /* Become reaper of our children */
1603 if (prctl(PR_SET_CHILD_SUBREAPER, 1) < 0) {
f47781d8 1604 log_warning_errno(errno, "Failed to make us a subreaper: %m");
663996b3
MS
1605 if (errno == EINVAL)
1606 log_info("Perhaps the kernel version is too old (< 3.4?)");
1607 }
1608 }
1609
e842803a 1610 if (arg_running_as == SYSTEMD_SYSTEM) {
663996b3
MS
1611 bump_rlimit_nofile(&saved_rlimit_nofile);
1612
e842803a
MB
1613 if (empty_etc) {
1614 r = unit_file_preset_all(UNIT_FILE_SYSTEM, false, NULL, UNIT_FILE_PRESET_FULL, false, NULL, 0);
1615 if (r < 0)
f47781d8 1616 log_warning_errno(r, "Failed to populate /etc with preset unit settings, ignoring: %m");
e842803a
MB
1617 else
1618 log_info("Populated /etc with preset unit settings.");
1619 }
1620 }
1621
5eef597e 1622 r = manager_new(arg_running_as, arg_action == ACTION_TEST, &m);
663996b3 1623 if (r < 0) {
f47781d8
MP
1624 log_emergency_errno(r, "Failed to allocate manager object: %m");
1625 error_message = "Failed to allocate manager object";
663996b3
MS
1626 goto finish;
1627 }
1628
1629 m->confirm_spawn = arg_confirm_spawn;
60f067b4 1630 m->default_timer_accuracy_usec = arg_default_timer_accuracy_usec;
663996b3
MS
1631 m->default_std_output = arg_default_std_output;
1632 m->default_std_error = arg_default_std_error;
60f067b4
JS
1633 m->default_restart_usec = arg_default_restart_usec;
1634 m->default_timeout_start_usec = arg_default_timeout_start_usec;
1635 m->default_timeout_stop_usec = arg_default_timeout_stop_usec;
1636 m->default_start_limit_interval = arg_default_start_limit_interval;
1637 m->default_start_limit_burst = arg_default_start_limit_burst;
1638 m->default_cpu_accounting = arg_default_cpu_accounting;
1639 m->default_blockio_accounting = arg_default_blockio_accounting;
1640 m->default_memory_accounting = arg_default_memory_accounting;
663996b3
MS
1641 m->runtime_watchdog = arg_runtime_watchdog;
1642 m->shutdown_watchdog = arg_shutdown_watchdog;
5eef597e 1643
663996b3
MS
1644 m->userspace_timestamp = userspace_timestamp;
1645 m->kernel_timestamp = kernel_timestamp;
663996b3 1646 m->initrd_timestamp = initrd_timestamp;
60f067b4
JS
1647 m->security_start_timestamp = security_start_timestamp;
1648 m->security_finish_timestamp = security_finish_timestamp;
663996b3
MS
1649
1650 manager_set_default_rlimits(m, arg_default_rlimit);
60f067b4 1651 manager_environment_add(m, NULL, arg_default_environment);
663996b3 1652 manager_set_show_status(m, arg_show_status);
5eef597e 1653 manager_set_first_boot(m, empty_etc);
663996b3
MS
1654
1655 /* Remember whether we should queue the default job */
60f067b4 1656 queue_default_job = !arg_serialization || arg_switched_root;
663996b3
MS
1657
1658 before_startup = now(CLOCK_MONOTONIC);
1659
60f067b4 1660 r = manager_startup(m, arg_serialization, fds);
663996b3 1661 if (r < 0)
f47781d8 1662 log_error_errno(r, "Failed to fully start up daemon: %m");
663996b3
MS
1663
1664 /* This will close all file descriptors that were opened, but
1665 * not claimed by any unit. */
1666 fdset_free(fds);
14228c0d 1667 fds = NULL;
663996b3 1668
60f067b4
JS
1669 if (arg_serialization) {
1670 fclose(arg_serialization);
1671 arg_serialization = NULL;
663996b3
MS
1672 }
1673
1674 if (queue_default_job) {
60f067b4 1675 _cleanup_bus_error_free_ sd_bus_error error = SD_BUS_ERROR_NULL;
663996b3
MS
1676 Unit *target = NULL;
1677 Job *default_unit_job;
1678
663996b3
MS
1679 log_debug("Activating default unit: %s", arg_default_unit);
1680
1681 r = manager_load_unit(m, arg_default_unit, NULL, &error, &target);
60f067b4
JS
1682 if (r < 0)
1683 log_error("Failed to load default target: %s", bus_error_message(&error, r));
1684 else if (target->load_state == UNIT_ERROR || target->load_state == UNIT_NOT_FOUND)
f47781d8 1685 log_error_errno(target->load_error, "Failed to load default target: %m");
663996b3
MS
1686 else if (target->load_state == UNIT_MASKED)
1687 log_error("Default target masked.");
1688
1689 if (!target || target->load_state != UNIT_LOADED) {
1690 log_info("Trying to load rescue target...");
1691
1692 r = manager_load_unit(m, SPECIAL_RESCUE_TARGET, NULL, &error, &target);
1693 if (r < 0) {
f47781d8
MP
1694 log_emergency("Failed to load rescue target: %s", bus_error_message(&error, r));
1695 error_message = "Failed to load rescue target";
663996b3 1696 goto finish;
14228c0d 1697 } else if (target->load_state == UNIT_ERROR || target->load_state == UNIT_NOT_FOUND) {
f47781d8
MP
1698 log_emergency_errno(target->load_error, "Failed to load rescue target: %m");
1699 error_message = "Failed to load rescue target";
663996b3
MS
1700 goto finish;
1701 } else if (target->load_state == UNIT_MASKED) {
f47781d8
MP
1702 log_emergency("Rescue target masked.");
1703 error_message = "Rescue target masked";
663996b3
MS
1704 goto finish;
1705 }
1706 }
1707
1708 assert(target->load_state == UNIT_LOADED);
1709
1710 if (arg_action == ACTION_TEST) {
1711 printf("-> By units:\n");
1712 manager_dump_units(m, stdout, "\t");
1713 }
1714
1715 r = manager_add_job(m, JOB_START, target, JOB_ISOLATE, false, &error, &default_unit_job);
1716 if (r == -EPERM) {
60f067b4 1717 log_debug("Default target could not be isolated, starting instead: %s", bus_error_message(&error, r));
663996b3
MS
1718
1719 r = manager_add_job(m, JOB_START, target, JOB_REPLACE, false, &error, &default_unit_job);
1720 if (r < 0) {
f47781d8
MP
1721 log_emergency("Failed to start default target: %s", bus_error_message(&error, r));
1722 error_message = "Failed to start default target";
663996b3
MS
1723 goto finish;
1724 }
1725 } else if (r < 0) {
f47781d8
MP
1726 log_emergency("Failed to isolate default target: %s", bus_error_message(&error, r));
1727 error_message = "Failed to isolate default target";
663996b3
MS
1728 goto finish;
1729 }
1730
1731 m->default_unit_job_id = default_unit_job->id;
1732
1733 after_startup = now(CLOCK_MONOTONIC);
1734 log_full(arg_action == ACTION_TEST ? LOG_INFO : LOG_DEBUG,
1735 "Loaded units and determined initial transaction in %s.",
5eef597e 1736 format_timespan(timespan, sizeof(timespan), after_startup - before_startup, 100 * USEC_PER_MSEC));
663996b3
MS
1737
1738 if (arg_action == ACTION_TEST) {
1739 printf("-> By jobs:\n");
1740 manager_dump_jobs(m, stdout, "\t");
1741 retval = EXIT_SUCCESS;
1742 goto finish;
1743 }
1744 }
1745
1746 for (;;) {
1747 r = manager_loop(m);
1748 if (r < 0) {
f47781d8
MP
1749 log_emergency_errno(r, "Failed to run main loop: %m");
1750 error_message = "Failed to run main loop";
663996b3
MS
1751 goto finish;
1752 }
1753
1754 switch (m->exit_code) {
1755
1756 case MANAGER_EXIT:
1757 retval = EXIT_SUCCESS;
1758 log_debug("Exit.");
1759 goto finish;
1760
1761 case MANAGER_RELOAD:
1762 log_info("Reloading.");
1763 r = manager_reload(m);
1764 if (r < 0)
f47781d8 1765 log_error_errno(r, "Failed to reload: %m");
663996b3
MS
1766 break;
1767
1768 case MANAGER_REEXECUTE:
1769
f47781d8
MP
1770 if (prepare_reexecute(m, &arg_serialization, &fds, false) < 0) {
1771 error_message = "Failed to prepare for reexection";
663996b3 1772 goto finish;
f47781d8 1773 }
663996b3
MS
1774
1775 reexecute = true;
1776 log_notice("Reexecuting.");
1777 goto finish;
1778
1779 case MANAGER_SWITCH_ROOT:
1780 /* Steal the switch root parameters */
1781 switch_root_dir = m->switch_root;
1782 switch_root_init = m->switch_root_init;
1783 m->switch_root = m->switch_root_init = NULL;
1784
1785 if (!switch_root_init)
f47781d8
MP
1786 if (prepare_reexecute(m, &arg_serialization, &fds, true) < 0) {
1787 error_message = "Failed to prepare for reexection";
663996b3 1788 goto finish;
f47781d8 1789 }
663996b3
MS
1790
1791 reexecute = true;
1792 log_notice("Switching root.");
1793 goto finish;
1794
1795 case MANAGER_REBOOT:
1796 case MANAGER_POWEROFF:
1797 case MANAGER_HALT:
1798 case MANAGER_KEXEC: {
1799 static const char * const table[_MANAGER_EXIT_CODE_MAX] = {
1800 [MANAGER_REBOOT] = "reboot",
1801 [MANAGER_POWEROFF] = "poweroff",
1802 [MANAGER_HALT] = "halt",
1803 [MANAGER_KEXEC] = "kexec"
1804 };
1805
1806 assert_se(shutdown_verb = table[m->exit_code]);
1807 arm_reboot_watchdog = m->exit_code == MANAGER_REBOOT;
1808
1809 log_notice("Shutting down.");
1810 goto finish;
1811 }
1812
1813 default:
1814 assert_not_reached("Unknown exit code.");
1815 }
1816 }
1817
1818finish:
5eef597e
MP
1819 pager_close();
1820
f47781d8 1821 m = manager_free(m);
663996b3 1822
60f067b4 1823 for (j = 0; j < ELEMENTSOF(arg_default_rlimit); j++) {
663996b3 1824 free(arg_default_rlimit[j]);
60f067b4
JS
1825 arg_default_rlimit[j] = NULL;
1826 }
663996b3
MS
1827
1828 free(arg_default_unit);
60f067b4
JS
1829 arg_default_unit = NULL;
1830
663996b3
MS
1831 free_join_controllers();
1832
60f067b4
JS
1833 strv_free(arg_default_environment);
1834 arg_default_environment = NULL;
1835
1836 set_free(arg_syscall_archs);
1837 arg_syscall_archs = NULL;
1838
5eef597e 1839 mac_selinux_finish();
663996b3
MS
1840
1841 if (reexecute) {
1842 const char **args;
1843 unsigned i, args_size;
1844
1845 /* Close and disarm the watchdog, so that the new
1846 * instance can reinitialize it, but doesn't get
1847 * rebooted while we do that */
1848 watchdog_close(true);
1849
1850 /* Reset the RLIMIT_NOFILE to the kernel default, so
1851 * that the new systemd can pass the kernel default to
1852 * its child processes */
1853 if (saved_rlimit_nofile.rlim_cur > 0)
1854 setrlimit(RLIMIT_NOFILE, &saved_rlimit_nofile);
1855
1856 if (switch_root_dir) {
1857 /* Kill all remaining processes from the
1858 * initrd, but don't wait for them, so that we
1859 * can handle the SIGCHLD for them after
1860 * deserializing. */
60f067b4 1861 broadcast_signal(SIGTERM, false, true);
663996b3 1862
5eef597e
MP
1863 /* And switch root with MS_MOVE, because we remove the old directory afterwards and detach it. */
1864 r = switch_root(switch_root_dir, "/mnt", true, MS_MOVE);
663996b3 1865 if (r < 0)
f47781d8 1866 log_error_errno(r, "Failed to switch root, trying to continue: %m");
663996b3
MS
1867 }
1868
1869 args_size = MAX(6, argc+1);
1870 args = newa(const char*, args_size);
1871
1872 if (!switch_root_init) {
1873 char sfd[16];
1874
1875 /* First try to spawn ourselves with the right
1876 * path, and with full serialization. We do
1877 * this only if the user didn't specify an
1878 * explicit init to spawn. */
1879
60f067b4 1880 assert(arg_serialization);
663996b3
MS
1881 assert(fds);
1882
60f067b4 1883 snprintf(sfd, sizeof(sfd), "%i", fileno(arg_serialization));
663996b3
MS
1884 char_array_0(sfd);
1885
1886 i = 0;
1887 args[i++] = SYSTEMD_BINARY_PATH;
1888 if (switch_root_dir)
1889 args[i++] = "--switched-root";
1890 args[i++] = arg_running_as == SYSTEMD_SYSTEM ? "--system" : "--user";
1891 args[i++] = "--deserialize";
1892 args[i++] = sfd;
1893 args[i++] = NULL;
1894
14228c0d
MB
1895 /* do not pass along the environment we inherit from the kernel or initrd */
1896 if (switch_root_dir)
1897 clearenv();
1898
663996b3
MS
1899 assert(i <= args_size);
1900 execv(args[0], (char* const*) args);
1901 }
1902
1903 /* Try the fallback, if there is any, without any
1904 * serialization. We pass the original argv[] and
1905 * envp[]. (Well, modulo the ordering changes due to
1906 * getopt() in argv[], and some cleanups in envp[],
1907 * but let's hope that doesn't matter.) */
1908
60f067b4
JS
1909 if (arg_serialization) {
1910 fclose(arg_serialization);
1911 arg_serialization = NULL;
663996b3
MS
1912 }
1913
1914 if (fds) {
1915 fdset_free(fds);
1916 fds = NULL;
1917 }
1918
1919 /* Reopen the console */
1920 make_console_stdio();
1921
60f067b4 1922 for (j = 1, i = 1; j < (unsigned) argc; j++)
663996b3
MS
1923 args[i++] = argv[j];
1924 args[i++] = NULL;
1925 assert(i <= args_size);
1926
5eef597e 1927 /* Reenable any blocked signals, especially important
e842803a
MB
1928 * if we switch from initial ramdisk to init=... */
1929 reset_all_signal_handlers();
5eef597e 1930 reset_signal_mask();
e842803a 1931
663996b3
MS
1932 if (switch_root_init) {
1933 args[0] = switch_root_init;
1934 execv(args[0], (char* const*) args);
f47781d8 1935 log_warning_errno(errno, "Failed to execute configured init, trying fallback: %m");
663996b3
MS
1936 }
1937
1938 args[0] = "/sbin/init";
1939 execv(args[0], (char* const*) args);
1940
1941 if (errno == ENOENT) {
1942 log_warning("No /sbin/init, trying fallback");
1943
1944 args[0] = "/bin/sh";
1945 args[1] = NULL;
1946 execv(args[0], (char* const*) args);
f47781d8 1947 log_error_errno(errno, "Failed to execute /bin/sh, giving up: %m");
663996b3 1948 } else
f47781d8 1949 log_warning_errno(errno, "Failed to execute /sbin/init, giving up: %m");
663996b3
MS
1950 }
1951
60f067b4
JS
1952 if (arg_serialization) {
1953 fclose(arg_serialization);
1954 arg_serialization = NULL;
1955 }
663996b3 1956
60f067b4 1957 if (fds) {
663996b3 1958 fdset_free(fds);
60f067b4
JS
1959 fds = NULL;
1960 }
1961
1962#ifdef HAVE_VALGRIND_VALGRIND_H
1963 /* If we are PID 1 and running under valgrind, then let's exit
1964 * here explicitly. valgrind will only generate nice output on
1965 * exit(), not on exec(), hence let's do the former not the
1966 * latter here. */
1967 if (getpid() == 1 && RUNNING_ON_VALGRIND)
1968 return 0;
1969#endif
663996b3
MS
1970
1971 if (shutdown_verb) {
60f067b4
JS
1972 char log_level[DECIMAL_STR_MAX(int) + 1];
1973 const char* command_line[9] = {
663996b3
MS
1974 SYSTEMD_SHUTDOWN_BINARY_PATH,
1975 shutdown_verb,
60f067b4
JS
1976 "--log-level", log_level,
1977 "--log-target",
1978 };
1979 unsigned pos = 5;
1980 _cleanup_strv_free_ char **env_block = NULL;
1981
1982 assert(command_line[pos] == NULL);
1983 env_block = strv_copy(environ);
1984
1985 snprintf(log_level, sizeof(log_level), "%d", log_get_max_level());
1986
1987 switch (log_get_target()) {
1988 case LOG_TARGET_KMSG:
1989 case LOG_TARGET_JOURNAL_OR_KMSG:
1990 case LOG_TARGET_SYSLOG_OR_KMSG:
1991 command_line[pos++] = "kmsg";
1992 break;
1993
1994 case LOG_TARGET_CONSOLE:
1995 default:
1996 command_line[pos++] = "console";
1997 break;
663996b3 1998 };
60f067b4
JS
1999
2000 if (log_get_show_color())
2001 command_line[pos++] = "--log-color";
2002
2003 if (log_get_show_location())
2004 command_line[pos++] = "--log-location";
2005
2006 assert(pos < ELEMENTSOF(command_line));
663996b3
MS
2007
2008 if (arm_reboot_watchdog && arg_shutdown_watchdog > 0) {
60f067b4 2009 char *e;
663996b3
MS
2010
2011 /* If we reboot let's set the shutdown
2012 * watchdog and tell the shutdown binary to
2013 * repeatedly ping it */
2014 watchdog_set_timeout(&arg_shutdown_watchdog);
2015 watchdog_close(false);
2016
60f067b4
JS
2017 /* Tell the binary how often to ping, ignore failure */
2018 if (asprintf(&e, "WATCHDOG_USEC="USEC_FMT, arg_shutdown_watchdog) > 0)
2019 strv_push(&env_block, e);
2020 } else
663996b3 2021 watchdog_close(true);
663996b3 2022
14228c0d
MB
2023 /* Avoid the creation of new processes forked by the
2024 * kernel; at this point, we will not listen to the
2025 * signals anyway */
2026 if (detect_container(NULL) <= 0)
2027 cg_uninstall_release_agent(SYSTEMD_CGROUP_CONTROLLER);
2028
663996b3 2029 execve(SYSTEMD_SHUTDOWN_BINARY_PATH, (char **) command_line, env_block);
f47781d8 2030 log_error_errno(errno, "Failed to execute shutdown binary, %s: %m",
60f067b4 2031 getpid() == 1 ? "freezing" : "quitting");
663996b3
MS
2032 }
2033
f47781d8
MP
2034 if (getpid() == 1) {
2035 if (error_message)
2036 manager_status_printf(NULL, STATUS_TYPE_EMERGENCY,
2037 ANSI_HIGHLIGHT_RED_ON "!!!!!!" ANSI_HIGHLIGHT_OFF,
2038 "%s, freezing.", error_message);
663996b3 2039 freeze();
f47781d8 2040 }
663996b3
MS
2041
2042 return retval;
2043}