]> git.proxmox.com Git - systemd.git/blame - src/core/main.c
Imported Upstream version 227
[systemd.git] / src / core / main.c
CommitLineData
663996b3
MS
1/*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
2
3/***
4 This file is part of systemd.
5
6 Copyright 2010 Lennart Poettering
7
8 systemd is free software; you can redistribute it and/or modify it
9 under the terms of the GNU Lesser General Public License as published by
10 the Free Software Foundation; either version 2.1 of the License, or
11 (at your option) any later version.
12
13 systemd is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 Lesser General Public License for more details.
17
18 You should have received a copy of the GNU Lesser General Public License
19 along with systemd; If not, see <http://www.gnu.org/licenses/>.
20***/
21
663996b3 22#include <errno.h>
6300502b 23#include <fcntl.h>
663996b3
MS
24#include <getopt.h>
25#include <signal.h>
6300502b
MP
26#include <stdio.h>
27#include <string.h>
663996b3 28#include <sys/mount.h>
6300502b
MP
29#include <sys/prctl.h>
30#include <sys/reboot.h>
31#include <sys/stat.h>
32#include <unistd.h>
60f067b4
JS
33#ifdef HAVE_SECCOMP
34#include <seccomp.h>
35#endif
6300502b
MP
36#ifdef HAVE_VALGRIND_VALGRIND_H
37#include <valgrind/valgrind.h>
38#endif
60f067b4
JS
39
40#include "sd-daemon.h"
60f067b4 41#include "sd-bus.h"
6300502b 42
60f067b4 43#include "architecture.h"
6300502b
MP
44#include "build.h"
45#include "bus-error.h"
46#include "bus-util.h"
663996b3 47#include "capability.h"
60f067b4 48#include "clock-util.h"
6300502b
MP
49#include "conf-parser.h"
50#include "cpu-set-util.h"
51#include "dbus-manager.h"
52#include "def.h"
53#include "env-util.h"
54#include "fdset.h"
60f067b4 55#include "fileio.h"
86f210e9 56#include "formats-util.h"
6300502b
MP
57#include "hostname-setup.h"
58#include "ima-setup.h"
59#include "killall.h"
60#include "kmod-setup.h"
e735f4d4 61#include "load-fragment.h"
6300502b 62#include "log.h"
663996b3 63#include "loopback-setup.h"
663996b3 64#include "machine-id-setup.h"
6300502b
MP
65#include "manager.h"
66#include "missing.h"
67#include "mount-setup.h"
68#include "pager.h"
69#include "process-util.h"
663996b3 70#include "selinux-setup.h"
6300502b
MP
71#include "selinux-util.h"
72#include "signal-util.h"
663996b3 73#include "smack-setup.h"
6300502b
MP
74#include "special.h"
75#include "strv.h"
76#include "switch-root.h"
77#include "terminal-util.h"
78#include "virt.h"
79#include "watchdog.h"
663996b3
MS
80
81static enum {
82 ACTION_RUN,
83 ACTION_HELP,
84 ACTION_VERSION,
85 ACTION_TEST,
86 ACTION_DUMP_CONFIGURATION_ITEMS,
87 ACTION_DONE
88} arg_action = ACTION_RUN;
663996b3 89static char *arg_default_unit = NULL;
e3bff60a 90static ManagerRunningAs arg_running_as = _MANAGER_RUNNING_AS_INVALID;
663996b3 91static bool arg_dump_core = true;
663996b3 92static int arg_crash_chvt = -1;
6300502b
MP
93static bool arg_crash_shell = false;
94static bool arg_crash_reboot = false;
663996b3 95static bool arg_confirm_spawn = false;
60f067b4 96static ShowStatus arg_show_status = _SHOW_STATUS_UNSET;
663996b3 97static bool arg_switched_root = false;
5eef597e 98static int arg_no_pager = -1;
663996b3
MS
99static char ***arg_join_controllers = NULL;
100static ExecOutput arg_default_std_output = EXEC_OUTPUT_JOURNAL;
101static ExecOutput arg_default_std_error = EXEC_OUTPUT_INHERIT;
60f067b4
JS
102static usec_t arg_default_restart_usec = DEFAULT_RESTART_USEC;
103static usec_t arg_default_timeout_start_usec = DEFAULT_TIMEOUT_USEC;
104static usec_t arg_default_timeout_stop_usec = DEFAULT_TIMEOUT_USEC;
105static usec_t arg_default_start_limit_interval = DEFAULT_START_LIMIT_INTERVAL;
106static unsigned arg_default_start_limit_burst = DEFAULT_START_LIMIT_BURST;
663996b3
MS
107static usec_t arg_runtime_watchdog = 0;
108static usec_t arg_shutdown_watchdog = 10 * USEC_PER_MINUTE;
14228c0d 109static char **arg_default_environment = NULL;
60f067b4 110static struct rlimit *arg_default_rlimit[_RLIMIT_MAX] = {};
663996b3 111static uint64_t arg_capability_bounding_set_drop = 0;
5eef597e 112static nsec_t arg_timer_slack_nsec = NSEC_INFINITY;
60f067b4
JS
113static usec_t arg_default_timer_accuracy_usec = 1 * USEC_PER_MINUTE;
114static Set* arg_syscall_archs = NULL;
115static FILE* arg_serialization = NULL;
116static bool arg_default_cpu_accounting = false;
117static bool arg_default_blockio_accounting = false;
118static bool arg_default_memory_accounting = false;
6300502b 119static bool arg_default_tasks_accounting = false;
663996b3 120
5eef597e
MP
121static void pager_open_if_enabled(void) {
122
123 if (arg_no_pager <= 0)
124 return;
125
126 pager_open(false);
127}
128
6300502b
MP
129noreturn static void freeze_or_reboot(void) {
130
131 if (arg_crash_reboot) {
132 log_notice("Rebooting in 10s...");
133 (void) sleep(10);
134
135 log_notice("Rebooting now...");
136 (void) reboot(RB_AUTOBOOT);
137 log_emergency_errno(errno, "Failed to reboot: %m");
138 }
139
140 log_emergency("Freezing execution.");
141 freeze();
142}
143
60f067b4 144noreturn static void crash(int sig) {
6300502b
MP
145 struct sigaction sa;
146 pid_t pid;
663996b3 147
14228c0d
MB
148 if (getpid() != 1)
149 /* Pass this on immediately, if this is not PID 1 */
6300502b 150 (void) raise(sig);
14228c0d 151 else if (!arg_dump_core)
f47781d8 152 log_emergency("Caught <%s>, not dumping core.", signal_to_string(sig));
663996b3 153 else {
6300502b
MP
154 sa = (struct sigaction) {
155 .sa_handler = nop_signal_handler,
663996b3
MS
156 .sa_flags = SA_NOCLDSTOP|SA_RESTART,
157 };
663996b3
MS
158
159 /* We want to wait for the core process, hence let's enable SIGCHLD */
6300502b 160 (void) sigaction(SIGCHLD, &sa, NULL);
663996b3 161
e735f4d4 162 pid = raw_clone(SIGCHLD, NULL);
663996b3 163 if (pid < 0)
f47781d8 164 log_emergency_errno(errno, "Caught <%s>, cannot fork for core dump: %m", signal_to_string(sig));
663996b3 165 else if (pid == 0) {
6300502b
MP
166 struct rlimit rl = {
167 .rlim_cur = RLIM_INFINITY,
168 .rlim_max = RLIM_INFINITY,
169 };
663996b3
MS
170
171 /* Enable default signal handler for core dump */
6300502b
MP
172 sa = (struct sigaction) {
173 .sa_handler = SIG_DFL,
174 };
175 (void) sigaction(sig, &sa, NULL);
663996b3
MS
176
177 /* Don't limit the core dump size */
6300502b 178 (void) setrlimit(RLIMIT_CORE, &rl);
663996b3
MS
179
180 /* Just to be sure... */
e3bff60a 181 (void) chdir("/");
663996b3
MS
182
183 /* Raise the signal again */
e735f4d4 184 pid = raw_getpid();
6300502b 185 (void) kill(pid, sig); /* raise() would kill the parent */
663996b3
MS
186
187 assert_not_reached("We shouldn't be here...");
6300502b 188 _exit(EXIT_FAILURE);
663996b3
MS
189 } else {
190 siginfo_t status;
191 int r;
192
193 /* Order things nicely. */
194 r = wait_for_terminate(pid, &status);
195 if (r < 0)
f47781d8 196 log_emergency_errno(r, "Caught <%s>, waitpid() failed: %m", signal_to_string(sig));
663996b3 197 else if (status.si_code != CLD_DUMPED)
e735f4d4
MP
198 log_emergency("Caught <%s>, core dump failed (child "PID_FMT", code=%s, status=%i/%s).",
199 signal_to_string(sig),
200 pid, sigchld_code_to_string(status.si_code),
201 status.si_status,
202 strna(status.si_code == CLD_EXITED
203 ? exit_status_to_string(status.si_status, EXIT_STATUS_FULL)
204 : signal_to_string(status.si_status)));
663996b3 205 else
f47781d8 206 log_emergency("Caught <%s>, dumped core as pid "PID_FMT".", signal_to_string(sig), pid);
663996b3
MS
207 }
208 }
209
6300502b
MP
210 if (arg_crash_chvt >= 0)
211 (void) chvt(arg_crash_chvt);
663996b3 212
6300502b
MP
213 sa = (struct sigaction) {
214 .sa_handler = SIG_IGN,
215 .sa_flags = SA_NOCLDSTOP|SA_NOCLDWAIT|SA_RESTART,
216 };
663996b3 217
6300502b
MP
218 /* Let the kernel reap children for us */
219 (void) sigaction(SIGCHLD, &sa, NULL);
663996b3 220
6300502b
MP
221 if (arg_crash_shell) {
222 log_notice("Executing crash shell in 10s...");
223 (void) sleep(10);
663996b3 224
e735f4d4 225 pid = raw_clone(SIGCHLD, NULL);
663996b3 226 if (pid < 0)
f47781d8 227 log_emergency_errno(errno, "Failed to fork off crash shell: %m");
663996b3 228 else if (pid == 0) {
6300502b
MP
229 (void) setsid();
230 (void) make_console_stdio();
231 (void) execle("/bin/sh", "/bin/sh", NULL, environ);
663996b3 232
e735f4d4 233 log_emergency_errno(errno, "execle() failed: %m");
6300502b
MP
234 _exit(EXIT_FAILURE);
235 } else {
236 log_info("Spawned crash shell as PID "PID_FMT".", pid);
237 (void) wait_for_terminate(pid, NULL);
238 }
663996b3
MS
239 }
240
6300502b 241 freeze_or_reboot();
663996b3
MS
242}
243
244static void install_crash_handler(void) {
e735f4d4 245 static const struct sigaction sa = {
663996b3 246 .sa_handler = crash,
e735f4d4 247 .sa_flags = SA_NODEFER, /* So that we can raise the signal again from the signal handler */
663996b3 248 };
e735f4d4 249 int r;
663996b3 250
e735f4d4
MP
251 /* We ignore the return value here, since, we don't mind if we
252 * cannot set up a crash handler */
253 r = sigaction_many(&sa, SIGNALS_CRASH_HANDLER, -1);
254 if (r < 0)
255 log_debug_errno(r, "I had trouble setting up the crash handler, ignoring: %m");
663996b3
MS
256}
257
5eef597e
MP
258static int console_setup(void) {
259 _cleanup_close_ int tty_fd = -1;
260 int r;
663996b3
MS
261
262 tty_fd = open_terminal("/dev/console", O_WRONLY|O_NOCTTY|O_CLOEXEC);
f47781d8
MP
263 if (tty_fd < 0)
264 return log_error_errno(tty_fd, "Failed to open /dev/console: %m");
663996b3 265
5eef597e
MP
266 /* We don't want to force text mode. plymouth may be showing
267 * pictures already from initrd. */
663996b3 268 r = reset_terminal_fd(tty_fd, false);
f47781d8
MP
269 if (r < 0)
270 return log_error_errno(r, "Failed to reset /dev/console: %m");
663996b3 271
5eef597e 272 return 0;
663996b3
MS
273}
274
6300502b
MP
275static int parse_crash_chvt(const char *value) {
276 int b;
663996b3 277
6300502b
MP
278 if (safe_atoi(value, &arg_crash_chvt) >= 0)
279 return 0;
663996b3 280
6300502b
MP
281 b = parse_boolean(value);
282 if (b < 0)
283 return b;
663996b3 284
6300502b
MP
285 if (b > 0)
286 arg_crash_chvt = 0; /* switch to where kmsg goes */
287 else
288 arg_crash_chvt = -1; /* turn off switching */
663996b3
MS
289
290 return 0;
291}
292
60f067b4 293static int parse_proc_cmdline_item(const char *key, const char *value) {
663996b3
MS
294
295 static const char * const rlmap[] = {
296 "emergency", SPECIAL_EMERGENCY_TARGET,
297 "-b", SPECIAL_EMERGENCY_TARGET,
5eef597e 298 "rescue", SPECIAL_RESCUE_TARGET,
663996b3
MS
299 "single", SPECIAL_RESCUE_TARGET,
300 "-s", SPECIAL_RESCUE_TARGET,
301 "s", SPECIAL_RESCUE_TARGET,
302 "S", SPECIAL_RESCUE_TARGET,
303 "1", SPECIAL_RESCUE_TARGET,
e3bff60a
MP
304 "2", SPECIAL_MULTI_USER_TARGET,
305 "3", SPECIAL_MULTI_USER_TARGET,
306 "4", SPECIAL_MULTI_USER_TARGET,
307 "5", SPECIAL_GRAPHICAL_TARGET,
663996b3 308 };
60f067b4 309 int r;
663996b3 310
60f067b4 311 assert(key);
663996b3 312
60f067b4 313 if (streq(key, "systemd.unit") && value) {
663996b3
MS
314
315 if (!in_initrd())
6300502b 316 return free_and_strdup(&arg_default_unit, value);
663996b3 317
60f067b4 318 } else if (streq(key, "rd.systemd.unit") && value) {
663996b3 319
e842803a 320 if (in_initrd())
6300502b 321 return free_and_strdup(&arg_default_unit, value);
663996b3 322
60f067b4 323 } else if (streq(key, "systemd.dump_core") && value) {
663996b3 324
60f067b4
JS
325 r = parse_boolean(value);
326 if (r < 0)
327 log_warning("Failed to parse dump core switch %s. Ignoring.", value);
663996b3
MS
328 else
329 arg_dump_core = r;
330
6300502b
MP
331 } else if (streq(key, "systemd.crash_chvt") && value) {
332
333 if (parse_crash_chvt(value) < 0)
334 log_warning("Failed to parse crash chvt switch %s. Ignoring.", value);
335
60f067b4 336 } else if (streq(key, "systemd.crash_shell") && value) {
663996b3 337
60f067b4
JS
338 r = parse_boolean(value);
339 if (r < 0)
340 log_warning("Failed to parse crash shell switch %s. Ignoring.", value);
663996b3
MS
341 else
342 arg_crash_shell = r;
343
6300502b 344 } else if (streq(key, "systemd.crash_reboot") && value) {
663996b3 345
6300502b
MP
346 r = parse_boolean(value);
347 if (r < 0)
348 log_warning("Failed to parse crash reboot switch %s. Ignoring.", value);
663996b3 349 else
6300502b 350 arg_crash_reboot = r;
663996b3 351
60f067b4 352 } else if (streq(key, "systemd.confirm_spawn") && value) {
663996b3 353
60f067b4
JS
354 r = parse_boolean(value);
355 if (r < 0)
356 log_warning("Failed to parse confirm spawn switch %s. Ignoring.", value);
663996b3 357 else
60f067b4 358 arg_confirm_spawn = r;
663996b3 359
60f067b4 360 } else if (streq(key, "systemd.show_status") && value) {
663996b3 361
60f067b4
JS
362 r = parse_show_status(value, &arg_show_status);
363 if (r < 0)
364 log_warning("Failed to parse show status switch %s. Ignoring.", value);
365
366 } else if (streq(key, "systemd.default_standard_output") && value) {
663996b3 367
60f067b4
JS
368 r = exec_output_from_string(value);
369 if (r < 0)
370 log_warning("Failed to parse default standard output switch %s. Ignoring.", value);
663996b3
MS
371 else
372 arg_default_std_output = r;
663996b3 373
60f067b4
JS
374 } else if (streq(key, "systemd.default_standard_error") && value) {
375
376 r = exec_output_from_string(value);
377 if (r < 0)
378 log_warning("Failed to parse default standard error switch %s. Ignoring.", value);
663996b3
MS
379 else
380 arg_default_std_error = r;
663996b3 381
60f067b4 382 } else if (streq(key, "systemd.setenv") && value) {
663996b3 383
60f067b4 384 if (env_assignment_is_valid(value)) {
14228c0d
MB
385 char **env;
386
60f067b4 387 env = strv_env_set(arg_default_environment, value);
14228c0d
MB
388 if (env)
389 arg_default_environment = env;
390 else
f47781d8 391 log_warning_errno(ENOMEM, "Setting environment variable '%s' failed, ignoring: %m", value);
14228c0d 392 } else
60f067b4 393 log_warning("Environment variable name '%s' is not valid. Ignoring.", value);
663996b3 394
60f067b4 395 } else if (streq(key, "quiet") && !value) {
e842803a 396
60f067b4
JS
397 if (arg_show_status == _SHOW_STATUS_UNSET)
398 arg_show_status = SHOW_STATUS_AUTO;
399
400 } else if (streq(key, "debug") && !value) {
e842803a 401
5eef597e
MP
402 /* Note that log_parse_environment() handles 'debug'
403 * too, and sets the log level to LOG_DEBUG. */
e842803a 404
6300502b 405 if (detect_container() > 0)
60f067b4
JS
406 log_set_target(LOG_TARGET_CONSOLE);
407
408 } else if (!in_initrd() && !value) {
663996b3
MS
409 unsigned i;
410
411 /* SysV compatibility */
412 for (i = 0; i < ELEMENTSOF(rlmap); i += 2)
60f067b4 413 if (streq(key, rlmap[i]))
6300502b 414 return free_and_strdup(&arg_default_unit, rlmap[i+1]);
663996b3
MS
415 }
416
417 return 0;
418}
419
420#define DEFINE_SETTER(name, func, descr) \
421 static int name(const char *unit, \
422 const char *filename, \
423 unsigned line, \
424 const char *section, \
60f067b4 425 unsigned section_line, \
663996b3
MS
426 const char *lvalue, \
427 int ltype, \
428 const char *rvalue, \
429 void *data, \
430 void *userdata) { \
431 \
432 int r; \
433 \
434 assert(filename); \
435 assert(lvalue); \
436 assert(rvalue); \
437 \
438 r = func(rvalue); \
439 if (r < 0) \
6300502b
MP
440 log_syntax(unit, LOG_ERR, filename, line, r, \
441 "Invalid " descr "'%s': %m", \
442 rvalue); \
663996b3
MS
443 \
444 return 0; \
445 }
446
447DEFINE_SETTER(config_parse_level2, log_set_max_level_from_string, "log level")
448DEFINE_SETTER(config_parse_target, log_set_target_from_string, "target")
449DEFINE_SETTER(config_parse_color, log_show_color_from_string, "color" )
450DEFINE_SETTER(config_parse_location, log_show_location_from_string, "location")
451
60f067b4
JS
452static int config_parse_cpu_affinity2(
453 const char *unit,
454 const char *filename,
455 unsigned line,
456 const char *section,
457 unsigned section_line,
458 const char *lvalue,
459 int ltype,
460 const char *rvalue,
461 void *data,
462 void *userdata) {
663996b3 463
d9dfd233 464 _cleanup_cpu_free_ cpu_set_t *c = NULL;
6300502b 465 int ncpus;
663996b3 466
6300502b
MP
467 ncpus = parse_cpu_set_and_warn(rvalue, &c, unit, filename, line, lvalue);
468 if (ncpus < 0)
469 return ncpus;
663996b3 470
6300502b
MP
471 if (sched_setaffinity(0, CPU_ALLOC_SIZE(ncpus), c) < 0)
472 log_warning("Failed to set CPU affinity: %m");
663996b3 473
663996b3
MS
474 return 0;
475}
476
60f067b4
JS
477static int config_parse_show_status(
478 const char* unit,
479 const char *filename,
480 unsigned line,
481 const char *section,
482 unsigned section_line,
483 const char *lvalue,
484 int ltype,
485 const char *rvalue,
486 void *data,
487 void *userdata) {
488
489 int k;
490 ShowStatus *b = data;
491
492 assert(filename);
493 assert(lvalue);
494 assert(rvalue);
495 assert(data);
496
497 k = parse_show_status(rvalue, b);
498 if (k < 0) {
6300502b 499 log_syntax(unit, LOG_ERR, filename, line, k, "Failed to parse show status setting, ignoring: %s", rvalue);
60f067b4
JS
500 return 0;
501 }
502
503 return 0;
504}
505
6300502b
MP
506static int config_parse_crash_chvt(
507 const char* unit,
508 const char *filename,
509 unsigned line,
510 const char *section,
511 unsigned section_line,
512 const char *lvalue,
513 int ltype,
514 const char *rvalue,
515 void *data,
516 void *userdata) {
663996b3 517
6300502b 518 int r;
663996b3 519
6300502b
MP
520 assert(filename);
521 assert(lvalue);
522 assert(rvalue);
663996b3 523
6300502b
MP
524 r = parse_crash_chvt(rvalue);
525 if (r < 0) {
526 log_syntax(unit, LOG_ERR, filename, line, r, "Failed to parse CrashChangeVT= setting, ignoring: %s", rvalue);
527 return 0;
528 }
663996b3 529
6300502b 530 return 0;
663996b3
MS
531}
532
533static int config_parse_join_controllers(const char *unit,
534 const char *filename,
535 unsigned line,
536 const char *section,
60f067b4 537 unsigned section_line,
663996b3
MS
538 const char *lvalue,
539 int ltype,
540 const char *rvalue,
541 void *data,
542 void *userdata) {
543
d9dfd233 544 const char *whole_rvalue = rvalue;
663996b3 545 unsigned n = 0;
663996b3
MS
546
547 assert(filename);
548 assert(lvalue);
549 assert(rvalue);
550
6300502b 551 arg_join_controllers = strv_free_free(arg_join_controllers);
663996b3 552
d9dfd233
MP
553 for (;;) {
554 _cleanup_free_ char *word = NULL;
555 char **l;
556 int r;
663996b3 557
d9dfd233
MP
558 r = extract_first_word(&rvalue, &word, WHITESPACE, EXTRACT_QUOTES);
559 if (r < 0) {
560 log_syntax(unit, LOG_ERR, filename, line, r, "Invalid value for %s: %s", lvalue, whole_rvalue);
561 return r;
562 }
563 if (r == 0)
564 break;
663996b3 565
d9dfd233
MP
566 l = strv_split(word, ",");
567 if (!l)
6300502b 568 return log_oom();
663996b3
MS
569 strv_uniq(l);
570
571 if (strv_length(l) <= 1) {
572 strv_free(l);
573 continue;
574 }
575
576 if (!arg_join_controllers) {
577 arg_join_controllers = new(char**, 2);
578 if (!arg_join_controllers) {
579 strv_free(l);
580 return log_oom();
581 }
582
583 arg_join_controllers[0] = l;
584 arg_join_controllers[1] = NULL;
585
586 n = 1;
587 } else {
588 char ***a;
589 char ***t;
590
591 t = new0(char**, n+2);
592 if (!t) {
593 strv_free(l);
594 return log_oom();
595 }
596
597 n = 0;
598
599 for (a = arg_join_controllers; *a; a++) {
600
601 if (strv_overlap(*a, l)) {
6300502b 602 if (strv_extend_strv(&l, *a, false) < 0) {
663996b3
MS
603 strv_free(l);
604 strv_free_free(t);
605 return log_oom();
606 }
607
663996b3
MS
608 } else {
609 char **c;
610
611 c = strv_copy(*a);
612 if (!c) {
613 strv_free(l);
614 strv_free_free(t);
615 return log_oom();
616 }
617
618 t[n++] = c;
619 }
620 }
621
622 t[n++] = strv_uniq(l);
623
624 strv_free_free(arg_join_controllers);
625 arg_join_controllers = t;
626 }
627 }
d9dfd233 628 if (!isempty(rvalue))
6300502b 629 log_syntax(unit, LOG_ERR, filename, line, 0, "Trailing garbage, ignoring.");
663996b3
MS
630
631 return 0;
632}
633
634static int parse_config_file(void) {
635
636 const ConfigTableItem items[] = {
60f067b4
JS
637 { "Manager", "LogLevel", config_parse_level2, 0, NULL },
638 { "Manager", "LogTarget", config_parse_target, 0, NULL },
639 { "Manager", "LogColor", config_parse_color, 0, NULL },
640 { "Manager", "LogLocation", config_parse_location, 0, NULL },
641 { "Manager", "DumpCore", config_parse_bool, 0, &arg_dump_core },
6300502b
MP
642 { "Manager", "CrashChVT", /* legacy */ config_parse_crash_chvt, 0, NULL },
643 { "Manager", "CrashChangeVT", config_parse_crash_chvt, 0, NULL },
60f067b4 644 { "Manager", "CrashShell", config_parse_bool, 0, &arg_crash_shell },
6300502b 645 { "Manager", "CrashReboot", config_parse_bool, 0, &arg_crash_reboot },
60f067b4 646 { "Manager", "ShowStatus", config_parse_show_status, 0, &arg_show_status },
60f067b4
JS
647 { "Manager", "CPUAffinity", config_parse_cpu_affinity2, 0, NULL },
648 { "Manager", "JoinControllers", config_parse_join_controllers, 0, &arg_join_controllers },
649 { "Manager", "RuntimeWatchdogSec", config_parse_sec, 0, &arg_runtime_watchdog },
650 { "Manager", "ShutdownWatchdogSec", config_parse_sec, 0, &arg_shutdown_watchdog },
651 { "Manager", "CapabilityBoundingSet", config_parse_bounding_set, 0, &arg_capability_bounding_set_drop },
652#ifdef HAVE_SECCOMP
653 { "Manager", "SystemCallArchitectures", config_parse_syscall_archs, 0, &arg_syscall_archs },
654#endif
655 { "Manager", "TimerSlackNSec", config_parse_nsec, 0, &arg_timer_slack_nsec },
656 { "Manager", "DefaultTimerAccuracySec", config_parse_sec, 0, &arg_default_timer_accuracy_usec },
657 { "Manager", "DefaultStandardOutput", config_parse_output, 0, &arg_default_std_output },
658 { "Manager", "DefaultStandardError", config_parse_output, 0, &arg_default_std_error },
659 { "Manager", "DefaultTimeoutStartSec", config_parse_sec, 0, &arg_default_timeout_start_usec },
660 { "Manager", "DefaultTimeoutStopSec", config_parse_sec, 0, &arg_default_timeout_stop_usec },
661 { "Manager", "DefaultRestartSec", config_parse_sec, 0, &arg_default_restart_usec },
662 { "Manager", "DefaultStartLimitInterval", config_parse_sec, 0, &arg_default_start_limit_interval },
663 { "Manager", "DefaultStartLimitBurst", config_parse_unsigned, 0, &arg_default_start_limit_burst },
664 { "Manager", "DefaultEnvironment", config_parse_environ, 0, &arg_default_environment },
665 { "Manager", "DefaultLimitCPU", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_CPU] },
666 { "Manager", "DefaultLimitFSIZE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_FSIZE] },
667 { "Manager", "DefaultLimitDATA", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_DATA] },
668 { "Manager", "DefaultLimitSTACK", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_STACK] },
669 { "Manager", "DefaultLimitCORE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_CORE] },
670 { "Manager", "DefaultLimitRSS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RSS] },
671 { "Manager", "DefaultLimitNOFILE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NOFILE] },
672 { "Manager", "DefaultLimitAS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_AS] },
673 { "Manager", "DefaultLimitNPROC", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NPROC] },
674 { "Manager", "DefaultLimitMEMLOCK", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_MEMLOCK] },
675 { "Manager", "DefaultLimitLOCKS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_LOCKS] },
676 { "Manager", "DefaultLimitSIGPENDING", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_SIGPENDING] },
677 { "Manager", "DefaultLimitMSGQUEUE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_MSGQUEUE] },
678 { "Manager", "DefaultLimitNICE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NICE] },
679 { "Manager", "DefaultLimitRTPRIO", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RTPRIO] },
680 { "Manager", "DefaultLimitRTTIME", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RTTIME] },
681 { "Manager", "DefaultCPUAccounting", config_parse_bool, 0, &arg_default_cpu_accounting },
682 { "Manager", "DefaultBlockIOAccounting", config_parse_bool, 0, &arg_default_blockio_accounting },
683 { "Manager", "DefaultMemoryAccounting", config_parse_bool, 0, &arg_default_memory_accounting },
6300502b 684 { "Manager", "DefaultTasksAccounting", config_parse_bool, 0, &arg_default_tasks_accounting },
60f067b4 685 {}
663996b3
MS
686 };
687
f47781d8 688 const char *fn, *conf_dirs_nulstr;
663996b3 689
e3bff60a
MP
690 fn = arg_running_as == MANAGER_SYSTEM ? PKGSYSCONFDIR "/system.conf" : PKGSYSCONFDIR "/user.conf";
691 conf_dirs_nulstr = arg_running_as == MANAGER_SYSTEM ? CONF_DIRS_NULSTR("systemd/system.conf") : CONF_DIRS_NULSTR("systemd/user.conf");
f47781d8
MP
692 config_parse_many(fn, conf_dirs_nulstr, "Manager\0",
693 config_item_table_lookup, items, false, NULL);
663996b3
MS
694
695 return 0;
696}
697
7035cd9e
MP
698static void manager_set_defaults(Manager *m) {
699
700 assert(m);
701
702 m->default_timer_accuracy_usec = arg_default_timer_accuracy_usec;
703 m->default_std_output = arg_default_std_output;
704 m->default_std_error = arg_default_std_error;
705 m->default_timeout_start_usec = arg_default_timeout_start_usec;
706 m->default_timeout_stop_usec = arg_default_timeout_stop_usec;
707 m->default_restart_usec = arg_default_restart_usec;
708 m->default_start_limit_interval = arg_default_start_limit_interval;
709 m->default_start_limit_burst = arg_default_start_limit_burst;
710 m->default_cpu_accounting = arg_default_cpu_accounting;
711 m->default_blockio_accounting = arg_default_blockio_accounting;
712 m->default_memory_accounting = arg_default_memory_accounting;
6300502b 713 m->default_tasks_accounting = arg_default_tasks_accounting;
7035cd9e
MP
714
715 manager_set_default_rlimits(m, arg_default_rlimit);
716 manager_environment_add(m, NULL, arg_default_environment);
717}
718
663996b3
MS
719static int parse_argv(int argc, char *argv[]) {
720
721 enum {
722 ARG_LOG_LEVEL = 0x100,
723 ARG_LOG_TARGET,
724 ARG_LOG_COLOR,
725 ARG_LOG_LOCATION,
726 ARG_UNIT,
727 ARG_SYSTEM,
728 ARG_USER,
729 ARG_TEST,
5eef597e 730 ARG_NO_PAGER,
663996b3
MS
731 ARG_VERSION,
732 ARG_DUMP_CONFIGURATION_ITEMS,
733 ARG_DUMP_CORE,
6300502b 734 ARG_CRASH_CHVT,
663996b3 735 ARG_CRASH_SHELL,
6300502b 736 ARG_CRASH_REBOOT,
663996b3
MS
737 ARG_CONFIRM_SPAWN,
738 ARG_SHOW_STATUS,
739 ARG_DESERIALIZE,
740 ARG_SWITCHED_ROOT,
663996b3
MS
741 ARG_DEFAULT_STD_OUTPUT,
742 ARG_DEFAULT_STD_ERROR
743 };
744
745 static const struct option options[] = {
746 { "log-level", required_argument, NULL, ARG_LOG_LEVEL },
747 { "log-target", required_argument, NULL, ARG_LOG_TARGET },
748 { "log-color", optional_argument, NULL, ARG_LOG_COLOR },
749 { "log-location", optional_argument, NULL, ARG_LOG_LOCATION },
750 { "unit", required_argument, NULL, ARG_UNIT },
751 { "system", no_argument, NULL, ARG_SYSTEM },
752 { "user", no_argument, NULL, ARG_USER },
753 { "test", no_argument, NULL, ARG_TEST },
5eef597e 754 { "no-pager", no_argument, NULL, ARG_NO_PAGER },
663996b3
MS
755 { "help", no_argument, NULL, 'h' },
756 { "version", no_argument, NULL, ARG_VERSION },
757 { "dump-configuration-items", no_argument, NULL, ARG_DUMP_CONFIGURATION_ITEMS },
758 { "dump-core", optional_argument, NULL, ARG_DUMP_CORE },
6300502b 759 { "crash-chvt", required_argument, NULL, ARG_CRASH_CHVT },
663996b3 760 { "crash-shell", optional_argument, NULL, ARG_CRASH_SHELL },
6300502b 761 { "crash-reboot", optional_argument, NULL, ARG_CRASH_REBOOT },
663996b3
MS
762 { "confirm-spawn", optional_argument, NULL, ARG_CONFIRM_SPAWN },
763 { "show-status", optional_argument, NULL, ARG_SHOW_STATUS },
764 { "deserialize", required_argument, NULL, ARG_DESERIALIZE },
765 { "switched-root", no_argument, NULL, ARG_SWITCHED_ROOT },
663996b3
MS
766 { "default-standard-output", required_argument, NULL, ARG_DEFAULT_STD_OUTPUT, },
767 { "default-standard-error", required_argument, NULL, ARG_DEFAULT_STD_ERROR, },
60f067b4 768 {}
663996b3
MS
769 };
770
771 int c, r;
772
773 assert(argc >= 1);
774 assert(argv);
775
776 if (getpid() == 1)
777 opterr = 0;
778
779 while ((c = getopt_long(argc, argv, "hDbsz:", options, NULL)) >= 0)
780
781 switch (c) {
782
783 case ARG_LOG_LEVEL:
60f067b4
JS
784 r = log_set_max_level_from_string(optarg);
785 if (r < 0) {
663996b3
MS
786 log_error("Failed to parse log level %s.", optarg);
787 return r;
788 }
789
790 break;
791
792 case ARG_LOG_TARGET:
60f067b4
JS
793 r = log_set_target_from_string(optarg);
794 if (r < 0) {
663996b3
MS
795 log_error("Failed to parse log target %s.", optarg);
796 return r;
797 }
798
799 break;
800
801 case ARG_LOG_COLOR:
802
803 if (optarg) {
60f067b4
JS
804 r = log_show_color_from_string(optarg);
805 if (r < 0) {
663996b3
MS
806 log_error("Failed to parse log color setting %s.", optarg);
807 return r;
808 }
809 } else
810 log_show_color(true);
811
812 break;
813
814 case ARG_LOG_LOCATION:
663996b3 815 if (optarg) {
60f067b4
JS
816 r = log_show_location_from_string(optarg);
817 if (r < 0) {
663996b3
MS
818 log_error("Failed to parse log location setting %s.", optarg);
819 return r;
820 }
821 } else
822 log_show_location(true);
823
824 break;
825
826 case ARG_DEFAULT_STD_OUTPUT:
60f067b4
JS
827 r = exec_output_from_string(optarg);
828 if (r < 0) {
663996b3
MS
829 log_error("Failed to parse default standard output setting %s.", optarg);
830 return r;
831 } else
832 arg_default_std_output = r;
833 break;
834
835 case ARG_DEFAULT_STD_ERROR:
60f067b4
JS
836 r = exec_output_from_string(optarg);
837 if (r < 0) {
663996b3
MS
838 log_error("Failed to parse default standard error output setting %s.", optarg);
839 return r;
840 } else
841 arg_default_std_error = r;
842 break;
843
844 case ARG_UNIT:
845
6300502b 846 r = free_and_strdup(&arg_default_unit, optarg);
f47781d8
MP
847 if (r < 0)
848 return log_error_errno(r, "Failed to set default unit %s: %m", optarg);
663996b3
MS
849
850 break;
851
852 case ARG_SYSTEM:
e3bff60a 853 arg_running_as = MANAGER_SYSTEM;
663996b3
MS
854 break;
855
856 case ARG_USER:
e3bff60a 857 arg_running_as = MANAGER_USER;
663996b3
MS
858 break;
859
860 case ARG_TEST:
861 arg_action = ACTION_TEST;
5eef597e
MP
862 if (arg_no_pager < 0)
863 arg_no_pager = true;
864 break;
865
866 case ARG_NO_PAGER:
867 arg_no_pager = true;
663996b3
MS
868 break;
869
870 case ARG_VERSION:
871 arg_action = ACTION_VERSION;
872 break;
873
874 case ARG_DUMP_CONFIGURATION_ITEMS:
875 arg_action = ACTION_DUMP_CONFIGURATION_ITEMS;
876 break;
877
878 case ARG_DUMP_CORE:
6300502b
MP
879 if (!optarg)
880 arg_dump_core = true;
881 else {
882 r = parse_boolean(optarg);
883 if (r < 0)
884 return log_error_errno(r, "Failed to parse dump core boolean: %s", optarg);
885 arg_dump_core = r;
663996b3 886 }
6300502b
MP
887 break;
888
889 case ARG_CRASH_CHVT:
890 r = parse_crash_chvt(optarg);
891 if (r < 0)
892 return log_error_errno(r, "Failed to parse crash virtual terminal index: %s", optarg);
663996b3
MS
893 break;
894
895 case ARG_CRASH_SHELL:
6300502b
MP
896 if (!optarg)
897 arg_crash_shell = true;
898 else {
899 r = parse_boolean(optarg);
900 if (r < 0)
901 return log_error_errno(r, "Failed to parse crash shell boolean: %s", optarg);
902 arg_crash_shell = r;
903 }
904 break;
905
906 case ARG_CRASH_REBOOT:
907 if (!optarg)
908 arg_crash_reboot = true;
909 else {
910 r = parse_boolean(optarg);
911 if (r < 0)
912 return log_error_errno(r, "Failed to parse crash shell boolean: %s", optarg);
913 arg_crash_reboot = r;
663996b3 914 }
663996b3
MS
915 break;
916
917 case ARG_CONFIRM_SPAWN:
918 r = optarg ? parse_boolean(optarg) : 1;
919 if (r < 0) {
920 log_error("Failed to parse confirm spawn boolean %s.", optarg);
921 return r;
922 }
923 arg_confirm_spawn = r;
924 break;
925
926 case ARG_SHOW_STATUS:
60f067b4
JS
927 if (optarg) {
928 r = parse_show_status(optarg, &arg_show_status);
929 if (r < 0) {
930 log_error("Failed to parse show status boolean %s.", optarg);
931 return r;
932 }
933 } else
934 arg_show_status = SHOW_STATUS_YES;
663996b3
MS
935 break;
936
937 case ARG_DESERIALIZE: {
938 int fd;
939 FILE *f;
940
941 r = safe_atoi(optarg, &fd);
942 if (r < 0 || fd < 0) {
943 log_error("Failed to parse deserialize option %s.", optarg);
6300502b 944 return -EINVAL;
663996b3
MS
945 }
946
6300502b 947 (void) fd_cloexec(fd, true);
663996b3
MS
948
949 f = fdopen(fd, "r");
f47781d8
MP
950 if (!f)
951 return log_error_errno(errno, "Failed to open serialization fd: %m");
663996b3 952
6300502b 953 safe_fclose(arg_serialization);
60f067b4 954 arg_serialization = f;
663996b3
MS
955
956 break;
957 }
958
959 case ARG_SWITCHED_ROOT:
960 arg_switched_root = true;
961 break;
962
663996b3
MS
963 case 'h':
964 arg_action = ACTION_HELP;
5eef597e
MP
965 if (arg_no_pager < 0)
966 arg_no_pager = true;
663996b3
MS
967 break;
968
969 case 'D':
970 log_set_max_level(LOG_DEBUG);
971 break;
972
973 case 'b':
974 case 's':
975 case 'z':
976 /* Just to eat away the sysvinit kernel
977 * cmdline args without getopt() error
978 * messages that we'll parse in
979 * parse_proc_cmdline_word() or ignore. */
980
981 case '?':
5eef597e 982 if (getpid() != 1)
663996b3 983 return -EINVAL;
5eef597e
MP
984 else
985 return 0;
663996b3 986
5eef597e
MP
987 default:
988 assert_not_reached("Unhandled option code.");
663996b3
MS
989 }
990
991 if (optind < argc && getpid() != 1) {
992 /* Hmm, when we aren't run as init system
993 * let's complain about excess arguments */
994
995 log_error("Excess arguments.");
996 return -EINVAL;
997 }
998
663996b3
MS
999 return 0;
1000}
1001
1002static int help(void) {
1003
1004 printf("%s [OPTIONS...]\n\n"
1005 "Starts up and maintains the system or user services.\n\n"
1006 " -h --help Show this help\n"
1007 " --test Determine startup sequence, dump it and exit\n"
5eef597e 1008 " --no-pager Do not pipe output into a pager\n"
663996b3 1009 " --dump-configuration-items Dump understood unit configuration items\n"
663996b3
MS
1010 " --unit=UNIT Set default unit\n"
1011 " --system Run a system instance, even if PID != 1\n"
1012 " --user Run a user instance\n"
6300502b
MP
1013 " --dump-core[=BOOL] Dump core on crash\n"
1014 " --crash-vt=NR Change to specified VT on crash\n"
1015 " --crash-reboot[=BOOL] Reboot on crash\n"
1016 " --crash-shell[=BOOL] Run shell on crash\n"
1017 " --confirm-spawn[=BOOL] Ask for confirmation when spawning processes\n"
1018 " --show-status[=BOOL] Show status updates on the console during bootup\n"
5eef597e 1019 " --log-target=TARGET Set log target (console, journal, kmsg, journal-or-kmsg, null)\n"
663996b3 1020 " --log-level=LEVEL Set log level (debug, info, notice, warning, err, crit, alert, emerg)\n"
6300502b
MP
1021 " --log-color[=BOOL] Highlight important log messages\n"
1022 " --log-location[=BOOL] Include code location in log messages\n"
663996b3
MS
1023 " --default-standard-output= Set default standard output for services\n"
1024 " --default-standard-error= Set default standard error output for services\n",
1025 program_invocation_short_name);
1026
1027 return 0;
1028}
1029
663996b3 1030static int prepare_reexecute(Manager *m, FILE **_f, FDSet **_fds, bool switching_root) {
6300502b
MP
1031 _cleanup_fdset_free_ FDSet *fds = NULL;
1032 _cleanup_fclose_ FILE *f = NULL;
663996b3
MS
1033 int r;
1034
1035 assert(m);
1036 assert(_f);
1037 assert(_fds);
1038
663996b3 1039 r = manager_open_serialization(m, &f);
6300502b
MP
1040 if (r < 0)
1041 return log_error_errno(r, "Failed to create serialization file: %m");
663996b3 1042
14228c0d
MB
1043 /* Make sure nothing is really destructed when we shut down */
1044 m->n_reloading ++;
60f067b4 1045 bus_manager_send_reloading(m, true);
14228c0d 1046
663996b3 1047 fds = fdset_new();
6300502b
MP
1048 if (!fds)
1049 return log_oom();
663996b3
MS
1050
1051 r = manager_serialize(m, f, fds, switching_root);
6300502b
MP
1052 if (r < 0)
1053 return log_error_errno(r, "Failed to serialize state: %m");
663996b3 1054
6300502b
MP
1055 if (fseeko(f, 0, SEEK_SET) == (off_t) -1)
1056 return log_error_errno(errno, "Failed to rewind serialization fd: %m");
663996b3
MS
1057
1058 r = fd_cloexec(fileno(f), false);
6300502b
MP
1059 if (r < 0)
1060 return log_error_errno(r, "Failed to disable O_CLOEXEC for serialization: %m");
663996b3
MS
1061
1062 r = fdset_cloexec(fds, false);
6300502b
MP
1063 if (r < 0)
1064 return log_error_errno(r, "Failed to disable O_CLOEXEC for serialization fds: %m");
663996b3
MS
1065
1066 *_f = f;
1067 *_fds = fds;
1068
6300502b
MP
1069 f = NULL;
1070 fds = NULL;
663996b3 1071
6300502b 1072 return 0;
663996b3
MS
1073}
1074
1075static int bump_rlimit_nofile(struct rlimit *saved_rlimit) {
1076 struct rlimit nl;
1077 int r;
1078
1079 assert(saved_rlimit);
1080
1081 /* Save the original RLIMIT_NOFILE so that we can reset it
1082 * later when transitioning from the initrd to the main
1083 * systemd or suchlike. */
f47781d8
MP
1084 if (getrlimit(RLIMIT_NOFILE, saved_rlimit) < 0)
1085 return log_error_errno(errno, "Reading RLIMIT_NOFILE failed: %m");
663996b3
MS
1086
1087 /* Make sure forked processes get the default kernel setting */
1088 if (!arg_default_rlimit[RLIMIT_NOFILE]) {
1089 struct rlimit *rl;
1090
1091 rl = newdup(struct rlimit, saved_rlimit, 1);
1092 if (!rl)
1093 return log_oom();
1094
1095 arg_default_rlimit[RLIMIT_NOFILE] = rl;
1096 }
1097
1098 /* Bump up the resource limit for ourselves substantially */
1099 nl.rlim_cur = nl.rlim_max = 64*1024;
1100 r = setrlimit_closest(RLIMIT_NOFILE, &nl);
f47781d8
MP
1101 if (r < 0)
1102 return log_error_errno(r, "Setting RLIMIT_NOFILE failed: %m");
663996b3
MS
1103
1104 return 0;
1105}
1106
663996b3 1107static void test_mtab(void) {
663996b3 1108
e842803a
MB
1109 static const char ok[] =
1110 "/proc/self/mounts\0"
1111 "/proc/mounts\0"
1112 "../proc/self/mounts\0"
1113 "../proc/mounts\0";
663996b3 1114
e842803a
MB
1115 _cleanup_free_ char *p = NULL;
1116 int r;
663996b3 1117
e842803a
MB
1118 /* Check that /etc/mtab is a symlink to the right place or
1119 * non-existing. But certainly not a file, or a symlink to
1120 * some weird place... */
663996b3 1121
e842803a
MB
1122 r = readlink_malloc("/etc/mtab", &p);
1123 if (r == -ENOENT)
1124 return;
1125 if (r >= 0 && nulstr_contains(ok, p))
1126 return;
663996b3 1127
6300502b
MP
1128 log_error("/etc/mtab is not a symlink or not pointing to /proc/self/mounts. "
1129 "This is not supported anymore. "
1130 "Please replace /etc/mtab with a symlink to /proc/self/mounts.");
1131 freeze_or_reboot();
663996b3
MS
1132}
1133
1134static void test_usr(void) {
1135
1136 /* Check that /usr is not a separate fs */
1137
1138 if (dir_is_empty("/usr") <= 0)
1139 return;
1140
e735f4d4 1141 log_warning("/usr appears to be on its own filesystem and is not already mounted. This is not a supported setup. "
663996b3
MS
1142 "Some things will probably break (sometimes even silently) in mysterious ways. "
1143 "Consult http://freedesktop.org/wiki/Software/systemd/separate-usr-is-broken for more information.");
1144}
1145
663996b3
MS
1146static int initialize_join_controllers(void) {
1147 /* By default, mount "cpu" + "cpuacct" together, and "net_cls"
1148 * + "net_prio". We'd like to add "cpuset" to the mix, but
e735f4d4 1149 * "cpuset" doesn't really work for groups with no initialized
663996b3
MS
1150 * attributes. */
1151
1152 arg_join_controllers = new(char**, 3);
1153 if (!arg_join_controllers)
1154 return -ENOMEM;
1155
1156 arg_join_controllers[0] = strv_new("cpu", "cpuacct", NULL);
6300502b
MP
1157 if (!arg_join_controllers[0])
1158 goto oom;
663996b3 1159
6300502b
MP
1160 arg_join_controllers[1] = strv_new("net_cls", "net_prio", NULL);
1161 if (!arg_join_controllers[1])
1162 goto oom;
663996b3 1163
6300502b 1164 arg_join_controllers[2] = NULL;
663996b3 1165 return 0;
6300502b
MP
1166
1167oom:
1168 arg_join_controllers = strv_free_free(arg_join_controllers);
1169 return -ENOMEM;
663996b3
MS
1170}
1171
60f067b4
JS
1172static int enforce_syscall_archs(Set *archs) {
1173#ifdef HAVE_SECCOMP
1174 scmp_filter_ctx *seccomp;
1175 Iterator i;
1176 void *id;
1177 int r;
1178
1179 seccomp = seccomp_init(SCMP_ACT_ALLOW);
1180 if (!seccomp)
1181 return log_oom();
1182
1183 SET_FOREACH(id, arg_syscall_archs, i) {
1184 r = seccomp_arch_add(seccomp, PTR_TO_UINT32(id) - 1);
1185 if (r == -EEXIST)
1186 continue;
1187 if (r < 0) {
f47781d8 1188 log_error_errno(r, "Failed to add architecture to seccomp: %m");
60f067b4
JS
1189 goto finish;
1190 }
1191 }
1192
1193 r = seccomp_attr_set(seccomp, SCMP_FLTATR_CTL_NNP, 0);
1194 if (r < 0) {
f47781d8 1195 log_error_errno(r, "Failed to unset NO_NEW_PRIVS: %m");
60f067b4
JS
1196 goto finish;
1197 }
1198
1199 r = seccomp_load(seccomp);
1200 if (r < 0)
f47781d8 1201 log_error_errno(r, "Failed to add install architecture seccomp: %m");
60f067b4
JS
1202
1203finish:
1204 seccomp_release(seccomp);
1205 return r;
1206#else
1207 return 0;
1208#endif
1209}
1210
1211static int status_welcome(void) {
1212 _cleanup_free_ char *pretty_name = NULL, *ansi_color = NULL;
1213 int r;
1214
1215 r = parse_env_file("/etc/os-release", NEWLINE,
1216 "PRETTY_NAME", &pretty_name,
1217 "ANSI_COLOR", &ansi_color,
1218 NULL);
6300502b 1219 if (r == -ENOENT)
e842803a
MB
1220 r = parse_env_file("/usr/lib/os-release", NEWLINE,
1221 "PRETTY_NAME", &pretty_name,
1222 "ANSI_COLOR", &ansi_color,
1223 NULL);
60f067b4
JS
1224
1225 if (r < 0 && r != -ENOENT)
f47781d8 1226 log_warning_errno(r, "Failed to read os-release file: %m");
60f067b4
JS
1227
1228 return status_printf(NULL, false, false,
1229 "\nWelcome to \x1B[%sm%s\x1B[0m!\n",
1230 isempty(ansi_color) ? "1" : ansi_color,
1231 isempty(pretty_name) ? "Linux" : pretty_name);
1232}
1233
1234static int write_container_id(void) {
1235 const char *c;
1236
1237 c = getenv("container");
1238 if (isempty(c))
1239 return 0;
1240
7035cd9e 1241 return write_string_file("/run/systemd/container", c, WRITE_STRING_FILE_CREATE);
60f067b4
JS
1242}
1243
663996b3
MS
1244int main(int argc, char *argv[]) {
1245 Manager *m = NULL;
1246 int r, retval = EXIT_FAILURE;
1247 usec_t before_startup, after_startup;
1248 char timespan[FORMAT_TIMESPAN_MAX];
1249 FDSet *fds = NULL;
1250 bool reexecute = false;
1251 const char *shutdown_verb = NULL;
e735f4d4
MP
1252 dual_timestamp initrd_timestamp = DUAL_TIMESTAMP_NULL;
1253 dual_timestamp userspace_timestamp = DUAL_TIMESTAMP_NULL;
1254 dual_timestamp kernel_timestamp = DUAL_TIMESTAMP_NULL;
1255 dual_timestamp security_start_timestamp = DUAL_TIMESTAMP_NULL;
1256 dual_timestamp security_finish_timestamp = DUAL_TIMESTAMP_NULL;
663996b3
MS
1257 static char systemd[] = "systemd";
1258 bool skip_setup = false;
60f067b4 1259 unsigned j;
663996b3
MS
1260 bool loaded_policy = false;
1261 bool arm_reboot_watchdog = false;
1262 bool queue_default_job = false;
e842803a 1263 bool empty_etc = false;
663996b3 1264 char *switch_root_dir = NULL, *switch_root_init = NULL;
e735f4d4 1265 struct rlimit saved_rlimit_nofile = RLIMIT_MAKE_CONST(0);
f47781d8 1266 const char *error_message = NULL;
663996b3
MS
1267
1268#ifdef HAVE_SYSV_COMPAT
1269 if (getpid() != 1 && strstr(program_invocation_short_name, "init")) {
1270 /* This is compatibility support for SysV, where
1271 * calling init as a user is identical to telinit. */
1272
1273 errno = -ENOENT;
1274 execv(SYSTEMCTL_BINARY_PATH, argv);
f47781d8 1275 log_error_errno(errno, "Failed to exec " SYSTEMCTL_BINARY_PATH ": %m");
663996b3
MS
1276 return 1;
1277 }
1278#endif
1279
1280 dual_timestamp_from_monotonic(&kernel_timestamp, 0);
1281 dual_timestamp_get(&userspace_timestamp);
1282
1283 /* Determine if this is a reexecution or normal bootup. We do
1284 * the full command line parsing much later, so let's just
1285 * have a quick peek here. */
1286 if (strv_find(argv+1, "--deserialize"))
1287 skip_setup = true;
1288
1289 /* If we have switched root, do all the special setup
1290 * things */
1291 if (strv_find(argv+1, "--switched-root"))
1292 skip_setup = false;
1293
1294 /* If we get started via the /sbin/init symlink then we are
1295 called 'init'. After a subsequent reexecution we are then
1296 called 'systemd'. That is confusing, hence let's call us
1297 systemd right-away. */
1298 program_invocation_short_name = systemd;
1299 prctl(PR_SET_NAME, systemd);
1300
1301 saved_argv = argv;
1302 saved_argc = argc;
1303
1304 log_show_color(isatty(STDERR_FILENO) > 0);
5eef597e 1305 log_set_upgrade_syslog_to_journal(true);
663996b3 1306
14228c0d
MB
1307 /* Disable the umask logic */
1308 if (getpid() == 1)
1309 umask(0);
1310
6300502b 1311 if (getpid() == 1 && detect_container() <= 0) {
14228c0d 1312
663996b3 1313 /* Running outside of a container as PID 1 */
e3bff60a 1314 arg_running_as = MANAGER_SYSTEM;
663996b3
MS
1315 make_null_stdio();
1316 log_set_target(LOG_TARGET_KMSG);
1317 log_open();
1318
14228c0d 1319 if (in_initrd())
663996b3 1320 initrd_timestamp = userspace_timestamp;
663996b3
MS
1321
1322 if (!skip_setup) {
1323 mount_setup_early();
60f067b4 1324 dual_timestamp_get(&security_start_timestamp);
f47781d8
MP
1325 if (mac_selinux_setup(&loaded_policy) < 0) {
1326 error_message = "Failed to load SELinux policy";
663996b3 1327 goto finish;
f47781d8
MP
1328 } else if (ima_setup() < 0) {
1329 error_message = "Failed to load IMA policy";
663996b3 1330 goto finish;
f47781d8
MP
1331 } else if (mac_smack_setup(&loaded_policy) < 0) {
1332 error_message = "Failed to load SMACK policy";
663996b3 1333 goto finish;
f47781d8 1334 }
60f067b4 1335 dual_timestamp_get(&security_finish_timestamp);
663996b3
MS
1336 }
1337
f47781d8
MP
1338 if (mac_selinux_init(NULL) < 0) {
1339 error_message = "Failed to initialize SELinux policy";
663996b3 1340 goto finish;
f47781d8 1341 }
663996b3
MS
1342
1343 if (!skip_setup) {
60f067b4 1344 if (clock_is_localtime() > 0) {
663996b3
MS
1345 int min;
1346
5eef597e
MP
1347 /*
1348 * The very first call of settimeofday() also does a time warp in the kernel.
1349 *
1350 * In the rtc-in-local time mode, we set the kernel's timezone, and rely on
1351 * external tools to take care of maintaining the RTC and do all adjustments.
1352 * This matches the behavior of Windows, which leaves the RTC alone if the
1353 * registry tells that the RTC runs in UTC.
1354 */
60f067b4 1355 r = clock_set_timezone(&min);
663996b3 1356 if (r < 0)
f47781d8 1357 log_error_errno(r, "Failed to apply local time delta, ignoring: %m");
663996b3
MS
1358 else
1359 log_info("RTC configured in localtime, applying delta of %i minutes to system time.", min);
1360 } else if (!in_initrd()) {
1361 /*
5eef597e 1362 * Do a dummy very first call to seal the kernel's time warp magic.
663996b3
MS
1363 *
1364 * Do not call this this from inside the initrd. The initrd might not
1365 * carry /etc/adjtime with LOCAL, but the real system could be set up
1366 * that way. In such case, we need to delay the time-warp or the sealing
1367 * until we reach the real system.
5eef597e
MP
1368 *
1369 * Do no set the kernel's timezone. The concept of local time cannot
1370 * be supported reliably, the time will jump or be incorrect at every daylight
1371 * saving time change. All kernel local time concepts will be treated
1372 * as UTC that way.
663996b3 1373 */
5eef597e 1374 clock_reset_timewarp();
663996b3
MS
1375 }
1376 }
1377
1378 /* Set the default for later on, but don't actually
1379 * open the logs like this for now. Note that if we
1380 * are transitioning from the initrd there might still
1381 * be journal fd open, and we shouldn't attempt
1382 * opening that before we parsed /proc/cmdline which
1383 * might redirect output elsewhere. */
1384 log_set_target(LOG_TARGET_JOURNAL_OR_KMSG);
1385
1386 } else if (getpid() == 1) {
1387 /* Running inside a container, as PID 1 */
e3bff60a 1388 arg_running_as = MANAGER_SYSTEM;
663996b3 1389 log_set_target(LOG_TARGET_CONSOLE);
60f067b4 1390 log_close_console(); /* force reopen of /dev/console */
663996b3
MS
1391 log_open();
1392
1393 /* For the later on, see above... */
1394 log_set_target(LOG_TARGET_JOURNAL);
1395
1396 /* clear the kernel timestamp,
1397 * because we are in a container */
1398 kernel_timestamp.monotonic = 0ULL;
1399 kernel_timestamp.realtime = 0ULL;
1400
1401 } else {
1402 /* Running as user instance */
e3bff60a 1403 arg_running_as = MANAGER_USER;
663996b3
MS
1404 log_set_target(LOG_TARGET_AUTO);
1405 log_open();
1406
1407 /* clear the kernel timestamp,
1408 * because we are not PID 1 */
d9dfd233 1409 kernel_timestamp = DUAL_TIMESTAMP_NULL;
663996b3
MS
1410 }
1411
1412 /* Initialize default unit */
6300502b 1413 r = free_and_strdup(&arg_default_unit, SPECIAL_DEFAULT_TARGET);
663996b3 1414 if (r < 0) {
f47781d8
MP
1415 log_emergency_errno(r, "Failed to set default unit %s: %m", SPECIAL_DEFAULT_TARGET);
1416 error_message = "Failed to set default unit";
663996b3
MS
1417 goto finish;
1418 }
1419
1420 r = initialize_join_controllers();
f47781d8 1421 if (r < 0) {
e3bff60a 1422 error_message = "Failed to initialize cgroup controllers";
663996b3 1423 goto finish;
f47781d8 1424 }
663996b3
MS
1425
1426 /* Mount /proc, /sys and friends, so that /proc/cmdline and
1427 * /proc/$PID/fd is available. */
1428 if (getpid() == 1) {
f47781d8
MP
1429
1430 /* Load the kernel modules early, so that we kdbus.ko is loaded before kdbusfs shall be mounted */
1431 if (!skip_setup)
1432 kmod_setup();
1433
663996b3 1434 r = mount_setup(loaded_policy);
f47781d8
MP
1435 if (r < 0) {
1436 error_message = "Failed to mount API filesystems";
663996b3 1437 goto finish;
f47781d8 1438 }
663996b3
MS
1439 }
1440
1441 /* Reset all signal handlers. */
86f210e9
MP
1442 (void) reset_all_signal_handlers();
1443 (void) ignore_signals(SIGNALS_IGNORE, -1);
663996b3 1444
f47781d8
MP
1445 if (parse_config_file() < 0) {
1446 error_message = "Failed to parse config file";
663996b3 1447 goto finish;
f47781d8 1448 }
663996b3 1449
e3bff60a 1450 if (arg_running_as == MANAGER_SYSTEM) {
f47781d8
MP
1451 r = parse_proc_cmdline(parse_proc_cmdline_item);
1452 if (r < 0)
1453 log_warning_errno(r, "Failed to parse kernel command line, ignoring: %m");
1454 }
663996b3 1455
5eef597e
MP
1456 /* Note that this also parses bits from the kernel command
1457 * line, including "debug". */
663996b3
MS
1458 log_parse_environment();
1459
f47781d8
MP
1460 if (parse_argv(argc, argv) < 0) {
1461 error_message = "Failed to parse commandline arguments";
663996b3 1462 goto finish;
f47781d8 1463 }
663996b3
MS
1464
1465 if (arg_action == ACTION_TEST &&
1466 geteuid() == 0) {
1467 log_error("Don't run test mode as root.");
1468 goto finish;
1469 }
1470
e3bff60a 1471 if (arg_running_as == MANAGER_USER &&
663996b3
MS
1472 arg_action == ACTION_RUN &&
1473 sd_booted() <= 0) {
1474 log_error("Trying to run as user instance, but the system has not been booted with systemd.");
1475 goto finish;
1476 }
1477
e3bff60a 1478 if (arg_running_as == MANAGER_SYSTEM &&
663996b3
MS
1479 arg_action == ACTION_RUN &&
1480 running_in_chroot() > 0) {
1481 log_error("Cannot be run in a chroot() environment.");
1482 goto finish;
1483 }
1484
5eef597e
MP
1485 if (arg_action == ACTION_TEST)
1486 skip_setup = true;
1487
1488 pager_open_if_enabled();
1489
663996b3
MS
1490 if (arg_action == ACTION_HELP) {
1491 retval = help();
1492 goto finish;
1493 } else if (arg_action == ACTION_VERSION) {
1494 retval = version();
1495 goto finish;
1496 } else if (arg_action == ACTION_DUMP_CONFIGURATION_ITEMS) {
1497 unit_dump_config_items(stdout);
1498 retval = EXIT_SUCCESS;
1499 goto finish;
1500 } else if (arg_action == ACTION_DONE) {
1501 retval = EXIT_SUCCESS;
1502 goto finish;
1503 }
1504
e3bff60a 1505 if (arg_running_as == MANAGER_USER &&
60f067b4
JS
1506 !getenv("XDG_RUNTIME_DIR")) {
1507 log_error("Trying to run as user instance, but $XDG_RUNTIME_DIR is not set.");
1508 goto finish;
1509 }
1510
663996b3
MS
1511 assert_se(arg_action == ACTION_RUN || arg_action == ACTION_TEST);
1512
1513 /* Close logging fds, in order not to confuse fdset below */
1514 log_close();
1515
1516 /* Remember open file descriptors for later deserialization */
1517 r = fdset_new_fill(&fds);
1518 if (r < 0) {
f47781d8
MP
1519 log_emergency_errno(r, "Failed to allocate fd set: %m");
1520 error_message = "Failed to allocate fd set";
663996b3
MS
1521 goto finish;
1522 } else
1523 fdset_cloexec(fds, true);
1524
60f067b4
JS
1525 if (arg_serialization)
1526 assert_se(fdset_remove(fds, fileno(arg_serialization)) >= 0);
663996b3 1527
e3bff60a 1528 if (arg_running_as == MANAGER_SYSTEM)
663996b3
MS
1529 /* Become a session leader if we aren't one yet. */
1530 setsid();
1531
14228c0d 1532 /* Move out of the way, so that we won't block unmounts */
86f210e9 1533 assert_se(chdir("/") == 0);
663996b3 1534
663996b3
MS
1535 /* Reset the console, but only if this is really init and we
1536 * are freshly booted */
e3bff60a 1537 if (arg_running_as == MANAGER_SYSTEM && arg_action == ACTION_RUN) {
5eef597e
MP
1538
1539 /* If we are init, we connect stdin/stdout/stderr to
1540 * /dev/null and make sure we don't have a controlling
1541 * tty. */
1542 release_terminal();
1543
1544 if (getpid() == 1 && !skip_setup)
1545 console_setup();
1546 }
663996b3
MS
1547
1548 /* Open the logging devices, if possible and necessary */
1549 log_open();
1550
60f067b4
JS
1551 if (arg_show_status == _SHOW_STATUS_UNSET)
1552 arg_show_status = SHOW_STATUS_YES;
1553
663996b3
MS
1554 /* Make sure we leave a core dump without panicing the
1555 * kernel. */
1556 if (getpid() == 1) {
1557 install_crash_handler();
1558
1559 r = mount_cgroup_controllers(arg_join_controllers);
1560 if (r < 0)
1561 goto finish;
1562 }
1563
e3bff60a 1564 if (arg_running_as == MANAGER_SYSTEM) {
6300502b 1565 int v;
663996b3 1566
5eef597e
MP
1567 log_info(PACKAGE_STRING " running in %ssystem mode. (" SYSTEMD_FEATURES ")",
1568 arg_action == ACTION_TEST ? "test " : "" );
663996b3 1569
6300502b
MP
1570 v = detect_virtualization();
1571 if (v > 0)
1572 log_info("Detected virtualization %s.", virtualization_to_string(v));
663996b3 1573
60f067b4
JS
1574 write_container_id();
1575
e3bff60a 1576 log_info("Detected architecture %s.", architecture_to_string(uname_architecture()));
60f067b4 1577
663996b3
MS
1578 if (in_initrd())
1579 log_info("Running in initial RAM disk.");
1580
5eef597e
MP
1581 /* Let's check whether /etc is already populated. We
1582 * don't actually really check for that, but use
1583 * /etc/machine-id as flag file. This allows container
1584 * managers and installers to provision a couple of
1585 * files already. If the container manager wants to
1586 * provision the machine ID itself it should pass
e735f4d4 1587 * $container_uuid to PID 1. */
5eef597e
MP
1588
1589 empty_etc = access("/etc/machine-id", F_OK) < 0;
e842803a
MB
1590 if (empty_etc)
1591 log_info("Running with unpopulated /etc.");
60f067b4 1592 } else {
e842803a
MB
1593 _cleanup_free_ char *t;
1594
1595 t = uid_to_name(getuid());
5eef597e
MP
1596 log_debug(PACKAGE_STRING " running in %suser mode for user "UID_FMT"/%s. (" SYSTEMD_FEATURES ")",
1597 arg_action == ACTION_TEST ? " test" : "", getuid(), t);
60f067b4 1598 }
663996b3 1599
e3bff60a
MP
1600 if (arg_running_as == MANAGER_SYSTEM && !skip_setup) {
1601 if (arg_show_status > 0)
663996b3
MS
1602 status_welcome();
1603
663996b3 1604 hostname_setup();
e842803a 1605 machine_id_setup(NULL);
663996b3
MS
1606 loopback_setup();
1607
1608 test_mtab();
1609 test_usr();
663996b3
MS
1610 }
1611
e3bff60a 1612 if (arg_running_as == MANAGER_SYSTEM && arg_runtime_watchdog > 0)
663996b3
MS
1613 watchdog_set_timeout(&arg_runtime_watchdog);
1614
5eef597e 1615 if (arg_timer_slack_nsec != NSEC_INFINITY)
663996b3 1616 if (prctl(PR_SET_TIMERSLACK, arg_timer_slack_nsec) < 0)
f47781d8 1617 log_error_errno(errno, "Failed to adjust timer slack: %m");
663996b3
MS
1618
1619 if (arg_capability_bounding_set_drop) {
14228c0d 1620 r = capability_bounding_set_drop_usermode(arg_capability_bounding_set_drop);
663996b3 1621 if (r < 0) {
f47781d8
MP
1622 log_emergency_errno(r, "Failed to drop capability bounding set of usermode helpers: %m");
1623 error_message = "Failed to drop capability bounding set of usermode helpers";
663996b3
MS
1624 goto finish;
1625 }
14228c0d 1626 r = capability_bounding_set_drop(arg_capability_bounding_set_drop, true);
663996b3 1627 if (r < 0) {
f47781d8
MP
1628 log_emergency_errno(r, "Failed to drop capability bounding set: %m");
1629 error_message = "Failed to drop capability bounding set";
663996b3
MS
1630 goto finish;
1631 }
1632 }
1633
60f067b4
JS
1634 if (arg_syscall_archs) {
1635 r = enforce_syscall_archs(arg_syscall_archs);
f47781d8
MP
1636 if (r < 0) {
1637 error_message = "Failed to set syscall architectures";
60f067b4 1638 goto finish;
f47781d8 1639 }
60f067b4
JS
1640 }
1641
86f210e9 1642 if (arg_running_as == MANAGER_USER)
663996b3 1643 /* Become reaper of our children */
86f210e9 1644 if (prctl(PR_SET_CHILD_SUBREAPER, 1) < 0)
f47781d8 1645 log_warning_errno(errno, "Failed to make us a subreaper: %m");
663996b3 1646
e3bff60a 1647 if (arg_running_as == MANAGER_SYSTEM) {
663996b3
MS
1648 bump_rlimit_nofile(&saved_rlimit_nofile);
1649
e842803a 1650 if (empty_etc) {
e3bff60a 1651 r = unit_file_preset_all(UNIT_FILE_SYSTEM, false, NULL, UNIT_FILE_PRESET_ENABLE_ONLY, false, NULL, 0);
e842803a 1652 if (r < 0)
f47781d8 1653 log_warning_errno(r, "Failed to populate /etc with preset unit settings, ignoring: %m");
e842803a
MB
1654 else
1655 log_info("Populated /etc with preset unit settings.");
1656 }
1657 }
1658
5eef597e 1659 r = manager_new(arg_running_as, arg_action == ACTION_TEST, &m);
663996b3 1660 if (r < 0) {
f47781d8
MP
1661 log_emergency_errno(r, "Failed to allocate manager object: %m");
1662 error_message = "Failed to allocate manager object";
663996b3
MS
1663 goto finish;
1664 }
1665
1666 m->confirm_spawn = arg_confirm_spawn;
663996b3
MS
1667 m->runtime_watchdog = arg_runtime_watchdog;
1668 m->shutdown_watchdog = arg_shutdown_watchdog;
1669 m->userspace_timestamp = userspace_timestamp;
1670 m->kernel_timestamp = kernel_timestamp;
663996b3 1671 m->initrd_timestamp = initrd_timestamp;
60f067b4
JS
1672 m->security_start_timestamp = security_start_timestamp;
1673 m->security_finish_timestamp = security_finish_timestamp;
663996b3 1674
7035cd9e 1675 manager_set_defaults(m);
663996b3 1676 manager_set_show_status(m, arg_show_status);
5eef597e 1677 manager_set_first_boot(m, empty_etc);
663996b3
MS
1678
1679 /* Remember whether we should queue the default job */
60f067b4 1680 queue_default_job = !arg_serialization || arg_switched_root;
663996b3
MS
1681
1682 before_startup = now(CLOCK_MONOTONIC);
1683
60f067b4 1684 r = manager_startup(m, arg_serialization, fds);
663996b3 1685 if (r < 0)
f47781d8 1686 log_error_errno(r, "Failed to fully start up daemon: %m");
663996b3
MS
1687
1688 /* This will close all file descriptors that were opened, but
1689 * not claimed by any unit. */
6300502b 1690 fds = fdset_free(fds);
663996b3 1691
6300502b 1692 arg_serialization = safe_fclose(arg_serialization);
663996b3
MS
1693
1694 if (queue_default_job) {
60f067b4 1695 _cleanup_bus_error_free_ sd_bus_error error = SD_BUS_ERROR_NULL;
663996b3
MS
1696 Unit *target = NULL;
1697 Job *default_unit_job;
1698
663996b3
MS
1699 log_debug("Activating default unit: %s", arg_default_unit);
1700
1701 r = manager_load_unit(m, arg_default_unit, NULL, &error, &target);
60f067b4
JS
1702 if (r < 0)
1703 log_error("Failed to load default target: %s", bus_error_message(&error, r));
1704 else if (target->load_state == UNIT_ERROR || target->load_state == UNIT_NOT_FOUND)
f47781d8 1705 log_error_errno(target->load_error, "Failed to load default target: %m");
663996b3
MS
1706 else if (target->load_state == UNIT_MASKED)
1707 log_error("Default target masked.");
1708
1709 if (!target || target->load_state != UNIT_LOADED) {
1710 log_info("Trying to load rescue target...");
1711
1712 r = manager_load_unit(m, SPECIAL_RESCUE_TARGET, NULL, &error, &target);
1713 if (r < 0) {
f47781d8
MP
1714 log_emergency("Failed to load rescue target: %s", bus_error_message(&error, r));
1715 error_message = "Failed to load rescue target";
663996b3 1716 goto finish;
14228c0d 1717 } else if (target->load_state == UNIT_ERROR || target->load_state == UNIT_NOT_FOUND) {
f47781d8
MP
1718 log_emergency_errno(target->load_error, "Failed to load rescue target: %m");
1719 error_message = "Failed to load rescue target";
663996b3
MS
1720 goto finish;
1721 } else if (target->load_state == UNIT_MASKED) {
f47781d8
MP
1722 log_emergency("Rescue target masked.");
1723 error_message = "Rescue target masked";
663996b3
MS
1724 goto finish;
1725 }
1726 }
1727
1728 assert(target->load_state == UNIT_LOADED);
1729
1730 if (arg_action == ACTION_TEST) {
1731 printf("-> By units:\n");
1732 manager_dump_units(m, stdout, "\t");
1733 }
1734
1735 r = manager_add_job(m, JOB_START, target, JOB_ISOLATE, false, &error, &default_unit_job);
1736 if (r == -EPERM) {
60f067b4 1737 log_debug("Default target could not be isolated, starting instead: %s", bus_error_message(&error, r));
663996b3
MS
1738
1739 r = manager_add_job(m, JOB_START, target, JOB_REPLACE, false, &error, &default_unit_job);
1740 if (r < 0) {
f47781d8
MP
1741 log_emergency("Failed to start default target: %s", bus_error_message(&error, r));
1742 error_message = "Failed to start default target";
663996b3
MS
1743 goto finish;
1744 }
1745 } else if (r < 0) {
f47781d8
MP
1746 log_emergency("Failed to isolate default target: %s", bus_error_message(&error, r));
1747 error_message = "Failed to isolate default target";
663996b3
MS
1748 goto finish;
1749 }
1750
1751 m->default_unit_job_id = default_unit_job->id;
1752
1753 after_startup = now(CLOCK_MONOTONIC);
1754 log_full(arg_action == ACTION_TEST ? LOG_INFO : LOG_DEBUG,
1755 "Loaded units and determined initial transaction in %s.",
5eef597e 1756 format_timespan(timespan, sizeof(timespan), after_startup - before_startup, 100 * USEC_PER_MSEC));
663996b3
MS
1757
1758 if (arg_action == ACTION_TEST) {
1759 printf("-> By jobs:\n");
1760 manager_dump_jobs(m, stdout, "\t");
1761 retval = EXIT_SUCCESS;
1762 goto finish;
1763 }
1764 }
1765
1766 for (;;) {
1767 r = manager_loop(m);
1768 if (r < 0) {
f47781d8
MP
1769 log_emergency_errno(r, "Failed to run main loop: %m");
1770 error_message = "Failed to run main loop";
663996b3
MS
1771 goto finish;
1772 }
1773
1774 switch (m->exit_code) {
1775
663996b3
MS
1776 case MANAGER_RELOAD:
1777 log_info("Reloading.");
7035cd9e
MP
1778
1779 r = parse_config_file();
1780 if (r < 0)
1781 log_error("Failed to parse config file.");
1782
1783 manager_set_defaults(m);
1784
663996b3
MS
1785 r = manager_reload(m);
1786 if (r < 0)
f47781d8 1787 log_error_errno(r, "Failed to reload: %m");
663996b3
MS
1788 break;
1789
1790 case MANAGER_REEXECUTE:
1791
f47781d8 1792 if (prepare_reexecute(m, &arg_serialization, &fds, false) < 0) {
13d276d0 1793 error_message = "Failed to prepare for reexecution";
663996b3 1794 goto finish;
f47781d8 1795 }
663996b3
MS
1796
1797 reexecute = true;
1798 log_notice("Reexecuting.");
1799 goto finish;
1800
1801 case MANAGER_SWITCH_ROOT:
1802 /* Steal the switch root parameters */
1803 switch_root_dir = m->switch_root;
1804 switch_root_init = m->switch_root_init;
1805 m->switch_root = m->switch_root_init = NULL;
1806
1807 if (!switch_root_init)
f47781d8 1808 if (prepare_reexecute(m, &arg_serialization, &fds, true) < 0) {
13d276d0 1809 error_message = "Failed to prepare for reexecution";
663996b3 1810 goto finish;
f47781d8 1811 }
663996b3
MS
1812
1813 reexecute = true;
1814 log_notice("Switching root.");
1815 goto finish;
1816
6300502b
MP
1817 case MANAGER_EXIT:
1818 retval = m->return_value;
1819
1820 if (m->running_as == MANAGER_USER) {
1821 log_debug("Exit.");
1822 goto finish;
1823 }
1824
1825 /* fallthrough */
663996b3
MS
1826 case MANAGER_REBOOT:
1827 case MANAGER_POWEROFF:
1828 case MANAGER_HALT:
1829 case MANAGER_KEXEC: {
1830 static const char * const table[_MANAGER_EXIT_CODE_MAX] = {
6300502b 1831 [MANAGER_EXIT] = "exit",
663996b3
MS
1832 [MANAGER_REBOOT] = "reboot",
1833 [MANAGER_POWEROFF] = "poweroff",
1834 [MANAGER_HALT] = "halt",
1835 [MANAGER_KEXEC] = "kexec"
1836 };
1837
1838 assert_se(shutdown_verb = table[m->exit_code]);
1839 arm_reboot_watchdog = m->exit_code == MANAGER_REBOOT;
1840
1841 log_notice("Shutting down.");
1842 goto finish;
1843 }
1844
1845 default:
1846 assert_not_reached("Unknown exit code.");
1847 }
1848 }
1849
1850finish:
5eef597e
MP
1851 pager_close();
1852
e735f4d4
MP
1853 if (m)
1854 arg_shutdown_watchdog = m->shutdown_watchdog;
6300502b 1855
f47781d8 1856 m = manager_free(m);
663996b3 1857
6300502b
MP
1858 for (j = 0; j < ELEMENTSOF(arg_default_rlimit); j++)
1859 arg_default_rlimit[j] = mfree(arg_default_rlimit[j]);
663996b3 1860
13d276d0 1861 arg_default_unit = mfree(arg_default_unit);
6300502b 1862 arg_join_controllers = strv_free_free(arg_join_controllers);
13d276d0 1863 arg_default_environment = strv_free(arg_default_environment);
6300502b 1864 arg_syscall_archs = set_free(arg_syscall_archs);
60f067b4 1865
5eef597e 1866 mac_selinux_finish();
663996b3
MS
1867
1868 if (reexecute) {
1869 const char **args;
1870 unsigned i, args_size;
1871
1872 /* Close and disarm the watchdog, so that the new
1873 * instance can reinitialize it, but doesn't get
1874 * rebooted while we do that */
1875 watchdog_close(true);
1876
1877 /* Reset the RLIMIT_NOFILE to the kernel default, so
1878 * that the new systemd can pass the kernel default to
1879 * its child processes */
1880 if (saved_rlimit_nofile.rlim_cur > 0)
6300502b 1881 (void) setrlimit(RLIMIT_NOFILE, &saved_rlimit_nofile);
663996b3
MS
1882
1883 if (switch_root_dir) {
1884 /* Kill all remaining processes from the
1885 * initrd, but don't wait for them, so that we
1886 * can handle the SIGCHLD for them after
1887 * deserializing. */
60f067b4 1888 broadcast_signal(SIGTERM, false, true);
663996b3 1889
5eef597e
MP
1890 /* And switch root with MS_MOVE, because we remove the old directory afterwards and detach it. */
1891 r = switch_root(switch_root_dir, "/mnt", true, MS_MOVE);
663996b3 1892 if (r < 0)
f47781d8 1893 log_error_errno(r, "Failed to switch root, trying to continue: %m");
663996b3
MS
1894 }
1895
1896 args_size = MAX(6, argc+1);
1897 args = newa(const char*, args_size);
1898
1899 if (!switch_root_init) {
e735f4d4 1900 char sfd[DECIMAL_STR_MAX(int) + 1];
663996b3
MS
1901
1902 /* First try to spawn ourselves with the right
1903 * path, and with full serialization. We do
1904 * this only if the user didn't specify an
1905 * explicit init to spawn. */
1906
60f067b4 1907 assert(arg_serialization);
663996b3
MS
1908 assert(fds);
1909
e735f4d4 1910 xsprintf(sfd, "%i", fileno(arg_serialization));
663996b3
MS
1911
1912 i = 0;
1913 args[i++] = SYSTEMD_BINARY_PATH;
1914 if (switch_root_dir)
1915 args[i++] = "--switched-root";
e3bff60a 1916 args[i++] = arg_running_as == MANAGER_SYSTEM ? "--system" : "--user";
663996b3
MS
1917 args[i++] = "--deserialize";
1918 args[i++] = sfd;
1919 args[i++] = NULL;
1920
14228c0d
MB
1921 /* do not pass along the environment we inherit from the kernel or initrd */
1922 if (switch_root_dir)
6300502b 1923 (void) clearenv();
14228c0d 1924
663996b3 1925 assert(i <= args_size);
6300502b 1926 (void) execv(args[0], (char* const*) args);
663996b3
MS
1927 }
1928
1929 /* Try the fallback, if there is any, without any
1930 * serialization. We pass the original argv[] and
1931 * envp[]. (Well, modulo the ordering changes due to
1932 * getopt() in argv[], and some cleanups in envp[],
1933 * but let's hope that doesn't matter.) */
1934
6300502b
MP
1935 arg_serialization = safe_fclose(arg_serialization);
1936 fds = fdset_free(fds);
663996b3
MS
1937
1938 /* Reopen the console */
6300502b 1939 (void) make_console_stdio();
663996b3 1940
60f067b4 1941 for (j = 1, i = 1; j < (unsigned) argc; j++)
663996b3
MS
1942 args[i++] = argv[j];
1943 args[i++] = NULL;
1944 assert(i <= args_size);
1945
5eef597e 1946 /* Reenable any blocked signals, especially important
e842803a 1947 * if we switch from initial ramdisk to init=... */
86f210e9
MP
1948 (void) reset_all_signal_handlers();
1949 (void) reset_signal_mask();
e842803a 1950
663996b3
MS
1951 if (switch_root_init) {
1952 args[0] = switch_root_init;
6300502b 1953 (void) execv(args[0], (char* const*) args);
f47781d8 1954 log_warning_errno(errno, "Failed to execute configured init, trying fallback: %m");
663996b3
MS
1955 }
1956
1957 args[0] = "/sbin/init";
6300502b 1958 (void) execv(args[0], (char* const*) args);
663996b3
MS
1959
1960 if (errno == ENOENT) {
1961 log_warning("No /sbin/init, trying fallback");
1962
1963 args[0] = "/bin/sh";
1964 args[1] = NULL;
6300502b 1965 (void) execv(args[0], (char* const*) args);
f47781d8 1966 log_error_errno(errno, "Failed to execute /bin/sh, giving up: %m");
663996b3 1967 } else
f47781d8 1968 log_warning_errno(errno, "Failed to execute /sbin/init, giving up: %m");
663996b3
MS
1969 }
1970
6300502b
MP
1971 arg_serialization = safe_fclose(arg_serialization);
1972 fds = fdset_free(fds);
60f067b4
JS
1973
1974#ifdef HAVE_VALGRIND_VALGRIND_H
1975 /* If we are PID 1 and running under valgrind, then let's exit
1976 * here explicitly. valgrind will only generate nice output on
1977 * exit(), not on exec(), hence let's do the former not the
1978 * latter here. */
1979 if (getpid() == 1 && RUNNING_ON_VALGRIND)
1980 return 0;
1981#endif
663996b3
MS
1982
1983 if (shutdown_verb) {
60f067b4 1984 char log_level[DECIMAL_STR_MAX(int) + 1];
6300502b
MP
1985 char exit_code[DECIMAL_STR_MAX(uint8_t) + 1];
1986 const char* command_line[11] = {
663996b3
MS
1987 SYSTEMD_SHUTDOWN_BINARY_PATH,
1988 shutdown_verb,
60f067b4
JS
1989 "--log-level", log_level,
1990 "--log-target",
1991 };
1992 unsigned pos = 5;
1993 _cleanup_strv_free_ char **env_block = NULL;
1994
1995 assert(command_line[pos] == NULL);
1996 env_block = strv_copy(environ);
1997
e735f4d4 1998 xsprintf(log_level, "%d", log_get_max_level());
60f067b4
JS
1999
2000 switch (log_get_target()) {
6300502b 2001
60f067b4
JS
2002 case LOG_TARGET_KMSG:
2003 case LOG_TARGET_JOURNAL_OR_KMSG:
2004 case LOG_TARGET_SYSLOG_OR_KMSG:
2005 command_line[pos++] = "kmsg";
2006 break;
2007
fb183854
MP
2008 case LOG_TARGET_NULL:
2009 command_line[pos++] = "null";
2010 break;
2011
60f067b4
JS
2012 case LOG_TARGET_CONSOLE:
2013 default:
2014 command_line[pos++] = "console";
2015 break;
663996b3 2016 };
60f067b4
JS
2017
2018 if (log_get_show_color())
2019 command_line[pos++] = "--log-color";
2020
2021 if (log_get_show_location())
2022 command_line[pos++] = "--log-location";
2023
6300502b
MP
2024 if (streq(shutdown_verb, "exit")) {
2025 command_line[pos++] = "--exit-code";
2026 command_line[pos++] = exit_code;
2027 xsprintf(exit_code, "%d", retval);
2028 }
2029
60f067b4 2030 assert(pos < ELEMENTSOF(command_line));
663996b3
MS
2031
2032 if (arm_reboot_watchdog && arg_shutdown_watchdog > 0) {
60f067b4 2033 char *e;
663996b3
MS
2034
2035 /* If we reboot let's set the shutdown
2036 * watchdog and tell the shutdown binary to
2037 * repeatedly ping it */
e735f4d4
MP
2038 r = watchdog_set_timeout(&arg_shutdown_watchdog);
2039 watchdog_close(r < 0);
663996b3 2040
60f067b4
JS
2041 /* Tell the binary how often to ping, ignore failure */
2042 if (asprintf(&e, "WATCHDOG_USEC="USEC_FMT, arg_shutdown_watchdog) > 0)
6300502b 2043 (void) strv_push(&env_block, e);
60f067b4 2044 } else
663996b3 2045 watchdog_close(true);
663996b3 2046
14228c0d
MB
2047 /* Avoid the creation of new processes forked by the
2048 * kernel; at this point, we will not listen to the
2049 * signals anyway */
6300502b 2050 if (detect_container() <= 0)
d9dfd233 2051 (void) cg_uninstall_release_agent(SYSTEMD_CGROUP_CONTROLLER);
14228c0d 2052
663996b3 2053 execve(SYSTEMD_SHUTDOWN_BINARY_PATH, (char **) command_line, env_block);
f47781d8 2054 log_error_errno(errno, "Failed to execute shutdown binary, %s: %m",
60f067b4 2055 getpid() == 1 ? "freezing" : "quitting");
663996b3
MS
2056 }
2057
f47781d8
MP
2058 if (getpid() == 1) {
2059 if (error_message)
2060 manager_status_printf(NULL, STATUS_TYPE_EMERGENCY,
6300502b 2061 ANSI_HIGHLIGHT_RED "!!!!!!" ANSI_NORMAL,
f47781d8 2062 "%s, freezing.", error_message);
6300502b 2063 freeze_or_reboot();
f47781d8 2064 }
663996b3
MS
2065
2066 return retval;
2067}