]> git.ipfire.org Git - thirdparty/systemd.git/blame - src/core/main.c
tree-wide: port more code to use send_one_fd() and receive_one_fd()
[thirdparty/systemd.git] / src / core / main.c
CommitLineData
d6c9574f 1/*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
60918275 2
a7334b09
LP
3/***
4 This file is part of systemd.
5
6 Copyright 2010 Lennart Poettering
7
8 systemd is free software; you can redistribute it and/or modify it
5430f7f2
LP
9 under the terms of the GNU Lesser General Public License as published by
10 the Free Software Foundation; either version 2.1 of the License, or
a7334b09
LP
11 (at your option) any later version.
12
13 systemd is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
5430f7f2 16 Lesser General Public License for more details.
a7334b09 17
5430f7f2 18 You should have received a copy of the GNU Lesser General Public License
a7334b09
LP
19 along with systemd; If not, see <http://www.gnu.org/licenses/>.
20***/
21
60918275
LP
22#include <stdio.h>
23#include <errno.h>
24#include <string.h>
16354eff 25#include <unistd.h>
4ade7963 26#include <sys/stat.h>
f170852a 27#include <getopt.h>
97c4f35c 28#include <signal.h>
80876c20 29#include <fcntl.h>
f3b6a3ed 30#include <sys/prctl.h>
664f88a7 31#include <sys/mount.h>
60918275 32
54b434b1
LP
33#ifdef HAVE_VALGRIND_VALGRIND_H
34#include <valgrind/valgrind.h>
35#endif
b64a3d86
LP
36#ifdef HAVE_SECCOMP
37#include <seccomp.h>
38#endif
54b434b1 39
718db961 40#include "sd-daemon.h"
718db961 41#include "sd-bus.h"
16354eff 42#include "log.h"
a16e1123 43#include "fdset.h"
514f4ef5 44#include "special.h"
487393e9 45#include "conf-parser.h"
ad780f19 46#include "missing.h"
b87c2aa6 47#include "pager.h"
302e27c8 48#include "build.h"
06d4c99a 49#include "strv.h"
f6a6225e 50#include "def.h"
b52aae1d 51#include "virt.h"
d9d93745 52#include "architecture.h"
e96d6be7 53#include "watchdog.h"
41669317 54#include "switch-root.h"
ec8927ca 55#include "capability.h"
bd3fa1d2 56#include "killall.h"
0c4025d1 57#include "env-util.h"
24efb112 58#include "clock-util.h"
718db961 59#include "fileio.h"
718db961
LP
60#include "bus-error.h"
61#include "bus-util.h"
d7b8eec7 62#include "selinux-util.h"
24882e06
LP
63#include "formats-util.h"
64#include "process-util.h"
65#include "terminal-util.h"
66#include "signal-util.h"
d7b8eec7
LP
67#include "manager.h"
68#include "dbus-manager.h"
69#include "load-fragment.h"
60918275 70
b6e66135
LP
71#include "mount-setup.h"
72#include "loopback-setup.h"
b6e66135
LP
73#include "hostname-setup.h"
74#include "machine-id-setup.h"
b6e66135
LP
75#include "selinux-setup.h"
76#include "ima-setup.h"
ffbd2c4d 77#include "smack-setup.h"
718db961 78#include "kmod-setup.h"
b6e66135 79
f170852a
LP
80static enum {
81 ACTION_RUN,
e965d56d 82 ACTION_HELP,
9ba0bc4e 83 ACTION_VERSION,
e537352b 84 ACTION_TEST,
4288f619
LP
85 ACTION_DUMP_CONFIGURATION_ITEMS,
86 ACTION_DONE
fa0f4d8a 87} arg_action = ACTION_RUN;
fa0f4d8a 88static char *arg_default_unit = NULL;
b2c23da8 89static ManagerRunningAs arg_running_as = _MANAGER_RUNNING_AS_INVALID;
fa0f4d8a
LP
90static bool arg_dump_core = true;
91static bool arg_crash_shell = false;
92static int arg_crash_chvt = -1;
93static bool arg_confirm_spawn = false;
b6e2f329 94static ShowStatus arg_show_status = _SHOW_STATUS_UNSET;
bf4df7c3 95static bool arg_switched_root = false;
b87c2aa6 96static int arg_no_pager = -1;
0c85a4f3 97static char ***arg_join_controllers = NULL;
706343f4 98static ExecOutput arg_default_std_output = EXEC_OUTPUT_JOURNAL;
0a494f1f 99static ExecOutput arg_default_std_error = EXEC_OUTPUT_INHERIT;
1f19a534
OS
100static usec_t arg_default_restart_usec = DEFAULT_RESTART_USEC;
101static usec_t arg_default_timeout_start_usec = DEFAULT_TIMEOUT_USEC;
102static usec_t arg_default_timeout_stop_usec = DEFAULT_TIMEOUT_USEC;
3f41e1e5
LN
103static usec_t arg_default_start_limit_interval = DEFAULT_START_LIMIT_INTERVAL;
104static unsigned arg_default_start_limit_burst = DEFAULT_START_LIMIT_BURST;
e96d6be7
LP
105static usec_t arg_runtime_watchdog = 0;
106static usec_t arg_shutdown_watchdog = 10 * USEC_PER_MINUTE;
97d0e5f8 107static char **arg_default_environment = NULL;
517d56b1 108static struct rlimit *arg_default_rlimit[_RLIMIT_MAX] = {};
ec8927ca 109static uint64_t arg_capability_bounding_set_drop = 0;
3a43da28 110static nsec_t arg_timer_slack_nsec = NSEC_INFINITY;
bd8f585b 111static usec_t arg_default_timer_accuracy_usec = 1 * USEC_PER_MINUTE;
d3b1c508
LP
112static Set* arg_syscall_archs = NULL;
113static FILE* arg_serialization = NULL;
085afe36
LP
114static bool arg_default_cpu_accounting = false;
115static bool arg_default_blockio_accounting = false;
116static bool arg_default_memory_accounting = false;
03a7b521 117static bool arg_default_tasks_accounting = false;
4fc935ca 118
d3b1c508 119static void nop_handler(int sig) {}
6f5e3f35 120
b87c2aa6
ZJS
121static void pager_open_if_enabled(void) {
122
123 if (arg_no_pager <= 0)
124 return;
125
126 pager_open(false);
127}
128
919ce0b7 129noreturn static void crash(int sig) {
97c4f35c 130
abb26902
LP
131 if (getpid() != 1)
132 /* Pass this on immediately, if this is not PID 1 */
133 raise(sig);
134 else if (!arg_dump_core)
4104970e 135 log_emergency("Caught <%s>, not dumping core.", signal_to_string(sig));
97c4f35c 136 else {
b92bea5d
ZJS
137 struct sigaction sa = {
138 .sa_handler = nop_handler,
139 .sa_flags = SA_NOCLDSTOP|SA_RESTART,
140 };
97c4f35c
LP
141 pid_t pid;
142
6f5e3f35 143 /* We want to wait for the core process, hence let's enable SIGCHLD */
abb26902 144 sigaction(SIGCHLD, &sa, NULL);
6f5e3f35 145
ee05e779 146 pid = raw_clone(SIGCHLD, NULL);
e62d8c39 147 if (pid < 0)
56f64d95 148 log_emergency_errno(errno, "Caught <%s>, cannot fork for core dump: %m", signal_to_string(sig));
97c4f35c
LP
149
150 else if (pid == 0) {
b92bea5d 151 struct rlimit rl = {};
97c4f35c
LP
152
153 /* Enable default signal handler for core dump */
154 zero(sa);
155 sa.sa_handler = SIG_DFL;
abb26902 156 sigaction(sig, &sa, NULL);
97c4f35c
LP
157
158 /* Don't limit the core dump size */
97c4f35c
LP
159 rl.rlim_cur = RLIM_INFINITY;
160 rl.rlim_max = RLIM_INFINITY;
161 setrlimit(RLIMIT_CORE, &rl);
162
163 /* Just to be sure... */
e62d9b81 164 (void) chdir("/");
97c4f35c
LP
165
166 /* Raise the signal again */
ee05e779
ZJS
167 pid = raw_getpid();
168 kill(pid, sig); /* raise() would kill the parent */
97c4f35c
LP
169
170 assert_not_reached("We shouldn't be here...");
171 _exit(1);
4fc935ca 172 } else {
8e12a6ae
LP
173 siginfo_t status;
174 int r;
4fc935ca
LP
175
176 /* Order things nicely. */
e62d8c39
ZJS
177 r = wait_for_terminate(pid, &status);
178 if (r < 0)
da927ba9 179 log_emergency_errno(r, "Caught <%s>, waitpid() failed: %m", signal_to_string(sig));
8e12a6ae 180 else if (status.si_code != CLD_DUMPED)
ee05e779
ZJS
181 log_emergency("Caught <%s>, core dump failed (child "PID_FMT", code=%s, status=%i/%s).",
182 signal_to_string(sig),
183 pid, sigchld_code_to_string(status.si_code),
184 status.si_status,
185 strna(status.si_code == CLD_EXITED
186 ? exit_status_to_string(status.si_status, EXIT_STATUS_FULL)
187 : signal_to_string(status.si_status)));
4fc935ca 188 else
4104970e 189 log_emergency("Caught <%s>, dumped core as pid "PID_FMT".", signal_to_string(sig), pid);
97c4f35c
LP
190 }
191 }
192
fa0f4d8a
LP
193 if (arg_crash_chvt)
194 chvt(arg_crash_chvt);
601f6a1e 195
fa0f4d8a 196 if (arg_crash_shell) {
b92bea5d
ZJS
197 struct sigaction sa = {
198 .sa_handler = SIG_IGN,
199 .sa_flags = SA_NOCLDSTOP|SA_NOCLDWAIT|SA_RESTART,
200 };
6f5e3f35 201 pid_t pid;
8c43883a 202
4fc935ca
LP
203 log_info("Executing crash shell in 10s...");
204 sleep(10);
205
6f5e3f35 206 /* Let the kernel reap children for us */
6f5e3f35 207 assert_se(sigaction(SIGCHLD, &sa, NULL) == 0);
8c43883a 208
ee05e779 209 pid = raw_clone(SIGCHLD, NULL);
cd3bd60a 210 if (pid < 0)
56f64d95 211 log_emergency_errno(errno, "Failed to fork off crash shell: %m");
6f5e3f35 212 else if (pid == 0) {
cd3bd60a 213 make_console_stdio();
ee05e779 214 execle("/bin/sh", "/bin/sh", NULL, environ);
6f5e3f35 215
ee05e779 216 log_emergency_errno(errno, "execle() failed: %m");
6f5e3f35 217 _exit(1);
ee05e779
ZJS
218 } else
219 log_info("Successfully spawned crash shell as PID "PID_FMT".", pid);
4fc935ca
LP
220 }
221
4104970e 222 log_emergency("Freezing execution.");
97c4f35c
LP
223 freeze();
224}
225
226static void install_crash_handler(void) {
297d563d 227 static const struct sigaction sa = {
b92bea5d 228 .sa_handler = crash,
297d563d 229 .sa_flags = SA_NODEFER, /* So that we can raise the signal again from the signal handler */
b92bea5d 230 };
297d563d 231 int r;
97c4f35c 232
297d563d
LP
233 /* We ignore the return value here, since, we don't mind if we
234 * cannot set up a crash handler */
235 r = sigaction_many(&sa, SIGNALS_CRASH_HANDLER, -1);
236 if (r < 0)
237 log_debug_errno(r, "I had trouble setting up the crash handler, ignoring: %m");
97c4f35c 238}
f170852a 239
56d96fc0
LP
240static int console_setup(void) {
241 _cleanup_close_ int tty_fd = -1;
242 int r;
80876c20 243
512947d4 244 tty_fd = open_terminal("/dev/console", O_WRONLY|O_NOCTTY|O_CLOEXEC);
23bbb0de
MS
245 if (tty_fd < 0)
246 return log_error_errno(tty_fd, "Failed to open /dev/console: %m");
80876c20 247
56d96fc0
LP
248 /* We don't want to force text mode. plymouth may be showing
249 * pictures already from initrd. */
512947d4 250 r = reset_terminal_fd(tty_fd, false);
23bbb0de
MS
251 if (r < 0)
252 return log_error_errno(r, "Failed to reset /dev/console: %m");
843d2643 253
56d96fc0 254 return 0;
80876c20
LP
255}
256
f170852a
LP
257static int set_default_unit(const char *u) {
258 char *c;
259
260 assert(u);
261
bf4df7c3
LP
262 c = strdup(u);
263 if (!c)
f170852a
LP
264 return -ENOMEM;
265
fa0f4d8a
LP
266 free(arg_default_unit);
267 arg_default_unit = c;
bf4df7c3 268
f170852a
LP
269 return 0;
270}
271
059cb385 272static int parse_proc_cmdline_item(const char *key, const char *value) {
f170852a
LP
273
274 static const char * const rlmap[] = {
ed370f5d 275 "emergency", SPECIAL_EMERGENCY_TARGET,
099663ff 276 "-b", SPECIAL_EMERGENCY_TARGET,
5329ab10 277 "rescue", SPECIAL_RESCUE_TARGET,
ed370f5d
LP
278 "single", SPECIAL_RESCUE_TARGET,
279 "-s", SPECIAL_RESCUE_TARGET,
280 "s", SPECIAL_RESCUE_TARGET,
281 "S", SPECIAL_RESCUE_TARGET,
282 "1", SPECIAL_RESCUE_TARGET,
d5d8429a
LP
283 "2", SPECIAL_MULTI_USER_TARGET,
284 "3", SPECIAL_MULTI_USER_TARGET,
285 "4", SPECIAL_MULTI_USER_TARGET,
286 "5", SPECIAL_GRAPHICAL_TARGET,
f170852a 287 };
059cb385 288 int r;
f170852a 289
059cb385 290 assert(key);
5192bd19 291
059cb385 292 if (streq(key, "systemd.unit") && value) {
bf4df7c3
LP
293
294 if (!in_initrd())
059cb385 295 return set_default_unit(value);
bf4df7c3 296
059cb385 297 } else if (streq(key, "rd.systemd.unit") && value) {
bf4df7c3 298
ca05941b
LP
299 if (in_initrd())
300 return set_default_unit(value);
f170852a 301
059cb385 302 } else if (streq(key, "systemd.dump_core") && value) {
4fc935ca 303
059cb385 304 r = parse_boolean(value);
fb472900 305 if (r < 0)
059cb385 306 log_warning("Failed to parse dump core switch %s. Ignoring.", value);
4fc935ca 307 else
fa0f4d8a 308 arg_dump_core = r;
4fc935ca 309
059cb385 310 } else if (streq(key, "systemd.crash_shell") && value) {
4fc935ca 311
059cb385 312 r = parse_boolean(value);
fb472900 313 if (r < 0)
059cb385 314 log_warning("Failed to parse crash shell switch %s. Ignoring.", value);
4fc935ca 315 else
fa0f4d8a 316 arg_crash_shell = r;
5e7ee61c 317
059cb385 318 } else if (streq(key, "systemd.crash_chvt") && value) {
5e7ee61c 319
059cb385
LP
320 if (safe_atoi(value, &r) < 0)
321 log_warning("Failed to parse crash chvt switch %s. Ignoring.", value);
5e7ee61c 322 else
059cb385 323 arg_crash_chvt = r;
5e7ee61c 324
059cb385 325 } else if (streq(key, "systemd.confirm_spawn") && value) {
601f6a1e 326
059cb385
LP
327 r = parse_boolean(value);
328 if (r < 0)
329 log_warning("Failed to parse confirm spawn switch %s. Ignoring.", value);
601f6a1e 330 else
059cb385 331 arg_confirm_spawn = r;
601f6a1e 332
059cb385 333 } else if (streq(key, "systemd.show_status") && value) {
9e58ff9c 334
059cb385 335 r = parse_show_status(value, &arg_show_status);
d450b6f2 336 if (r < 0)
059cb385
LP
337 log_warning("Failed to parse show status switch %s. Ignoring.", value);
338
339 } else if (streq(key, "systemd.default_standard_output") && value) {
0a494f1f 340
059cb385 341 r = exec_output_from_string(value);
fb472900 342 if (r < 0)
059cb385 343 log_warning("Failed to parse default standard output switch %s. Ignoring.", value);
0a494f1f
LP
344 else
345 arg_default_std_output = r;
0a494f1f 346
059cb385
LP
347 } else if (streq(key, "systemd.default_standard_error") && value) {
348
349 r = exec_output_from_string(value);
fb472900 350 if (r < 0)
059cb385 351 log_warning("Failed to parse default standard error switch %s. Ignoring.", value);
0a494f1f
LP
352 else
353 arg_default_std_error = r;
9e7c5357 354
059cb385
LP
355 } else if (streq(key, "systemd.setenv") && value) {
356
357 if (env_assignment_is_valid(value)) {
e21fea24
KS
358 char **env;
359
059cb385 360 env = strv_env_set(arg_default_environment, value);
e21fea24
KS
361 if (env)
362 arg_default_environment = env;
363 else
279d3c9c 364 log_warning_errno(ENOMEM, "Setting environment variable '%s' failed, ignoring: %m", value);
e21fea24 365 } else
059cb385 366 log_warning("Environment variable name '%s' is not valid. Ignoring.", value);
9e58ff9c 367
059cb385 368 } else if (streq(key, "quiet") && !value) {
d7b15e0a 369
b6e2f329 370 if (arg_show_status == _SHOW_STATUS_UNSET)
d450b6f2 371 arg_show_status = SHOW_STATUS_AUTO;
059cb385
LP
372
373 } else if (streq(key, "debug") && !value) {
d7b15e0a 374
1de1c9c3
LP
375 /* Note that log_parse_environment() handles 'debug'
376 * too, and sets the log level to LOG_DEBUG. */
d7b15e0a 377
75f86906 378 if (detect_container() > 0)
b2103dcc 379 log_set_target(LOG_TARGET_CONSOLE);
059cb385
LP
380
381 } else if (!in_initrd() && !value) {
f170852a
LP
382 unsigned i;
383
384 /* SysV compatibility */
f170852a 385 for (i = 0; i < ELEMENTSOF(rlmap); i += 2)
059cb385 386 if (streq(key, rlmap[i]))
f170852a
LP
387 return set_default_unit(rlmap[i+1]);
388 }
389
390 return 0;
391}
392
e8e581bf
ZJS
393#define DEFINE_SETTER(name, func, descr) \
394 static int name(const char *unit, \
395 const char *filename, \
396 unsigned line, \
397 const char *section, \
71a61510 398 unsigned section_line, \
e8e581bf
ZJS
399 const char *lvalue, \
400 int ltype, \
401 const char *rvalue, \
402 void *data, \
403 void *userdata) { \
404 \
405 int r; \
406 \
407 assert(filename); \
408 assert(lvalue); \
409 assert(rvalue); \
410 \
411 r = func(rvalue); \
412 if (r < 0) \
413 log_syntax(unit, LOG_ERR, filename, line, -r, \
414 "Invalid " descr "'%s': %s", \
415 rvalue, strerror(-r)); \
416 \
417 return 0; \
418 }
487393e9 419
e8e581bf
ZJS
420DEFINE_SETTER(config_parse_level2, log_set_max_level_from_string, "log level")
421DEFINE_SETTER(config_parse_target, log_set_target_from_string, "target")
422DEFINE_SETTER(config_parse_color, log_show_color_from_string, "color" )
423DEFINE_SETTER(config_parse_location, log_show_location_from_string, "location")
487393e9 424
4d7213b2
LP
425static int config_parse_cpu_affinity2(
426 const char *unit,
427 const char *filename,
428 unsigned line,
429 const char *section,
430 unsigned section_line,
431 const char *lvalue,
432 int ltype,
433 const char *rvalue,
434 void *data,
435 void *userdata) {
487393e9 436
4b40bc38 437 _cleanup_cpu_free_ cpu_set_t *c = NULL;
f5c72b73 438 int ncpus;
487393e9 439
f5c72b73 440 ncpus = parse_cpu_set(rvalue, &c, unit, filename, line, lvalue);
487393e9 441
f5c72b73
FB
442 if (ncpus < 0)
443 return ncpus;
487393e9 444
f5c72b73
FB
445 if (sched_setaffinity(0, CPU_ALLOC_SIZE(ncpus), c) < 0)
446 log_warning("Failed to set CPU affinity: %m");
487393e9 447
487393e9
LP
448 return 0;
449}
450
4d7213b2
LP
451static int config_parse_show_status(
452 const char* unit,
453 const char *filename,
454 unsigned line,
455 const char *section,
456 unsigned section_line,
457 const char *lvalue,
458 int ltype,
459 const char *rvalue,
460 void *data,
461 void *userdata) {
462
463 int k;
464 ShowStatus *b = data;
465
466 assert(filename);
467 assert(lvalue);
468 assert(rvalue);
469 assert(data);
470
471 k = parse_show_status(rvalue, b);
472 if (k < 0) {
473 log_syntax(unit, LOG_ERR, filename, line, -k,
474 "Failed to parse show status setting, ignoring: %s", rvalue);
475 return 0;
476 }
477
478 return 0;
479}
480
0c85a4f3
LP
481static void strv_free_free(char ***l) {
482 char ***i;
483
484 if (!l)
485 return;
486
487 for (i = l; *i; i++)
488 strv_free(*i);
489
490 free(l);
491}
492
493static void free_join_controllers(void) {
0c85a4f3
LP
494 strv_free_free(arg_join_controllers);
495 arg_join_controllers = NULL;
496}
497
e8e581bf
ZJS
498static int config_parse_join_controllers(const char *unit,
499 const char *filename,
500 unsigned line,
501 const char *section,
71a61510 502 unsigned section_line,
e8e581bf
ZJS
503 const char *lvalue,
504 int ltype,
505 const char *rvalue,
506 void *data,
507 void *userdata) {
0c85a4f3 508
3875c85b 509 const char *whole_rvalue = rvalue;
0c85a4f3 510 unsigned n = 0;
0c85a4f3
LP
511
512 assert(filename);
513 assert(lvalue);
514 assert(rvalue);
515
516 free_join_controllers();
517
d4ebeb4f
FB
518 for (;;) {
519 _cleanup_free_ char *word = NULL;
520 char **l;
521 int r;
0c85a4f3 522
d4ebeb4f 523 r = extract_first_word(&rvalue, &word, WHITESPACE, EXTRACT_QUOTES);
3875c85b
FB
524 if (r < 0) {
525 log_syntax(unit, LOG_ERR, filename, line, r, "Invalid value for %s: %s", lvalue, whole_rvalue);
d4ebeb4f 526 return r;
3875c85b 527 }
d4ebeb4f
FB
528 if (r == 0)
529 break;
0c85a4f3 530
d4ebeb4f 531 l = strv_split(word, ",");
1592ec21
FB
532 if (!l)
533 log_oom();
0c85a4f3
LP
534 strv_uniq(l);
535
536 if (strv_length(l) <= 1) {
537 strv_free(l);
538 continue;
539 }
540
541 if (!arg_join_controllers) {
542 arg_join_controllers = new(char**, 2);
543 if (!arg_join_controllers) {
544 strv_free(l);
14212119 545 return log_oom();
0c85a4f3
LP
546 }
547
548 arg_join_controllers[0] = l;
549 arg_join_controllers[1] = NULL;
550
551 n = 1;
552 } else {
553 char ***a;
554 char ***t;
555
556 t = new0(char**, n+2);
557 if (!t) {
558 strv_free(l);
14212119 559 return log_oom();
0c85a4f3
LP
560 }
561
562 n = 0;
563
564 for (a = arg_join_controllers; *a; a++) {
565
566 if (strv_overlap(*a, l)) {
e3e45d4f 567 if (strv_extend_strv(&l, *a) < 0) {
0c85a4f3
LP
568 strv_free(l);
569 strv_free_free(t);
14212119 570 return log_oom();
0c85a4f3
LP
571 }
572
0c85a4f3
LP
573 } else {
574 char **c;
575
576 c = strv_copy(*a);
577 if (!c) {
578 strv_free(l);
579 strv_free_free(t);
14212119 580 return log_oom();
0c85a4f3
LP
581 }
582
583 t[n++] = c;
584 }
585 }
586
587 t[n++] = strv_uniq(l);
588
589 strv_free_free(arg_join_controllers);
590 arg_join_controllers = t;
591 }
592 }
d4ebeb4f 593 if (!isempty(rvalue))
b2fadec6
ZJS
594 log_syntax(unit, LOG_ERR, filename, line, EINVAL,
595 "Trailing garbage, ignoring.");
0c85a4f3
LP
596
597 return 0;
598}
599
487393e9
LP
600static int parse_config_file(void) {
601
f975e971 602 const ConfigTableItem items[] = {
d3b1c508
LP
603 { "Manager", "LogLevel", config_parse_level2, 0, NULL },
604 { "Manager", "LogTarget", config_parse_target, 0, NULL },
605 { "Manager", "LogColor", config_parse_color, 0, NULL },
606 { "Manager", "LogLocation", config_parse_location, 0, NULL },
607 { "Manager", "DumpCore", config_parse_bool, 0, &arg_dump_core },
608 { "Manager", "CrashShell", config_parse_bool, 0, &arg_crash_shell },
609 { "Manager", "ShowStatus", config_parse_show_status, 0, &arg_show_status },
610 { "Manager", "CrashChVT", config_parse_int, 0, &arg_crash_chvt },
611 { "Manager", "CPUAffinity", config_parse_cpu_affinity2, 0, NULL },
612 { "Manager", "JoinControllers", config_parse_join_controllers, 0, &arg_join_controllers },
613 { "Manager", "RuntimeWatchdogSec", config_parse_sec, 0, &arg_runtime_watchdog },
614 { "Manager", "ShutdownWatchdogSec", config_parse_sec, 0, &arg_shutdown_watchdog },
615 { "Manager", "CapabilityBoundingSet", config_parse_bounding_set, 0, &arg_capability_bounding_set_drop },
89fffa27 616#ifdef HAVE_SECCOMP
d3b1c508 617 { "Manager", "SystemCallArchitectures", config_parse_syscall_archs, 0, &arg_syscall_archs },
89fffa27 618#endif
d3b1c508 619 { "Manager", "TimerSlackNSec", config_parse_nsec, 0, &arg_timer_slack_nsec },
bd8f585b 620 { "Manager", "DefaultTimerAccuracySec", config_parse_sec, 0, &arg_default_timer_accuracy_usec },
d3b1c508
LP
621 { "Manager", "DefaultStandardOutput", config_parse_output, 0, &arg_default_std_output },
622 { "Manager", "DefaultStandardError", config_parse_output, 0, &arg_default_std_error },
623 { "Manager", "DefaultTimeoutStartSec", config_parse_sec, 0, &arg_default_timeout_start_usec },
624 { "Manager", "DefaultTimeoutStopSec", config_parse_sec, 0, &arg_default_timeout_stop_usec },
625 { "Manager", "DefaultRestartSec", config_parse_sec, 0, &arg_default_restart_usec },
626 { "Manager", "DefaultStartLimitInterval", config_parse_sec, 0, &arg_default_start_limit_interval },
627 { "Manager", "DefaultStartLimitBurst", config_parse_unsigned, 0, &arg_default_start_limit_burst },
628 { "Manager", "DefaultEnvironment", config_parse_environ, 0, &arg_default_environment },
629 { "Manager", "DefaultLimitCPU", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_CPU] },
630 { "Manager", "DefaultLimitFSIZE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_FSIZE] },
631 { "Manager", "DefaultLimitDATA", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_DATA] },
632 { "Manager", "DefaultLimitSTACK", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_STACK] },
633 { "Manager", "DefaultLimitCORE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_CORE] },
634 { "Manager", "DefaultLimitRSS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RSS] },
635 { "Manager", "DefaultLimitNOFILE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NOFILE] },
636 { "Manager", "DefaultLimitAS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_AS] },
637 { "Manager", "DefaultLimitNPROC", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NPROC] },
638 { "Manager", "DefaultLimitMEMLOCK", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_MEMLOCK] },
639 { "Manager", "DefaultLimitLOCKS", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_LOCKS] },
640 { "Manager", "DefaultLimitSIGPENDING", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_SIGPENDING] },
641 { "Manager", "DefaultLimitMSGQUEUE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_MSGQUEUE] },
642 { "Manager", "DefaultLimitNICE", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_NICE] },
643 { "Manager", "DefaultLimitRTPRIO", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RTPRIO] },
644 { "Manager", "DefaultLimitRTTIME", config_parse_limit, 0, &arg_default_rlimit[RLIMIT_RTTIME] },
085afe36
LP
645 { "Manager", "DefaultCPUAccounting", config_parse_bool, 0, &arg_default_cpu_accounting },
646 { "Manager", "DefaultBlockIOAccounting", config_parse_bool, 0, &arg_default_blockio_accounting },
647 { "Manager", "DefaultMemoryAccounting", config_parse_bool, 0, &arg_default_memory_accounting },
03a7b521 648 { "Manager", "DefaultTasksAccounting", config_parse_bool, 0, &arg_default_tasks_accounting },
d3b1c508 649 {}
487393e9
LP
650 };
651
1b907b5c 652 const char *fn, *conf_dirs_nulstr;
487393e9 653
b2c23da8
LP
654 fn = arg_running_as == MANAGER_SYSTEM ? PKGSYSCONFDIR "/system.conf" : PKGSYSCONFDIR "/user.conf";
655 conf_dirs_nulstr = arg_running_as == MANAGER_SYSTEM ? CONF_DIRS_NULSTR("systemd/system.conf") : CONF_DIRS_NULSTR("systemd/user.conf");
1b907b5c
JT
656 config_parse_many(fn, conf_dirs_nulstr, "Manager\0",
657 config_item_table_lookup, items, false, NULL);
487393e9 658
487393e9
LP
659 return 0;
660}
661
06af2a04
TB
662static void manager_set_defaults(Manager *m) {
663
664 assert(m);
665
666 m->default_timer_accuracy_usec = arg_default_timer_accuracy_usec;
667 m->default_std_output = arg_default_std_output;
668 m->default_std_error = arg_default_std_error;
669 m->default_timeout_start_usec = arg_default_timeout_start_usec;
670 m->default_timeout_stop_usec = arg_default_timeout_stop_usec;
671 m->default_restart_usec = arg_default_restart_usec;
672 m->default_start_limit_interval = arg_default_start_limit_interval;
673 m->default_start_limit_burst = arg_default_start_limit_burst;
674 m->default_cpu_accounting = arg_default_cpu_accounting;
675 m->default_blockio_accounting = arg_default_blockio_accounting;
676 m->default_memory_accounting = arg_default_memory_accounting;
03a7b521 677 m->default_tasks_accounting = arg_default_tasks_accounting;
06af2a04
TB
678
679 manager_set_default_rlimits(m, arg_default_rlimit);
680 manager_environment_add(m, NULL, arg_default_environment);
681}
682
f170852a
LP
683static int parse_argv(int argc, char *argv[]) {
684
685 enum {
686 ARG_LOG_LEVEL = 0x100,
687 ARG_LOG_TARGET,
bbe63281
LP
688 ARG_LOG_COLOR,
689 ARG_LOG_LOCATION,
2f198e2f 690 ARG_UNIT,
edb9aaa8 691 ARG_SYSTEM,
af2d49f7 692 ARG_USER,
e537352b 693 ARG_TEST,
b87c2aa6 694 ARG_NO_PAGER,
9ba0bc4e 695 ARG_VERSION,
80876c20 696 ARG_DUMP_CONFIGURATION_ITEMS,
9e58ff9c
LP
697 ARG_DUMP_CORE,
698 ARG_CRASH_SHELL,
a16e1123 699 ARG_CONFIRM_SPAWN,
9e58ff9c 700 ARG_SHOW_STATUS,
4288f619 701 ARG_DESERIALIZE,
2660882b 702 ARG_SWITCHED_ROOT,
0a494f1f
LP
703 ARG_DEFAULT_STD_OUTPUT,
704 ARG_DEFAULT_STD_ERROR
f170852a
LP
705 };
706
707 static const struct option options[] = {
a16e1123
LP
708 { "log-level", required_argument, NULL, ARG_LOG_LEVEL },
709 { "log-target", required_argument, NULL, ARG_LOG_TARGET },
bbe63281
LP
710 { "log-color", optional_argument, NULL, ARG_LOG_COLOR },
711 { "log-location", optional_argument, NULL, ARG_LOG_LOCATION },
2f198e2f 712 { "unit", required_argument, NULL, ARG_UNIT },
edb9aaa8 713 { "system", no_argument, NULL, ARG_SYSTEM },
af2d49f7 714 { "user", no_argument, NULL, ARG_USER },
a16e1123 715 { "test", no_argument, NULL, ARG_TEST },
b87c2aa6 716 { "no-pager", no_argument, NULL, ARG_NO_PAGER },
a16e1123 717 { "help", no_argument, NULL, 'h' },
9ba0bc4e 718 { "version", no_argument, NULL, ARG_VERSION },
a16e1123 719 { "dump-configuration-items", no_argument, NULL, ARG_DUMP_CONFIGURATION_ITEMS },
a5d87bf0
LP
720 { "dump-core", optional_argument, NULL, ARG_DUMP_CORE },
721 { "crash-shell", optional_argument, NULL, ARG_CRASH_SHELL },
722 { "confirm-spawn", optional_argument, NULL, ARG_CONFIRM_SPAWN },
6e98720f 723 { "show-status", optional_argument, NULL, ARG_SHOW_STATUS },
a16e1123 724 { "deserialize", required_argument, NULL, ARG_DESERIALIZE },
2660882b 725 { "switched-root", no_argument, NULL, ARG_SWITCHED_ROOT },
0a494f1f
LP
726 { "default-standard-output", required_argument, NULL, ARG_DEFAULT_STD_OUTPUT, },
727 { "default-standard-error", required_argument, NULL, ARG_DEFAULT_STD_ERROR, },
fb472900 728 {}
f170852a
LP
729 };
730
731 int c, r;
732
733 assert(argc >= 1);
734 assert(argv);
735
b770165a
LP
736 if (getpid() == 1)
737 opterr = 0;
738
099663ff 739 while ((c = getopt_long(argc, argv, "hDbsz:", options, NULL)) >= 0)
f170852a
LP
740
741 switch (c) {
742
743 case ARG_LOG_LEVEL:
fb472900
ZJS
744 r = log_set_max_level_from_string(optarg);
745 if (r < 0) {
f170852a
LP
746 log_error("Failed to parse log level %s.", optarg);
747 return r;
748 }
749
750 break;
751
752 case ARG_LOG_TARGET:
fb472900
ZJS
753 r = log_set_target_from_string(optarg);
754 if (r < 0) {
f170852a
LP
755 log_error("Failed to parse log target %s.", optarg);
756 return r;
757 }
758
759 break;
760
bbe63281
LP
761 case ARG_LOG_COLOR:
762
d0b170c8 763 if (optarg) {
fb472900
ZJS
764 r = log_show_color_from_string(optarg);
765 if (r < 0) {
d0b170c8
LP
766 log_error("Failed to parse log color setting %s.", optarg);
767 return r;
768 }
769 } else
770 log_show_color(true);
bbe63281
LP
771
772 break;
773
774 case ARG_LOG_LOCATION:
d0b170c8 775 if (optarg) {
fb472900
ZJS
776 r = log_show_location_from_string(optarg);
777 if (r < 0) {
d0b170c8
LP
778 log_error("Failed to parse log location setting %s.", optarg);
779 return r;
780 }
781 } else
782 log_show_location(true);
bbe63281
LP
783
784 break;
785
0a494f1f 786 case ARG_DEFAULT_STD_OUTPUT:
fb472900
ZJS
787 r = exec_output_from_string(optarg);
788 if (r < 0) {
0a494f1f
LP
789 log_error("Failed to parse default standard output setting %s.", optarg);
790 return r;
791 } else
792 arg_default_std_output = r;
793 break;
794
795 case ARG_DEFAULT_STD_ERROR:
fb472900
ZJS
796 r = exec_output_from_string(optarg);
797 if (r < 0) {
0a494f1f
LP
798 log_error("Failed to parse default standard error output setting %s.", optarg);
799 return r;
800 } else
801 arg_default_std_error = r;
802 break;
803
2f198e2f 804 case ARG_UNIT:
f170852a 805
fb472900 806 r = set_default_unit(optarg);
23bbb0de
MS
807 if (r < 0)
808 return log_error_errno(r, "Failed to set default unit %s: %m", optarg);
f170852a
LP
809
810 break;
811
edb9aaa8 812 case ARG_SYSTEM:
b2c23da8 813 arg_running_as = MANAGER_SYSTEM;
edb9aaa8 814 break;
a5dab5ce 815
af2d49f7 816 case ARG_USER:
b2c23da8 817 arg_running_as = MANAGER_USER;
a5dab5ce 818 break;
a5dab5ce 819
e965d56d 820 case ARG_TEST:
fa0f4d8a 821 arg_action = ACTION_TEST;
b87c2aa6
ZJS
822 if (arg_no_pager < 0)
823 arg_no_pager = true;
824 break;
825
826 case ARG_NO_PAGER:
827 arg_no_pager = true;
e965d56d
LP
828 break;
829
9ba0bc4e
ZJS
830 case ARG_VERSION:
831 arg_action = ACTION_VERSION;
832 break;
833
e537352b 834 case ARG_DUMP_CONFIGURATION_ITEMS:
fa0f4d8a 835 arg_action = ACTION_DUMP_CONFIGURATION_ITEMS;
e537352b
LP
836 break;
837
9e58ff9c 838 case ARG_DUMP_CORE:
a5d87bf0
LP
839 r = optarg ? parse_boolean(optarg) : 1;
840 if (r < 0) {
841 log_error("Failed to parse dump core boolean %s.", optarg);
842 return r;
843 }
844 arg_dump_core = r;
9e58ff9c
LP
845 break;
846
847 case ARG_CRASH_SHELL:
a5d87bf0
LP
848 r = optarg ? parse_boolean(optarg) : 1;
849 if (r < 0) {
850 log_error("Failed to parse crash shell boolean %s.", optarg);
851 return r;
852 }
853 arg_crash_shell = r;
9e58ff9c
LP
854 break;
855
80876c20 856 case ARG_CONFIRM_SPAWN:
a5d87bf0
LP
857 r = optarg ? parse_boolean(optarg) : 1;
858 if (r < 0) {
859 log_error("Failed to parse confirm spawn boolean %s.", optarg);
860 return r;
861 }
862 arg_confirm_spawn = r;
80876c20
LP
863 break;
864
9e58ff9c 865 case ARG_SHOW_STATUS:
d450b6f2
ZJS
866 if (optarg) {
867 r = parse_show_status(optarg, &arg_show_status);
868 if (r < 0) {
869 log_error("Failed to parse show status boolean %s.", optarg);
870 return r;
871 }
872 } else
873 arg_show_status = SHOW_STATUS_YES;
6e98720f 874 break;
a5d87bf0 875
a16e1123
LP
876 case ARG_DESERIALIZE: {
877 int fd;
878 FILE *f;
879
01e10de3
LP
880 r = safe_atoi(optarg, &fd);
881 if (r < 0 || fd < 0) {
a16e1123 882 log_error("Failed to parse deserialize option %s.", optarg);
01e10de3 883 return r < 0 ? r : -EINVAL;
a16e1123
LP
884 }
885
01e10de3
LP
886 fd_cloexec(fd, true);
887
888 f = fdopen(fd, "r");
4a62c710
MS
889 if (!f)
890 return log_error_errno(errno, "Failed to open serialization fd: %m");
a16e1123 891
74ca738f 892 safe_fclose(arg_serialization);
a16e1123 893
d3b1c508 894 arg_serialization = f;
a16e1123
LP
895
896 break;
897 }
898
2660882b 899 case ARG_SWITCHED_ROOT:
bf4df7c3 900 arg_switched_root = true;
d03bc1b8
HH
901 break;
902
f170852a 903 case 'h':
fa0f4d8a 904 arg_action = ACTION_HELP;
b87c2aa6
ZJS
905 if (arg_no_pager < 0)
906 arg_no_pager = true;
f170852a
LP
907 break;
908
1d2e23ab
LP
909 case 'D':
910 log_set_max_level(LOG_DEBUG);
911 break;
912
099663ff
LP
913 case 'b':
914 case 's':
915 case 'z':
916 /* Just to eat away the sysvinit kernel
917 * cmdline args without getopt() error
918 * messages that we'll parse in
919 * parse_proc_cmdline_word() or ignore. */
f170852a 920
099663ff 921 case '?':
601185b4 922 if (getpid() != 1)
099663ff 923 return -EINVAL;
601185b4
ZJS
924 else
925 return 0;
099663ff 926
601185b4
ZJS
927 default:
928 assert_not_reached("Unhandled option code.");
f170852a
LP
929 }
930
d821e6d6
LP
931 if (optind < argc && getpid() != 1) {
932 /* Hmm, when we aren't run as init system
933 * let's complain about excess arguments */
934
935 log_error("Excess arguments.");
936 return -EINVAL;
937 }
938
f170852a
LP
939 return 0;
940}
941
942static int help(void) {
943
2e33c433 944 printf("%s [OPTIONS...]\n\n"
af2d49f7 945 "Starts up and maintains the system or user services.\n\n"
e537352b 946 " -h --help Show this help\n"
e537352b 947 " --test Determine startup sequence, dump it and exit\n"
b87c2aa6 948 " --no-pager Do not pipe output into a pager\n"
80876c20 949 " --dump-configuration-items Dump understood unit configuration items\n"
9e58ff9c 950 " --unit=UNIT Set default unit\n"
edb9aaa8 951 " --system Run a system instance, even if PID != 1\n"
af2d49f7 952 " --user Run a user instance\n"
a5d87bf0
LP
953 " --dump-core[=0|1] Dump core on crash\n"
954 " --crash-shell[=0|1] Run shell on crash\n"
955 " --confirm-spawn[=0|1] Ask for confirmation when spawning processes\n"
6e98720f 956 " --show-status[=0|1] Show status updates on the console during bootup\n"
c1dc6153 957 " --log-target=TARGET Set log target (console, journal, kmsg, journal-or-kmsg, null)\n"
9e58ff9c 958 " --log-level=LEVEL Set log level (debug, info, notice, warning, err, crit, alert, emerg)\n"
2218198b 959 " --log-color[=0|1] Highlight important log messages\n"
0a494f1f
LP
960 " --log-location[=0|1] Include code location in log messages\n"
961 " --default-standard-output= Set default standard output for services\n"
962 " --default-standard-error= Set default standard error output for services\n",
5b6319dc 963 program_invocation_short_name);
f170852a
LP
964
965 return 0;
966}
967
9ba0bc4e
ZJS
968static int version(void) {
969 puts(PACKAGE_STRING);
9ba0bc4e
ZJS
970 puts(SYSTEMD_FEATURES);
971
972 return 0;
973}
974
b3680f49 975static int prepare_reexecute(Manager *m, FILE **_f, FDSet **_fds, bool switching_root) {
a16e1123
LP
976 FILE *f = NULL;
977 FDSet *fds = NULL;
978 int r;
979
980 assert(m);
981 assert(_f);
982 assert(_fds);
983
6b78f9b4
LP
984 r = manager_open_serialization(m, &f);
985 if (r < 0) {
da927ba9 986 log_error_errno(r, "Failed to create serialization file: %m");
a16e1123
LP
987 goto fail;
988 }
989
71445ae7
LP
990 /* Make sure nothing is really destructed when we shut down */
991 m->n_reloading ++;
718db961 992 bus_manager_send_reloading(m, true);
71445ae7 993
6b78f9b4
LP
994 fds = fdset_new();
995 if (!fds) {
a16e1123 996 r = -ENOMEM;
da927ba9 997 log_error_errno(r, "Failed to allocate fd set: %m");
a16e1123
LP
998 goto fail;
999 }
1000
b3680f49 1001 r = manager_serialize(m, f, fds, switching_root);
6b78f9b4 1002 if (r < 0) {
da927ba9 1003 log_error_errno(r, "Failed to serialize state: %m");
a16e1123
LP
1004 goto fail;
1005 }
1006
1007 if (fseeko(f, 0, SEEK_SET) < 0) {
56f64d95 1008 log_error_errno(errno, "Failed to rewind serialization fd: %m");
a16e1123
LP
1009 goto fail;
1010 }
1011
6b78f9b4
LP
1012 r = fd_cloexec(fileno(f), false);
1013 if (r < 0) {
da927ba9 1014 log_error_errno(r, "Failed to disable O_CLOEXEC for serialization: %m");
a16e1123
LP
1015 goto fail;
1016 }
1017
6b78f9b4
LP
1018 r = fdset_cloexec(fds, false);
1019 if (r < 0) {
da927ba9 1020 log_error_errno(r, "Failed to disable O_CLOEXEC for serialization fds: %m");
a16e1123
LP
1021 goto fail;
1022 }
1023
1024 *_f = f;
1025 *_fds = fds;
1026
1027 return 0;
1028
1029fail:
1030 fdset_free(fds);
1031
74ca738f 1032 safe_fclose(f);
a16e1123
LP
1033
1034 return r;
1035}
1036
4096d6f5
LP
1037static int bump_rlimit_nofile(struct rlimit *saved_rlimit) {
1038 struct rlimit nl;
1039 int r;
1040
1041 assert(saved_rlimit);
1042
1043 /* Save the original RLIMIT_NOFILE so that we can reset it
1044 * later when transitioning from the initrd to the main
1045 * systemd or suchlike. */
4a62c710
MS
1046 if (getrlimit(RLIMIT_NOFILE, saved_rlimit) < 0)
1047 return log_error_errno(errno, "Reading RLIMIT_NOFILE failed: %m");
4096d6f5
LP
1048
1049 /* Make sure forked processes get the default kernel setting */
1050 if (!arg_default_rlimit[RLIMIT_NOFILE]) {
1051 struct rlimit *rl;
1052
1053 rl = newdup(struct rlimit, saved_rlimit, 1);
1054 if (!rl)
1055 return log_oom();
1056
1057 arg_default_rlimit[RLIMIT_NOFILE] = rl;
1058 }
1059
1060 /* Bump up the resource limit for ourselves substantially */
1061 nl.rlim_cur = nl.rlim_max = 64*1024;
1062 r = setrlimit_closest(RLIMIT_NOFILE, &nl);
23bbb0de
MS
1063 if (r < 0)
1064 return log_error_errno(r, "Setting RLIMIT_NOFILE failed: %m");
4096d6f5
LP
1065
1066 return 0;
1067}
1068
6ee5bbf8 1069static void test_mtab(void) {
6ee5bbf8 1070
5b4c0131
LP
1071 static const char ok[] =
1072 "/proc/self/mounts\0"
1073 "/proc/mounts\0"
1074 "../proc/self/mounts\0"
1075 "../proc/mounts\0";
80758717 1076
5b4c0131
LP
1077 _cleanup_free_ char *p = NULL;
1078 int r;
6ee5bbf8 1079
5b4c0131
LP
1080 /* Check that /etc/mtab is a symlink to the right place or
1081 * non-existing. But certainly not a file, or a symlink to
1082 * some weird place... */
6ee5bbf8 1083
5b4c0131
LP
1084 r = readlink_malloc("/etc/mtab", &p);
1085 if (r == -ENOENT)
1086 return;
1087 if (r >= 0 && nulstr_contains(ok, p))
1088 return;
6ee5bbf8 1089
bcce7187
DM
1090 log_error("/etc/mtab is not a symlink or not pointing to /proc/self/mounts. "
1091 "This is not supported anymore. "
1092 "Please make sure to replace this file by a symlink to avoid incorrect or misleading mount(8) output.");
1093 freeze();
80758717
LP
1094}
1095
1096static void test_usr(void) {
80758717 1097
ed1c99fc 1098 /* Check that /usr is not a separate fs */
80758717 1099
871c44a7
LP
1100 if (dir_is_empty("/usr") <= 0)
1101 return;
1102
8b173b5e 1103 log_warning("/usr appears to be on its own filesystem and is not already mounted. This is not a supported setup. "
871c44a7
LP
1104 "Some things will probably break (sometimes even silently) in mysterious ways. "
1105 "Consult http://freedesktop.org/wiki/Software/systemd/separate-usr-is-broken for more information.");
1106}
1107
a07fdfa3
LP
1108static int initialize_join_controllers(void) {
1109 /* By default, mount "cpu" + "cpuacct" together, and "net_cls"
1110 * + "net_prio". We'd like to add "cpuset" to the mix, but
f131770b 1111 * "cpuset" doesn't really work for groups with no initialized
a07fdfa3
LP
1112 * attributes. */
1113
1114 arg_join_controllers = new(char**, 3);
1115 if (!arg_join_controllers)
1116 return -ENOMEM;
1117
1118 arg_join_controllers[0] = strv_new("cpu", "cpuacct", NULL);
a07fdfa3 1119 arg_join_controllers[1] = strv_new("net_cls", "net_prio", NULL);
a6b26d90
ZJS
1120 arg_join_controllers[2] = NULL;
1121
1122 if (!arg_join_controllers[0] || !arg_join_controllers[1]) {
1123 free_join_controllers();
a07fdfa3 1124 return -ENOMEM;
a6b26d90 1125 }
a07fdfa3 1126
a07fdfa3
LP
1127 return 0;
1128}
1129
d3b1c508
LP
1130static int enforce_syscall_archs(Set *archs) {
1131#ifdef HAVE_SECCOMP
1132 scmp_filter_ctx *seccomp;
1133 Iterator i;
1134 void *id;
1135 int r;
1136
1137 seccomp = seccomp_init(SCMP_ACT_ALLOW);
1138 if (!seccomp)
1139 return log_oom();
1140
1141 SET_FOREACH(id, arg_syscall_archs, i) {
1142 r = seccomp_arch_add(seccomp, PTR_TO_UINT32(id) - 1);
1143 if (r == -EEXIST)
1144 continue;
1145 if (r < 0) {
da927ba9 1146 log_error_errno(r, "Failed to add architecture to seccomp: %m");
d3b1c508
LP
1147 goto finish;
1148 }
1149 }
1150
8a8bf3c0
LP
1151 r = seccomp_attr_set(seccomp, SCMP_FLTATR_CTL_NNP, 0);
1152 if (r < 0) {
da927ba9 1153 log_error_errno(r, "Failed to unset NO_NEW_PRIVS: %m");
8a8bf3c0
LP
1154 goto finish;
1155 }
1156
d3b1c508
LP
1157 r = seccomp_load(seccomp);
1158 if (r < 0)
da927ba9 1159 log_error_errno(r, "Failed to add install architecture seccomp: %m");
d3b1c508
LP
1160
1161finish:
1162 seccomp_release(seccomp);
1163 return r;
1164#else
1165 return 0;
1166#endif
1167}
1168
b6e2f329
LP
1169static int status_welcome(void) {
1170 _cleanup_free_ char *pretty_name = NULL, *ansi_color = NULL;
1171 int r;
1172
1173 r = parse_env_file("/etc/os-release", NEWLINE,
1174 "PRETTY_NAME", &pretty_name,
1175 "ANSI_COLOR", &ansi_color,
1176 NULL);
ece174c5 1177 if (r == -ENOENT)
5ae4d543
LP
1178 r = parse_env_file("/usr/lib/os-release", NEWLINE,
1179 "PRETTY_NAME", &pretty_name,
1180 "ANSI_COLOR", &ansi_color,
1181 NULL);
b6e2f329
LP
1182
1183 if (r < 0 && r != -ENOENT)
da927ba9 1184 log_warning_errno(r, "Failed to read os-release file: %m");
b6e2f329
LP
1185
1186 return status_printf(NULL, false, false,
1187 "\nWelcome to \x1B[%sm%s\x1B[0m!\n",
1188 isempty(ansi_color) ? "1" : ansi_color,
1189 isempty(pretty_name) ? "Linux" : pretty_name);
1190}
1191
fdd25311
LP
1192static int write_container_id(void) {
1193 const char *c;
1194
1195 c = getenv("container");
1196 if (isempty(c))
1197 return 0;
1198
4c1fc3e4 1199 return write_string_file("/run/systemd/container", c, WRITE_STRING_FILE_CREATE);
fdd25311
LP
1200}
1201
60918275
LP
1202int main(int argc, char *argv[]) {
1203 Manager *m = NULL;
22f4096c 1204 int r, retval = EXIT_FAILURE;
9d76d730
LP
1205 usec_t before_startup, after_startup;
1206 char timespan[FORMAT_TIMESPAN_MAX];
a16e1123
LP
1207 FDSet *fds = NULL;
1208 bool reexecute = false;
b9080b03 1209 const char *shutdown_verb = NULL;
86caf095
LP
1210 dual_timestamp initrd_timestamp = DUAL_TIMESTAMP_NULL;
1211 dual_timestamp userspace_timestamp = DUAL_TIMESTAMP_NULL;
1212 dual_timestamp kernel_timestamp = DUAL_TIMESTAMP_NULL;
1213 dual_timestamp security_start_timestamp = DUAL_TIMESTAMP_NULL;
1214 dual_timestamp security_finish_timestamp = DUAL_TIMESTAMP_NULL;
5d6b1584 1215 static char systemd[] = "systemd";
2660882b 1216 bool skip_setup = false;
d3b1c508 1217 unsigned j;
0b3325e7 1218 bool loaded_policy = false;
e96d6be7 1219 bool arm_reboot_watchdog = false;
bf4df7c3 1220 bool queue_default_job = false;
5f5c2f38 1221 bool empty_etc = false;
41669317 1222 char *switch_root_dir = NULL, *switch_root_init = NULL;
86caf095 1223 struct rlimit saved_rlimit_nofile = RLIMIT_MAKE_CONST(0);
cb6531be 1224 const char *error_message = NULL;
287419c1 1225 uint8_t shutdown_exit_code = 0;
27b14a22 1226
058dc6f3 1227#ifdef HAVE_SYSV_COMPAT
2cb1a60d 1228 if (getpid() != 1 && strstr(program_invocation_short_name, "init")) {
35b8ca3a 1229 /* This is compatibility support for SysV, where
2cb1a60d
LP
1230 * calling init as a user is identical to telinit. */
1231
1232 errno = -ENOENT;
1233 execv(SYSTEMCTL_BINARY_PATH, argv);
56f64d95 1234 log_error_errno(errno, "Failed to exec " SYSTEMCTL_BINARY_PATH ": %m");
2cb1a60d
LP
1235 return 1;
1236 }
058dc6f3 1237#endif
2cb1a60d 1238
c3a170f3
HH
1239 dual_timestamp_from_monotonic(&kernel_timestamp, 0);
1240 dual_timestamp_get(&userspace_timestamp);
1241
0b3325e7
LP
1242 /* Determine if this is a reexecution or normal bootup. We do
1243 * the full command line parsing much later, so let's just
1244 * have a quick peek here. */
db813c2a
LP
1245 if (strv_find(argv+1, "--deserialize"))
1246 skip_setup = true;
0b3325e7 1247
2660882b
LP
1248 /* If we have switched root, do all the special setup
1249 * things */
db813c2a
LP
1250 if (strv_find(argv+1, "--switched-root"))
1251 skip_setup = false;
d03bc1b8 1252
f3b6a3ed
LP
1253 /* If we get started via the /sbin/init symlink then we are
1254 called 'init'. After a subsequent reexecution we are then
1255 called 'systemd'. That is confusing, hence let's call us
1256 systemd right-away. */
f3b6a3ed
LP
1257 program_invocation_short_name = systemd;
1258 prctl(PR_SET_NAME, systemd);
5d6b1584 1259
9a0e6896
LP
1260 saved_argv = argv;
1261 saved_argc = argc;
f3b6a3ed 1262
2cc59dbf 1263 log_show_color(isatty(STDERR_FILENO) > 0);
c1dc6153 1264 log_set_upgrade_syslog_to_journal(true);
bbe63281 1265
90dc8c2e
MG
1266 /* Disable the umask logic */
1267 if (getpid() == 1)
1268 umask(0);
1269
75f86906 1270 if (getpid() == 1 && detect_container() <= 0) {
4f8d551f 1271
a866073d 1272 /* Running outside of a container as PID 1 */
b2c23da8 1273 arg_running_as = MANAGER_SYSTEM;
a866073d
LP
1274 make_null_stdio();
1275 log_set_target(LOG_TARGET_KMSG);
1276 log_open();
1277
21bf2ab0 1278 if (in_initrd())
c3a170f3 1279 initrd_timestamp = userspace_timestamp;
c3ba6250 1280
2660882b 1281 if (!skip_setup) {
8f838d8a 1282 mount_setup_early();
c2e0d600 1283 dual_timestamp_get(&security_start_timestamp);
cb6531be
ZJS
1284 if (mac_selinux_setup(&loaded_policy) < 0) {
1285 error_message = "Failed to load SELinux policy";
0b3325e7 1286 goto finish;
cb6531be
ZJS
1287 } else if (ima_setup() < 0) {
1288 error_message = "Failed to load IMA policy";
81611586 1289 goto finish;
cb6531be
ZJS
1290 } else if (mac_smack_setup(&loaded_policy) < 0) {
1291 error_message = "Failed to load SMACK policy";
ffbd2c4d 1292 goto finish;
cb6531be 1293 }
c2e0d600 1294 dual_timestamp_get(&security_finish_timestamp);
81611586 1295 }
0b3325e7 1296
cb6531be
ZJS
1297 if (mac_selinux_init(NULL) < 0) {
1298 error_message = "Failed to initialize SELinux policy";
0ff4cdd9 1299 goto finish;
cb6531be 1300 }
7948c4df 1301
72edcff5 1302 if (!skip_setup) {
24efb112 1303 if (clock_is_localtime() > 0) {
0b3325e7 1304 int min;
7948c4df 1305
c264aeab
KS
1306 /*
1307 * The very first call of settimeofday() also does a time warp in the kernel.
1308 *
1309 * In the rtc-in-local time mode, we set the kernel's timezone, and rely on
1310 * external tools to take care of maintaining the RTC and do all adjustments.
1311 * This matches the behavior of Windows, which leaves the RTC alone if the
1312 * registry tells that the RTC runs in UTC.
1313 */
24efb112 1314 r = clock_set_timezone(&min);
0b3325e7 1315 if (r < 0)
da927ba9 1316 log_error_errno(r, "Failed to apply local time delta, ignoring: %m");
0b3325e7
LP
1317 else
1318 log_info("RTC configured in localtime, applying delta of %i minutes to system time.", min);
19e65613
KS
1319 } else if (!in_initrd()) {
1320 /*
c264aeab 1321 * Do a dummy very first call to seal the kernel's time warp magic.
19e65613
KS
1322 *
1323 * Do not call this this from inside the initrd. The initrd might not
1324 * carry /etc/adjtime with LOCAL, but the real system could be set up
1325 * that way. In such case, we need to delay the time-warp or the sealing
1326 * until we reach the real system.
c264aeab
KS
1327 *
1328 * Do no set the kernel's timezone. The concept of local time cannot
1329 * be supported reliably, the time will jump or be incorrect at every daylight
1330 * saving time change. All kernel local time concepts will be treated
1331 * as UTC that way.
19e65613 1332 */
c264aeab 1333 clock_reset_timewarp();
72edcff5
KS
1334 }
1335 }
a866073d
LP
1336
1337 /* Set the default for later on, but don't actually
1338 * open the logs like this for now. Note that if we
1339 * are transitioning from the initrd there might still
1340 * be journal fd open, and we shouldn't attempt
1341 * opening that before we parsed /proc/cmdline which
1342 * might redirect output elsewhere. */
1343 log_set_target(LOG_TARGET_JOURNAL_OR_KMSG);
1344
1345 } else if (getpid() == 1) {
a866073d 1346 /* Running inside a container, as PID 1 */
b2c23da8 1347 arg_running_as = MANAGER_SYSTEM;
a866073d 1348 log_set_target(LOG_TARGET_CONSOLE);
99f09825 1349 log_close_console(); /* force reopen of /dev/console */
a866073d
LP
1350 log_open();
1351
1352 /* For the later on, see above... */
1353 log_set_target(LOG_TARGET_JOURNAL);
1354
c3a170f3
HH
1355 /* clear the kernel timestamp,
1356 * because we are in a container */
1357 kernel_timestamp.monotonic = 0ULL;
1358 kernel_timestamp.realtime = 0ULL;
a866073d 1359
c3a170f3 1360 } else {
a866073d 1361 /* Running as user instance */
b2c23da8 1362 arg_running_as = MANAGER_USER;
eeecf6e6 1363 log_set_target(LOG_TARGET_AUTO);
871e5809 1364 log_open();
c3a170f3
HH
1365
1366 /* clear the kernel timestamp,
1367 * because we are not PID 1 */
6513d561 1368 kernel_timestamp = DUAL_TIMESTAMP_NULL;
bbe63281 1369 }
a5dab5ce 1370
0c85a4f3 1371 /* Initialize default unit */
6afa301b
LP
1372 r = set_default_unit(SPECIAL_DEFAULT_TARGET);
1373 if (r < 0) {
da927ba9 1374 log_emergency_errno(r, "Failed to set default unit %s: %m", SPECIAL_DEFAULT_TARGET);
cb6531be 1375 error_message = "Failed to set default unit";
f170852a 1376 goto finish;
14212119 1377 }
60918275 1378
a07fdfa3 1379 r = initialize_join_controllers();
cb6531be 1380 if (r < 0) {
ff9b60f3 1381 error_message = "Failed to initialize cgroup controllers";
0c85a4f3 1382 goto finish;
cb6531be 1383 }
0c85a4f3 1384
f170852a
LP
1385 /* Mount /proc, /sys and friends, so that /proc/cmdline and
1386 * /proc/$PID/fd is available. */
c1dae1b3 1387 if (getpid() == 1) {
f84f9974
LP
1388
1389 /* Load the kernel modules early, so that we kdbus.ko is loaded before kdbusfs shall be mounted */
2e75e2a8
DM
1390 if (!skip_setup)
1391 kmod_setup();
2e75e2a8 1392
0c85a4f3 1393 r = mount_setup(loaded_policy);
cb6531be
ZJS
1394 if (r < 0) {
1395 error_message = "Failed to mount API filesystems";
8efe3c01 1396 goto finish;
cb6531be 1397 }
0c85a4f3 1398 }
4ade7963
LP
1399
1400 /* Reset all signal handlers. */
ce30c8dc
LP
1401 (void) reset_all_signal_handlers();
1402 (void) ignore_signals(SIGNALS_IGNORE, -1);
078e4539 1403
cb6531be
ZJS
1404 if (parse_config_file() < 0) {
1405 error_message = "Failed to parse config file";
487393e9 1406 goto finish;
cb6531be 1407 }
487393e9 1408
b2c23da8 1409 if (arg_running_as == MANAGER_SYSTEM) {
b5884878
LP
1410 r = parse_proc_cmdline(parse_proc_cmdline_item);
1411 if (r < 0)
da927ba9 1412 log_warning_errno(r, "Failed to parse kernel command line, ignoring: %m");
b5884878 1413 }
f170852a 1414
1de1c9c3
LP
1415 /* Note that this also parses bits from the kernel command
1416 * line, including "debug". */
f170852a
LP
1417 log_parse_environment();
1418
cb6531be
ZJS
1419 if (parse_argv(argc, argv) < 0) {
1420 error_message = "Failed to parse commandline arguments";
f170852a 1421 goto finish;
cb6531be 1422 }
f170852a 1423
6bae23a0
TB
1424 if (arg_action == ACTION_TEST &&
1425 geteuid() == 0) {
b5c6cf87
LP
1426 log_error("Don't run test mode as root.");
1427 goto finish;
1428 }
1429
b2c23da8 1430 if (arg_running_as == MANAGER_USER &&
6bae23a0
TB
1431 arg_action == ACTION_RUN &&
1432 sd_booted() <= 0) {
1433 log_error("Trying to run as user instance, but the system has not been booted with systemd.");
1434 goto finish;
1435 }
1436
b2c23da8 1437 if (arg_running_as == MANAGER_SYSTEM &&
fe783b03
LP
1438 arg_action == ACTION_RUN &&
1439 running_in_chroot() > 0) {
1440 log_error("Cannot be run in a chroot() environment.");
1441 goto finish;
1442 }
1443
0d8c31ff
ZJS
1444 if (arg_action == ACTION_TEST)
1445 skip_setup = true;
1446
b87c2aa6
ZJS
1447 pager_open_if_enabled();
1448
fa0f4d8a 1449 if (arg_action == ACTION_HELP) {
f170852a
LP
1450 retval = help();
1451 goto finish;
9ba0bc4e
ZJS
1452 } else if (arg_action == ACTION_VERSION) {
1453 retval = version();
1454 goto finish;
fa0f4d8a 1455 } else if (arg_action == ACTION_DUMP_CONFIGURATION_ITEMS) {
e537352b 1456 unit_dump_config_items(stdout);
22f4096c 1457 retval = EXIT_SUCCESS;
e537352b 1458 goto finish;
fa0f4d8a 1459 } else if (arg_action == ACTION_DONE) {
22f4096c 1460 retval = EXIT_SUCCESS;
4288f619 1461 goto finish;
f170852a
LP
1462 }
1463
b2c23da8 1464 if (arg_running_as == MANAGER_USER &&
8be28fb1
KS
1465 !getenv("XDG_RUNTIME_DIR")) {
1466 log_error("Trying to run as user instance, but $XDG_RUNTIME_DIR is not set.");
1467 goto finish;
1468 }
1469
fa0f4d8a 1470 assert_se(arg_action == ACTION_RUN || arg_action == ACTION_TEST);
f170852a 1471
871e5809
LP
1472 /* Close logging fds, in order not to confuse fdset below */
1473 log_close();
1474
a16e1123 1475 /* Remember open file descriptors for later deserialization */
01e10de3
LP
1476 r = fdset_new_fill(&fds);
1477 if (r < 0) {
da927ba9 1478 log_emergency_errno(r, "Failed to allocate fd set: %m");
cb6531be 1479 error_message = "Failed to allocate fd set";
01e10de3
LP
1480 goto finish;
1481 } else
1482 fdset_cloexec(fds, true);
a16e1123 1483
d3b1c508
LP
1484 if (arg_serialization)
1485 assert_se(fdset_remove(fds, fileno(arg_serialization)) >= 0);
a16e1123 1486
b2c23da8 1487 if (arg_running_as == MANAGER_SYSTEM)
80876c20
LP
1488 /* Become a session leader if we aren't one yet. */
1489 setsid();
4ade7963 1490
befb5b6a 1491 /* Move out of the way, so that we won't block unmounts */
d250afe7 1492 assert_se(chdir("/") == 0);
befb5b6a 1493
2146621b
LP
1494 /* Reset the console, but only if this is really init and we
1495 * are freshly booted */
b2c23da8 1496 if (arg_running_as == MANAGER_SYSTEM && arg_action == ACTION_RUN) {
56d96fc0
LP
1497
1498 /* If we are init, we connect stdin/stdout/stderr to
1499 * /dev/null and make sure we don't have a controlling
1500 * tty. */
1501 release_terminal();
1502
1503 if (getpid() == 1 && !skip_setup)
1504 console_setup();
1505 }
4ade7963 1506
18149b9f 1507 /* Open the logging devices, if possible and necessary */
843d2643 1508 log_open();
4ade7963 1509
b6e2f329
LP
1510 if (arg_show_status == _SHOW_STATUS_UNSET)
1511 arg_show_status = SHOW_STATUS_YES;
1512
5373d602
LP
1513 /* Make sure we leave a core dump without panicing the
1514 * kernel. */
ab422445 1515 if (getpid() == 1) {
4fc935ca 1516 install_crash_handler();
97c4f35c 1517
0c85a4f3
LP
1518 r = mount_cgroup_controllers(arg_join_controllers);
1519 if (r < 0)
1520 goto finish;
1521 }
1522
b2c23da8 1523 if (arg_running_as == MANAGER_SYSTEM) {
75f86906 1524 int v;
c20f5ac7 1525
0d8c31ff
ZJS
1526 log_info(PACKAGE_STRING " running in %ssystem mode. (" SYSTEMD_FEATURES ")",
1527 arg_action == ACTION_TEST ? "test " : "" );
c20f5ac7 1528
75f86906
LP
1529 v = detect_virtualization();
1530 if (v > 0)
1531 log_info("Detected virtualization %s.", virtualization_to_string(v));
c20f5ac7 1532
fdd25311
LP
1533 write_container_id();
1534
d3f86679 1535 log_info("Detected architecture %s.", architecture_to_string(uname_architecture()));
d9d93745 1536
26a1efdf
LP
1537 if (in_initrd())
1538 log_info("Running in initial RAM disk.");
1539
3408ba01
LP
1540 /* Let's check whether /etc is already populated. We
1541 * don't actually really check for that, but use
1542 * /etc/machine-id as flag file. This allows container
1543 * managers and installers to provision a couple of
1544 * files already. If the container manager wants to
1545 * provision the machine ID itself it should pass
ee33e53a 1546 * $container_uuid to PID 1. */
3408ba01 1547
baa1bdf7 1548 empty_etc = access("/etc/machine-id", F_OK) < 0;
5f5c2f38
LP
1549 if (empty_etc)
1550 log_info("Running with unpopulated /etc.");
d8160f21 1551 } else {
1f97091d
LP
1552 _cleanup_free_ char *t;
1553
1554 t = uid_to_name(getuid());
0d8c31ff
ZJS
1555 log_debug(PACKAGE_STRING " running in %suser mode for user "UID_FMT"/%s. (" SYSTEMD_FEATURES ")",
1556 arg_action == ACTION_TEST ? " test" : "", getuid(), t);
d8160f21 1557 }
a5dab5ce 1558
b2c23da8 1559 if (arg_running_as == MANAGER_SYSTEM && !skip_setup) {
031886ed 1560 if (arg_show_status > 0)
888c6216
LP
1561 status_welcome();
1562
888c6216 1563 hostname_setup();
489388fb 1564 machine_id_setup(NULL);
888c6216 1565 loopback_setup();
490aed58 1566
6ee5bbf8 1567 test_mtab();
80758717 1568 test_usr();
af5bc85d 1569 }
302e8c4c 1570
b2c23da8 1571 if (arg_running_as == MANAGER_SYSTEM && arg_runtime_watchdog > 0)
e96d6be7
LP
1572 watchdog_set_timeout(&arg_runtime_watchdog);
1573
3a43da28 1574 if (arg_timer_slack_nsec != NSEC_INFINITY)
aa0f64ac 1575 if (prctl(PR_SET_TIMERSLACK, arg_timer_slack_nsec) < 0)
56f64d95 1576 log_error_errno(errno, "Failed to adjust timer slack: %m");
aa0f64ac 1577
ec8927ca 1578 if (arg_capability_bounding_set_drop) {
31c885e9 1579 r = capability_bounding_set_drop_usermode(arg_capability_bounding_set_drop);
ec8927ca 1580 if (r < 0) {
da927ba9 1581 log_emergency_errno(r, "Failed to drop capability bounding set of usermode helpers: %m");
cb6531be 1582 error_message = "Failed to drop capability bounding set of usermode helpers";
ec8927ca
LP
1583 goto finish;
1584 }
31c885e9 1585 r = capability_bounding_set_drop(arg_capability_bounding_set_drop, true);
939b8f14 1586 if (r < 0) {
da927ba9 1587 log_emergency_errno(r, "Failed to drop capability bounding set: %m");
cb6531be 1588 error_message = "Failed to drop capability bounding set";
939b8f14
LP
1589 goto finish;
1590 }
ec8927ca
LP
1591 }
1592
d3b1c508
LP
1593 if (arg_syscall_archs) {
1594 r = enforce_syscall_archs(arg_syscall_archs);
cb6531be
ZJS
1595 if (r < 0) {
1596 error_message = "Failed to set syscall architectures";
d3b1c508 1597 goto finish;
cb6531be 1598 }
d3b1c508
LP
1599 }
1600
61b9b203 1601 if (arg_running_as == MANAGER_USER)
d4447f4d 1602 /* Become reaper of our children */
61b9b203 1603 if (prctl(PR_SET_CHILD_SUBREAPER, 1) < 0)
56f64d95 1604 log_warning_errno(errno, "Failed to make us a subreaper: %m");
d4447f4d 1605
b2c23da8 1606 if (arg_running_as == MANAGER_SYSTEM) {
4096d6f5
LP
1607 bump_rlimit_nofile(&saved_rlimit_nofile);
1608
5f5c2f38 1609 if (empty_etc) {
304b3079 1610 r = unit_file_preset_all(UNIT_FILE_SYSTEM, false, NULL, UNIT_FILE_PRESET_ENABLE_ONLY, false, NULL, 0);
5f5c2f38 1611 if (r < 0)
da927ba9 1612 log_warning_errno(r, "Failed to populate /etc with preset unit settings, ignoring: %m");
5f5c2f38
LP
1613 else
1614 log_info("Populated /etc with preset unit settings.");
1615 }
1616 }
1617
0d8c31ff 1618 r = manager_new(arg_running_as, arg_action == ACTION_TEST, &m);
e96d6be7 1619 if (r < 0) {
da927ba9 1620 log_emergency_errno(r, "Failed to allocate manager object: %m");
cb6531be 1621 error_message = "Failed to allocate manager object";
60918275
LP
1622 goto finish;
1623 }
1624
9e58ff9c 1625 m->confirm_spawn = arg_confirm_spawn;
e96d6be7
LP
1626 m->runtime_watchdog = arg_runtime_watchdog;
1627 m->shutdown_watchdog = arg_shutdown_watchdog;
c3a170f3
HH
1628 m->userspace_timestamp = userspace_timestamp;
1629 m->kernel_timestamp = kernel_timestamp;
c3a170f3 1630 m->initrd_timestamp = initrd_timestamp;
c2e0d600
TA
1631 m->security_start_timestamp = security_start_timestamp;
1632 m->security_finish_timestamp = security_finish_timestamp;
9e58ff9c 1633
06af2a04 1634 manager_set_defaults(m);
27d340c7 1635 manager_set_show_status(m, arg_show_status);
e2680723 1636 manager_set_first_boot(m, empty_etc);
27d340c7 1637
bf4df7c3 1638 /* Remember whether we should queue the default job */
d3b1c508 1639 queue_default_job = !arg_serialization || arg_switched_root;
bf4df7c3 1640
9d76d730
LP
1641 before_startup = now(CLOCK_MONOTONIC);
1642
d3b1c508 1643 r = manager_startup(m, arg_serialization, fds);
e96d6be7 1644 if (r < 0)
da927ba9 1645 log_error_errno(r, "Failed to fully start up daemon: %m");
a16e1123 1646
bf4df7c3
LP
1647 /* This will close all file descriptors that were opened, but
1648 * not claimed by any unit. */
01e10de3 1649 fdset_free(fds);
6c081276 1650 fds = NULL;
f50e0a01 1651
74ca738f 1652 arg_serialization = safe_fclose(arg_serialization);
bf4df7c3
LP
1653
1654 if (queue_default_job) {
718db961 1655 _cleanup_bus_error_free_ sd_bus_error error = SD_BUS_ERROR_NULL;
1c27d3f3 1656 Unit *target = NULL;
bacbccb7 1657 Job *default_unit_job;
398ef8ba 1658
fa0f4d8a 1659 log_debug("Activating default unit: %s", arg_default_unit);
a16e1123 1660
e96d6be7 1661 r = manager_load_unit(m, arg_default_unit, NULL, &error, &target);
718db961
LP
1662 if (r < 0)
1663 log_error("Failed to load default target: %s", bus_error_message(&error, r));
1664 else if (target->load_state == UNIT_ERROR || target->load_state == UNIT_NOT_FOUND)
c33b3297 1665 log_error_errno(target->load_error, "Failed to load default target: %m");
ac155bb8 1666 else if (target->load_state == UNIT_MASKED)
6daf4f90 1667 log_error("Default target masked.");
27b14a22 1668
ac155bb8 1669 if (!target || target->load_state != UNIT_LOADED) {
a16e1123 1670 log_info("Trying to load rescue target...");
1c27d3f3 1671
e96d6be7
LP
1672 r = manager_load_unit(m, SPECIAL_RESCUE_TARGET, NULL, &error, &target);
1673 if (r < 0) {
4104970e 1674 log_emergency("Failed to load rescue target: %s", bus_error_message(&error, r));
cb6531be 1675 error_message = "Failed to load rescue target";
a16e1123 1676 goto finish;
11ddb6f4 1677 } else if (target->load_state == UNIT_ERROR || target->load_state == UNIT_NOT_FOUND) {
c33b3297 1678 log_emergency_errno(target->load_error, "Failed to load rescue target: %m");
cb6531be 1679 error_message = "Failed to load rescue target";
1c27d3f3 1680 goto finish;
ac155bb8 1681 } else if (target->load_state == UNIT_MASKED) {
4104970e 1682 log_emergency("Rescue target masked.");
cb6531be 1683 error_message = "Rescue target masked";
00dc5d76 1684 goto finish;
a16e1123
LP
1685 }
1686 }
37d88da7 1687
ac155bb8 1688 assert(target->load_state == UNIT_LOADED);
00dc5d76 1689
fa0f4d8a 1690 if (arg_action == ACTION_TEST) {
40d50879 1691 printf("-> By units:\n");
a16e1123
LP
1692 manager_dump_units(m, stdout, "\t");
1693 }
1694
95f1b47d 1695 r = manager_add_job(m, JOB_START, target, JOB_ISOLATE, false, &error, &default_unit_job);
ab17a050 1696 if (r == -EPERM) {
718db961 1697 log_debug("Default target could not be isolated, starting instead: %s", bus_error_message(&error, r));
ab17a050
LP
1698
1699 r = manager_add_job(m, JOB_START, target, JOB_REPLACE, false, &error, &default_unit_job);
1700 if (r < 0) {
4104970e 1701 log_emergency("Failed to start default target: %s", bus_error_message(&error, r));
cb6531be 1702 error_message = "Failed to start default target";
ab17a050
LP
1703 goto finish;
1704 }
1705 } else if (r < 0) {
4104970e 1706 log_emergency("Failed to isolate default target: %s", bus_error_message(&error, r));
cb6531be 1707 error_message = "Failed to isolate default target";
37d88da7
LP
1708 goto finish;
1709 }
ab17a050 1710
bacbccb7 1711 m->default_unit_job_id = default_unit_job->id;
60918275 1712
07672f49
LP
1713 after_startup = now(CLOCK_MONOTONIC);
1714 log_full(arg_action == ACTION_TEST ? LOG_INFO : LOG_DEBUG,
1715 "Loaded units and determined initial transaction in %s.",
fdb14b7e 1716 format_timespan(timespan, sizeof(timespan), after_startup - before_startup, 100 * USEC_PER_MSEC));
07672f49 1717
fa0f4d8a 1718 if (arg_action == ACTION_TEST) {
40d50879 1719 printf("-> By jobs:\n");
a16e1123 1720 manager_dump_jobs(m, stdout, "\t");
22f4096c 1721 retval = EXIT_SUCCESS;
a16e1123
LP
1722 goto finish;
1723 }
e965d56d 1724 }
d46de8a1 1725
a16e1123 1726 for (;;) {
e96d6be7
LP
1727 r = manager_loop(m);
1728 if (r < 0) {
da927ba9 1729 log_emergency_errno(r, "Failed to run main loop: %m");
cb6531be 1730 error_message = "Failed to run main loop";
a16e1123
LP
1731 goto finish;
1732 }
11dd41ce 1733
a16e1123 1734 switch (m->exit_code) {
e965d56d 1735
a16e1123 1736 case MANAGER_RELOAD:
e015090f 1737 log_info("Reloading.");
06af2a04
TB
1738
1739 r = parse_config_file();
1740 if (r < 0)
1741 log_error("Failed to parse config file.");
1742
1743 manager_set_defaults(m);
1744
e96d6be7
LP
1745 r = manager_reload(m);
1746 if (r < 0)
da927ba9 1747 log_error_errno(r, "Failed to reload: %m");
a16e1123 1748 break;
cea8e32e 1749
a16e1123 1750 case MANAGER_REEXECUTE:
664f88a7 1751
cb6531be 1752 if (prepare_reexecute(m, &arg_serialization, &fds, false) < 0) {
6b9af963 1753 error_message = "Failed to prepare for reexecution";
a16e1123 1754 goto finish;
cb6531be 1755 }
60918275 1756
a16e1123 1757 reexecute = true;
e015090f 1758 log_notice("Reexecuting.");
a16e1123
LP
1759 goto finish;
1760
664f88a7
LP
1761 case MANAGER_SWITCH_ROOT:
1762 /* Steal the switch root parameters */
41669317 1763 switch_root_dir = m->switch_root;
664f88a7
LP
1764 switch_root_init = m->switch_root_init;
1765 m->switch_root = m->switch_root_init = NULL;
1766
1767 if (!switch_root_init)
cb6531be 1768 if (prepare_reexecute(m, &arg_serialization, &fds, true) < 0) {
6b9af963 1769 error_message = "Failed to prepare for reexecution";
664f88a7 1770 goto finish;
cb6531be 1771 }
664f88a7
LP
1772
1773 reexecute = true;
1774 log_notice("Switching root.");
1775 goto finish;
1776
287419c1 1777 case MANAGER_EXIT:
8ebfe0cb
DH
1778 if (m->running_as == MANAGER_USER) {
1779 retval = EXIT_SUCCESS;
1780 log_debug("Exit.");
1781 goto finish;
1782 }
1783
1784 /* fallthrough */
b9080b03
FF
1785 case MANAGER_REBOOT:
1786 case MANAGER_POWEROFF:
1787 case MANAGER_HALT:
1788 case MANAGER_KEXEC: {
1789 static const char * const table[_MANAGER_EXIT_CODE_MAX] = {
287419c1 1790 [MANAGER_EXIT] = "exit",
b9080b03
FF
1791 [MANAGER_REBOOT] = "reboot",
1792 [MANAGER_POWEROFF] = "poweroff",
1793 [MANAGER_HALT] = "halt",
1794 [MANAGER_KEXEC] = "kexec"
1795 };
1796
1797 assert_se(shutdown_verb = table[m->exit_code]);
e96d6be7 1798 arm_reboot_watchdog = m->exit_code == MANAGER_REBOOT;
b9080b03
FF
1799
1800 log_notice("Shutting down.");
1801 goto finish;
1802 }
1803
a16e1123
LP
1804 default:
1805 assert_not_reached("Unknown exit code.");
1806 }
1807 }
f170852a 1808
60918275 1809finish:
b87c2aa6
ZJS
1810 pager_close();
1811
287419c1 1812 if (m) {
81f5fc2d 1813 arg_shutdown_watchdog = m->shutdown_watchdog;
287419c1
AC
1814 shutdown_exit_code = m->return_value;
1815 }
06d8d842 1816 m = manager_free(m);
60918275 1817
1f6b4113 1818 for (j = 0; j < ELEMENTSOF(arg_default_rlimit); j++)
a1e58e8e 1819 arg_default_rlimit[j] = mfree(arg_default_rlimit[j]);
c93ff2e9 1820
97b11eed 1821 arg_default_unit = mfree(arg_default_unit);
d3b1c508 1822
0c85a4f3 1823 free_join_controllers();
b9cd2ec1 1824
97b11eed 1825 arg_default_environment = strv_free(arg_default_environment);
d3b1c508 1826
525d3cc7 1827 arg_syscall_archs = set_free(arg_syscall_archs);
d3b1c508 1828
cc56fafe 1829 mac_selinux_finish();
b2bb3dbe 1830
a16e1123 1831 if (reexecute) {
664f88a7 1832 const char **args;
e564a982 1833 unsigned i, args_size;
a16e1123 1834
664f88a7
LP
1835 /* Close and disarm the watchdog, so that the new
1836 * instance can reinitialize it, but doesn't get
1837 * rebooted while we do that */
1838 watchdog_close(true);
a16e1123 1839
4096d6f5
LP
1840 /* Reset the RLIMIT_NOFILE to the kernel default, so
1841 * that the new systemd can pass the kernel default to
1842 * its child processes */
1843 if (saved_rlimit_nofile.rlim_cur > 0)
1844 setrlimit(RLIMIT_NOFILE, &saved_rlimit_nofile);
1845
41669317 1846 if (switch_root_dir) {
cee530bb
LP
1847 /* Kill all remaining processes from the
1848 * initrd, but don't wait for them, so that we
1849 * can handle the SIGCHLD for them after
1850 * deserializing. */
0bee65f0 1851 broadcast_signal(SIGTERM, false, true);
bd3fa1d2 1852
5a4bf02f
HH
1853 /* And switch root with MS_MOVE, because we remove the old directory afterwards and detach it. */
1854 r = switch_root(switch_root_dir, "/mnt", true, MS_MOVE);
41669317 1855 if (r < 0)
da927ba9 1856 log_error_errno(r, "Failed to switch root, trying to continue: %m");
41669317 1857 }
a16e1123 1858
d03bc1b8 1859 args_size = MAX(6, argc+1);
e564a982 1860 args = newa(const char*, args_size);
a16e1123 1861
664f88a7 1862 if (!switch_root_init) {
5ffa8c81 1863 char sfd[DECIMAL_STR_MAX(int) + 1];
a16e1123 1864
664f88a7
LP
1865 /* First try to spawn ourselves with the right
1866 * path, and with full serialization. We do
1867 * this only if the user didn't specify an
1868 * explicit init to spawn. */
edb9aaa8 1869
d3b1c508 1870 assert(arg_serialization);
664f88a7 1871 assert(fds);
edb9aaa8 1872
5ffa8c81 1873 xsprintf(sfd, "%i", fileno(arg_serialization));
edb9aaa8 1874
664f88a7
LP
1875 i = 0;
1876 args[i++] = SYSTEMD_BINARY_PATH;
41669317 1877 if (switch_root_dir)
2660882b 1878 args[i++] = "--switched-root";
b2c23da8 1879 args[i++] = arg_running_as == MANAGER_SYSTEM ? "--system" : "--user";
664f88a7
LP
1880 args[i++] = "--deserialize";
1881 args[i++] = sfd;
1882 args[i++] = NULL;
edb9aaa8 1883
ce8aba56
KS
1884 /* do not pass along the environment we inherit from the kernel or initrd */
1885 if (switch_root_dir)
1886 clearenv();
1887
e564a982 1888 assert(i <= args_size);
664f88a7
LP
1889 execv(args[0], (char* const*) args);
1890 }
6e98720f 1891
664f88a7
LP
1892 /* Try the fallback, if there is any, without any
1893 * serialization. We pass the original argv[] and
1894 * envp[]. (Well, modulo the ordering changes due to
1895 * getopt() in argv[], and some cleanups in envp[],
1896 * but let's hope that doesn't matter.) */
a16e1123 1897
74ca738f 1898 arg_serialization = safe_fclose(arg_serialization);
a16e1123 1899
b8f83232 1900 if (fds) {
664f88a7 1901 fdset_free(fds);
b8f83232
LP
1902 fds = NULL;
1903 }
a16e1123 1904
a504223d
HH
1905 /* Reopen the console */
1906 make_console_stdio();
1907
d3b1c508 1908 for (j = 1, i = 1; j < (unsigned) argc; j++)
664f88a7 1909 args[i++] = argv[j];
a16e1123 1910 args[i++] = NULL;
e564a982 1911 assert(i <= args_size);
b8f83232 1912
1b6d7fa7 1913 /* Reenable any blocked signals, especially important
5a85ca1c 1914 * if we switch from initial ramdisk to init=... */
ce30c8dc
LP
1915 (void) reset_all_signal_handlers();
1916 (void) reset_signal_mask();
5a85ca1c 1917
b8f83232
LP
1918 if (switch_root_init) {
1919 args[0] = switch_root_init;
1920 execv(args[0], (char* const*) args);
56f64d95 1921 log_warning_errno(errno, "Failed to execute configured init, trying fallback: %m");
b8f83232
LP
1922 }
1923
1924 args[0] = "/sbin/init";
a16e1123
LP
1925 execv(args[0], (char* const*) args);
1926
745e2fb7
KS
1927 if (errno == ENOENT) {
1928 log_warning("No /sbin/init, trying fallback");
b8f83232 1929
745e2fb7
KS
1930 args[0] = "/bin/sh";
1931 args[1] = NULL;
1932 execv(args[0], (char* const*) args);
56f64d95 1933 log_error_errno(errno, "Failed to execute /bin/sh, giving up: %m");
745e2fb7 1934 } else
56f64d95 1935 log_warning_errno(errno, "Failed to execute /sbin/init, giving up: %m");
a16e1123
LP
1936 }
1937
74ca738f 1938 arg_serialization = safe_fclose(arg_serialization);
a16e1123 1939
d3b1c508 1940 if (fds) {
a16e1123 1941 fdset_free(fds);
d3b1c508
LP
1942 fds = NULL;
1943 }
a16e1123 1944
54b434b1
LP
1945#ifdef HAVE_VALGRIND_VALGRIND_H
1946 /* If we are PID 1 and running under valgrind, then let's exit
1947 * here explicitly. valgrind will only generate nice output on
1948 * exit(), not on exec(), hence let's do the former not the
1949 * latter here. */
1950 if (getpid() == 1 && RUNNING_ON_VALGRIND)
1951 return 0;
1952#endif
1953
b9080b03 1954 if (shutdown_verb) {
b1e90ec5 1955 char log_level[DECIMAL_STR_MAX(int) + 1];
287419c1
AC
1956 char exit_code[DECIMAL_STR_MAX(uint8_t) + 1];
1957 const char* command_line[11] = {
b9080b03
FF
1958 SYSTEMD_SHUTDOWN_BINARY_PATH,
1959 shutdown_verb,
b1e90ec5
ZJS
1960 "--log-level", log_level,
1961 "--log-target",
b9080b03 1962 };
b1e90ec5 1963 unsigned pos = 5;
e3e45d4f 1964 _cleanup_strv_free_ char **env_block = NULL;
15bd5aee
LP
1965
1966 assert(command_line[pos] == NULL);
e3e45d4f 1967 env_block = strv_copy(environ);
b9080b03 1968
5ffa8c81 1969 xsprintf(log_level, "%d", log_get_max_level());
b1e90ec5
ZJS
1970
1971 switch (log_get_target()) {
1972 case LOG_TARGET_KMSG:
1973 case LOG_TARGET_JOURNAL_OR_KMSG:
1974 case LOG_TARGET_SYSLOG_OR_KMSG:
1975 command_line[pos++] = "kmsg";
1976 break;
1977
10f00ff1
ILG
1978 case LOG_TARGET_NULL:
1979 command_line[pos++] = "null";
1980 break;
1981
b1e90ec5
ZJS
1982 case LOG_TARGET_CONSOLE:
1983 default:
1984 command_line[pos++] = "console";
1985 break;
1986 };
1987
1988 if (log_get_show_color())
1989 command_line[pos++] = "--log-color";
1990
1991 if (log_get_show_location())
1992 command_line[pos++] = "--log-location";
1993
287419c1
AC
1994 if (streq(shutdown_verb, "exit")) {
1995 command_line[pos++] = "--exit-code";
1996 command_line[pos++] = exit_code;
1997 xsprintf(exit_code, "%d", shutdown_exit_code);
1998 }
1999
26abdc73 2000 assert(pos < ELEMENTSOF(command_line));
b1e90ec5 2001
e96d6be7 2002 if (arm_reboot_watchdog && arg_shutdown_watchdog > 0) {
e3e45d4f 2003 char *e;
d18f337c 2004
e96d6be7
LP
2005 /* If we reboot let's set the shutdown
2006 * watchdog and tell the shutdown binary to
2007 * repeatedly ping it */
c2cc6b9a
LP
2008 r = watchdog_set_timeout(&arg_shutdown_watchdog);
2009 watchdog_close(r < 0);
e96d6be7 2010
e3e45d4f
SP
2011 /* Tell the binary how often to ping, ignore failure */
2012 if (asprintf(&e, "WATCHDOG_USEC="USEC_FMT, arg_shutdown_watchdog) > 0)
2013 strv_push(&env_block, e);
2014 } else
e96d6be7
LP
2015 watchdog_close(true);
2016
66713f77
LP
2017 /* Avoid the creation of new processes forked by the
2018 * kernel; at this point, we will not listen to the
2019 * signals anyway */
75f86906 2020 if (detect_container() <= 0)
e155a0aa 2021 (void) cg_uninstall_release_agent(SYSTEMD_CGROUP_CONTROLLER);
ad929bcc 2022
d18f337c 2023 execve(SYSTEMD_SHUTDOWN_BINARY_PATH, (char **) command_line, env_block);
56f64d95 2024 log_error_errno(errno, "Failed to execute shutdown binary, %s: %m",
b1e90ec5 2025 getpid() == 1 ? "freezing" : "quitting");
b9080b03
FF
2026 }
2027
cb6531be
ZJS
2028 if (getpid() == 1) {
2029 if (error_message)
2030 manager_status_printf(NULL, STATUS_TYPE_EMERGENCY,
1fc464f6 2031 ANSI_HIGHLIGHT_RED "!!!!!!" ANSI_NORMAL,
cb6531be 2032 "%s, freezing.", error_message);
c3b3c274 2033 freeze();
cb6531be 2034 }
c3b3c274 2035
60918275
LP
2036 return retval;
2037}