]> git.ipfire.org Git - thirdparty/systemd.git/blame - src/core/manager.c
man: add an additional note about journalctl -u
[thirdparty/systemd.git] / src / core / manager.c
CommitLineData
53e1b683 1/* SPDX-License-Identifier: LGPL-2.1+ */
a7334b09
LP
2/***
3 This file is part of systemd.
4
5 Copyright 2010 Lennart Poettering
6
7 systemd is free software; you can redistribute it and/or modify it
5430f7f2
LP
8 under the terms of the GNU Lesser General Public License as published by
9 the Free Software Foundation; either version 2.1 of the License, or
a7334b09
LP
10 (at your option) any later version.
11
12 systemd is distributed in the hope that it will be useful, but
13 WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
5430f7f2 15 Lesser General Public License for more details.
a7334b09 16
5430f7f2 17 You should have received a copy of the GNU Lesser General Public License
a7334b09
LP
18 along with systemd; If not, see <http://www.gnu.org/licenses/>.
19***/
20
60918275 21#include <errno.h>
400f1a33
LP
22#include <fcntl.h>
23#include <linux/kd.h>
9152c765 24#include <signal.h>
713f6f90 25#include <stdio_ext.h>
400f1a33 26#include <string.h>
e46b13c8 27#include <sys/epoll.h>
400f1a33 28#include <sys/inotify.h>
e1414003 29#include <sys/ioctl.h>
400f1a33 30#include <sys/reboot.h>
8742514c 31#include <sys/timerfd.h>
400f1a33
LP
32#include <sys/wait.h>
33#include <unistd.h>
830f6caa 34
349cc4a5 35#if HAVE_AUDIT
4927fcae 36#include <libaudit.h>
830f6caa 37#endif
60918275 38
718db961 39#include "sd-daemon.h"
718db961 40#include "sd-messages.h"
3536f49e 41#include "sd-path.h"
81527be1 42
b5efdb8a 43#include "alloc-util.h"
400f1a33
LP
44#include "audit-fd.h"
45#include "boot-timestamps.h"
46#include "bus-common-errors.h"
47#include "bus-error.h"
48#include "bus-kernel.h"
49#include "bus-util.h"
00d9ef85 50#include "clean-ipc.h"
af6b0ecc 51#include "clock-util.h"
400f1a33
LP
52#include "dbus-job.h"
53#include "dbus-manager.h"
54#include "dbus-unit.h"
55#include "dbus.h"
d063a527 56#include "dirent-util.h"
400f1a33 57#include "env-util.h"
4f5dd394 58#include "escape.h"
89711996 59#include "exec-util.h"
d3070fbd 60#include "execute.h"
400f1a33 61#include "exit-status.h"
3ffd4af2 62#include "fd-util.h"
0d39fa9c 63#include "fileio.h"
f4f15635 64#include "fs-util.h"
60918275 65#include "hashmap.h"
c004493c 66#include "io-util.h"
d3070fbd 67#include "label.h"
400f1a33 68#include "locale-setup.h"
16354eff 69#include "log.h"
400f1a33 70#include "macro.h"
3ffd4af2 71#include "manager.h"
400f1a33 72#include "missing.h"
49e942b2 73#include "mkdir.h"
6bedfcbb 74#include "parse-util.h"
400f1a33
LP
75#include "path-lookup.h"
76#include "path-util.h"
77#include "process-util.h"
ea430986 78#include "ratelimit.h"
c6878637 79#include "rm-rf.h"
400f1a33 80#include "signal-util.h"
514f4ef5 81#include "special.h"
8fcde012 82#include "stat-util.h"
8b43440b 83#include "string-table.h"
07630cea 84#include "string-util.h"
400f1a33 85#include "strv.h"
dd1db3c2 86#include "strxcpyx.h"
400f1a33
LP
87#include "terminal-util.h"
88#include "time-util.h"
89#include "transaction.h"
affb60b1 90#include "umask-util.h"
400f1a33 91#include "unit-name.h"
00d9ef85 92#include "user-util.h"
400f1a33 93#include "util.h"
5dc4c17f 94#include "virt.h"
e96d6be7 95#include "watchdog.h"
60918275 96
a47806fa 97#define NOTIFY_RCVBUF_SIZE (8*1024*1024)
d8fdc620 98#define CGROUPS_AGENT_RCVBUF_SIZE (8*1024*1024)
a47806fa 99
03b717a3 100/* Initial delay and the interval for printing status messages about running jobs */
fd08a840
ZJS
101#define JOBS_IN_PROGRESS_WAIT_USEC (5*USEC_PER_SEC)
102#define JOBS_IN_PROGRESS_PERIOD_USEC (USEC_PER_SEC / 3)
03b717a3
MS
103#define JOBS_IN_PROGRESS_PERIOD_DIVISOR 3
104
e0a08581
LP
105/* If there are more than 1K bus messages queue across our API and direct busses, then let's not add more on top until
106 * the queue gets more empty. */
107#define MANAGER_BUS_BUSY_THRESHOLD 1024LU
108
109/* How many units and jobs to process of the bus queue before returning to the event loop. */
110#define MANAGER_BUS_MESSAGE_BUDGET 100U
111
718db961 112static int manager_dispatch_notify_fd(sd_event_source *source, int fd, uint32_t revents, void *userdata);
d8fdc620 113static int manager_dispatch_cgroups_agent_fd(sd_event_source *source, int fd, uint32_t revents, void *userdata);
718db961
LP
114static int manager_dispatch_signal_fd(sd_event_source *source, int fd, uint32_t revents, void *userdata);
115static int manager_dispatch_time_change_fd(sd_event_source *source, int fd, uint32_t revents, void *userdata);
116static int manager_dispatch_idle_pipe_fd(sd_event_source *source, int fd, uint32_t revents, void *userdata);
00d9ef85 117static int manager_dispatch_user_lookup_fd(sd_event_source *source, int fd, uint32_t revents, void *userdata);
718db961 118static int manager_dispatch_jobs_in_progress(sd_event_source *source, usec_t usec, void *userdata);
752b5905 119static int manager_dispatch_run_queue(sd_event_source *source, void *userdata);
575b300b 120static int manager_dispatch_sigchld(sd_event_source *source, void *userdata);
64691d20 121static int manager_run_environment_generators(Manager *m);
e801700e 122static int manager_run_generators(Manager *m);
718db961 123
2ae56591 124static void manager_watch_jobs_in_progress(Manager *m) {
e5723c89 125 usec_t next;
cfa9677b 126 int r;
e5723c89 127
718db961 128 assert(m);
03b717a3 129
42bf1ae1
FB
130 /* We do not want to show the cylon animation if the user
131 * needs to confirm service executions otherwise confirmation
132 * messages will be screwed by the cylon animation. */
b0eb2944 133 if (!manager_is_confirm_spawn_disabled(m))
42bf1ae1
FB
134 return;
135
718db961 136 if (m->jobs_in_progress_event_source)
2ae56591 137 return;
03b717a3 138
e5723c89 139 next = now(CLOCK_MONOTONIC) + JOBS_IN_PROGRESS_WAIT_USEC;
cfa9677b 140 r = sd_event_add_time(
6a0f1f6d
LP
141 m->event,
142 &m->jobs_in_progress_event_source,
143 CLOCK_MONOTONIC,
144 next, 0,
145 manager_dispatch_jobs_in_progress, m);
cfa9677b
MM
146 if (r < 0)
147 return;
7dfbe2e3
TG
148
149 (void) sd_event_source_set_description(m->jobs_in_progress_event_source, "manager-jobs-in-progress");
03b717a3
MS
150}
151
fbd0b64f 152#define CYLON_BUFFER_EXTRA (2*STRLEN(ANSI_RED) + STRLEN(ANSI_HIGHLIGHT_RED) + 2*STRLEN(ANSI_NORMAL))
03b717a3 153
03b717a3
MS
154static void draw_cylon(char buffer[], size_t buflen, unsigned width, unsigned pos) {
155 char *p = buffer;
156
157 assert(buflen >= CYLON_BUFFER_EXTRA + width + 1);
158 assert(pos <= width+1); /* 0 or width+1 mean that the center light is behind the corner */
159
160 if (pos > 1) {
6282c859
MS
161 if (pos > 2)
162 p = mempset(p, ' ', pos-2);
64c3610b
FB
163 if (log_get_show_color())
164 p = stpcpy(p, ANSI_RED);
03b717a3
MS
165 *p++ = '*';
166 }
167
168 if (pos > 0 && pos <= width) {
64c3610b
FB
169 if (log_get_show_color())
170 p = stpcpy(p, ANSI_HIGHLIGHT_RED);
03b717a3
MS
171 *p++ = '*';
172 }
173
64c3610b
FB
174 if (log_get_show_color())
175 p = stpcpy(p, ANSI_NORMAL);
03b717a3
MS
176
177 if (pos < width) {
64c3610b
FB
178 if (log_get_show_color())
179 p = stpcpy(p, ANSI_RED);
03b717a3 180 *p++ = '*';
6282c859
MS
181 if (pos < width-1)
182 p = mempset(p, ' ', width-1-pos);
64c3610b
FB
183 if (log_get_show_color())
184 strcpy(p, ANSI_NORMAL);
03b717a3 185 }
03b717a3
MS
186}
187
cb8ccb22 188void manager_flip_auto_status(Manager *m, bool enable) {
f755e3b7
LP
189 assert(m);
190
cb8ccb22
ZJS
191 if (enable) {
192 if (m->show_status == SHOW_STATUS_AUTO)
193 manager_set_show_status(m, SHOW_STATUS_TEMPORARY);
194 } else {
195 if (m->show_status == SHOW_STATUS_TEMPORARY)
196 manager_set_show_status(m, SHOW_STATUS_AUTO);
197 }
198}
199
03b717a3 200static void manager_print_jobs_in_progress(Manager *m) {
718db961 201 _cleanup_free_ char *job_of_n = NULL;
03b717a3
MS
202 Iterator i;
203 Job *j;
03b717a3
MS
204 unsigned counter = 0, print_nr;
205 char cylon[6 + CYLON_BUFFER_EXTRA + 1];
206 unsigned cylon_pos;
8bb310c3
ZJS
207 char time[FORMAT_TIMESPAN_MAX], limit[FORMAT_TIMESPAN_MAX] = "no limit";
208 uint64_t x;
03b717a3 209
718db961 210 assert(m);
9c3349e2 211 assert(m->n_running_jobs > 0);
718db961 212
cb8ccb22 213 manager_flip_auto_status(m, true);
d450b6f2 214
03b717a3
MS
215 print_nr = (m->jobs_in_progress_iteration / JOBS_IN_PROGRESS_PERIOD_DIVISOR) % m->n_running_jobs;
216
217 HASHMAP_FOREACH(j, m->jobs, i)
218 if (j->state == JOB_RUNNING && counter++ == print_nr)
219 break;
220
e970a72e
MS
221 /* m->n_running_jobs must be consistent with the contents of m->jobs,
222 * so the above loop must have succeeded in finding j. */
223 assert(counter == print_nr + 1);
51d122af 224 assert(j);
5a82a91a 225
03b717a3
MS
226 cylon_pos = m->jobs_in_progress_iteration % 14;
227 if (cylon_pos >= 8)
228 cylon_pos = 14 - cylon_pos;
229 draw_cylon(cylon, sizeof(cylon), 6, cylon_pos);
230
8bb310c3
ZJS
231 m->jobs_in_progress_iteration++;
232
d6483ba7
ZJS
233 if (m->n_running_jobs > 1) {
234 if (asprintf(&job_of_n, "(%u of %u) ", counter, m->n_running_jobs) < 0)
235 job_of_n = NULL;
236 }
03b717a3 237
8bb310c3
ZJS
238 format_timespan(time, sizeof(time), now(CLOCK_MONOTONIC) - j->begin_usec, 1*USEC_PER_SEC);
239 if (job_get_timeout(j, &x) > 0)
240 format_timespan(limit, sizeof(limit), x - j->begin_usec, 1*USEC_PER_SEC);
241
127d5fd1 242 manager_status_printf(m, STATUS_TYPE_EPHEMERAL, cylon,
8bb310c3
ZJS
243 "%sA %s job is running for %s (%s / %s)",
244 strempty(job_of_n),
245 job_type_to_string(j->type),
246 unit_description(j->unit),
247 time, limit);
03b717a3
MS
248}
249
e46b13c8
ZJS
250static int have_ask_password(void) {
251 _cleanup_closedir_ DIR *dir;
8fb3f009 252 struct dirent *de;
e46b13c8
ZJS
253
254 dir = opendir("/run/systemd/ask-password");
255 if (!dir) {
256 if (errno == ENOENT)
257 return false;
258 else
259 return -errno;
260 }
261
8fb3f009 262 FOREACH_DIRENT_ALL(de, dir, return -errno) {
e46b13c8
ZJS
263 if (startswith(de->d_name, "ask."))
264 return true;
265 }
8fb3f009 266 return false;
e46b13c8
ZJS
267}
268
269static int manager_dispatch_ask_password_fd(sd_event_source *source,
270 int fd, uint32_t revents, void *userdata) {
271 Manager *m = userdata;
272
273 assert(m);
274
665dfe93 275 (void) flush_fd(fd);
e46b13c8
ZJS
276
277 m->have_ask_password = have_ask_password();
278 if (m->have_ask_password < 0)
279 /* Log error but continue. Negative have_ask_password
280 * is treated as unknown status. */
c33b3297 281 log_error_errno(m->have_ask_password, "Failed to list /run/systemd/ask-password: %m");
e46b13c8
ZJS
282
283 return 0;
284}
285
286static void manager_close_ask_password(Manager *m) {
287 assert(m);
288
e46b13c8 289 m->ask_password_event_source = sd_event_source_unref(m->ask_password_event_source);
90990e28 290 m->ask_password_inotify_fd = safe_close(m->ask_password_inotify_fd);
e46b13c8
ZJS
291 m->have_ask_password = -EINVAL;
292}
293
294static int manager_check_ask_password(Manager *m) {
295 int r;
296
297 assert(m);
298
299 if (!m->ask_password_event_source) {
300 assert(m->ask_password_inotify_fd < 0);
301
302 mkdir_p_label("/run/systemd/ask-password", 0755);
303
304 m->ask_password_inotify_fd = inotify_init1(IN_NONBLOCK|IN_CLOEXEC);
4a62c710
MS
305 if (m->ask_password_inotify_fd < 0)
306 return log_error_errno(errno, "inotify_init1() failed: %m");
e46b13c8
ZJS
307
308 if (inotify_add_watch(m->ask_password_inotify_fd, "/run/systemd/ask-password", IN_CREATE|IN_DELETE|IN_MOVE) < 0) {
56f64d95 309 log_error_errno(errno, "Failed to add watch on /run/systemd/ask-password: %m");
e46b13c8
ZJS
310 manager_close_ask_password(m);
311 return -errno;
312 }
313
314 r = sd_event_add_io(m->event, &m->ask_password_event_source,
315 m->ask_password_inotify_fd, EPOLLIN,
316 manager_dispatch_ask_password_fd, m);
317 if (r < 0) {
56f64d95 318 log_error_errno(errno, "Failed to add event source for /run/systemd/ask-password: %m");
e46b13c8
ZJS
319 manager_close_ask_password(m);
320 return -errno;
321 }
322
7dfbe2e3
TG
323 (void) sd_event_source_set_description(m->ask_password_event_source, "manager-ask-password");
324
e46b13c8
ZJS
325 /* Queries might have been added meanwhile... */
326 manager_dispatch_ask_password_fd(m->ask_password_event_source,
327 m->ask_password_inotify_fd, EPOLLIN, m);
328 }
329
330 return m->have_ask_password;
331}
332
31a7eb86 333static int manager_watch_idle_pipe(Manager *m) {
31a7eb86
ZJS
334 int r;
335
718db961
LP
336 assert(m);
337
338 if (m->idle_pipe_event_source)
31a7eb86
ZJS
339 return 0;
340
341 if (m->idle_pipe[2] < 0)
342 return 0;
343
151b9b96 344 r = sd_event_add_io(m->event, &m->idle_pipe_event_source, m->idle_pipe[2], EPOLLIN, manager_dispatch_idle_pipe_fd, m);
23bbb0de
MS
345 if (r < 0)
346 return log_error_errno(r, "Failed to watch idle pipe: %m");
31a7eb86 347
7dfbe2e3
TG
348 (void) sd_event_source_set_description(m->idle_pipe_event_source, "manager-idle-pipe");
349
31a7eb86 350 return 0;
31a7eb86
ZJS
351}
352
718db961
LP
353static void manager_close_idle_pipe(Manager *m) {
354 assert(m);
31a7eb86 355
cd72bd8a
LP
356 m->idle_pipe_event_source = sd_event_source_unref(m->idle_pipe_event_source);
357
3d94f76c
LP
358 safe_close_pair(m->idle_pipe);
359 safe_close_pair(m->idle_pipe + 2);
31a7eb86
ZJS
360}
361
8742514c 362static int manager_setup_time_change(Manager *m) {
718db961 363 int r;
b92bea5d
ZJS
364
365 /* We only care for the cancellation event, hence we set the
366 * timeout to the latest possible value. */
367 struct itimerspec its = {
368 .it_value.tv_sec = TIME_T_MAX,
369 };
8742514c 370
718db961
LP
371 assert(m);
372 assert_cc(sizeof(time_t) == sizeof(TIME_T_MAX));
8742514c 373
e0a3da1f 374 if (m->test_run_flags)
0d8c31ff
ZJS
375 return 0;
376
8742514c
LP
377 /* Uses TFD_TIMER_CANCEL_ON_SET to get notifications whenever
378 * CLOCK_REALTIME makes a jump relative to CLOCK_MONOTONIC */
379
718db961 380 m->time_change_fd = timerfd_create(CLOCK_REALTIME, TFD_NONBLOCK|TFD_CLOEXEC);
4a62c710
MS
381 if (m->time_change_fd < 0)
382 return log_error_errno(errno, "Failed to create timerfd: %m");
8742514c 383
718db961 384 if (timerfd_settime(m->time_change_fd, TFD_TIMER_ABSTIME|TFD_TIMER_CANCEL_ON_SET, &its, NULL) < 0) {
56f64d95 385 log_debug_errno(errno, "Failed to set up TFD_TIMER_CANCEL_ON_SET, ignoring: %m");
03e334a1 386 m->time_change_fd = safe_close(m->time_change_fd);
8742514c
LP
387 return 0;
388 }
389
151b9b96 390 r = sd_event_add_io(m->event, &m->time_change_event_source, m->time_change_fd, EPOLLIN, manager_dispatch_time_change_fd, m);
23bbb0de
MS
391 if (r < 0)
392 return log_error_errno(r, "Failed to create time change event source: %m");
8742514c 393
7dfbe2e3
TG
394 (void) sd_event_source_set_description(m->time_change_event_source, "manager-time-change");
395
8742514c
LP
396 log_debug("Set up TFD_TIMER_CANCEL_ON_SET timerfd.");
397
398 return 0;
399}
400
80876c20 401static int enable_special_signals(Manager *m) {
718db961 402 _cleanup_close_ int fd = -1;
80876c20
LP
403
404 assert(m);
405
e0a3da1f 406 if (m->test_run_flags)
37453b3a
EV
407 return 0;
408
a41b539e 409 /* Enable that we get SIGINT on control-alt-del. In containers
c9999773
LP
410 * this will fail with EPERM (older) or EINVAL (newer), so
411 * ignore that. */
4c701096 412 if (reboot(RB_DISABLE_CAD) < 0 && !IN_SET(errno, EPERM, EINVAL))
56f64d95 413 log_warning_errno(errno, "Failed to enable ctrl-alt-del handling: %m");
80876c20 414
a41b539e
LP
415 fd = open_terminal("/dev/tty0", O_RDWR|O_NOCTTY|O_CLOEXEC);
416 if (fd < 0) {
417 /* Support systems without virtual console */
418 if (fd != -ENOENT)
56f64d95 419 log_warning_errno(errno, "Failed to open /dev/tty0: %m");
a41b539e 420 } else {
80876c20
LP
421 /* Enable that we get SIGWINCH on kbrequest */
422 if (ioctl(fd, KDSIGACCEPT, SIGWINCH) < 0)
56f64d95 423 log_warning_errno(errno, "Failed to enable kbrequest handling: %m");
80876c20
LP
424 }
425
426 return 0;
427}
428
8750ac02
ZJS
429#define RTSIG_IF_AVAILABLE(signum) (signum <= SIGRTMAX ? signum : -1)
430
ce578209 431static int manager_setup_signals(Manager *m) {
b92bea5d
ZJS
432 struct sigaction sa = {
433 .sa_handler = SIG_DFL,
434 .sa_flags = SA_NOCLDSTOP|SA_RESTART,
435 };
718db961
LP
436 sigset_t mask;
437 int r;
60918275 438
ce578209
LP
439 assert(m);
440
57c0c30e
LP
441 assert_se(sigaction(SIGCHLD, &sa, NULL) == 0);
442
4dffec14
LP
443 /* We make liberal use of realtime signals here. On
444 * Linux/glibc we have 30 of them (with the exception of Linux
445 * on hppa, see below), between SIGRTMIN+0 ... SIGRTMIN+30
446 * (aka SIGRTMAX). */
7d793605 447
4dffec14 448 assert_se(sigemptyset(&mask) == 0);
7d793605
LP
449 sigset_add_many(&mask,
450 SIGCHLD, /* Child died */
451 SIGTERM, /* Reexecute daemon */
452 SIGHUP, /* Reload configuration */
453 SIGUSR1, /* systemd/upstart: reconnect to D-Bus */
454 SIGUSR2, /* systemd: dump status */
455 SIGINT, /* Kernel sends us this on control-alt-del */
456 SIGWINCH, /* Kernel sends us this on kbrequest (alt-arrowup) */
457 SIGPWR, /* Some kernel drivers and upsd send us this on power failure */
4dffec14 458
7d793605 459 SIGRTMIN+0, /* systemd: start default.target */
0003d1ab 460 SIGRTMIN+1, /* systemd: isolate rescue.target */
7d793605
LP
461 SIGRTMIN+2, /* systemd: isolate emergency.target */
462 SIGRTMIN+3, /* systemd: start halt.target */
463 SIGRTMIN+4, /* systemd: start poweroff.target */
464 SIGRTMIN+5, /* systemd: start reboot.target */
0003d1ab 465 SIGRTMIN+6, /* systemd: start kexec.target */
4dffec14
LP
466
467 /* ... space for more special targets ... */
468
0003d1ab
LP
469 SIGRTMIN+13, /* systemd: Immediate halt */
470 SIGRTMIN+14, /* systemd: Immediate poweroff */
471 SIGRTMIN+15, /* systemd: Immediate reboot */
472 SIGRTMIN+16, /* systemd: Immediate kexec */
4dffec14
LP
473
474 /* ... space for more immediate system state changes ... */
475
0658666b
LP
476 SIGRTMIN+20, /* systemd: enable status messages */
477 SIGRTMIN+21, /* systemd: disable status messages */
253ee27a
LP
478 SIGRTMIN+22, /* systemd: set log level to LOG_DEBUG */
479 SIGRTMIN+23, /* systemd: set log level to LOG_INFO */
600b704e 480 SIGRTMIN+24, /* systemd: Immediate exit (--user only) */
4dffec14
LP
481
482 /* .. one free signal here ... */
483
8750ac02
ZJS
484 /* Apparently Linux on hppa had fewer RT signals until v3.18,
485 * SIGRTMAX was SIGRTMIN+25, and then SIGRTMIN was lowered,
486 * see commit v3.17-7614-g1f25df2eff.
487 *
488 * We cannot unconditionally make use of those signals here,
489 * so let's use a runtime check. Since these commands are
490 * accessible by different means and only really a safety
491 * net, the missing functionality on hppa shouldn't matter.
492 */
493
494 RTSIG_IF_AVAILABLE(SIGRTMIN+26), /* systemd: set log target to journal-or-kmsg */
495 RTSIG_IF_AVAILABLE(SIGRTMIN+27), /* systemd: set log target to console */
496 RTSIG_IF_AVAILABLE(SIGRTMIN+28), /* systemd: set log target to kmsg */
497 RTSIG_IF_AVAILABLE(SIGRTMIN+29), /* systemd: set log target to syslog-or-kmsg (obsolete) */
4dffec14
LP
498
499 /* ... one free signal here SIGRTMIN+30 ... */
7d793605 500 -1);
ce578209
LP
501 assert_se(sigprocmask(SIG_SETMASK, &mask, NULL) == 0);
502
718db961
LP
503 m->signal_fd = signalfd(-1, &mask, SFD_NONBLOCK|SFD_CLOEXEC);
504 if (m->signal_fd < 0)
ce578209
LP
505 return -errno;
506
151b9b96 507 r = sd_event_add_io(m->event, &m->signal_event_source, m->signal_fd, EPOLLIN, manager_dispatch_signal_fd, m);
718db961
LP
508 if (r < 0)
509 return r;
ce578209 510
7dfbe2e3
TG
511 (void) sd_event_source_set_description(m->signal_event_source, "manager-signal");
512
d8fdc620
LP
513 /* Process signals a bit earlier than the rest of things, but later than notify_fd processing, so that the
514 * notify processing can still figure out to which process/service a message belongs, before we reap the
515 * process. Also, process this before handling cgroup notifications, so that we always collect child exit
516 * status information before detecting that there's no process in a cgroup. */
517 r = sd_event_source_set_priority(m->signal_event_source, SD_EVENT_PRIORITY_NORMAL-6);
29083707
LP
518 if (r < 0)
519 return r;
520
463d0d15 521 if (MANAGER_IS_SYSTEM(m))
80876c20 522 return enable_special_signals(m);
e1414003 523
ce578209
LP
524 return 0;
525}
526
47cf8ff2 527static void manager_sanitize_environment(Manager *m) {
f069efb4
LP
528 assert(m);
529
47cf8ff2 530 /* Let's remove some environment variables that we need ourselves to communicate with our clients */
f069efb4
LP
531 strv_env_unset_many(
532 m->environment,
47cf8ff2
LP
533 "EXIT_CODE",
534 "EXIT_STATUS",
535 "INVOCATION_ID",
536 "JOURNAL_STREAM",
537 "LISTEN_FDNAMES",
538 "LISTEN_FDS",
539 "LISTEN_PID",
f069efb4
LP
540 "MAINPID",
541 "MANAGERPID",
47cf8ff2
LP
542 "NOTIFY_SOCKET",
543 "REMOTE_ADDR",
544 "REMOTE_PORT",
545 "SERVICE_RESULT",
f069efb4
LP
546 "WATCHDOG_PID",
547 "WATCHDOG_USEC",
548 NULL);
47cf8ff2
LP
549
550 /* Let's order the environment alphabetically, just to make it pretty */
551 strv_sort(m->environment);
f069efb4
LP
552}
553
e21fea24 554static int manager_default_environment(Manager *m) {
71ecc858
LP
555 assert(m);
556
463d0d15 557 if (MANAGER_IS_SYSTEM(m)) {
e21fea24
KS
558 /* The system manager always starts with a clean
559 * environment for its children. It does not import
71cb7d30 560 * the kernel's or the parents' exported variables.
e21fea24 561 *
71cb7d30 562 * The initial passed environment is untouched to keep
e21fea24
KS
563 * /proc/self/environ valid; it is used for tagging
564 * the init process inside containers. */
43638332
ZJS
565 m->environment = strv_new("PATH=" DEFAULT_PATH,
566 NULL);
e21fea24
KS
567
568 /* Import locale variables LC_*= from configuration */
569 locale_setup(&m->environment);
71cb7d30 570 } else
e21fea24
KS
571 /* The user manager passes its own environment
572 * along to its children. */
573 m->environment = strv_copy(environ);
43d03a83 574
e21fea24
KS
575 if (!m->environment)
576 return -ENOMEM;
8b55b8c4 577
47cf8ff2 578 manager_sanitize_environment(m);
9d5a3757 579
e21fea24 580 return 0;
71ecc858
LP
581}
582
3536f49e
YW
583static int manager_setup_prefix(Manager *m) {
584 struct table_entry {
585 uint64_t type;
586 const char *suffix;
587 };
588
72fd1768 589 static const struct table_entry paths_system[_EXEC_DIRECTORY_TYPE_MAX] = {
3536f49e
YW
590 [EXEC_DIRECTORY_RUNTIME] = { SD_PATH_SYSTEM_RUNTIME, NULL },
591 [EXEC_DIRECTORY_STATE] = { SD_PATH_SYSTEM_STATE_PRIVATE, NULL },
592 [EXEC_DIRECTORY_CACHE] = { SD_PATH_SYSTEM_STATE_CACHE, NULL },
593 [EXEC_DIRECTORY_LOGS] = { SD_PATH_SYSTEM_STATE_LOGS, NULL },
594 [EXEC_DIRECTORY_CONFIGURATION] = { SD_PATH_SYSTEM_CONFIGURATION, NULL },
595 };
596
72fd1768 597 static const struct table_entry paths_user[_EXEC_DIRECTORY_TYPE_MAX] = {
3536f49e
YW
598 [EXEC_DIRECTORY_RUNTIME] = { SD_PATH_USER_RUNTIME, NULL },
599 [EXEC_DIRECTORY_STATE] = { SD_PATH_USER_CONFIGURATION, NULL },
c6218495
LP
600 [EXEC_DIRECTORY_CACHE] = { SD_PATH_USER_STATE_CACHE, NULL },
601 [EXEC_DIRECTORY_LOGS] = { SD_PATH_USER_CONFIGURATION, "log" },
602 [EXEC_DIRECTORY_CONFIGURATION] = { SD_PATH_USER_CONFIGURATION, NULL },
3536f49e
YW
603 };
604
605 const struct table_entry *p;
606 ExecDirectoryType i;
607 int r;
608
609 assert(m);
610
611 if (MANAGER_IS_SYSTEM(m))
612 p = paths_system;
613 else
614 p = paths_user;
615
72fd1768 616 for (i = 0; i < _EXEC_DIRECTORY_TYPE_MAX; i++) {
3536f49e
YW
617 r = sd_path_home(p[i].type, p[i].suffix, &m->prefix[i]);
618 if (r < 0)
619 return r;
620 }
621
622 return 0;
623}
624
279d81dd
LP
625static int manager_setup_run_queue(Manager *m) {
626 int r;
627
628 assert(m);
629 assert(!m->run_queue_event_source);
630
631 r = sd_event_add_defer(m->event, &m->run_queue_event_source, manager_dispatch_run_queue, m);
632 if (r < 0)
633 return r;
634
635 r = sd_event_source_set_priority(m->run_queue_event_source, SD_EVENT_PRIORITY_IDLE);
636 if (r < 0)
637 return r;
638
639 r = sd_event_source_set_enabled(m->run_queue_event_source, SD_EVENT_OFF);
640 if (r < 0)
641 return r;
642
643 (void) sd_event_source_set_description(m->run_queue_event_source, "manager-run-queue");
644
645 return 0;
646}
647
575b300b
LP
648static int manager_setup_sigchld_event_source(Manager *m) {
649 int r;
650
651 assert(m);
652 assert(!m->sigchld_event_source);
653
654 r = sd_event_add_defer(m->event, &m->sigchld_event_source, manager_dispatch_sigchld, m);
655 if (r < 0)
656 return r;
657
658 r = sd_event_source_set_priority(m->sigchld_event_source, SD_EVENT_PRIORITY_NORMAL-7);
659 if (r < 0)
660 return r;
661
662 r = sd_event_source_set_enabled(m->sigchld_event_source, SD_EVENT_OFF);
663 if (r < 0)
664 return r;
665
666 (void) sd_event_source_set_description(m->sigchld_event_source, "manager-sigchld");
667
668 return 0;
669}
670
e0a3da1f 671int manager_new(UnitFileScope scope, unsigned test_run_flags, Manager **_m) {
c70cac54 672 _cleanup_(manager_freep) Manager *m = NULL;
e3dd987c 673 int r;
8e274523
LP
674
675 assert(_m);
463d0d15 676 assert(IN_SET(scope, UNIT_FILE_SYSTEM, UNIT_FILE_USER));
ce578209 677
915b3753
LP
678 m = new0(Manager, 1);
679 if (!m)
8e274523 680 return -ENOMEM;
60918275 681
463d0d15 682 m->unit_file_scope = scope;
a16e1123 683 m->exit_code = _MANAGER_EXIT_CODE_INVALID;
bd8f585b 684 m->default_timer_accuracy_usec = USEC_PER_MINUTE;
444d5863 685 m->default_memory_accounting = MEMORY_ACCOUNTING_DEFAULT;
9ded9cd1 686 m->default_tasks_accounting = true;
79baeeb9 687 m->default_tasks_max = UINT64_MAX;
bd389aa7
LP
688 m->default_timeout_start_usec = DEFAULT_TIMEOUT_USEC;
689 m->default_timeout_stop_usec = DEFAULT_TIMEOUT_USEC;
690 m->default_restart_usec = DEFAULT_RESTART_USEC;
80876c20 691
349cc4a5 692#if ENABLE_EFI
463d0d15 693 if (MANAGER_IS_SYSTEM(m) && detect_container() <= 0)
9f9f0342
LP
694 boot_timestamps(m->timestamps + MANAGER_TIMESTAMP_USERSPACE,
695 m->timestamps + MANAGER_TIMESTAMP_FIRMWARE,
696 m->timestamps + MANAGER_TIMESTAMP_LOADER);
463d0d15
LP
697#endif
698
f2341e0a 699 /* Prepare log fields we can use for structured logging */
463d0d15
LP
700 if (MANAGER_IS_SYSTEM(m)) {
701 m->unit_log_field = "UNIT=";
702 m->unit_log_format_string = "UNIT=%s";
4b58153d
LP
703
704 m->invocation_log_field = "INVOCATION_ID=";
f1c50bec 705 m->invocation_log_format_string = "INVOCATION_ID=%s";
463d0d15
LP
706 } else {
707 m->unit_log_field = "USER_UNIT=";
708 m->unit_log_format_string = "USER_UNIT=%s";
4b58153d
LP
709
710 m->invocation_log_field = "USER_INVOCATION_ID=";
f1c50bec 711 m->invocation_log_format_string = "USER_INVOCATION_ID=%s";
463d0d15 712 }
f2341e0a 713
718db961 714 m->idle_pipe[0] = m->idle_pipe[1] = m->idle_pipe[2] = m->idle_pipe[3] = -1;
8742514c 715
d8fdc620 716 m->pin_cgroupfs_fd = m->notify_fd = m->cgroups_agent_fd = m->signal_fd = m->time_change_fd =
232f6754 717 m->dev_autofs_fd = m->private_listen_fd = m->cgroup_inotify_fd =
d8fdc620 718 m->ask_password_inotify_fd = -1;
d379d442 719
00d9ef85
LP
720 m->user_lookup_fds[0] = m->user_lookup_fds[1] = -1;
721
ea430986 722 m->current_job_id = 1; /* start as id #1, so that we can leave #0 around as "null-like" value */
9152c765 723
e46b13c8 724 m->have_ask_password = -EINVAL; /* we don't know */
ae2a2c53 725 m->first_boot = -1;
e46b13c8 726
e0a3da1f 727 m->test_run_flags = test_run_flags;
0d8c31ff 728
2e5c94b9
LP
729 /* Reboot immediately if the user hits C-A-D more often than 7x per 2s */
730 RATELIMIT_INIT(m->ctrl_alt_del_ratelimit, 2 * USEC_PER_SEC, 7);
731
e21fea24
KS
732 r = manager_default_environment(m);
733 if (r < 0)
c70cac54 734 return r;
1137a57c 735
d5099efc 736 r = hashmap_ensure_allocated(&m->units, &string_hash_ops);
718db961 737 if (r < 0)
c70cac54 738 return r;
60918275 739
d5099efc 740 r = hashmap_ensure_allocated(&m->jobs, NULL);
718db961 741 if (r < 0)
c70cac54 742 return r;
60918275 743
548f6937 744 r = hashmap_ensure_allocated(&m->cgroup_unit, &path_hash_ops);
718db961 745 if (r < 0)
c70cac54 746 return r;
9152c765 747
d5099efc 748 r = hashmap_ensure_allocated(&m->watch_bus, &string_hash_ops);
718db961 749 if (r < 0)
c70cac54 750 return r;
05e343b7 751
e8112e67 752 r = manager_setup_prefix(m);
718db961 753 if (r < 0)
c70cac54 754 return r;
8742514c 755
e8112e67
ZJS
756 m->udev = udev_new();
757 if (!m->udev)
758 return -ENOMEM;
752b5905 759
e8112e67 760 r = sd_event_default(&m->event);
8742514c 761 if (r < 0)
c70cac54 762 return r;
9152c765 763
e8112e67 764 r = manager_setup_run_queue(m);
a1d32bac 765 if (r < 0)
c70cac54 766 return r;
8e274523 767
e8112e67
ZJS
768 if (test_run_flags == MANAGER_TEST_RUN_MINIMAL) {
769 m->cgroup_root = strdup("");
770 if (!m->cgroup_root)
771 return -ENOMEM;
772 } else {
773 r = manager_setup_signals(m);
774 if (r < 0)
775 return r;
8c47c732 776
e8112e67
ZJS
777 r = manager_setup_cgroup(m);
778 if (r < 0)
779 return r;
575b300b 780
e8112e67
ZJS
781 r = manager_setup_time_change(m);
782 if (r < 0)
783 return r;
9670d583 784
e8112e67
ZJS
785 r = manager_setup_sigchld_event_source(m);
786 if (r < 0)
787 return r;
788 }
e27fe688 789
5eb397cf 790 if (MANAGER_IS_SYSTEM(m) && test_run_flags == 0) {
d3070fbd
LP
791 r = mkdir_label("/run/systemd/units", 0755);
792 if (r < 0 && r != -EEXIST)
c70cac54 793 return r;
d3070fbd
LP
794 }
795
e27fe688
LP
796 m->taint_usr =
797 !in_initrd() &&
798 dir_is_empty("/usr") > 0;
799
232f6754
ZJS
800 /* Note that we do not set up the notify fd here. We do that after deserialization,
801 * since they might have gotten serialized across the reexec. */
3536f49e 802
8e274523 803 *_m = m;
c70cac54 804 m = NULL;
8e274523 805 return 0;
60918275
LP
806}
807
d86f9d52 808static int manager_setup_notify(Manager *m) {
7181dbdb 809 int r;
d86f9d52 810
e0a3da1f 811 if (m->test_run_flags)
0d8c31ff
ZJS
812 return 0;
813
d86f9d52
LP
814 if (m->notify_fd < 0) {
815 _cleanup_close_ int fd = -1;
920b52e4 816 union sockaddr_union sa = {
7181dbdb
LP
817 .sa.sa_family = AF_UNIX,
818 };
55836941 819 static const int one = 1;
d86f9d52
LP
820
821 /* First free all secondary fields */
a1e58e8e 822 m->notify_socket = mfree(m->notify_socket);
d86f9d52
LP
823 m->notify_event_source = sd_event_source_unref(m->notify_event_source);
824
825 fd = socket(AF_UNIX, SOCK_DGRAM|SOCK_CLOEXEC|SOCK_NONBLOCK, 0);
4a62c710
MS
826 if (fd < 0)
827 return log_error_errno(errno, "Failed to allocate notification socket: %m");
d86f9d52 828
a47806fa
LP
829 fd_inc_rcvbuf(fd, NOTIFY_RCVBUF_SIZE);
830
3536f49e 831 m->notify_socket = strappend(m->prefix[EXEC_DIRECTORY_RUNTIME], "/systemd/notify");
498e87d6
LP
832 if (!m->notify_socket)
833 return log_oom();
834
835 (void) mkdir_parents_label(m->notify_socket, 0755);
f0e62e89 836 (void) unlink(m->notify_socket);
7181dbdb
LP
837
838 strncpy(sa.un.sun_path, m->notify_socket, sizeof(sa.un.sun_path)-1);
fc2fffe7 839 r = bind(fd, &sa.sa, SOCKADDR_UN_LEN(sa.un));
4a62c710
MS
840 if (r < 0)
841 return log_error_errno(errno, "bind(%s) failed: %m", sa.un.sun_path);
d86f9d52
LP
842
843 r = setsockopt(fd, SOL_SOCKET, SO_PASSCRED, &one, sizeof(one));
4a62c710
MS
844 if (r < 0)
845 return log_error_errno(errno, "SO_PASSCRED failed: %m");
d86f9d52 846
d86f9d52
LP
847 m->notify_fd = fd;
848 fd = -1;
849
850 log_debug("Using notification socket %s", m->notify_socket);
851 }
852
853 if (!m->notify_event_source) {
151b9b96 854 r = sd_event_add_io(m->event, &m->notify_event_source, m->notify_fd, EPOLLIN, manager_dispatch_notify_fd, m);
895b3a7b
MS
855 if (r < 0)
856 return log_error_errno(r, "Failed to allocate notify event source: %m");
d86f9d52 857
d8fdc620
LP
858 /* Process notification messages a bit earlier than SIGCHLD, so that we can still identify to which
859 * service an exit message belongs. */
575b300b 860 r = sd_event_source_set_priority(m->notify_event_source, SD_EVENT_PRIORITY_NORMAL-8);
23bbb0de
MS
861 if (r < 0)
862 return log_error_errno(r, "Failed to set priority of notify event source: %m");
7dfbe2e3
TG
863
864 (void) sd_event_source_set_description(m->notify_event_source, "manager-notify");
d86f9d52
LP
865 }
866
867 return 0;
868}
869
d8fdc620
LP
870static int manager_setup_cgroups_agent(Manager *m) {
871
872 static const union sockaddr_union sa = {
873 .un.sun_family = AF_UNIX,
874 .un.sun_path = "/run/systemd/cgroups-agent",
875 };
876 int r;
877
878 /* This creates a listening socket we receive cgroups agent messages on. We do not use D-Bus for delivering
879 * these messages from the cgroups agent binary to PID 1, as the cgroups agent binary is very short-living, and
880 * each instance of it needs a new D-Bus connection. Since D-Bus connections are SOCK_STREAM/AF_UNIX, on
881 * overloaded systems the backlog of the D-Bus socket becomes relevant, as not more than the configured number
882 * of D-Bus connections may be queued until the kernel will start dropping further incoming connections,
883 * possibly resulting in lost cgroups agent messages. To avoid this, we'll use a private SOCK_DGRAM/AF_UNIX
884 * socket, where no backlog is relevant as communication may take place without an actual connect() cycle, and
885 * we thus won't lose messages.
886 *
887 * Note that PID 1 will forward the agent message to system bus, so that the user systemd instance may listen
888 * to it. The system instance hence listens on this special socket, but the user instances listen on the system
889 * bus for these messages. */
890
e0a3da1f 891 if (m->test_run_flags)
d8fdc620
LP
892 return 0;
893
894 if (!MANAGER_IS_SYSTEM(m))
895 return 0;
896
c22800e4 897 r = cg_unified_controller(SYSTEMD_CGROUP_CONTROLLER);
b4cccbc1
LP
898 if (r < 0)
899 return log_error_errno(r, "Failed to determine whether unified cgroups hierarchy is used: %m");
900 if (r > 0) /* We don't need this anymore on the unified hierarchy */
d8fdc620
LP
901 return 0;
902
903 if (m->cgroups_agent_fd < 0) {
904 _cleanup_close_ int fd = -1;
905
906 /* First free all secondary fields */
907 m->cgroups_agent_event_source = sd_event_source_unref(m->cgroups_agent_event_source);
908
909 fd = socket(AF_UNIX, SOCK_DGRAM|SOCK_CLOEXEC|SOCK_NONBLOCK, 0);
910 if (fd < 0)
911 return log_error_errno(errno, "Failed to allocate cgroups agent socket: %m");
912
913 fd_inc_rcvbuf(fd, CGROUPS_AGENT_RCVBUF_SIZE);
914
915 (void) unlink(sa.un.sun_path);
916
917 /* Only allow root to connect to this socket */
918 RUN_WITH_UMASK(0077)
fc2fffe7 919 r = bind(fd, &sa.sa, SOCKADDR_UN_LEN(sa.un));
d8fdc620
LP
920 if (r < 0)
921 return log_error_errno(errno, "bind(%s) failed: %m", sa.un.sun_path);
922
923 m->cgroups_agent_fd = fd;
924 fd = -1;
925 }
926
927 if (!m->cgroups_agent_event_source) {
928 r = sd_event_add_io(m->event, &m->cgroups_agent_event_source, m->cgroups_agent_fd, EPOLLIN, manager_dispatch_cgroups_agent_fd, m);
929 if (r < 0)
930 return log_error_errno(r, "Failed to allocate cgroups agent event source: %m");
931
932 /* Process cgroups notifications early, but after having processed service notification messages or
933 * SIGCHLD signals, so that a cgroup running empty is always just the last safety net of notification,
934 * and we collected the metadata the notification and SIGCHLD stuff offers first. Also see handling of
935 * cgroup inotify for the unified cgroup stuff. */
09e24654 936 r = sd_event_source_set_priority(m->cgroups_agent_event_source, SD_EVENT_PRIORITY_NORMAL-4);
d8fdc620
LP
937 if (r < 0)
938 return log_error_errno(r, "Failed to set priority of cgroups agent event source: %m");
939
940 (void) sd_event_source_set_description(m->cgroups_agent_event_source, "manager-cgroups-agent");
941 }
942
943 return 0;
944}
945
00d9ef85
LP
946static int manager_setup_user_lookup_fd(Manager *m) {
947 int r;
948
949 assert(m);
950
951 /* Set up the socket pair used for passing UID/GID resolution results from forked off processes to PID
952 * 1. Background: we can't do name lookups (NSS) from PID 1, since it might involve IPC and thus activation,
953 * and we might hence deadlock on ourselves. Hence we do all user/group lookups asynchronously from the forked
954 * off processes right before executing the binaries to start. In order to be able to clean up any IPC objects
955 * created by a unit (see RemoveIPC=) we need to know in PID 1 the used UID/GID of the executed processes,
956 * hence we establish this communication channel so that forked off processes can pass their UID/GID
957 * information back to PID 1. The forked off processes send their resolved UID/GID to PID 1 in a simple
958 * datagram, along with their unit name, so that we can share one communication socket pair among all units for
959 * this purpose.
960 *
961 * You might wonder why we need a communication channel for this that is independent of the usual notification
962 * socket scheme (i.e. $NOTIFY_SOCKET). The primary difference is about trust: data sent via the $NOTIFY_SOCKET
963 * channel is only accepted if it originates from the right unit and if reception was enabled for it. The user
964 * lookup socket OTOH is only accessible by PID 1 and its children until they exec(), and always available.
965 *
966 * Note that this function is called under two circumstances: when we first initialize (in which case we
967 * allocate both the socket pair and the event source to listen on it), and when we deserialize after a reload
968 * (in which case the socket pair already exists but we still need to allocate the event source for it). */
969
970 if (m->user_lookup_fds[0] < 0) {
971
972 /* Free all secondary fields */
973 safe_close_pair(m->user_lookup_fds);
974 m->user_lookup_event_source = sd_event_source_unref(m->user_lookup_event_source);
975
976 if (socketpair(AF_UNIX, SOCK_DGRAM|SOCK_CLOEXEC, 0, m->user_lookup_fds) < 0)
977 return log_error_errno(errno, "Failed to allocate user lookup socket: %m");
978
979 (void) fd_inc_rcvbuf(m->user_lookup_fds[0], NOTIFY_RCVBUF_SIZE);
980 }
981
982 if (!m->user_lookup_event_source) {
983 r = sd_event_add_io(m->event, &m->user_lookup_event_source, m->user_lookup_fds[0], EPOLLIN, manager_dispatch_user_lookup_fd, m);
984 if (r < 0)
985 return log_error_errno(errno, "Failed to allocate user lookup event source: %m");
986
987 /* Process even earlier than the notify event source, so that we always know first about valid UID/GID
988 * resolutions */
67ae4e8d 989 r = sd_event_source_set_priority(m->user_lookup_event_source, SD_EVENT_PRIORITY_NORMAL-11);
00d9ef85
LP
990 if (r < 0)
991 return log_error_errno(errno, "Failed to set priority ot user lookup event source: %m");
992
993 (void) sd_event_source_set_description(m->user_lookup_event_source, "user-lookup");
994 }
995
996 return 0;
997}
998
23a177ef 999static unsigned manager_dispatch_cleanup_queue(Manager *m) {
595ed347 1000 Unit *u;
23a177ef
LP
1001 unsigned n = 0;
1002
1003 assert(m);
1004
595ed347
MS
1005 while ((u = m->cleanup_queue)) {
1006 assert(u->in_cleanup_queue);
23a177ef 1007
595ed347 1008 unit_free(u);
23a177ef
LP
1009 n++;
1010 }
1011
1012 return n;
1013}
1014
eced69b3 1015enum {
35b8ca3a 1016 GC_OFFSET_IN_PATH, /* This one is on the path we were traveling */
eced69b3
LP
1017 GC_OFFSET_UNSURE, /* No clue */
1018 GC_OFFSET_GOOD, /* We still need this unit */
1019 GC_OFFSET_BAD, /* We don't need this unit anymore */
1020 _GC_OFFSET_MAX
1021};
1022
00d9ef85 1023static void unit_gc_mark_good(Unit *u, unsigned gc_marker) {
4892084f 1024 Unit *other;
eef85c4a
LP
1025 Iterator i;
1026 void *v;
4892084f
LN
1027
1028 u->gc_marker = gc_marker + GC_OFFSET_GOOD;
1029
1030 /* Recursively mark referenced units as GOOD as well */
eef85c4a 1031 HASHMAP_FOREACH_KEY(v, other, u->dependencies[UNIT_REFERENCES], i)
4892084f
LN
1032 if (other->gc_marker == gc_marker + GC_OFFSET_UNSURE)
1033 unit_gc_mark_good(other, gc_marker);
1034}
1035
eced69b3 1036static void unit_gc_sweep(Unit *u, unsigned gc_marker) {
701cc384 1037 Unit *other;
eced69b3 1038 bool is_bad;
eef85c4a
LP
1039 Iterator i;
1040 void *v;
701cc384
LP
1041
1042 assert(u);
1043
4c701096
YW
1044 if (IN_SET(u->gc_marker - gc_marker,
1045 GC_OFFSET_GOOD, GC_OFFSET_BAD, GC_OFFSET_UNSURE, GC_OFFSET_IN_PATH))
701cc384
LP
1046 return;
1047
ac155bb8 1048 if (u->in_cleanup_queue)
701cc384
LP
1049 goto bad;
1050
f2f725e5 1051 if (!unit_may_gc(u))
701cc384
LP
1052 goto good;
1053
ac155bb8 1054 u->gc_marker = gc_marker + GC_OFFSET_IN_PATH;
eced69b3
LP
1055
1056 is_bad = true;
1057
eef85c4a 1058 HASHMAP_FOREACH_KEY(v, other, u->dependencies[UNIT_REFERENCED_BY], i) {
701cc384
LP
1059 unit_gc_sweep(other, gc_marker);
1060
ac155bb8 1061 if (other->gc_marker == gc_marker + GC_OFFSET_GOOD)
701cc384 1062 goto good;
eced69b3 1063
ac155bb8 1064 if (other->gc_marker != gc_marker + GC_OFFSET_BAD)
eced69b3 1065 is_bad = false;
701cc384
LP
1066 }
1067
2641f02e
ZJS
1068 if (u->refs_by_target) {
1069 const UnitRef *ref;
1070
1071 LIST_FOREACH(refs_by_target, ref, u->refs_by_target) {
1072 unit_gc_sweep(ref->source, gc_marker);
1073
1074 if (ref->source->gc_marker == gc_marker + GC_OFFSET_GOOD)
1075 goto good;
1076
1077 if (ref->source->gc_marker != gc_marker + GC_OFFSET_BAD)
1078 is_bad = false;
1079 }
1080 }
701cc384 1081
eced69b3
LP
1082 if (is_bad)
1083 goto bad;
1084
1085 /* We were unable to find anything out about this entry, so
1086 * let's investigate it later */
ac155bb8 1087 u->gc_marker = gc_marker + GC_OFFSET_UNSURE;
eced69b3
LP
1088 unit_add_to_gc_queue(u);
1089 return;
1090
701cc384 1091bad:
eced69b3
LP
1092 /* We definitely know that this one is not useful anymore, so
1093 * let's mark it for deletion */
ac155bb8 1094 u->gc_marker = gc_marker + GC_OFFSET_BAD;
eced69b3 1095 unit_add_to_cleanup_queue(u);
701cc384
LP
1096 return;
1097
1098good:
4892084f 1099 unit_gc_mark_good(u, gc_marker);
701cc384
LP
1100}
1101
c5a97ed1
LP
1102static unsigned manager_dispatch_gc_unit_queue(Manager *m) {
1103 unsigned n = 0, gc_marker;
595ed347 1104 Unit *u;
701cc384
LP
1105
1106 assert(m);
1107
cf1265e1 1108 /* log_debug("Running GC..."); */
701cc384 1109
eced69b3
LP
1110 m->gc_marker += _GC_OFFSET_MAX;
1111 if (m->gc_marker + _GC_OFFSET_MAX <= _GC_OFFSET_MAX)
c9c0cadb 1112 m->gc_marker = 1;
701cc384 1113
eced69b3
LP
1114 gc_marker = m->gc_marker;
1115
c5a97ed1 1116 while ((u = m->gc_unit_queue)) {
595ed347 1117 assert(u->in_gc_queue);
701cc384 1118
595ed347 1119 unit_gc_sweep(u, gc_marker);
eced69b3 1120
c5a97ed1 1121 LIST_REMOVE(gc_queue, m->gc_unit_queue, u);
595ed347 1122 u->in_gc_queue = false;
701cc384
LP
1123
1124 n++;
1125
4c701096
YW
1126 if (IN_SET(u->gc_marker - gc_marker,
1127 GC_OFFSET_BAD, GC_OFFSET_UNSURE)) {
cc3bc3e6 1128 if (u->id)
f2341e0a 1129 log_unit_debug(u, "Collecting.");
595ed347
MS
1130 u->gc_marker = gc_marker + GC_OFFSET_BAD;
1131 unit_add_to_cleanup_queue(u);
701cc384
LP
1132 }
1133 }
1134
701cc384
LP
1135 return n;
1136}
1137
c5a97ed1
LP
1138static unsigned manager_dispatch_gc_job_queue(Manager *m) {
1139 unsigned n = 0;
1140 Job *j;
1141
1142 assert(m);
1143
1144 while ((j = m->gc_job_queue)) {
1145 assert(j->in_gc_queue);
1146
1147 LIST_REMOVE(gc_queue, m->gc_job_queue, j);
1148 j->in_gc_queue = false;
1149
1150 n++;
1151
2ab3050f 1152 if (!job_may_gc(j))
c5a97ed1
LP
1153 continue;
1154
1155 log_unit_debug(j->unit, "Collecting job.");
1156 (void) job_finish_and_invalidate(j, JOB_COLLECTED, false, false);
1157 }
1158
1159 return n;
1160}
1161
a16e1123 1162static void manager_clear_jobs_and_units(Manager *m) {
a16e1123 1163 Unit *u;
60918275
LP
1164
1165 assert(m);
1166
87f0e418
LP
1167 while ((u = hashmap_first(m->units)))
1168 unit_free(u);
964e0949
LP
1169
1170 manager_dispatch_cleanup_queue(m);
1171
1172 assert(!m->load_queue);
1173 assert(!m->run_queue);
1174 assert(!m->dbus_unit_queue);
1175 assert(!m->dbus_job_queue);
1176 assert(!m->cleanup_queue);
c5a97ed1
LP
1177 assert(!m->gc_unit_queue);
1178 assert(!m->gc_job_queue);
964e0949 1179
964e0949
LP
1180 assert(hashmap_isempty(m->jobs));
1181 assert(hashmap_isempty(m->units));
9e9e2b72
MS
1182
1183 m->n_on_console = 0;
1184 m->n_running_jobs = 0;
a16e1123
LP
1185}
1186
06d8d842 1187Manager* manager_free(Manager *m) {
a16e1123 1188 UnitType c;
c93ff2e9 1189 int i;
35aba85a 1190 ExecDirectoryType dt;
87f0e418 1191
06d8d842
ZJS
1192 if (!m)
1193 return NULL;
a16e1123
LP
1194
1195 manager_clear_jobs_and_units(m);
23a177ef 1196
7824bbeb
LP
1197 for (c = 0; c < _UNIT_TYPE_MAX; c++)
1198 if (unit_vtable[c]->shutdown)
1199 unit_vtable[c]->shutdown(m);
1200
a1f31f47 1201 /* If we reexecute ourselves, we keep the root cgroup around */
c6c18be3 1202 manager_shutdown_cgroup(m, m->exit_code != MANAGER_REEXECUTE);
8e274523 1203
07a78643 1204 lookup_paths_flush_generator(&m->lookup_paths);
5a1e9937 1205
5e8d1c9a 1206 bus_done(m);
ea430986 1207
e8a565cb
YW
1208 exec_runtime_vacuum(m);
1209 hashmap_free(m->exec_runtime_by_id);
1210
29206d46
LP
1211 dynamic_user_vacuum(m, false);
1212 hashmap_free(m->dynamic_users);
1213
87f0e418 1214 hashmap_free(m->units);
4b58153d 1215 hashmap_free(m->units_by_invocation_id);
60918275 1216 hashmap_free(m->jobs);
62a76913 1217 hashmap_free(m->watch_pids);
05e343b7 1218 hashmap_free(m->watch_bus);
9152c765 1219
95ae05c0 1220 set_free(m->startup_units);
f755e3b7
LP
1221 set_free(m->failed_units);
1222
718db961 1223 sd_event_source_unref(m->signal_event_source);
575b300b 1224 sd_event_source_unref(m->sigchld_event_source);
718db961 1225 sd_event_source_unref(m->notify_event_source);
d8fdc620 1226 sd_event_source_unref(m->cgroups_agent_event_source);
718db961
LP
1227 sd_event_source_unref(m->time_change_event_source);
1228 sd_event_source_unref(m->jobs_in_progress_event_source);
752b5905 1229 sd_event_source_unref(m->run_queue_event_source);
00d9ef85 1230 sd_event_source_unref(m->user_lookup_event_source);
5f109056 1231 sd_event_source_unref(m->sync_bus_names_event_source);
718db961 1232
03e334a1
LP
1233 safe_close(m->signal_fd);
1234 safe_close(m->notify_fd);
d8fdc620 1235 safe_close(m->cgroups_agent_fd);
03e334a1 1236 safe_close(m->time_change_fd);
00d9ef85 1237 safe_close_pair(m->user_lookup_fds);
718db961 1238
e46b13c8
ZJS
1239 manager_close_ask_password(m);
1240
718db961
LP
1241 manager_close_idle_pipe(m);
1242
9670d583 1243 udev_unref(m->udev);
718db961 1244 sd_event_unref(m->event);
60918275 1245
c952c6ec
LP
1246 free(m->notify_socket);
1247
84e3543e 1248 lookup_paths_free(&m->lookup_paths);
1137a57c 1249 strv_free(m->environment);
036643a2 1250
4ad49000 1251 hashmap_free(m->cgroup_unit);
c6c18be3 1252 set_free_free(m->unit_path_cache);
33be102a 1253
664f88a7
LP
1254 free(m->switch_root);
1255 free(m->switch_root_init);
1256
517d56b1 1257 for (i = 0; i < _RLIMIT_MAX; i++)
d9814c76 1258 m->rlimit[i] = mfree(m->rlimit[i]);
c93ff2e9 1259
a57f7e2c
LP
1260 assert(hashmap_isempty(m->units_requiring_mounts_for));
1261 hashmap_free(m->units_requiring_mounts_for);
1262
00d9ef85
LP
1263 hashmap_free(m->uid_refs);
1264 hashmap_free(m->gid_refs);
1265
72fd1768 1266 for (dt = 0; dt < _EXEC_DIRECTORY_TYPE_MAX; dt++)
35aba85a
YW
1267 m->prefix[dt] = mfree(m->prefix[dt]);
1268
6b430fdb 1269 return mfree(m);
60918275
LP
1270}
1271
ba64af90 1272void manager_enumerate(Manager *m) {
f50e0a01 1273 UnitType c;
f50e0a01
LP
1274
1275 assert(m);
1276
a16e1123
LP
1277 /* Let's ask every type to load all units from disk/kernel
1278 * that it might know */
0faacd47 1279 for (c = 0; c < _UNIT_TYPE_MAX; c++) {
1c2e9646 1280 if (!unit_type_supported(c)) {
03afec3c 1281 log_debug("Unit type .%s is not supported on this system.", unit_type_to_string(c));
0faacd47 1282 continue;
a57f7e2c 1283 }
f50e0a01 1284
0faacd47
LP
1285 if (!unit_vtable[c]->enumerate)
1286 continue;
1287
ba64af90 1288 unit_vtable[c]->enumerate(m);
0faacd47
LP
1289 }
1290
f50e0a01 1291 manager_dispatch_load_queue(m);
a16e1123
LP
1292}
1293
007c6337 1294static void manager_coldplug(Manager *m) {
a16e1123
LP
1295 Iterator i;
1296 Unit *u;
1297 char *k;
007c6337 1298 int r;
a16e1123
LP
1299
1300 assert(m);
f50e0a01
LP
1301
1302 /* Then, let's set up their initial state. */
1303 HASHMAP_FOREACH_KEY(u, k, m->units, i) {
1304
1305 /* ignore aliases */
ac155bb8 1306 if (u->id != k)
f50e0a01
LP
1307 continue;
1308
007c6337
LP
1309 r = unit_coldplug(u);
1310 if (r < 0)
1311 log_warning_errno(r, "We couldn't coldplug %s, proceeding anyway: %m", u->id);
f50e0a01 1312 }
a16e1123
LP
1313}
1314
fe51822e
LP
1315static void manager_build_unit_path_cache(Manager *m) {
1316 char **i;
fe51822e
LP
1317 int r;
1318
1319 assert(m);
1320
1321 set_free_free(m->unit_path_cache);
1322
548f6937 1323 m->unit_path_cache = set_new(&path_hash_ops);
874310b7 1324 if (!m->unit_path_cache) {
d063a527
LP
1325 r = -ENOMEM;
1326 goto fail;
fe51822e
LP
1327 }
1328
1329 /* This simply builds a list of files we know exist, so that
1330 * we don't always have to go to disk */
1331
a3c4eb07 1332 STRV_FOREACH(i, m->lookup_paths.search_path) {
d063a527 1333 _cleanup_closedir_ DIR *d = NULL;
fe51822e
LP
1334 struct dirent *de;
1335
bd0af849
ZJS
1336 d = opendir(*i);
1337 if (!d) {
874310b7 1338 if (errno != ENOENT)
d063a527 1339 log_warning_errno(errno, "Failed to open directory %s, ignoring: %m", *i);
fe51822e
LP
1340 continue;
1341 }
1342
d063a527 1343 FOREACH_DIRENT(de, d, r = -errno; goto fail) {
fe51822e
LP
1344 char *p;
1345
605405c6 1346 p = strjoin(streq(*i, "/") ? "" : *i, "/", de->d_name);
44d91056 1347 if (!p) {
fe51822e
LP
1348 r = -ENOMEM;
1349 goto fail;
1350 }
1351
ef42202a
ZJS
1352 r = set_consume(m->unit_path_cache, p);
1353 if (r < 0)
fe51822e 1354 goto fail;
fe51822e 1355 }
fe51822e
LP
1356 }
1357
1358 return;
1359
1360fail:
d063a527
LP
1361 log_warning_errno(r, "Failed to build unit path cache, proceeding without: %m");
1362 m->unit_path_cache = set_free_free(m->unit_path_cache);
fe51822e
LP
1363}
1364
9ff1a6f1 1365static void manager_distribute_fds(Manager *m, FDSet *fds) {
9588bc32 1366 Iterator i;
9ff1a6f1 1367 Unit *u;
9588bc32
LP
1368
1369 assert(m);
1370
1371 HASHMAP_FOREACH(u, m->units, i) {
1372
1373 if (fdset_size(fds) <= 0)
1374 break;
1375
9ff1a6f1
LP
1376 if (!UNIT_VTABLE(u)->distribute_fds)
1377 continue;
9588bc32 1378
9ff1a6f1
LP
1379 UNIT_VTABLE(u)->distribute_fds(u, fds);
1380 }
9588bc32
LP
1381}
1382
8559b3b7
LP
1383static bool manager_dbus_is_running(Manager *m, bool deserialized) {
1384 Unit *u;
1385
1386 assert(m);
1387
1388 /* This checks whether the dbus instance we are supposed to expose our APIs on is up. We check both the socket
1389 * and the service unit. If the 'deserialized' parameter is true we'll check the deserialized state of the unit
1390 * rather than the current one. */
1391
1392 if (m->test_run_flags != 0)
1393 return false;
1394
1395 /* If we are in the user instance, and the env var is already set for us, then this means D-Bus is ran
1396 * somewhere outside of our own logic. Let's use it */
1397 if (MANAGER_IS_USER(m) && getenv("DBUS_SESSION_BUS_ADDRESS"))
1398 return true;
1399
1400 u = manager_get_unit(m, SPECIAL_DBUS_SOCKET);
1401 if (!u)
1402 return false;
1403 if ((deserialized ? SOCKET(u)->deserialized_state : SOCKET(u)->state) != SOCKET_RUNNING)
1404 return false;
1405
1406 u = manager_get_unit(m, SPECIAL_DBUS_SERVICE);
1407 if (!u)
1408 return false;
1409 if (!IN_SET((deserialized ? SERVICE(u)->deserialized_state : SERVICE(u)->state), SERVICE_RUNNING, SERVICE_RELOAD))
1410 return false;
1411
1412 return true;
1413}
1414
a16e1123 1415int manager_startup(Manager *m, FILE *serialization, FDSet *fds) {
17f01ace 1416 int r;
a16e1123
LP
1417
1418 assert(m);
1419
a1f31f47
ZJS
1420 /* If we are running in test mode, we still want to run the generators,
1421 * but we should not touch the real generator directories. */
1422 r = lookup_paths_init(&m->lookup_paths, m->unit_file_scope,
e0a3da1f 1423 m->test_run_flags ? LOOKUP_PATHS_TEMPORARY_GENERATED : 0,
a1f31f47 1424 NULL);
e801700e
ZJS
1425 if (r < 0)
1426 return r;
5a1e9937 1427
64691d20
ZJS
1428 r = manager_run_environment_generators(m);
1429 if (r < 0)
1430 return r;
1431
9f9f0342 1432 dual_timestamp_get(m->timestamps + MANAGER_TIMESTAMP_GENERATORS_START);
a3c4eb07 1433 r = manager_run_generators(m);
9f9f0342 1434 dual_timestamp_get(m->timestamps + MANAGER_TIMESTAMP_GENERATORS_FINISH);
07719a21
LP
1435 if (r < 0)
1436 return r;
1437
fd130612 1438 /* If this is the first boot, and we are in the host system, then preset everything */
81fe6cde 1439 if (m->first_boot > 0 &&
fd130612 1440 MANAGER_IS_SYSTEM(m) &&
e0a3da1f 1441 !m->test_run_flags) {
81fe6cde 1442
17f01ace
ZJS
1443 r = unit_file_preset_all(UNIT_FILE_SYSTEM, 0, NULL, UNIT_FILE_PRESET_ENABLE_ONLY, NULL, 0);
1444 if (r < 0)
1445 log_full_errno(r == -EEXIST ? LOG_NOTICE : LOG_WARNING, r,
1446 "Failed to populate /etc with preset unit settings, ignoring: %m");
28dd66ec
LB
1447 else
1448 log_info("Populated /etc with preset unit settings.");
1449 }
1450
a1453343 1451 lookup_paths_reduce(&m->lookup_paths);
fe51822e
LP
1452 manager_build_unit_path_cache(m);
1453
9f611ad8
LP
1454 /* If we will deserialize make sure that during enumeration
1455 * this is already known, so we increase the counter here
1456 * already */
1457 if (serialization)
313cefa1 1458 m->n_reloading++;
9f611ad8 1459
a16e1123 1460 /* First, enumerate what we can from all config files */
9f9f0342 1461 dual_timestamp_get(m->timestamps + MANAGER_TIMESTAMP_UNITS_LOAD_START);
ba64af90 1462 manager_enumerate(m);
9f9f0342 1463 dual_timestamp_get(m->timestamps + MANAGER_TIMESTAMP_UNITS_LOAD_FINISH);
a16e1123
LP
1464
1465 /* Second, deserialize if there is something to deserialize */
07429866 1466 if (serialization) {
1cd974ed 1467 r = manager_deserialize(m, serialization, fds);
07429866 1468 if (r < 0)
17f01ace 1469 return log_error_errno(r, "Deserialization failed: %m");
07429866 1470 }
a16e1123 1471
01e10de3
LP
1472 /* Any fds left? Find some unit which wants them. This is
1473 * useful to allow container managers to pass some file
1474 * descriptors to us pre-initialized. This enables
1475 * socket-based activation of entire containers. */
9ff1a6f1 1476 manager_distribute_fds(m, fds);
01e10de3 1477
d86f9d52
LP
1478 /* We might have deserialized the notify fd, but if we didn't
1479 * then let's create the bus now */
17f01ace
ZJS
1480 r = manager_setup_notify(m);
1481 if (r < 0)
1482 /* No sense to continue without notifications, our children would fail anyway. */
1483 return r;
d86f9d52 1484
17f01ace
ZJS
1485 r = manager_setup_cgroups_agent(m);
1486 if (r < 0)
1487 /* Likewise, no sense to continue without empty cgroup notifications. */
1488 return r;
d8fdc620 1489
17f01ace
ZJS
1490 r = manager_setup_user_lookup_fd(m);
1491 if (r < 0)
1492 /* This shouldn't fail, except if things are really broken. */
1493 return r;
00d9ef85 1494
8559b3b7
LP
1495 /* Let's set up our private bus connection now, unconditionally */
1496 (void) bus_init_private(m);
05a98afd 1497
8559b3b7
LP
1498 /* If we are in --user mode also connect to the system bus now */
1499 if (MANAGER_IS_USER(m))
1500 (void) bus_init_system(m);
1501
1502 /* Let's connect to the bus now, but only if the unit is supposed to be up */
1503 if (manager_dbus_is_running(m, !!serialization)) {
1504 (void) bus_init_api(m);
05a98afd 1505
8559b3b7
LP
1506 if (MANAGER_IS_SYSTEM(m))
1507 (void) bus_init_system(m);
1508 }
1509
1510 /* Now that we are connected to all possible busses, let's deserialize who is tracking us. */
05a98afd
LP
1511 (void) bus_track_coldplug(m, &m->subscribed, false, m->deserialized_subscribed);
1512 m->deserialized_subscribed = strv_free(m->deserialized_subscribed);
e3dd987c 1513
a16e1123 1514 /* Third, fire things up! */
007c6337 1515 manager_coldplug(m);
a16e1123 1516
29206d46
LP
1517 /* Release any dynamic users no longer referenced */
1518 dynamic_user_vacuum(m, true);
1519
e8a565cb
YW
1520 exec_runtime_vacuum(m);
1521
00d9ef85
LP
1522 /* Release any references to UIDs/GIDs no longer referenced, and destroy any IPC owned by them */
1523 manager_vacuum_uid_refs(m);
1524 manager_vacuum_gid_refs(m);
1525
9f611ad8 1526 if (serialization) {
a7556052 1527 assert(m->n_reloading > 0);
313cefa1 1528 m->n_reloading--;
71445ae7
LP
1529
1530 /* Let's wait for the UnitNew/JobNew messages being
1531 * sent, before we notify that the reload is
1532 * finished */
1533 m->send_reloading_done = true;
9f611ad8
LP
1534 }
1535
17f01ace 1536 return 0;
f50e0a01
LP
1537}
1538
4bd29fe5 1539int manager_add_job(Manager *m, JobType type, Unit *unit, JobMode mode, sd_bus_error *e, Job **_ret) {
e5b5ae50 1540 int r;
7527cb52 1541 Transaction *tr;
e5b5ae50
LP
1542
1543 assert(m);
1544 assert(type < _JOB_TYPE_MAX);
87f0e418 1545 assert(unit);
e5b5ae50 1546 assert(mode < _JOB_MODE_MAX);
60918275 1547
7358dc02
ZJS
1548 if (mode == JOB_ISOLATE && type != JOB_START)
1549 return sd_bus_error_setf(e, SD_BUS_ERROR_INVALID_ARGS, "Isolate is only valid for start.");
c497c7a9 1550
7358dc02
ZJS
1551 if (mode == JOB_ISOLATE && !unit->allow_isolate)
1552 return sd_bus_error_setf(e, BUS_ERROR_NO_ISOLATION, "Operation refused, unit may not be isolated.");
2528a7a6 1553
f2341e0a 1554 log_unit_debug(unit, "Trying to enqueue job %s/%s/%s", unit->id, job_type_to_string(type), job_mode_to_string(mode));
9f04bd52 1555
c6497ccb 1556 type = job_type_collapse(type, unit);
e0209d83 1557
23ade460 1558 tr = transaction_new(mode == JOB_REPLACE_IRREVERSIBLY);
7527cb52
MS
1559 if (!tr)
1560 return -ENOMEM;
11dd41ce 1561
4bd29fe5 1562 r = transaction_add_job_and_dependencies(tr, type, unit, NULL, true, false,
3742095b 1563 IN_SET(mode, JOB_IGNORE_DEPENDENCIES, JOB_IGNORE_REQUIREMENTS),
b94fbd30 1564 mode == JOB_IGNORE_DEPENDENCIES, e);
7527cb52
MS
1565 if (r < 0)
1566 goto tr_abort;
c497c7a9 1567
7527cb52
MS
1568 if (mode == JOB_ISOLATE) {
1569 r = transaction_add_isolate_jobs(tr, m);
1570 if (r < 0)
1571 goto tr_abort;
1572 }
1573
1574 r = transaction_activate(tr, m, mode, e);
1575 if (r < 0)
1576 goto tr_abort;
e5b5ae50 1577
f2341e0a 1578 log_unit_debug(unit,
66870f90
ZJS
1579 "Enqueued job %s/%s as %u", unit->id,
1580 job_type_to_string(type), (unsigned) tr->anchor_job->id);
f50e0a01 1581
e5b5ae50 1582 if (_ret)
b94fbd30 1583 *_ret = tr->anchor_job;
60918275 1584
7527cb52 1585 transaction_free(tr);
e5b5ae50 1586 return 0;
7527cb52
MS
1587
1588tr_abort:
1589 transaction_abort(tr);
1590 transaction_free(tr);
1591 return r;
e5b5ae50 1592}
60918275 1593
53f18416 1594int manager_add_job_by_name(Manager *m, JobType type, const char *name, JobMode mode, sd_bus_error *e, Job **ret) {
4440b27d 1595 Unit *unit = NULL; /* just to appease gcc, initialization is not really necessary */
28247076
LP
1596 int r;
1597
1598 assert(m);
1599 assert(type < _JOB_TYPE_MAX);
1600 assert(name);
1601 assert(mode < _JOB_MODE_MAX);
1602
c3090674
LP
1603 r = manager_load_unit(m, name, NULL, NULL, &unit);
1604 if (r < 0)
28247076 1605 return r;
4440b27d 1606 assert(unit);
28247076 1607
53f18416
LP
1608 return manager_add_job(m, type, unit, mode, e, ret);
1609}
1610
1611int manager_add_job_by_name_and_warn(Manager *m, JobType type, const char *name, JobMode mode, Job **ret) {
4afd3348 1612 _cleanup_(sd_bus_error_free) sd_bus_error error = SD_BUS_ERROR_NULL;
53f18416
LP
1613 int r;
1614
1615 assert(m);
1616 assert(type < _JOB_TYPE_MAX);
1617 assert(name);
1618 assert(mode < _JOB_MODE_MAX);
1619
1620 r = manager_add_job_by_name(m, type, name, mode, &error, ret);
1621 if (r < 0)
1622 return log_warning_errno(r, "Failed to enqueue %s job for %s: %s", job_mode_to_string(mode), name, bus_error_message(&error, r));
1623
1624 return r;
28247076
LP
1625}
1626
15d167f8
JW
1627int manager_propagate_reload(Manager *m, Unit *unit, JobMode mode, sd_bus_error *e) {
1628 int r;
1629 Transaction *tr;
1630
1631 assert(m);
1632 assert(unit);
1633 assert(mode < _JOB_MODE_MAX);
1634 assert(mode != JOB_ISOLATE); /* Isolate is only valid for start */
1635
1636 tr = transaction_new(mode == JOB_REPLACE_IRREVERSIBLY);
1637 if (!tr)
1638 return -ENOMEM;
1639
1640 /* We need an anchor job */
1641 r = transaction_add_job_and_dependencies(tr, JOB_NOP, unit, NULL, false, false, true, true, e);
1642 if (r < 0)
1643 goto tr_abort;
1644
1645 /* Failure in adding individual dependencies is ignored, so this always succeeds. */
1646 transaction_add_propagate_reload_jobs(tr, unit, tr->anchor_job, mode == JOB_IGNORE_DEPENDENCIES, e);
1647
1648 r = transaction_activate(tr, m, mode, e);
1649 if (r < 0)
1650 goto tr_abort;
1651
1652 transaction_free(tr);
1653 return 0;
1654
1655tr_abort:
1656 transaction_abort(tr);
1657 transaction_free(tr);
1658 return r;
1659}
1660
60918275
LP
1661Job *manager_get_job(Manager *m, uint32_t id) {
1662 assert(m);
1663
1664 return hashmap_get(m->jobs, UINT32_TO_PTR(id));
1665}
1666
87f0e418 1667Unit *manager_get_unit(Manager *m, const char *name) {
60918275
LP
1668 assert(m);
1669 assert(name);
1670
87f0e418 1671 return hashmap_get(m->units, name);
60918275
LP
1672}
1673
c1e1601e 1674unsigned manager_dispatch_load_queue(Manager *m) {
595ed347 1675 Unit *u;
c1e1601e 1676 unsigned n = 0;
60918275
LP
1677
1678 assert(m);
1679
223dabab
LP
1680 /* Make sure we are not run recursively */
1681 if (m->dispatching_load_queue)
c1e1601e 1682 return 0;
223dabab
LP
1683
1684 m->dispatching_load_queue = true;
1685
87f0e418 1686 /* Dispatches the load queue. Takes a unit from the queue and
60918275
LP
1687 * tries to load its data until the queue is empty */
1688
595ed347
MS
1689 while ((u = m->load_queue)) {
1690 assert(u->in_load_queue);
034c6ed7 1691
595ed347 1692 unit_load(u);
c1e1601e 1693 n++;
60918275
LP
1694 }
1695
223dabab 1696 m->dispatching_load_queue = false;
c1e1601e 1697 return n;
60918275
LP
1698}
1699
c2756a68
LP
1700int manager_load_unit_prepare(
1701 Manager *m,
1702 const char *name,
1703 const char *path,
718db961 1704 sd_bus_error *e,
c2756a68
LP
1705 Unit **_ret) {
1706
dc409696 1707 _cleanup_(unit_freep) Unit *cleanup_ret = NULL;
87f0e418 1708 Unit *ret;
7d17cfbc 1709 UnitType t;
60918275
LP
1710 int r;
1711
1712 assert(m);
9e2f7c11 1713 assert(name || path);
7a6a095a 1714 assert(_ret);
60918275 1715
db06e3b6
LP
1716 /* This will prepare the unit for loading, but not actually
1717 * load anything from disk. */
0301abf4 1718
718db961
LP
1719 if (path && !is_path(path))
1720 return sd_bus_error_setf(e, SD_BUS_ERROR_INVALID_ARGS, "Path %s is not absolute.", path);
9e2f7c11
LP
1721
1722 if (!name)
2b6bf07d 1723 name = basename(path);
9e2f7c11 1724
7d17cfbc
MS
1725 t = unit_name_to_type(name);
1726
5d512d54
LN
1727 if (t == _UNIT_TYPE_INVALID || !unit_name_is_valid(name, UNIT_NAME_PLAIN|UNIT_NAME_INSTANCE)) {
1728 if (unit_name_is_valid(name, UNIT_NAME_TEMPLATE))
1729 return sd_bus_error_setf(e, SD_BUS_ERROR_INVALID_ARGS, "Unit name %s is missing the instance name.", name);
1730
718db961 1731 return sd_bus_error_setf(e, SD_BUS_ERROR_INVALID_ARGS, "Unit name %s is not valid.", name);
5d512d54 1732 }
60918275 1733
7d17cfbc
MS
1734 ret = manager_get_unit(m, name);
1735 if (ret) {
034c6ed7 1736 *_ret = ret;
413d6313 1737 return 1;
034c6ed7 1738 }
60918275 1739
dc409696 1740 ret = cleanup_ret = unit_new(m, unit_vtable[t]->object_size);
7d17cfbc 1741 if (!ret)
60918275
LP
1742 return -ENOMEM;
1743
7d17cfbc 1744 if (path) {
ac155bb8 1745 ret->fragment_path = strdup(path);
dc409696 1746 if (!ret->fragment_path)
0301abf4 1747 return -ENOMEM;
7d17cfbc 1748 }
0301abf4 1749
1058cbf2 1750 r = unit_add_name(ret, name);
dc409696 1751 if (r < 0)
1ffba6fe 1752 return r;
60918275 1753
87f0e418 1754 unit_add_to_load_queue(ret);
c1e1601e 1755 unit_add_to_dbus_queue(ret);
949061f0 1756 unit_add_to_gc_queue(ret);
c1e1601e 1757
7a6a095a 1758 *_ret = ret;
dc409696 1759 cleanup_ret = NULL;
db06e3b6
LP
1760
1761 return 0;
1762}
1763
c2756a68
LP
1764int manager_load_unit(
1765 Manager *m,
1766 const char *name,
1767 const char *path,
718db961 1768 sd_bus_error *e,
c2756a68
LP
1769 Unit **_ret) {
1770
db06e3b6
LP
1771 int r;
1772
1773 assert(m);
7a6a095a 1774 assert(_ret);
db06e3b6
LP
1775
1776 /* This will load the service information files, but not actually
1777 * start any services or anything. */
1778
c3090674
LP
1779 r = manager_load_unit_prepare(m, name, path, e, _ret);
1780 if (r != 0)
db06e3b6
LP
1781 return r;
1782
f50e0a01 1783 manager_dispatch_load_queue(m);
60918275 1784
7a6a095a 1785 *_ret = unit_follow_merge(*_ret);
9e2f7c11 1786
60918275
LP
1787 return 0;
1788}
a66d02c3 1789
cea8e32e 1790void manager_dump_jobs(Manager *s, FILE *f, const char *prefix) {
034c6ed7 1791 Iterator i;
a66d02c3
LP
1792 Job *j;
1793
1794 assert(s);
1795 assert(f);
1796
034c6ed7 1797 HASHMAP_FOREACH(j, s->jobs, i)
cea8e32e 1798 job_dump(j, f, prefix);
a66d02c3
LP
1799}
1800
87f0e418 1801void manager_dump_units(Manager *s, FILE *f, const char *prefix) {
034c6ed7 1802 Iterator i;
87f0e418 1803 Unit *u;
11dd41ce 1804 const char *t;
a66d02c3
LP
1805
1806 assert(s);
1807 assert(f);
1808
87f0e418 1809 HASHMAP_FOREACH_KEY(u, t, s->units, i)
ac155bb8 1810 if (u->id == t)
87f0e418 1811 unit_dump(u, f, prefix);
a66d02c3 1812}
7fad411c 1813
ad75b9e7
LP
1814void manager_dump(Manager *m, FILE *f, const char *prefix) {
1815 ManagerTimestamp q;
1816
1817 assert(m);
1818 assert(f);
1819
1820 for (q = 0; q < _MANAGER_TIMESTAMP_MAX; q++) {
1821 char buf[FORMAT_TIMESTAMP_MAX];
1822
1823 if (dual_timestamp_is_set(m->timestamps + q))
1824 fprintf(f, "%sTimestamp %s: %s\n",
1825 strempty(prefix),
1826 manager_timestamp_to_string(q),
1827 format_timestamp(buf, sizeof(buf), m->timestamps[q].realtime));
1828 }
1829
1830 manager_dump_units(m, f, prefix);
1831 manager_dump_jobs(m, f, prefix);
1832}
1833
713f6f90
LP
1834int manager_get_dump_string(Manager *m, char **ret) {
1835 _cleanup_free_ char *dump = NULL;
1836 _cleanup_fclose_ FILE *f = NULL;
1837 size_t size;
1838 int r;
1839
1840 assert(m);
1841 assert(ret);
1842
1843 f = open_memstream(&dump, &size);
1844 if (!f)
1845 return -errno;
1846
0d536673 1847 (void) __fsetlocking(f, FSETLOCKING_BYCALLER);
713f6f90
LP
1848
1849 manager_dump(m, f, NULL);
1850
1851 r = fflush_and_check(f);
1852 if (r < 0)
1853 return r;
1854
1855 f = safe_fclose(f);
1856
1857 *ret = dump;
1858 dump = NULL;
1859
1860 return 0;
1861}
1862
7fad411c
LP
1863void manager_clear_jobs(Manager *m) {
1864 Job *j;
1865
1866 assert(m);
1867
7fad411c 1868 while ((j = hashmap_first(m->jobs)))
5273510e 1869 /* No need to recurse. We're cancelling all jobs. */
833f92ad 1870 job_finish_and_invalidate(j, JOB_CANCELED, false, false);
7fad411c 1871}
83c60c9f 1872
752b5905
LP
1873static int manager_dispatch_run_queue(sd_event_source *source, void *userdata) {
1874 Manager *m = userdata;
83c60c9f 1875 Job *j;
034c6ed7 1876
752b5905
LP
1877 assert(source);
1878 assert(m);
9152c765 1879
034c6ed7 1880 while ((j = m->run_queue)) {
ac1135be 1881 assert(j->installed);
034c6ed7
LP
1882 assert(j->in_run_queue);
1883
1884 job_run_and_invalidate(j);
9152c765 1885 }
034c6ed7 1886
a0b64226 1887 if (m->n_running_jobs > 0)
03b717a3
MS
1888 manager_watch_jobs_in_progress(m);
1889
31a7eb86
ZJS
1890 if (m->n_on_console > 0)
1891 manager_watch_idle_pipe(m);
1892
752b5905 1893 return 1;
c1e1601e
LP
1894}
1895
9588bc32 1896static unsigned manager_dispatch_dbus_queue(Manager *m) {
e0a08581 1897 unsigned n = 0, budget;
595ed347 1898 Unit *u;
e0a08581 1899 Job *j;
c1e1601e
LP
1900
1901 assert(m);
1902
1903 if (m->dispatching_dbus_queue)
1904 return 0;
1905
e0a08581
LP
1906 /* Anything to do at all? */
1907 if (!m->dbus_unit_queue && !m->dbus_job_queue && !m->send_reloading_done && !m->queued_message)
1908 return 0;
1909
1910 /* Do we have overly many messages queued at the moment? If so, let's not enqueue more on top, let's sit this
1911 * cycle out, and process things in a later cycle when the queues got a bit emptier. */
1912 if (manager_bus_n_queued_write(m) > MANAGER_BUS_BUSY_THRESHOLD)
1913 return 0;
1914
1915 /* Only process a certain number of units/jobs per event loop iteration. Even if the bus queue wasn't overly
1916 * full before this call we shouldn't increase it in size too wildly in one step, and we shouldn't monopolize
1917 * CPU time with generating these messages. Note the difference in counting of this "budget" and the
1918 * "threshold" above: the "budget" is decreased only once per generated message, regardless how many
1919 * busses/direct connections it is enqueued on, while the "threshold" is applied to each queued instance of bus
1920 * message, i.e. if the same message is enqueued to five busses/direct connections it will be counted five
1921 * times. This difference in counting ("references" vs. "instances") is primarily a result of the fact that
1922 * it's easier to implement it this way, however it also reflects the thinking that the "threshold" should put
1923 * a limit on used queue memory, i.e. space, while the "budget" should put a limit on time. Also note that
1924 * the "threshold" is currently chosen much higher than the "budget". */
1925 budget = MANAGER_BUS_MESSAGE_BUDGET;
1926
c1e1601e
LP
1927 m->dispatching_dbus_queue = true;
1928
e0a08581
LP
1929 while (budget > 0 && (u = m->dbus_unit_queue)) {
1930
595ed347 1931 assert(u->in_dbus_queue);
c1e1601e 1932
595ed347 1933 bus_unit_send_change_signal(u);
e0a08581 1934 n++, budget--;
c1e1601e
LP
1935 }
1936
e0a08581 1937 while (budget > 0 && (j = m->dbus_job_queue)) {
c1e1601e
LP
1938 assert(j->in_dbus_queue);
1939
1940 bus_job_send_change_signal(j);
e0a08581 1941 n++, budget--;
c1e1601e
LP
1942 }
1943
1944 m->dispatching_dbus_queue = false;
71445ae7 1945
e0a08581 1946 if (budget > 0 && m->send_reloading_done) {
71445ae7 1947 m->send_reloading_done = false;
718db961 1948 bus_manager_send_reloading(m, false);
e0a08581 1949 n++, budget--;
71445ae7
LP
1950 }
1951
e0a08581 1952 if (budget > 0 && m->queued_message) {
718db961 1953 bus_send_queued_message(m);
e0a08581
LP
1954 n++;
1955 }
718db961 1956
c1e1601e 1957 return n;
9152c765
LP
1958}
1959
d8fdc620
LP
1960static int manager_dispatch_cgroups_agent_fd(sd_event_source *source, int fd, uint32_t revents, void *userdata) {
1961 Manager *m = userdata;
1962 char buf[PATH_MAX+1];
1963 ssize_t n;
1964
1965 n = recv(fd, buf, sizeof(buf), 0);
1966 if (n < 0)
1967 return log_error_errno(errno, "Failed to read cgroups agent message: %m");
1968 if (n == 0) {
1969 log_error("Got zero-length cgroups agent message, ignoring.");
1970 return 0;
1971 }
1972 if ((size_t) n >= sizeof(buf)) {
1973 log_error("Got overly long cgroups agent message, ignoring.");
1974 return 0;
1975 }
1976
1977 if (memchr(buf, 0, n)) {
1978 log_error("Got cgroups agent message with embedded NUL byte, ignoring.");
1979 return 0;
1980 }
1981 buf[n] = 0;
1982
1983 manager_notify_cgroup_empty(m, buf);
d5f15326 1984 (void) bus_forward_agent_released(m, buf);
d8fdc620
LP
1985
1986 return 0;
1987}
1988
db256aab
LP
1989static void manager_invoke_notify_message(
1990 Manager *m,
1991 Unit *u,
1992 const struct ucred *ucred,
1993 const char *buf,
1994 FDSet *fds) {
1995
5ba6985b
LP
1996 assert(m);
1997 assert(u);
db256aab 1998 assert(ucred);
5ba6985b 1999 assert(buf);
5ba6985b 2000
62a76913 2001 if (u->notifygen == m->notifygen) /* Already invoked on this same unit in this same iteration? */
5ba6985b 2002 return;
62a76913
LP
2003 u->notifygen = m->notifygen;
2004
2005 if (UNIT_VTABLE(u)->notify_message) {
2006 _cleanup_strv_free_ char **tags = NULL;
2007
2008 tags = strv_split(buf, NEWLINE);
2009 if (!tags) {
2010 log_oom();
2011 return;
2012 }
5ba6985b 2013
db256aab 2014 UNIT_VTABLE(u)->notify_message(u, ucred, tags, fds);
62a76913
LP
2015
2016 } else if (DEBUG_LOGGING) {
a86b7675
ZJS
2017 _cleanup_free_ char *x = NULL, *y = NULL;
2018
da5fb861 2019 x = ellipsize(buf, 20, 90);
a86b7675 2020 if (x)
da5fb861
LP
2021 y = cescape(x);
2022
a86b7675
ZJS
2023 log_unit_debug(u, "Got notification message \"%s\", ignoring.", strnull(y));
2024 }
5ba6985b
LP
2025}
2026
718db961 2027static int manager_dispatch_notify_fd(sd_event_source *source, int fd, uint32_t revents, void *userdata) {
3d0b8a55 2028
b215b0ed 2029 _cleanup_fdset_free_ FDSet *fds = NULL;
718db961 2030 Manager *m = userdata;
b215b0ed
DH
2031 char buf[NOTIFY_BUFFER_MAX+1];
2032 struct iovec iovec = {
2033 .iov_base = buf,
2034 .iov_len = sizeof(buf)-1,
2035 };
2036 union {
2037 struct cmsghdr cmsghdr;
2038 uint8_t buf[CMSG_SPACE(sizeof(struct ucred)) +
2039 CMSG_SPACE(sizeof(int) * NOTIFY_FD_MAX)];
2040 } control = {};
2041 struct msghdr msghdr = {
2042 .msg_iov = &iovec,
2043 .msg_iovlen = 1,
2044 .msg_control = &control,
2045 .msg_controllen = sizeof(control),
2046 };
2047
2048 struct cmsghdr *cmsg;
2049 struct ucred *ucred = NULL;
62a76913
LP
2050 _cleanup_free_ Unit **array_copy = NULL;
2051 Unit *u1, *u2, **array;
b215b0ed
DH
2052 int r, *fd_array = NULL;
2053 unsigned n_fds = 0;
62a76913 2054 bool found = false;
8c47c732
LP
2055 ssize_t n;
2056
2057 assert(m);
718db961
LP
2058 assert(m->notify_fd == fd);
2059
2060 if (revents != EPOLLIN) {
2061 log_warning("Got unexpected poll event for notify fd.");
2062 return 0;
2063 }
8c47c732 2064
045a3d59 2065 n = recvmsg(m->notify_fd, &msghdr, MSG_DONTWAIT|MSG_CMSG_CLOEXEC|MSG_TRUNC);
b215b0ed 2066 if (n < 0) {
c55ae51e
LP
2067 if (IN_SET(errno, EAGAIN, EINTR))
2068 return 0; /* Spurious wakeup, try again */
8c47c732 2069
c55ae51e
LP
2070 /* If this is any other, real error, then let's stop processing this socket. This of course means we
2071 * won't take notification messages anymore, but that's still better than busy looping around this:
2072 * being woken up over and over again but being unable to actually read the message off the socket. */
2073 return log_error_errno(errno, "Failed to receive notification message: %m");
b215b0ed 2074 }
a354329f 2075
b215b0ed
DH
2076 CMSG_FOREACH(cmsg, &msghdr) {
2077 if (cmsg->cmsg_level == SOL_SOCKET && cmsg->cmsg_type == SCM_RIGHTS) {
a354329f 2078
b215b0ed
DH
2079 fd_array = (int*) CMSG_DATA(cmsg);
2080 n_fds = (cmsg->cmsg_len - CMSG_LEN(0)) / sizeof(int);
a354329f 2081
b215b0ed
DH
2082 } else if (cmsg->cmsg_level == SOL_SOCKET &&
2083 cmsg->cmsg_type == SCM_CREDENTIALS &&
2084 cmsg->cmsg_len == CMSG_LEN(sizeof(struct ucred))) {
a354329f 2085
b215b0ed 2086 ucred = (struct ucred*) CMSG_DATA(cmsg);
a354329f 2087 }
b215b0ed 2088 }
a354329f 2089
b215b0ed
DH
2090 if (n_fds > 0) {
2091 assert(fd_array);
a354329f 2092
b215b0ed
DH
2093 r = fdset_new_array(&fds, fd_array, n_fds);
2094 if (r < 0) {
2095 close_many(fd_array, n_fds);
9987750e
FB
2096 log_oom();
2097 return 0;
a354329f 2098 }
b215b0ed 2099 }
8c47c732 2100
15e23e8c 2101 if (!ucred || !pid_is_valid(ucred->pid)) {
b215b0ed
DH
2102 log_warning("Received notify message without valid credentials. Ignoring.");
2103 return 0;
2104 }
8c47c732 2105
045a3d59 2106 if ((size_t) n >= sizeof(buf) || (msghdr.msg_flags & MSG_TRUNC)) {
b215b0ed
DH
2107 log_warning("Received notify message exceeded maximum size. Ignoring.");
2108 return 0;
2109 }
8c47c732 2110
875ca88d
LP
2111 /* As extra safety check, let's make sure the string we get doesn't contain embedded NUL bytes. We permit one
2112 * trailing NUL byte in the message, but don't expect it. */
2113 if (n > 1 && memchr(buf, 0, n-1)) {
2114 log_warning("Received notify message with embedded NUL bytes. Ignoring.");
2115 return 0;
2116 }
2117
2118 /* Make sure it's NUL-terminated. */
b215b0ed 2119 buf[n] = 0;
8c47c732 2120
62a76913
LP
2121 /* Increase the generation counter used for filtering out duplicate unit invocations. */
2122 m->notifygen++;
2123
2124 /* Notify every unit that might be interested, which might be multiple. */
b215b0ed 2125 u1 = manager_get_unit_by_pid_cgroup(m, ucred->pid);
62a76913
LP
2126 u2 = hashmap_get(m->watch_pids, PID_TO_PTR(ucred->pid));
2127 array = hashmap_get(m->watch_pids, PID_TO_PTR(-ucred->pid));
2128 if (array) {
2129 size_t k = 0;
5ba6985b 2130
62a76913
LP
2131 while (array[k])
2132 k++;
5ba6985b 2133
62a76913
LP
2134 array_copy = newdup(Unit*, array, k+1);
2135 if (!array_copy)
2136 log_oom();
2137 }
2138 /* And now invoke the per-unit callbacks. Note that manager_invoke_notify_message() will handle duplicate units
2139 * make sure we only invoke each unit's handler once. */
2140 if (u1) {
2141 manager_invoke_notify_message(m, u1, ucred, buf, fds);
2142 found = true;
2143 }
2144 if (u2) {
2145 manager_invoke_notify_message(m, u2, ucred, buf, fds);
2146 found = true;
2147 }
2148 if (array_copy)
2149 for (size_t i = 0; array_copy[i]; i++) {
2150 manager_invoke_notify_message(m, array_copy[i], ucred, buf, fds);
2151 found = true;
2152 }
8c47c732 2153
62a76913
LP
2154 if (!found)
2155 log_warning("Cannot find unit for notify message of PID "PID_FMT", ignoring.", ucred->pid);
a354329f 2156
b215b0ed 2157 if (fdset_size(fds) > 0)
5fd2c135 2158 log_warning("Got extra auxiliary fds with notification message, closing them.");
8c47c732
LP
2159
2160 return 0;
2161}
2162
62a76913
LP
2163static void manager_invoke_sigchld_event(
2164 Manager *m,
2165 Unit *u,
2166 const siginfo_t *si) {
36f20ae3 2167
5ba6985b
LP
2168 assert(m);
2169 assert(u);
2170 assert(si);
2171
62a76913
LP
2172 /* Already invoked the handler of this unit in this iteration? Then don't process this again */
2173 if (u->sigchldgen == m->sigchldgen)
2174 return;
2175 u->sigchldgen = m->sigchldgen;
5ba6985b 2176
62a76913 2177 log_unit_debug(u, "Child "PID_FMT" belongs to %s.", si->si_pid, u->id);
5ba6985b 2178 unit_unwatch_pid(u, si->si_pid);
e57051f5 2179
62a76913
LP
2180 if (UNIT_VTABLE(u)->sigchld_event)
2181 UNIT_VTABLE(u)->sigchld_event(u, si->si_pid, si->si_code, si->si_status);
5ba6985b
LP
2182}
2183
575b300b
LP
2184static int manager_dispatch_sigchld(sd_event_source *source, void *userdata) {
2185 Manager *m = userdata;
2186 siginfo_t si = {};
2187 int r;
2188
2189 assert(source);
9152c765
LP
2190 assert(m);
2191
575b300b
LP
2192 /* First we call waitd() for a PID and do not reap the zombie. That way we can still access /proc/$PID for it
2193 * while it is a zombie. */
9152c765 2194
575b300b 2195 if (waitid(P_ALL, 0, &si, WEXITED|WNOHANG|WNOWAIT) < 0) {
acbb0225 2196
8afabc50
AJ
2197 if (errno != ECHILD)
2198 log_error_errno(errno, "Failed to peek for child with waitid(), ignoring: %m");
acbb0225 2199
8afabc50 2200 goto turn_off;
575b300b 2201 }
4112df16 2202
575b300b
LP
2203 if (si.si_pid <= 0)
2204 goto turn_off;
2205
2206 if (IN_SET(si.si_code, CLD_EXITED, CLD_KILLED, CLD_DUMPED)) {
62a76913 2207 _cleanup_free_ Unit **array_copy = NULL;
575b300b 2208 _cleanup_free_ char *name = NULL;
62a76913 2209 Unit *u1, *u2, **array;
575b300b
LP
2210
2211 (void) get_process_comm(si.si_pid, &name);
2212
2213 log_debug("Child "PID_FMT" (%s) died (code=%s, status=%i/%s)",
2214 si.si_pid, strna(name),
2215 sigchld_code_to_string(si.si_code),
2216 si.si_status,
2217 strna(si.si_code == CLD_EXITED
2218 ? exit_status_to_string(si.si_status, EXIT_STATUS_FULL)
2219 : signal_to_string(si.si_status)));
2220
62a76913
LP
2221 /* Increase the generation counter used for filtering out duplicate unit invocations */
2222 m->sigchldgen++;
2223
2224 /* And now figure out the unit this belongs to, it might be multiple... */
575b300b 2225 u1 = manager_get_unit_by_pid_cgroup(m, si.si_pid);
62a76913
LP
2226 u2 = hashmap_get(m->watch_pids, PID_TO_PTR(si.si_pid));
2227 array = hashmap_get(m->watch_pids, PID_TO_PTR(-si.si_pid));
2228 if (array) {
2229 size_t n = 0;
2230
2231 /* Cound how many entries the array has */
2232 while (array[n])
2233 n++;
2234
2235 /* Make a copy of the array so that we don't trip up on the array changing beneath us */
2236 array_copy = newdup(Unit*, array, n+1);
2237 if (!array_copy)
2238 log_oom();
2239 }
2240
2241 /* Finally, execute them all. Note that u1, u2 and the array might contain duplicates, but
2242 * that's fine, manager_invoke_sigchld_event() will ensure we only invoke the handlers once for
2243 * each iteration. */
575b300b 2244 if (u1)
62a76913
LP
2245 manager_invoke_sigchld_event(m, u1, &si);
2246 if (u2)
2247 manager_invoke_sigchld_event(m, u2, &si);
2248 if (array_copy)
2249 for (size_t i = 0; array_copy[i]; i++)
2250 manager_invoke_sigchld_event(m, array_copy[i], &si);
575b300b 2251 }
9152c765 2252
575b300b
LP
2253 /* And now, we actually reap the zombie. */
2254 if (waitid(P_PID, si.si_pid, &si, WEXITED) < 0) {
2255 log_error_errno(errno, "Failed to dequeue child, ignoring: %m");
2256 return 0;
2257 }
9152c765 2258
575b300b 2259 return 0;
8c47c732 2260
575b300b
LP
2261turn_off:
2262 /* All children processed for now, turn off event source */
4112df16 2263
575b300b
LP
2264 r = sd_event_source_set_enabled(m->sigchld_event_source, SD_EVENT_OFF);
2265 if (r < 0)
2266 return log_error_errno(r, "Failed to disable SIGCHLD event source: %m");
9152c765
LP
2267
2268 return 0;
2269}
2270
c75fbada 2271static void manager_start_target(Manager *m, const char *name, JobMode mode) {
4afd3348 2272 _cleanup_(sd_bus_error_free) sd_bus_error error = SD_BUS_ERROR_NULL;
28247076 2273 int r;
398ef8ba 2274
f2341e0a 2275 log_debug("Activating special unit %s", name);
1e001f52 2276
4bd29fe5 2277 r = manager_add_job_by_name(m, JOB_START, name, mode, &error, NULL);
bd0af849 2278 if (r < 0)
f2341e0a 2279 log_error("Failed to enqueue %s job: %s", name, bus_error_message(&error, r));
28247076
LP
2280}
2281
24dd31c1
LN
2282static void manager_handle_ctrl_alt_del(Manager *m) {
2283 /* If the user presses C-A-D more than
2284 * 7 times within 2s, we reboot/shutdown immediately,
2285 * unless it was disabled in system.conf */
2286
ae8c7939 2287 if (ratelimit_test(&m->ctrl_alt_del_ratelimit) || m->cad_burst_action == EMERGENCY_ACTION_NONE)
24dd31c1 2288 manager_start_target(m, SPECIAL_CTRL_ALT_DEL_TARGET, JOB_REPLACE_IRREVERSIBLY);
ae8c7939
LN
2289 else
2290 emergency_action(m, m->cad_burst_action, NULL,
2291 "Ctrl-Alt-Del was pressed more than 7 times within 2s");
24dd31c1
LN
2292}
2293
718db961
LP
2294static int manager_dispatch_signal_fd(sd_event_source *source, int fd, uint32_t revents, void *userdata) {
2295 Manager *m = userdata;
9152c765
LP
2296 ssize_t n;
2297 struct signalfd_siginfo sfsi;
dacd6cee 2298 int r;
9152c765
LP
2299
2300 assert(m);
718db961
LP
2301 assert(m->signal_fd == fd);
2302
2303 if (revents != EPOLLIN) {
2304 log_warning("Got unexpected events from signal file descriptor.");
2305 return 0;
2306 }
9152c765 2307
575b300b
LP
2308 n = read(m->signal_fd, &sfsi, sizeof(sfsi));
2309 if (n != sizeof(sfsi)) {
2310 if (n >= 0) {
2311 log_warning("Truncated read from signal fd (%zu bytes), ignoring!", n);
2312 return 0;
2313 }
9152c765 2314
575b300b
LP
2315 if (IN_SET(errno, EINTR, EAGAIN))
2316 return 0;
9152c765 2317
575b300b
LP
2318 /* We return an error here, which will kill this handler,
2319 * to avoid a busy loop on read error. */
2320 return log_error_errno(errno, "Reading from signal fd failed: %m");
2321 }
9152c765 2322
575b300b
LP
2323 log_received_signal(sfsi.ssi_signo == SIGCHLD ||
2324 (sfsi.ssi_signo == SIGTERM && MANAGER_IS_USER(m))
2325 ? LOG_DEBUG : LOG_INFO,
2326 &sfsi);
1e001f52 2327
575b300b 2328 switch (sfsi.ssi_signo) {
b9cd2ec1 2329
575b300b
LP
2330 case SIGCHLD:
2331 r = sd_event_source_set_enabled(m->sigchld_event_source, SD_EVENT_ON);
2332 if (r < 0)
8afabc50 2333 log_warning_errno(r, "Failed to enable SIGCHLD event source, ignoring: %m");
b9cd2ec1 2334
575b300b 2335 break;
84e9af1e 2336
575b300b
LP
2337 case SIGTERM:
2338 if (MANAGER_IS_SYSTEM(m)) {
ba0c7754 2339 /* This is for compatibility with the original sysvinit */
575b300b
LP
2340 r = verify_run_space_and_log("Refusing to reexecute");
2341 if (r >= 0)
2342 m->exit_code = MANAGER_REEXECUTE;
a1b256b0 2343 break;
575b300b 2344 }
84e9af1e 2345
575b300b
LP
2346 _fallthrough_;
2347 case SIGINT:
2348 if (MANAGER_IS_SYSTEM(m))
2349 manager_handle_ctrl_alt_del(m);
2350 else
2351 manager_start_target(m, SPECIAL_EXIT_TARGET,
2352 JOB_REPLACE_IRREVERSIBLY);
2353 break;
84e9af1e 2354
575b300b 2355 case SIGWINCH:
ba0c7754 2356 /* This is a nop on non-init */
575b300b
LP
2357 if (MANAGER_IS_SYSTEM(m))
2358 manager_start_target(m, SPECIAL_KBREQUEST_TARGET, JOB_REPLACE);
84e9af1e 2359
575b300b 2360 break;
84e9af1e 2361
575b300b 2362 case SIGPWR:
ba0c7754 2363 /* This is a nop on non-init */
575b300b
LP
2364 if (MANAGER_IS_SYSTEM(m))
2365 manager_start_target(m, SPECIAL_SIGPWR_TARGET, JOB_REPLACE);
6632c602 2366
575b300b 2367 break;
57ee42ce 2368
8559b3b7 2369 case SIGUSR1:
8559b3b7 2370 if (manager_dbus_is_running(m, false)) {
575b300b 2371 log_info("Trying to reconnect to bus...");
575b300b 2372
8559b3b7
LP
2373 (void) bus_init_api(m);
2374
2375 if (MANAGER_IS_SYSTEM(m))
2376 (void) bus_init_system(m);
2377 } else {
2378 log_info("Starting D-Bus service...");
575b300b
LP
2379 manager_start_target(m, SPECIAL_DBUS_SERVICE, JOB_REPLACE);
2380 }
57ee42ce 2381
575b300b 2382 break;
575b300b
LP
2383
2384 case SIGUSR2: {
2385 _cleanup_free_ char *dump = NULL;
2386
2387 r = manager_get_dump_string(m, &dump);
2388 if (r < 0) {
2389 log_warning_errno(errno, "Failed to acquire manager dump: %m");
57ee42ce
LP
2390 break;
2391 }
2392
575b300b
LP
2393 log_dump(LOG_INFO, dump);
2394 break;
2395 }
2149e37c 2396
575b300b
LP
2397 case SIGHUP:
2398 r = verify_run_space_and_log("Refusing to reload");
2399 if (r >= 0)
2400 m->exit_code = MANAGER_RELOAD;
2401 break;
2402
2403 default: {
2404
2405 /* Starting SIGRTMIN+0 */
2406 static const struct {
2407 const char *target;
2408 JobMode mode;
2409 } target_table[] = {
2410 [0] = { SPECIAL_DEFAULT_TARGET, JOB_ISOLATE },
2411 [1] = { SPECIAL_RESCUE_TARGET, JOB_ISOLATE },
2412 [2] = { SPECIAL_EMERGENCY_TARGET, JOB_ISOLATE },
2413 [3] = { SPECIAL_HALT_TARGET, JOB_REPLACE_IRREVERSIBLY },
2414 [4] = { SPECIAL_POWEROFF_TARGET, JOB_REPLACE_IRREVERSIBLY },
2415 [5] = { SPECIAL_REBOOT_TARGET, JOB_REPLACE_IRREVERSIBLY },
2416 [6] = { SPECIAL_KEXEC_TARGET, JOB_REPLACE_IRREVERSIBLY },
2417 };
2418
2419 /* Starting SIGRTMIN+13, so that target halt and system halt are 10 apart */
2420 static const ManagerExitCode code_table[] = {
2421 [0] = MANAGER_HALT,
2422 [1] = MANAGER_POWEROFF,
2423 [2] = MANAGER_REBOOT,
2424 [3] = MANAGER_KEXEC,
2425 };
b2cdc666 2426
575b300b
LP
2427 if ((int) sfsi.ssi_signo >= SIGRTMIN+0 &&
2428 (int) sfsi.ssi_signo < SIGRTMIN+(int) ELEMENTSOF(target_table)) {
2429 int idx = (int) sfsi.ssi_signo - SIGRTMIN;
2430 manager_start_target(m, target_table[idx].target,
2431 target_table[idx].mode);
1005d14f 2432 break;
2149e37c 2433 }
1005d14f 2434
575b300b
LP
2435 if ((int) sfsi.ssi_signo >= SIGRTMIN+13 &&
2436 (int) sfsi.ssi_signo < SIGRTMIN+13+(int) ELEMENTSOF(code_table)) {
2437 m->exit_code = code_table[sfsi.ssi_signo - SIGRTMIN - 13];
2438 break;
2439 }
2440
2441 switch (sfsi.ssi_signo - SIGRTMIN) {
2442
2443 case 20:
2444 manager_set_show_status(m, SHOW_STATUS_YES);
a16e1123
LP
2445 break;
2446
575b300b
LP
2447 case 21:
2448 manager_set_show_status(m, SHOW_STATUS_NO);
2449 break;
7d793605 2450
575b300b
LP
2451 case 22:
2452 log_set_max_level(LOG_DEBUG);
2453 log_info("Setting log level to debug.");
2454 break;
2455
2456 case 23:
2457 log_set_max_level(LOG_INFO);
2458 log_info("Setting log level to info.");
2459 break;
0003d1ab 2460
575b300b
LP
2461 case 24:
2462 if (MANAGER_IS_USER(m)) {
2463 m->exit_code = MANAGER_EXIT;
2464 return 0;
0658666b 2465 }
9152c765 2466
575b300b
LP
2467 /* This is a nop on init */
2468 break;
2469
2470 case 26:
2471 case 29: /* compatibility: used to be mapped to LOG_TARGET_SYSLOG_OR_KMSG */
2472 log_set_target(LOG_TARGET_JOURNAL_OR_KMSG);
2473 log_notice("Setting log target to journal-or-kmsg.");
2474 break;
2475
2476 case 27:
2477 log_set_target(LOG_TARGET_CONSOLE);
2478 log_notice("Setting log target to console.");
2479 break;
2480
2481 case 28:
2482 log_set_target(LOG_TARGET_KMSG);
2483 log_notice("Setting log target to kmsg.");
2484 break;
2485
2486 default:
2487 log_warning("Got unhandled signal <%s>.", signal_to_string(sfsi.ssi_signo));
2488 }
2489 }}
034c6ed7
LP
2490
2491 return 0;
2492}
2493
718db961
LP
2494static int manager_dispatch_time_change_fd(sd_event_source *source, int fd, uint32_t revents, void *userdata) {
2495 Manager *m = userdata;
2496 Iterator i;
2497 Unit *u;
034c6ed7
LP
2498
2499 assert(m);
718db961 2500 assert(m->time_change_fd == fd);
034c6ed7 2501
a80c1575 2502 log_struct(LOG_DEBUG,
2b044526 2503 "MESSAGE_ID=" SD_MESSAGE_TIME_CHANGE_STR,
e2cc6eca 2504 LOG_MESSAGE("Time has been changed"),
718db961 2505 NULL);
034c6ed7 2506
718db961
LP
2507 /* Restart the watch */
2508 m->time_change_event_source = sd_event_source_unref(m->time_change_event_source);
03e334a1 2509 m->time_change_fd = safe_close(m->time_change_fd);
ef734fd6 2510
718db961 2511 manager_setup_time_change(m);
4e434314 2512
718db961
LP
2513 HASHMAP_FOREACH(u, m->units, i)
2514 if (UNIT_VTABLE(u)->time_change)
2515 UNIT_VTABLE(u)->time_change(u);
ea430986 2516
718db961
LP
2517 return 0;
2518}
ea430986 2519
718db961
LP
2520static int manager_dispatch_idle_pipe_fd(sd_event_source *source, int fd, uint32_t revents, void *userdata) {
2521 Manager *m = userdata;
8742514c 2522
718db961
LP
2523 assert(m);
2524 assert(m->idle_pipe[2] == fd);
8742514c 2525
5a69973f
LP
2526 /* There's at least one Type=idle child that just gave up on us waiting for the boot process to complete. Let's
2527 * now turn off any further console output if there's at least one service that needs console access, so that
2528 * from now on our own output should not spill into that service's output anymore. After all, we support
2529 * Type=idle only to beautify console output and it generally is set on services that want to own the console
2530 * exclusively without our interference. */
718db961 2531 m->no_console_output = m->n_on_console > 0;
03b717a3 2532
5a69973f
LP
2533 /* Acknowledge the child's request, and let all all other children know too that they shouldn't wait any longer
2534 * by closing the pipes towards them, which is what they are waiting for. */
718db961 2535 manager_close_idle_pipe(m);
03b717a3 2536
718db961
LP
2537 return 0;
2538}
31a7eb86 2539
718db961
LP
2540static int manager_dispatch_jobs_in_progress(sd_event_source *source, usec_t usec, void *userdata) {
2541 Manager *m = userdata;
fd08a840
ZJS
2542 int r;
2543 uint64_t next;
31a7eb86 2544
718db961 2545 assert(m);
fd08a840 2546 assert(source);
9152c765 2547
718db961 2548 manager_print_jobs_in_progress(m);
fd08a840
ZJS
2549
2550 next = now(CLOCK_MONOTONIC) + JOBS_IN_PROGRESS_PERIOD_USEC;
2551 r = sd_event_source_set_time(source, next);
2552 if (r < 0)
2553 return r;
2554
2555 return sd_event_source_set_enabled(source, SD_EVENT_ONESHOT);
9152c765
LP
2556}
2557
2558int manager_loop(Manager *m) {
2559 int r;
9152c765 2560
fac9f8df 2561 RATELIMIT_DEFINE(rl, 1*USEC_PER_SEC, 50000);
ea430986 2562
9152c765 2563 assert(m);
f755e3b7 2564 m->exit_code = MANAGER_OK;
9152c765 2565
fe51822e 2566 /* Release the path cache */
97044145 2567 m->unit_path_cache = set_free_free(m->unit_path_cache);
fe51822e 2568
b0c918b9
LP
2569 manager_check_finished(m);
2570
575b300b
LP
2571 /* There might still be some zombies hanging around from before we were exec()'ed. Let's reap them. */
2572 r = sd_event_source_set_enabled(m->sigchld_event_source, SD_EVENT_ON);
e96d6be7 2573 if (r < 0)
575b300b 2574 return log_error_errno(r, "Failed to enable SIGCHLD event source: %m");
a4312405 2575
f755e3b7 2576 while (m->exit_code == MANAGER_OK) {
718db961 2577 usec_t wait_usec;
9152c765 2578
463d0d15 2579 if (m->runtime_watchdog > 0 && m->runtime_watchdog != USEC_INFINITY && MANAGER_IS_SYSTEM(m))
e96d6be7
LP
2580 watchdog_ping();
2581
ea430986
LP
2582 if (!ratelimit_test(&rl)) {
2583 /* Yay, something is going seriously wrong, pause a little */
2584 log_warning("Looping too fast. Throttling execution a little.");
2585 sleep(1);
2586 }
2587
37a8e683 2588 if (manager_dispatch_load_queue(m) > 0)
23a177ef
LP
2589 continue;
2590
c5a97ed1
LP
2591 if (manager_dispatch_gc_job_queue(m) > 0)
2592 continue;
2593
2594 if (manager_dispatch_gc_unit_queue(m) > 0)
701cc384
LP
2595 continue;
2596
cf1265e1 2597 if (manager_dispatch_cleanup_queue(m) > 0)
c1e1601e 2598 continue;
034c6ed7 2599
91a6073e 2600 if (manager_dispatch_cgroup_realize_queue(m) > 0)
c1e1601e
LP
2601 continue;
2602
c1e1601e 2603 if (manager_dispatch_dbus_queue(m) > 0)
ea430986 2604 continue;
ea430986 2605
c757a65b 2606 /* Sleep for half the watchdog time */
463d0d15 2607 if (m->runtime_watchdog > 0 && m->runtime_watchdog != USEC_INFINITY && MANAGER_IS_SYSTEM(m)) {
718db961
LP
2608 wait_usec = m->runtime_watchdog / 2;
2609 if (wait_usec <= 0)
2610 wait_usec = 1;
c757a65b 2611 } else
3a43da28 2612 wait_usec = USEC_INFINITY;
9152c765 2613
718db961 2614 r = sd_event_run(m->event, wait_usec);
23bbb0de
MS
2615 if (r < 0)
2616 return log_error_errno(r, "Failed to run event loop: %m");
a16e1123 2617 }
957ca890 2618
a16e1123 2619 return m->exit_code;
83c60c9f 2620}
ea430986 2621
718db961 2622int manager_load_unit_from_dbus_path(Manager *m, const char *s, sd_bus_error *e, Unit **_u) {
ede3a796 2623 _cleanup_free_ char *n = NULL;
4b58153d 2624 sd_id128_t invocation_id;
ea430986 2625 Unit *u;
80fbf05e 2626 int r;
ea430986
LP
2627
2628 assert(m);
2629 assert(s);
2630 assert(_u);
2631
ede3a796
LP
2632 r = unit_name_from_dbus_path(s, &n);
2633 if (r < 0)
2634 return r;
ea430986 2635
4b58153d
LP
2636 /* Permit addressing units by invocation ID: if the passed bus path is suffixed by a 128bit ID then we use it
2637 * as invocation ID. */
2638 r = sd_id128_from_string(n, &invocation_id);
2639 if (r >= 0) {
2640 u = hashmap_get(m->units_by_invocation_id, &invocation_id);
2641 if (u) {
2642 *_u = u;
2643 return 0;
2644 }
2645
2646 return sd_bus_error_setf(e, BUS_ERROR_NO_UNIT_FOR_INVOCATION_ID, "No unit with the specified invocation ID " SD_ID128_FORMAT_STR " known.", SD_ID128_FORMAT_VAL(invocation_id));
2647 }
2648
00c83b43
LP
2649 /* If this didn't work, we check if this is a unit name */
2650 if (!unit_name_is_valid(n, UNIT_NAME_PLAIN|UNIT_NAME_INSTANCE))
2651 return sd_bus_error_setf(e, SD_BUS_ERROR_INVALID_ARGS, "Unit name %s is neither a valid invocation ID nor unit name.", n);
2652
80fbf05e 2653 r = manager_load_unit(m, n, NULL, e, &u);
80fbf05e
MS
2654 if (r < 0)
2655 return r;
ea430986
LP
2656
2657 *_u = u;
ea430986
LP
2658 return 0;
2659}
86fbf370
LP
2660
2661int manager_get_job_from_dbus_path(Manager *m, const char *s, Job **_j) {
718db961 2662 const char *p;
86fbf370 2663 unsigned id;
718db961 2664 Job *j;
86fbf370
LP
2665 int r;
2666
2667 assert(m);
2668 assert(s);
2669 assert(_j);
2670
718db961
LP
2671 p = startswith(s, "/org/freedesktop/systemd1/job/");
2672 if (!p)
86fbf370
LP
2673 return -EINVAL;
2674
718db961 2675 r = safe_atou(p, &id);
8742514c 2676 if (r < 0)
86fbf370
LP
2677 return r;
2678
8742514c
LP
2679 j = manager_get_job(m, id);
2680 if (!j)
86fbf370
LP
2681 return -ENOENT;
2682
2683 *_j = j;
2684
2685 return 0;
2686}
dfcd764e 2687
4927fcae 2688void manager_send_unit_audit(Manager *m, Unit *u, int type, bool success) {
e537352b 2689
349cc4a5 2690#if HAVE_AUDIT
2ba11090 2691 _cleanup_free_ char *p = NULL;
0aa281df 2692 const char *msg;
7410616c 2693 int audit_fd, r;
e537352b 2694
463d0d15 2695 if (!MANAGER_IS_SYSTEM(m))
a1a078ee
LP
2696 return;
2697
c1165f82
LP
2698 audit_fd = get_audit_fd();
2699 if (audit_fd < 0)
e537352b
LP
2700 return;
2701
bbd3a7ba
LP
2702 /* Don't generate audit events if the service was already
2703 * started and we're just deserializing */
2c289ea8 2704 if (MANAGER_IS_RELOADING(m))
bbd3a7ba
LP
2705 return;
2706
ac155bb8 2707 if (u->type != UNIT_SERVICE)
f1dd0c3f
LP
2708 return;
2709
7410616c
LP
2710 r = unit_name_to_prefix_and_instance(u->id, &p);
2711 if (r < 0) {
2712 log_error_errno(r, "Failed to extract prefix and instance of unit name: %m");
e537352b
LP
2713 return;
2714 }
2715
63c372cb 2716 msg = strjoina("unit=", p);
0aa281df
LP
2717 if (audit_log_user_comm_message(audit_fd, type, msg, "systemd", NULL, NULL, NULL, success) < 0) {
2718 if (errno == EPERM)
391ade86 2719 /* We aren't allowed to send audit messages?
44785992 2720 * Then let's not retry again. */
c1165f82 2721 close_audit_fd();
0aa281df 2722 else
56f64d95 2723 log_warning_errno(errno, "Failed to send audit message: %m");
391ade86 2724 }
4927fcae 2725#endif
e537352b 2726
e537352b
LP
2727}
2728
e983b760 2729void manager_send_unit_plymouth(Manager *m, Unit *u) {
fc2fffe7 2730 static const union sockaddr_union sa = PLYMOUTH_SOCKET;
2ba11090
ZJS
2731 _cleanup_free_ char *message = NULL;
2732 _cleanup_close_ int fd = -1;
fc2fffe7 2733 int n = 0;
e983b760
LP
2734
2735 /* Don't generate plymouth events if the service was already
2736 * started and we're just deserializing */
2c289ea8 2737 if (MANAGER_IS_RELOADING(m))
e983b760
LP
2738 return;
2739
463d0d15 2740 if (!MANAGER_IS_SYSTEM(m))
e983b760
LP
2741 return;
2742
75f86906 2743 if (detect_container() > 0)
3772995a
LP
2744 return;
2745
ec2ce0c5 2746 if (!IN_SET(u->type, UNIT_SERVICE, UNIT_MOUNT, UNIT_SWAP))
e983b760
LP
2747 return;
2748
2749 /* We set SOCK_NONBLOCK here so that we rather drop the
2750 * message then wait for plymouth */
e62d8c39
ZJS
2751 fd = socket(AF_UNIX, SOCK_STREAM|SOCK_CLOEXEC|SOCK_NONBLOCK, 0);
2752 if (fd < 0) {
56f64d95 2753 log_error_errno(errno, "socket() failed: %m");
e983b760
LP
2754 return;
2755 }
2756
fc2fffe7 2757 if (connect(fd, &sa.sa, SOCKADDR_UN_LEN(sa.un)) < 0) {
2ba11090 2758 if (!IN_SET(errno, EPIPE, EAGAIN, ENOENT, ECONNREFUSED, ECONNRESET, ECONNABORTED))
56f64d95 2759 log_error_errno(errno, "connect() failed: %m");
2ba11090 2760 return;
e983b760
LP
2761 }
2762
ac155bb8 2763 if (asprintf(&message, "U\002%c%s%n", (int) (strlen(u->id) + 1), u->id, &n) < 0) {
0d0f0c50 2764 log_oom();
2ba11090 2765 return;
e983b760
LP
2766 }
2767
2768 errno = 0;
2ba11090
ZJS
2769 if (write(fd, message, n + 1) != n + 1)
2770 if (!IN_SET(errno, EPIPE, EAGAIN, ENOENT, ECONNREFUSED, ECONNRESET, ECONNABORTED))
56f64d95 2771 log_error_errno(errno, "Failed to write Plymouth message: %m");
e983b760
LP
2772}
2773
d8d5ab98 2774int manager_open_serialization(Manager *m, FILE **_f) {
504afd7c 2775 int fd;
a16e1123
LP
2776 FILE *f;
2777
2778 assert(_f);
2779
504afd7c
ZJS
2780 fd = open_serialization_fd("systemd-state");
2781 if (fd < 0)
2782 return fd;
a16e1123 2783
01e10de3 2784 f = fdopen(fd, "w+");
d86f9d52 2785 if (!f) {
03e334a1 2786 safe_close(fd);
a16e1123 2787 return -errno;
d86f9d52 2788 }
a16e1123
LP
2789
2790 *_f = f;
a16e1123
LP
2791 return 0;
2792}
2793
b3680f49 2794int manager_serialize(Manager *m, FILE *f, FDSet *fds, bool switching_root) {
9f9f0342
LP
2795 ManagerTimestamp q;
2796 const char *t;
a16e1123
LP
2797 Iterator i;
2798 Unit *u;
a16e1123
LP
2799 int r;
2800
2801 assert(m);
2802 assert(f);
2803 assert(fds);
2804
313cefa1 2805 m->n_reloading++;
38c52d46 2806
1fa2f38f 2807 fprintf(f, "current-job-id=%"PRIu32"\n", m->current_job_id);
33c5fae9
LP
2808 fprintf(f, "n-installed-jobs=%u\n", m->n_installed_jobs);
2809 fprintf(f, "n-failed-jobs=%u\n", m->n_failed_jobs);
0c2826c6
ZJS
2810 fprintf(f, "taint-usr=%s\n", yes_no(m->taint_usr));
2811 fprintf(f, "ready-sent=%s\n", yes_no(m->ready_sent));
d8eb10d6 2812 fprintf(f, "taint-logged=%s\n", yes_no(m->taint_logged));
2a12e32e 2813 fprintf(f, "service-watchdogs=%s\n", yes_no(m->service_watchdogs));
01d67b43 2814
9f9f0342
LP
2815 for (q = 0; q < _MANAGER_TIMESTAMP_MAX; q++) {
2816 /* The userspace and finish timestamps only apply to the host system, hence only serialize them there */
2817 if (in_initrd() && IN_SET(q, MANAGER_TIMESTAMP_USERSPACE, MANAGER_TIMESTAMP_FINISH))
2818 continue;
f38ed060 2819
9f9f0342
LP
2820 t = manager_timestamp_to_string(q);
2821 {
fbd0b64f 2822 char field[strlen(t) + STRLEN("-timestamp") + 1];
9f9f0342
LP
2823 strcpy(stpcpy(field, t), "-timestamp");
2824 dual_timestamp_serialize(f, field, m->timestamps + q);
2825 }
f38ed060 2826 }
47a483a1 2827
fe902fa4
ZJS
2828 if (!switching_root)
2829 (void) serialize_environment(f, m->environment);
4a9fd066 2830
d86f9d52
LP
2831 if (m->notify_fd >= 0) {
2832 int copy;
2833
2834 copy = fdset_put_dup(fds, m->notify_fd);
2835 if (copy < 0)
2836 return copy;
2837
2838 fprintf(f, "notify-fd=%i\n", copy);
2839 fprintf(f, "notify-socket=%s\n", m->notify_socket);
2840 }
2841
d8fdc620
LP
2842 if (m->cgroups_agent_fd >= 0) {
2843 int copy;
2844
2845 copy = fdset_put_dup(fds, m->cgroups_agent_fd);
2846 if (copy < 0)
2847 return copy;
2848
2849 fprintf(f, "cgroups-agent-fd=%i\n", copy);
2850 }
2851
00d9ef85
LP
2852 if (m->user_lookup_fds[0] >= 0) {
2853 int copy0, copy1;
2854
2855 copy0 = fdset_put_dup(fds, m->user_lookup_fds[0]);
2856 if (copy0 < 0)
2857 return copy0;
2858
2859 copy1 = fdset_put_dup(fds, m->user_lookup_fds[1]);
2860 if (copy1 < 0)
2861 return copy1;
2862
2863 fprintf(f, "user-lookup=%i %i\n", copy0, copy1);
2864 }
2865
05a98afd 2866 bus_track_serialize(m->subscribed, f, "subscribed");
6fa48533 2867
29206d46
LP
2868 r = dynamic_user_serialize(m, f, fds);
2869 if (r < 0)
2870 return r;
2871
00d9ef85
LP
2872 manager_serialize_uid_refs(m, f);
2873 manager_serialize_gid_refs(m, f);
2874
e8a565cb
YW
2875 r = exec_runtime_serialize(m, f, fds);
2876 if (r < 0)
2877 return r;
2878
0d536673 2879 (void) fputc('\n', f);
f2382a94 2880
a16e1123 2881 HASHMAP_FOREACH_KEY(u, t, m->units, i) {
ac155bb8 2882 if (u->id != t)
a16e1123
LP
2883 continue;
2884
a16e1123 2885 /* Start marker */
0d536673
LP
2886 fputs(u->id, f);
2887 fputc('\n', f);
a16e1123 2888
6fa48533
LP
2889 r = unit_serialize(u, f, fds, !switching_root);
2890 if (r < 0) {
313cefa1 2891 m->n_reloading--;
a16e1123 2892 return r;
38c52d46 2893 }
a16e1123
LP
2894 }
2895
a7556052 2896 assert(m->n_reloading > 0);
313cefa1 2897 m->n_reloading--;
38c52d46 2898
a16e1123
LP
2899 if (ferror(f))
2900 return -EIO;
2901
b23de6af
LP
2902 r = bus_fdset_add_all(m, fds);
2903 if (r < 0)
2904 return r;
2905
a16e1123
LP
2906 return 0;
2907}
2908
2909int manager_deserialize(Manager *m, FILE *f, FDSet *fds) {
2910 int r = 0;
2911
2912 assert(m);
2913 assert(f);
2914
2915 log_debug("Deserializing state...");
2916
313cefa1 2917 m->n_reloading++;
82c64bf5 2918
10f8e83c 2919 for (;;) {
d233c99a
ZJS
2920 char line[LINE_MAX];
2921 const char *val, *l;
10f8e83c
LP
2922
2923 if (!fgets(line, sizeof(line), f)) {
2924 if (feof(f))
2925 r = 0;
2926 else
2927 r = -errno;
2928
2929 goto finish;
2930 }
2931
2932 char_array_0(line);
2933 l = strstrip(line);
2934
2935 if (l[0] == 0)
2936 break;
2937
fb4650aa 2938 if ((val = startswith(l, "current-job-id="))) {
01d67b43
LP
2939 uint32_t id;
2940
fb4650aa 2941 if (safe_atou32(val, &id) < 0)
62c460c6 2942 log_notice("Failed to parse current job id value %s", val);
01d67b43
LP
2943 else
2944 m->current_job_id = MAX(m->current_job_id, id);
718db961 2945
fb4650aa 2946 } else if ((val = startswith(l, "n-installed-jobs="))) {
33c5fae9
LP
2947 uint32_t n;
2948
fb4650aa 2949 if (safe_atou32(val, &n) < 0)
62c460c6 2950 log_notice("Failed to parse installed jobs counter %s", val);
33c5fae9
LP
2951 else
2952 m->n_installed_jobs += n;
718db961 2953
fb4650aa 2954 } else if ((val = startswith(l, "n-failed-jobs="))) {
33c5fae9
LP
2955 uint32_t n;
2956
fb4650aa 2957 if (safe_atou32(val, &n) < 0)
62c460c6 2958 log_notice("Failed to parse failed jobs counter %s", val);
33c5fae9
LP
2959 else
2960 m->n_failed_jobs += n;
718db961 2961
fb4650aa 2962 } else if ((val = startswith(l, "taint-usr="))) {
01d67b43
LP
2963 int b;
2964
fb4650aa 2965 b = parse_boolean(val);
e3dd987c 2966 if (b < 0)
62c460c6 2967 log_notice("Failed to parse taint /usr flag %s", val);
01d67b43
LP
2968 else
2969 m->taint_usr = m->taint_usr || b;
718db961 2970
0c2826c6
ZJS
2971 } else if ((val = startswith(l, "ready-sent="))) {
2972 int b;
2973
2974 b = parse_boolean(val);
2975 if (b < 0)
2976 log_notice("Failed to parse ready-sent flag %s", val);
2977 else
2978 m->ready_sent = m->ready_sent || b;
2979
d8eb10d6
ZJS
2980 } else if ((val = startswith(l, "taint-logged="))) {
2981 int b;
2982
2983 b = parse_boolean(val);
2984 if (b < 0)
2985 log_notice("Failed to parse taint-logged flag %s", val);
2986 else
2987 m->taint_logged = m->taint_logged || b;
2988
2a12e32e
JK
2989 } else if ((val = startswith(l, "service-watchdogs="))) {
2990 int b;
2991
2992 b = parse_boolean(val);
2993 if (b < 0)
2994 log_notice("Failed to parse service-watchdogs flag %s", val);
2995 else
2996 m->service_watchdogs = b;
2997
9f9f0342 2998 } else if (startswith(l, "env=")) {
fe902fa4 2999 r = deserialize_environment(&m->environment, l);
d233c99a
ZJS
3000 if (r == -ENOMEM)
3001 goto finish;
527b7a42 3002 if (r < 0)
d233c99a 3003 log_notice_errno(r, "Failed to parse environment entry: \"%s\": %m", l);
e3dd987c 3004
fb4650aa 3005 } else if ((val = startswith(l, "notify-fd="))) {
d86f9d52
LP
3006 int fd;
3007
fb4650aa 3008 if (safe_atoi(val, &fd) < 0 || fd < 0 || !fdset_contains(fds, fd))
62c460c6 3009 log_notice("Failed to parse notify fd: \"%s\"", val);
d86f9d52 3010 else {
03e334a1
LP
3011 m->notify_event_source = sd_event_source_unref(m->notify_event_source);
3012 safe_close(m->notify_fd);
d86f9d52
LP
3013 m->notify_fd = fdset_remove(fds, fd);
3014 }
3015
fb4650aa 3016 } else if ((val = startswith(l, "notify-socket="))) {
d86f9d52
LP
3017 char *n;
3018
fb4650aa 3019 n = strdup(val);
d86f9d52
LP
3020 if (!n) {
3021 r = -ENOMEM;
3022 goto finish;
3023 }
3024
3025 free(m->notify_socket);
3026 m->notify_socket = n;
3027
fb4650aa 3028 } else if ((val = startswith(l, "cgroups-agent-fd="))) {
d8fdc620
LP
3029 int fd;
3030
fb4650aa 3031 if (safe_atoi(val, &fd) < 0 || fd < 0 || !fdset_contains(fds, fd))
62c460c6 3032 log_notice("Failed to parse cgroups agent fd: %s", val);
d8fdc620
LP
3033 else {
3034 m->cgroups_agent_event_source = sd_event_source_unref(m->cgroups_agent_event_source);
3035 safe_close(m->cgroups_agent_fd);
3036 m->cgroups_agent_fd = fdset_remove(fds, fd);
3037 }
3038
fb4650aa 3039 } else if ((val = startswith(l, "user-lookup="))) {
00d9ef85
LP
3040 int fd0, fd1;
3041
fb4650aa 3042 if (sscanf(val, "%i %i", &fd0, &fd1) != 2 || fd0 < 0 || fd1 < 0 || fd0 == fd1 || !fdset_contains(fds, fd0) || !fdset_contains(fds, fd1))
62c460c6 3043 log_notice("Failed to parse user lookup fd: %s", val);
00d9ef85
LP
3044 else {
3045 m->user_lookup_event_source = sd_event_source_unref(m->user_lookup_event_source);
3046 safe_close_pair(m->user_lookup_fds);
3047 m->user_lookup_fds[0] = fdset_remove(fds, fd0);
3048 m->user_lookup_fds[1] = fdset_remove(fds, fd1);
3049 }
3050
fb4650aa
ZJS
3051 } else if ((val = startswith(l, "dynamic-user=")))
3052 dynamic_user_deserialize_one(m, val, fds);
3053 else if ((val = startswith(l, "destroy-ipc-uid=")))
3054 manager_deserialize_uid_refs_one(m, val);
3055 else if ((val = startswith(l, "destroy-ipc-gid=")))
3056 manager_deserialize_gid_refs_one(m, val);
e8a565cb
YW
3057 else if ((val = startswith(l, "exec-runtime=")))
3058 exec_runtime_deserialize_one(m, val, fds);
fb4650aa 3059 else if ((val = startswith(l, "subscribed="))) {
05a98afd 3060
fb4650aa 3061 if (strv_extend(&m->deserialized_subscribed, val) < 0)
05a98afd 3062 log_oom();
9f9f0342
LP
3063 } else {
3064 ManagerTimestamp q;
3065
3066 for (q = 0; q < _MANAGER_TIMESTAMP_MAX; q++) {
3067 val = startswith(l, manager_timestamp_to_string(q));
3068 if (!val)
3069 continue;
05a98afd 3070
9f9f0342
LP
3071 val = startswith(val, "-timestamp=");
3072 if (val)
3073 break;
3074 }
05a98afd 3075
9f9f0342
LP
3076 if (q < _MANAGER_TIMESTAMP_MAX) /* found it */
3077 dual_timestamp_deserialize(val, m->timestamps + q);
3078 else if (!startswith(l, "kdbus-fd=")) /* ignore kdbus */
3079 log_notice("Unknown serialization item '%s'", l);
3080 }
10f8e83c
LP
3081 }
3082
a16e1123
LP
3083 for (;;) {
3084 Unit *u;
3085 char name[UNIT_NAME_MAX+2];
07429866 3086 const char* unit_name;
a16e1123
LP
3087
3088 /* Start marker */
3089 if (!fgets(name, sizeof(name), f)) {
3090 if (feof(f))
10f8e83c
LP
3091 r = 0;
3092 else
3093 r = -errno;
a16e1123 3094
82c64bf5 3095 goto finish;
a16e1123
LP
3096 }
3097
3098 char_array_0(name);
07429866 3099 unit_name = strstrip(name);
a16e1123 3100
07429866
ZJS
3101 r = manager_load_unit(m, unit_name, NULL, NULL, &u);
3102 if (r < 0) {
3103 log_notice_errno(r, "Failed to load unit \"%s\", skipping deserialization: %m", unit_name);
3104 if (r == -ENOMEM)
3105 goto finish;
3106 unit_deserialize_skip(f);
3107 continue;
3108 }
a16e1123 3109
01e10de3 3110 r = unit_deserialize(u, f, fds);
07429866
ZJS
3111 if (r < 0) {
3112 log_notice_errno(r, "Failed to deserialize unit \"%s\": %m", unit_name);
3113 if (r == -ENOMEM)
3114 goto finish;
3115 }
a16e1123
LP
3116 }
3117
10f8e83c 3118finish:
145b1f79 3119 if (ferror(f))
82c64bf5 3120 r = -EIO;
a16e1123 3121
a7556052 3122 assert(m->n_reloading > 0);
313cefa1 3123 m->n_reloading--;
82c64bf5
LP
3124
3125 return r;
a16e1123
LP
3126}
3127
3128int manager_reload(Manager *m) {
3129 int r, q;
51d122af
ZJS
3130 _cleanup_fclose_ FILE *f = NULL;
3131 _cleanup_fdset_free_ FDSet *fds = NULL;
a16e1123
LP
3132
3133 assert(m);
3134
07719a21
LP
3135 r = manager_open_serialization(m, &f);
3136 if (r < 0)
a16e1123
LP
3137 return r;
3138
313cefa1 3139 m->n_reloading++;
718db961 3140 bus_manager_send_reloading(m, true);
38c52d46 3141
07719a21
LP
3142 fds = fdset_new();
3143 if (!fds) {
313cefa1 3144 m->n_reloading--;
51d122af 3145 return -ENOMEM;
a16e1123
LP
3146 }
3147
b3680f49 3148 r = manager_serialize(m, f, fds, false);
07719a21 3149 if (r < 0) {
313cefa1 3150 m->n_reloading--;
51d122af 3151 return r;
38c52d46 3152 }
a16e1123
LP
3153
3154 if (fseeko(f, 0, SEEK_SET) < 0) {
313cefa1 3155 m->n_reloading--;
51d122af 3156 return -errno;
a16e1123
LP
3157 }
3158
3159 /* From here on there is no way back. */
3160 manager_clear_jobs_and_units(m);
07a78643 3161 lookup_paths_flush_generator(&m->lookup_paths);
84e3543e 3162 lookup_paths_free(&m->lookup_paths);
e8a565cb 3163 exec_runtime_vacuum(m);
29206d46 3164 dynamic_user_vacuum(m, false);
00d9ef85
LP
3165 m->uid_refs = hashmap_free(m->uid_refs);
3166 m->gid_refs = hashmap_free(m->gid_refs);
2ded0c04 3167
4943d143 3168 q = lookup_paths_init(&m->lookup_paths, m->unit_file_scope, 0, NULL);
e801700e
ZJS
3169 if (q < 0 && r >= 0)
3170 r = q;
5a1e9937 3171
64691d20
ZJS
3172 q = manager_run_environment_generators(m);
3173 if (q < 0 && r >= 0)
3174 r = q;
3175
a3c4eb07
LP
3176 /* Find new unit paths */
3177 q = manager_run_generators(m);
e801700e 3178 if (q < 0 && r >= 0)
07719a21
LP
3179 r = q;
3180
a1453343 3181 lookup_paths_reduce(&m->lookup_paths);
5a1e9937
LP
3182 manager_build_unit_path_cache(m);
3183
a16e1123 3184 /* First, enumerate what we can from all config files */
ba64af90 3185 manager_enumerate(m);
a16e1123
LP
3186
3187 /* Second, deserialize our stored data */
07719a21 3188 q = manager_deserialize(m, f, fds);
07429866
ZJS
3189 if (q < 0) {
3190 log_error_errno(q, "Deserialization failed: %m");
3191
3192 if (r >= 0)
3193 r = q;
3194 }
a16e1123
LP
3195
3196 fclose(f);
3197 f = NULL;
3198
a2cc4a6c
ZJS
3199 /* Re-register notify_fd as event source */
3200 q = manager_setup_notify(m);
e801700e 3201 if (q < 0 && r >= 0)
a2cc4a6c
ZJS
3202 r = q;
3203
d8fdc620
LP
3204 q = manager_setup_cgroups_agent(m);
3205 if (q < 0 && r >= 0)
3206 r = q;
3207
00d9ef85
LP
3208 q = manager_setup_user_lookup_fd(m);
3209 if (q < 0 && r >= 0)
3210 r = q;
3211
a16e1123 3212 /* Third, fire things up! */
007c6337 3213 manager_coldplug(m);
a16e1123 3214
29206d46
LP
3215 /* Release any dynamic users no longer referenced */
3216 dynamic_user_vacuum(m, true);
3217
00d9ef85
LP
3218 /* Release any references to UIDs/GIDs no longer referenced, and destroy any IPC owned by them */
3219 manager_vacuum_uid_refs(m);
3220 manager_vacuum_gid_refs(m);
3221
e8a565cb
YW
3222 exec_runtime_vacuum(m);
3223
31dc1ca3
LP
3224 assert(m->n_reloading > 0);
3225 m->n_reloading--;
3226
8559b3b7 3227 /* It might be safe to log to the journal now and connect to dbus */
d075092f 3228 manager_recheck_journal(m);
8559b3b7 3229 manager_recheck_dbus(m);
d075092f 3230
8936a5e3 3231 /* Sync current state of bus names with our set of listening units */
5f109056
LP
3232 q = manager_enqueue_sync_bus_names(m);
3233 if (q < 0 && r >= 0)
3234 r = q;
8936a5e3 3235
71445ae7
LP
3236 m->send_reloading_done = true;
3237
a16e1123
LP
3238 return r;
3239}
3240
fdf20a31 3241void manager_reset_failed(Manager *m) {
5632e374
LP
3242 Unit *u;
3243 Iterator i;
3244
3245 assert(m);
3246
3247 HASHMAP_FOREACH(u, m->units, i)
fdf20a31 3248 unit_reset_failed(u);
5632e374
LP
3249}
3250
31afa0a4 3251bool manager_unit_inactive_or_pending(Manager *m, const char *name) {
8f6df3fa
LP
3252 Unit *u;
3253
3254 assert(m);
3255 assert(name);
3256
3257 /* Returns true if the unit is inactive or going down */
bd0af849
ZJS
3258 u = manager_get_unit(m, name);
3259 if (!u)
8f6df3fa
LP
3260 return true;
3261
31afa0a4 3262 return unit_inactive_or_pending(u);
8f6df3fa
LP
3263}
3264
d8eb10d6
ZJS
3265static void log_taint_string(Manager *m) {
3266 _cleanup_free_ char *taint = NULL;
3267
3268 assert(m);
3269
3270 if (MANAGER_IS_USER(m) || m->taint_logged)
3271 return;
3272
3273 m->taint_logged = true; /* only check for taint once */
3274
3275 taint = manager_taint_string(m);
3276 if (isempty(taint))
3277 return;
3278
3279 log_struct(LOG_NOTICE,
3280 LOG_MESSAGE("System is tainted: %s", taint),
3281 "TAINT=%s", taint,
3282 "MESSAGE_ID=" SD_MESSAGE_TAINTED_STR,
3283 NULL);
3284}
3285
56dacdbc 3286static void manager_notify_finished(Manager *m) {
7ceba241 3287 char userspace[FORMAT_TIMESPAN_MAX], initrd[FORMAT_TIMESPAN_MAX], kernel[FORMAT_TIMESPAN_MAX], sum[FORMAT_TIMESPAN_MAX];
915b3753 3288 usec_t firmware_usec, loader_usec, kernel_usec, initrd_usec, userspace_usec, total_usec;
b0c918b9 3289
e0a3da1f 3290 if (m->test_run_flags)
b0c918b9
LP
3291 return;
3292
463d0d15 3293 if (MANAGER_IS_SYSTEM(m) && detect_container() <= 0) {
dd1db3c2 3294 char ts[FORMAT_TIMESPAN_MAX];
dc3c9f5e
ZJS
3295 char buf[FORMAT_TIMESPAN_MAX + STRLEN(" (firmware) + ") + FORMAT_TIMESPAN_MAX + STRLEN(" (loader) + ")]
3296 = {};
3297 char *p = buf;
3298 size_t size = sizeof buf;
e03ae661 3299
9f9f0342
LP
3300 /* Note that MANAGER_TIMESTAMP_KERNEL's monotonic value is always at 0, and
3301 * MANAGER_TIMESTAMP_FIRMWARE's and MANAGER_TIMESTAMP_LOADER's monotonic value should be considered
915b3753
LP
3302 * negative values. */
3303
9f9f0342
LP
3304 firmware_usec = m->timestamps[MANAGER_TIMESTAMP_FIRMWARE].monotonic - m->timestamps[MANAGER_TIMESTAMP_LOADER].monotonic;
3305 loader_usec = m->timestamps[MANAGER_TIMESTAMP_LOADER].monotonic - m->timestamps[MANAGER_TIMESTAMP_KERNEL].monotonic;
3306 userspace_usec = m->timestamps[MANAGER_TIMESTAMP_FINISH].monotonic - m->timestamps[MANAGER_TIMESTAMP_USERSPACE].monotonic;
3307 total_usec = m->timestamps[MANAGER_TIMESTAMP_FIRMWARE].monotonic + m->timestamps[MANAGER_TIMESTAMP_FINISH].monotonic;
18fa6b27 3308
dd1db3c2
YW
3309 if (firmware_usec > 0)
3310 size = strpcpyf(&p, size, "%s (firmware) + ", format_timespan(ts, sizeof(ts), firmware_usec, USEC_PER_MSEC));
3311 if (loader_usec > 0)
3312 size = strpcpyf(&p, size, "%s (loader) + ", format_timespan(ts, sizeof(ts), loader_usec, USEC_PER_MSEC));
3313
9f9f0342 3314 if (dual_timestamp_is_set(&m->timestamps[MANAGER_TIMESTAMP_INITRD])) {
18fa6b27 3315
9f9f0342
LP
3316 /* The initrd case on bare-metal*/
3317 kernel_usec = m->timestamps[MANAGER_TIMESTAMP_INITRD].monotonic - m->timestamps[MANAGER_TIMESTAMP_KERNEL].monotonic;
3318 initrd_usec = m->timestamps[MANAGER_TIMESTAMP_USERSPACE].monotonic - m->timestamps[MANAGER_TIMESTAMP_INITRD].monotonic;
18fa6b27 3319
e12919e8 3320 log_struct(LOG_INFO,
2b044526 3321 "MESSAGE_ID=" SD_MESSAGE_STARTUP_FINISHED_STR,
e12919e8
LP
3322 "KERNEL_USEC="USEC_FMT, kernel_usec,
3323 "INITRD_USEC="USEC_FMT, initrd_usec,
3324 "USERSPACE_USEC="USEC_FMT, userspace_usec,
dd1db3c2
YW
3325 LOG_MESSAGE("Startup finished in %s%s (kernel) + %s (initrd) + %s (userspace) = %s.",
3326 buf,
e2cc6eca
LP
3327 format_timespan(kernel, sizeof(kernel), kernel_usec, USEC_PER_MSEC),
3328 format_timespan(initrd, sizeof(initrd), initrd_usec, USEC_PER_MSEC),
3329 format_timespan(userspace, sizeof(userspace), userspace_usec, USEC_PER_MSEC),
3330 format_timespan(sum, sizeof(sum), total_usec, USEC_PER_MSEC)),
e12919e8 3331 NULL);
18fa6b27 3332 } else {
9f9f0342
LP
3333 /* The initrd-less case on bare-metal*/
3334
3335 kernel_usec = m->timestamps[MANAGER_TIMESTAMP_USERSPACE].monotonic - m->timestamps[MANAGER_TIMESTAMP_KERNEL].monotonic;
18fa6b27
LP
3336 initrd_usec = 0;
3337
81270860 3338 log_struct(LOG_INFO,
2b044526 3339 "MESSAGE_ID=" SD_MESSAGE_STARTUP_FINISHED_STR,
e12919e8 3340 "KERNEL_USEC="USEC_FMT, kernel_usec,
ccd06097 3341 "USERSPACE_USEC="USEC_FMT, userspace_usec,
dd1db3c2
YW
3342 LOG_MESSAGE("Startup finished in %s%s (kernel) + %s (userspace) = %s.",
3343 buf,
e2cc6eca
LP
3344 format_timespan(kernel, sizeof(kernel), kernel_usec, USEC_PER_MSEC),
3345 format_timespan(userspace, sizeof(userspace), userspace_usec, USEC_PER_MSEC),
3346 format_timespan(sum, sizeof(sum), total_usec, USEC_PER_MSEC)),
81270860 3347 NULL);
e12919e8
LP
3348 }
3349 } else {
4adf314b 3350 /* The container and --user case */
e12919e8 3351 firmware_usec = loader_usec = initrd_usec = kernel_usec = 0;
9f9f0342 3352 total_usec = userspace_usec = m->timestamps[MANAGER_TIMESTAMP_FINISH].monotonic - m->timestamps[MANAGER_TIMESTAMP_USERSPACE].monotonic;
e12919e8
LP
3353
3354 log_struct(LOG_INFO,
2b044526 3355 "MESSAGE_ID=" SD_MESSAGE_USER_STARTUP_FINISHED_STR,
e12919e8 3356 "USERSPACE_USEC="USEC_FMT, userspace_usec,
e2cc6eca
LP
3357 LOG_MESSAGE("Startup finished in %s.",
3358 format_timespan(sum, sizeof(sum), total_usec, USEC_PER_MSEC)),
e12919e8 3359 NULL);
18fa6b27 3360 }
b0c918b9 3361
718db961 3362 bus_manager_send_finished(m, firmware_usec, loader_usec, kernel_usec, initrd_usec, userspace_usec, total_usec);
530345e7
LP
3363
3364 sd_notifyf(false,
0c2826c6
ZJS
3365 m->ready_sent ? "STATUS=Startup finished in %s."
3366 : "READY=1\n"
3367 "STATUS=Startup finished in %s.",
2fa4092c 3368 format_timespan(sum, sizeof(sum), total_usec, USEC_PER_MSEC));
0c2826c6 3369 m->ready_sent = true;
d8eb10d6
ZJS
3370
3371 log_taint_string(m);
b0c918b9
LP
3372}
3373
4adf314b
LP
3374static void manager_send_ready(Manager *m) {
3375 assert(m);
3376
3377 /* We send READY=1 on reaching basic.target only when running in --user mode. */
3378 if (!MANAGER_IS_USER(m) || m->ready_sent)
3379 return;
3380
3381 m->ready_sent = true;
3382
3383 sd_notifyf(false,
3384 "READY=1\n"
3385 "STATUS=Reached " SPECIAL_BASIC_TARGET ".");
3386}
3387
3388static void manager_check_basic_target(Manager *m) {
3389 Unit *u;
3390
3391 assert(m);
3392
3393 /* Small shortcut */
3394 if (m->ready_sent && m->taint_logged)
3395 return;
3396
3397 u = manager_get_unit(m, SPECIAL_BASIC_TARGET);
3398 if (!u || !UNIT_IS_ACTIVE_OR_RELOADING(unit_active_state(u)))
3399 return;
3400
3401 /* For user managers, send out READY=1 as soon as we reach basic.target */
3402 manager_send_ready(m);
3403
3404 /* Log the taint string as soon as we reach basic.target */
3405 log_taint_string(m);
3406}
3407
56dacdbc 3408void manager_check_finished(Manager *m) {
56dacdbc
ZJS
3409 assert(m);
3410
2c289ea8 3411 if (MANAGER_IS_RELOADING(m))
aad1976f
LP
3412 return;
3413
4259d202
LP
3414 /* Verify that we have entered the event loop already, and not left it again. */
3415 if (!MANAGER_IS_RUNNING(m))
9771b62d
LP
3416 return;
3417
4adf314b 3418 manager_check_basic_target(m);
0c2826c6 3419
56dacdbc 3420 if (hashmap_size(m->jobs) > 0) {
56dacdbc 3421 if (m->jobs_in_progress_event_source)
2ae56591 3422 /* Ignore any failure, this is only for feedback */
e7ab4d1a 3423 (void) sd_event_source_set_time(m->jobs_in_progress_event_source, now(CLOCK_MONOTONIC) + JOBS_IN_PROGRESS_WAIT_USEC);
56dacdbc
ZJS
3424
3425 return;
3426 }
3427
3428 manager_flip_auto_status(m, false);
3429
3430 /* Notify Type=idle units that we are done now */
56dacdbc
ZJS
3431 manager_close_idle_pipe(m);
3432
3433 /* Turn off confirm spawn now */
7d5ceb64 3434 m->confirm_spawn = NULL;
56dacdbc
ZJS
3435
3436 /* No need to update ask password status when we're going non-interactive */
3437 manager_close_ask_password(m);
3438
3439 /* This is no longer the first boot */
3440 manager_set_first_boot(m, false);
3441
49d5666c 3442 if (MANAGER_IS_FINISHED(m))
56dacdbc
ZJS
3443 return;
3444
9f9f0342 3445 dual_timestamp_get(m->timestamps + MANAGER_TIMESTAMP_FINISH);
56dacdbc
ZJS
3446
3447 manager_notify_finished(m);
3448
e7ab4d1a 3449 manager_invalidate_startup_units(m);
56dacdbc
ZJS
3450}
3451
64691d20
ZJS
3452static bool generator_path_any(const char* const* paths) {
3453 char **path;
3454 bool found = false;
3455
3456 /* Optimize by skipping the whole process by not creating output directories
3457 * if no generators are found. */
3458 STRV_FOREACH(path, (char**) paths)
3459 if (access(*path, F_OK) == 0)
3460 found = true;
3461 else if (errno != ENOENT)
3462 log_warning_errno(errno, "Failed to open generator directory %s: %m", *path);
3463
3464 return found;
3465}
3466
3467static const char* system_env_generator_binary_paths[] = {
3468 "/run/systemd/system-environment-generators",
3469 "/etc/systemd/system-environment-generators",
3470 "/usr/local/lib/systemd/system-environment-generators",
3471 SYSTEM_ENV_GENERATOR_PATH,
3472 NULL
3473};
3474
3475static const char* user_env_generator_binary_paths[] = {
3476 "/run/systemd/user-environment-generators",
3477 "/etc/systemd/user-environment-generators",
3478 "/usr/local/lib/systemd/user-environment-generators",
3479 USER_ENV_GENERATOR_PATH,
3480 NULL
3481};
3482
3483static int manager_run_environment_generators(Manager *m) {
3484 char **tmp = NULL; /* this is only used in the forked process, no cleanup here */
3485 const char **paths;
3486 void* args[] = {&tmp, &tmp, &m->environment};
3487
e0a3da1f
ZJS
3488 if (m->test_run_flags && !(m->test_run_flags & MANAGER_TEST_RUN_ENV_GENERATORS))
3489 return 0;
3490
64691d20
ZJS
3491 paths = MANAGER_IS_SYSTEM(m) ? system_env_generator_binary_paths : user_env_generator_binary_paths;
3492
3493 if (!generator_path_any(paths))
3494 return 0;
3495
3496 return execute_directories(paths, DEFAULT_TIMEOUT_USEC, gather_environment, args, NULL);
3497}
3498
e801700e 3499static int manager_run_generators(Manager *m) {
f42348ac 3500 _cleanup_strv_free_ char **paths = NULL;
07719a21 3501 const char *argv[5];
07719a21 3502 int r;
5a1e9937
LP
3503
3504 assert(m);
3505
e0a3da1f
ZJS
3506 if (m->test_run_flags && !(m->test_run_flags & MANAGER_TEST_RUN_GENERATORS))
3507 return 0;
3508
9183df70 3509 paths = generator_binary_paths(m->unit_file_scope);
e801700e
ZJS
3510 if (!paths)
3511 return log_oom();
5a1e9937 3512
64691d20
ZJS
3513 if (!generator_path_any((const char* const*) paths))
3514 return 0;
5a1e9937 3515
cd64fd56 3516 r = lookup_paths_mkdir_generator(&m->lookup_paths);
07719a21
LP
3517 if (r < 0)
3518 goto finish;
5a1e9937 3519
83cc030f 3520 argv[0] = NULL; /* Leave this empty, execute_directory() will fill something in */
a3c4eb07
LP
3521 argv[1] = m->lookup_paths.generator;
3522 argv[2] = m->lookup_paths.generator_early;
3523 argv[3] = m->lookup_paths.generator_late;
07719a21 3524 argv[4] = NULL;
5a1e9937 3525
718db961 3526 RUN_WITH_UMASK(0022)
c6e47247
ZJS
3527 execute_directories((const char* const*) paths, DEFAULT_TIMEOUT_USEC,
3528 NULL, NULL, (char**) argv);
5a1e9937 3529
718db961 3530finish:
cd64fd56 3531 lookup_paths_trim_generator(&m->lookup_paths);
e801700e 3532 return r;
5a1e9937
LP
3533}
3534
718db961
LP
3535int manager_environment_add(Manager *m, char **minus, char **plus) {
3536 char **a = NULL, **b = NULL, **l;
97d0e5f8 3537 assert(m);
bcd8e6d1 3538
718db961 3539 l = m->environment;
bcd8e6d1 3540
718db961
LP
3541 if (!strv_isempty(minus)) {
3542 a = strv_env_delete(l, 1, minus);
3543 if (!a)
3544 return -ENOMEM;
3545
3546 l = a;
3547 }
3548
3549 if (!strv_isempty(plus)) {
3550 b = strv_env_merge(2, l, plus);
aa9f8a30
AH
3551 if (!b) {
3552 strv_free(a);
718db961 3553 return -ENOMEM;
aa9f8a30 3554 }
bcd8e6d1 3555
718db961
LP
3556 l = b;
3557 }
3558
3559 if (m->environment != l)
3560 strv_free(m->environment);
3561 if (a != l)
3562 strv_free(a);
3563 if (b != l)
3564 strv_free(b);
3565
f069efb4 3566 m->environment = l;
47cf8ff2 3567 manager_sanitize_environment(m);
f069efb4 3568
97d0e5f8
UTL
3569 return 0;
3570}
3571
c93ff2e9
FC
3572int manager_set_default_rlimits(Manager *m, struct rlimit **default_rlimit) {
3573 int i;
3574
3575 assert(m);
3576
517d56b1 3577 for (i = 0; i < _RLIMIT_MAX; i++) {
d9814c76
EV
3578 m->rlimit[i] = mfree(m->rlimit[i]);
3579
07719a21
LP
3580 if (!default_rlimit[i])
3581 continue;
c93ff2e9 3582
07719a21
LP
3583 m->rlimit[i] = newdup(struct rlimit, default_rlimit[i], 1);
3584 if (!m->rlimit[i])
3ce40911 3585 return log_oom();
c93ff2e9
FC
3586 }
3587
3588 return 0;
3589}
3590
8559b3b7
LP
3591void manager_recheck_dbus(Manager *m) {
3592 assert(m);
3593
3594 /* Connects to the bus if the dbus service and socket are running. If we are running in user mode this is all
3595 * it does. In system mode we'll also connect to the system bus (which will most likely just reuse the
3596 * connection of the API bus). That's because the system bus after all runs as service of the system instance,
3597 * while in the user instance we can assume it's already there. */
3598
31dc1ca3
LP
3599 if (MANAGER_IS_RELOADING(m))
3600 return; /* don't check while we are reloading… */
3601
8559b3b7
LP
3602 if (manager_dbus_is_running(m, false)) {
3603 (void) bus_init_api(m);
3604
3605 if (MANAGER_IS_SYSTEM(m))
3606 (void) bus_init_system(m);
3607 } else {
3608 (void) bus_done_api(m);
3609
3610 if (MANAGER_IS_SYSTEM(m))
3611 (void) bus_done_system(m);
3612 }
3613}
3614
d075092f 3615static bool manager_journal_is_running(Manager *m) {
f1dd0c3f
LP
3616 Unit *u;
3617
3618 assert(m);
3619
7d814a19
LP
3620 if (m->test_run_flags != 0)
3621 return false;
3622
d075092f 3623 /* If we are the user manager we can safely assume that the journal is up */
463d0d15 3624 if (!MANAGER_IS_SYSTEM(m))
d075092f 3625 return true;
f1dd0c3f 3626
d075092f 3627 /* Check that the socket is not only up, but in RUNNING state */
731a676c 3628 u = manager_get_unit(m, SPECIAL_JOURNALD_SOCKET);
d075092f
LP
3629 if (!u)
3630 return false;
3631 if (SOCKET(u)->state != SOCKET_RUNNING)
3632 return false;
f1dd0c3f 3633
d075092f 3634 /* Similar, check if the daemon itself is fully up, too */
731a676c 3635 u = manager_get_unit(m, SPECIAL_JOURNALD_SERVICE);
d075092f
LP
3636 if (!u)
3637 return false;
217677ab 3638 if (!IN_SET(SERVICE(u)->state, SERVICE_RELOAD, SERVICE_RUNNING))
d075092f
LP
3639 return false;
3640
3641 return true;
3642}
3643
3644void manager_recheck_journal(Manager *m) {
3645
3646 assert(m);
3647
3648 /* Don't bother with this unless we are in the special situation of being PID 1 */
3649 if (getpid_cached() != 1)
731a676c 3650 return;
f1dd0c3f 3651
31dc1ca3
LP
3652 /* Don't check this while we are reloading, things might still change */
3653 if (MANAGER_IS_RELOADING(m))
3654 return;
3655
cedf5088
LP
3656 /* The journal is fully and entirely up? If so, let's permit logging to it, if that's configured. If the
3657 * journal is down, don't ever log to it, otherwise we might end up deadlocking ourselves as we might trigger
3658 * an activation ourselves we can't fulfill. */
3659 log_set_prohibit_ipc(!manager_journal_is_running(m));
cc2b9e6b 3660 log_open();
f1dd0c3f
LP
3661}
3662
d450b6f2 3663void manager_set_show_status(Manager *m, ShowStatus mode) {
27d340c7 3664 assert(m);
d450b6f2 3665 assert(IN_SET(mode, SHOW_STATUS_AUTO, SHOW_STATUS_NO, SHOW_STATUS_YES, SHOW_STATUS_TEMPORARY));
27d340c7 3666
463d0d15 3667 if (!MANAGER_IS_SYSTEM(m))
27d340c7
LP
3668 return;
3669
76b6f3f6
ZJS
3670 if (m->show_status != mode)
3671 log_debug("%s showing of status.",
3672 mode == SHOW_STATUS_NO ? "Disabling" : "Enabling");
d450b6f2 3673 m->show_status = mode;
27d340c7 3674
d450b6f2 3675 if (mode > 0)
ac5b0c13 3676 (void) touch("/run/systemd/show-status");
27d340c7 3677 else
ac5b0c13 3678 (void) unlink("/run/systemd/show-status");
27d340c7
LP
3679}
3680
127d5fd1 3681static bool manager_get_show_status(Manager *m, StatusType type) {
27d340c7
LP
3682 assert(m);
3683
463d0d15 3684 if (!MANAGER_IS_SYSTEM(m))
27d340c7
LP
3685 return false;
3686
31a7eb86
ZJS
3687 if (m->no_console_output)
3688 return false;
3689
d81afec1 3690 if (!IN_SET(manager_state(m), MANAGER_INITIALIZING, MANAGER_STARTING, MANAGER_STOPPING))
08510627
LP
3691 return false;
3692
e46b13c8 3693 /* If we cannot find out the status properly, just proceed. */
ebc5788e 3694 if (type != STATUS_TYPE_EMERGENCY && manager_check_ask_password(m) > 0)
e46b13c8
ZJS
3695 return false;
3696
46fb617b 3697 return m->show_status > 0;
27d340c7 3698}
68b29a9f 3699
7d5ceb64
FB
3700const char *manager_get_confirm_spawn(Manager *m) {
3701 static int last_errno = 0;
3702 const char *vc = m->confirm_spawn;
3703 struct stat st;
3704 int r;
3705
3706 /* Here's the deal: we want to test the validity of the console but don't want
3707 * PID1 to go through the whole console process which might block. But we also
3708 * want to warn the user only once if something is wrong with the console so we
3709 * cannot do the sanity checks after spawning our children. So here we simply do
3710 * really basic tests to hopefully trap common errors.
3711 *
3712 * If the console suddenly disappear at the time our children will really it
3713 * then they will simply fail to acquire it and a positive answer will be
3714 * assumed. New children will fallback to /dev/console though.
3715 *
3716 * Note: TTYs are devices that can come and go any time, and frequently aren't
3717 * available yet during early boot (consider a USB rs232 dongle...). If for any
3718 * reason the configured console is not ready, we fallback to the default
3719 * console. */
3720
3721 if (!vc || path_equal(vc, "/dev/console"))
3722 return vc;
3723
3724 r = stat(vc, &st);
3725 if (r < 0)
3726 goto fail;
3727
3728 if (!S_ISCHR(st.st_mode)) {
3729 errno = ENOTTY;
3730 goto fail;
3731 }
3732
3733 last_errno = 0;
3734 return vc;
3735fail:
3736 if (last_errno != errno) {
3737 last_errno = errno;
3738 log_warning_errno(errno, "Failed to open %s: %m, using default console", vc);
3739 }
3740 return "/dev/console";
3741}
3742
e2680723
LP
3743void manager_set_first_boot(Manager *m, bool b) {
3744 assert(m);
3745
463d0d15 3746 if (!MANAGER_IS_SYSTEM(m))
e2680723
LP
3747 return;
3748
ae2a2c53
LP
3749 if (m->first_boot != (int) b) {
3750 if (b)
3751 (void) touch("/run/systemd/first-boot");
3752 else
3753 (void) unlink("/run/systemd/first-boot");
3754 }
e2680723 3755
ae2a2c53 3756 m->first_boot = b;
e2680723
LP
3757}
3758
b0eb2944
FB
3759void manager_disable_confirm_spawn(void) {
3760 (void) touch("/run/systemd/confirm_spawn_disabled");
3761}
3762
3763bool manager_is_confirm_spawn_disabled(Manager *m) {
3764 if (!m->confirm_spawn)
3765 return true;
3766
3767 return access("/run/systemd/confirm_spawn_disabled", F_OK) >= 0;
3768}
3769
127d5fd1 3770void manager_status_printf(Manager *m, StatusType type, const char *status, const char *format, ...) {
25cee550
MS
3771 va_list ap;
3772
cb6531be
ZJS
3773 /* If m is NULL, assume we're after shutdown and let the messages through. */
3774
3775 if (m && !manager_get_show_status(m, type))
25cee550
MS
3776 return;
3777
03b717a3
MS
3778 /* XXX We should totally drop the check for ephemeral here
3779 * and thus effectively make 'Type=idle' pointless. */
cb6531be 3780 if (type == STATUS_TYPE_EPHEMERAL && m && m->n_on_console > 0)
03b717a3
MS
3781 return;
3782
25cee550 3783 va_start(ap, format);
127d5fd1 3784 status_vprintf(status, true, type == STATUS_TYPE_EPHEMERAL, format, ap);
25cee550
MS
3785 va_end(ap);
3786}
3787
a57f7e2c
LP
3788Set *manager_get_units_requiring_mounts_for(Manager *m, const char *path) {
3789 char p[strlen(path)+1];
3790
3791 assert(m);
3792 assert(path);
3793
3794 strcpy(p, path);
3795 path_kill_slashes(p);
3796
3797 return hashmap_get(m->units_requiring_mounts_for, streq(p, "/") ? "" : p);
3798}
e66cf1a3 3799
5269eb6b 3800int manager_update_failed_units(Manager *m, Unit *u, bool failed) {
03455c28 3801 unsigned size;
5269eb6b 3802 int r;
03455c28
LDM
3803
3804 assert(m);
3805 assert(u->manager == m);
3806
3807 size = set_size(m->failed_units);
3808
9fff8981 3809 if (failed) {
5269eb6b
LP
3810 r = set_ensure_allocated(&m->failed_units, NULL);
3811 if (r < 0)
3812 return log_oom();
3813
9fff8981 3814 if (set_put(m->failed_units, u) < 0)
5269eb6b 3815 return log_oom();
9fff8981 3816 } else
5269eb6b 3817 (void) set_remove(m->failed_units, u);
03455c28
LDM
3818
3819 if (set_size(m->failed_units) != size)
3820 bus_manager_send_change_signal(m);
5269eb6b
LP
3821
3822 return 0;
03455c28
LDM
3823}
3824
f755e3b7
LP
3825ManagerState manager_state(Manager *m) {
3826 Unit *u;
3827
3828 assert(m);
3829
3830 /* Did we ever finish booting? If not then we are still starting up */
49d5666c 3831 if (!MANAGER_IS_FINISHED(m)) {
d81afec1
LP
3832
3833 u = manager_get_unit(m, SPECIAL_BASIC_TARGET);
3834 if (!u || !UNIT_IS_ACTIVE_OR_RELOADING(unit_active_state(u)))
3835 return MANAGER_INITIALIZING;
3836
f755e3b7 3837 return MANAGER_STARTING;
d81afec1 3838 }
f755e3b7 3839
e68537f0 3840 /* Is the special shutdown target active or queued? If so, we are in shutdown state */
f755e3b7 3841 u = manager_get_unit(m, SPECIAL_SHUTDOWN_TARGET);
706424c2 3842 if (u && unit_active_or_pending(u))
f755e3b7
LP
3843 return MANAGER_STOPPING;
3844
45a7b16b
LP
3845 if (MANAGER_IS_SYSTEM(m)) {
3846 /* Are the rescue or emergency targets active or queued? If so we are in maintenance state */
3847 u = manager_get_unit(m, SPECIAL_RESCUE_TARGET);
3848 if (u && unit_active_or_pending(u))
3849 return MANAGER_MAINTENANCE;
f755e3b7 3850
45a7b16b
LP
3851 u = manager_get_unit(m, SPECIAL_EMERGENCY_TARGET);
3852 if (u && unit_active_or_pending(u))
3853 return MANAGER_MAINTENANCE;
3854 }
f755e3b7
LP
3855
3856 /* Are there any failed units? If so, we are in degraded mode */
3857 if (set_size(m->failed_units) > 0)
3858 return MANAGER_DEGRADED;
3859
3860 return MANAGER_RUNNING;
3861}
3862
00d9ef85
LP
3863#define DESTROY_IPC_FLAG (UINT32_C(1) << 31)
3864
3865static void manager_unref_uid_internal(
3866 Manager *m,
3867 Hashmap **uid_refs,
3868 uid_t uid,
3869 bool destroy_now,
3870 int (*_clean_ipc)(uid_t uid)) {
3871
3872 uint32_t c, n;
3873
3874 assert(m);
3875 assert(uid_refs);
3876 assert(uid_is_valid(uid));
3877 assert(_clean_ipc);
3878
3879 /* A generic implementation, covering both manager_unref_uid() and manager_unref_gid(), under the assumption
3880 * that uid_t and gid_t are actually defined the same way, with the same validity rules.
3881 *
3882 * We store a hashmap where the UID/GID is they key and the value is a 32bit reference counter, whose highest
3883 * bit is used as flag for marking UIDs/GIDs whose IPC objects to remove when the last reference to the UID/GID
3884 * is dropped. The flag is set to on, once at least one reference from a unit where RemoveIPC= is set is added
3885 * on a UID/GID. It is reset when the UID's/GID's reference counter drops to 0 again. */
3886
3887 assert_cc(sizeof(uid_t) == sizeof(gid_t));
3888 assert_cc(UID_INVALID == (uid_t) GID_INVALID);
3889
3890 if (uid == 0) /* We don't keep track of root, and will never destroy it */
3891 return;
3892
3893 c = PTR_TO_UINT32(hashmap_get(*uid_refs, UID_TO_PTR(uid)));
3894
3895 n = c & ~DESTROY_IPC_FLAG;
3896 assert(n > 0);
3897 n--;
3898
3899 if (destroy_now && n == 0) {
3900 hashmap_remove(*uid_refs, UID_TO_PTR(uid));
3901
3902 if (c & DESTROY_IPC_FLAG) {
3903 log_debug("%s " UID_FMT " is no longer referenced, cleaning up its IPC.",
3904 _clean_ipc == clean_ipc_by_uid ? "UID" : "GID",
3905 uid);
3906 (void) _clean_ipc(uid);
3907 }
3908 } else {
3909 c = n | (c & DESTROY_IPC_FLAG);
3910 assert_se(hashmap_update(*uid_refs, UID_TO_PTR(uid), UINT32_TO_PTR(c)) >= 0);
3911 }
3912}
3913
3914void manager_unref_uid(Manager *m, uid_t uid, bool destroy_now) {
3915 manager_unref_uid_internal(m, &m->uid_refs, uid, destroy_now, clean_ipc_by_uid);
3916}
3917
3918void manager_unref_gid(Manager *m, gid_t gid, bool destroy_now) {
3919 manager_unref_uid_internal(m, &m->gid_refs, (uid_t) gid, destroy_now, clean_ipc_by_gid);
3920}
3921
3922static int manager_ref_uid_internal(
3923 Manager *m,
3924 Hashmap **uid_refs,
3925 uid_t uid,
3926 bool clean_ipc) {
3927
3928 uint32_t c, n;
3929 int r;
3930
3931 assert(m);
3932 assert(uid_refs);
3933 assert(uid_is_valid(uid));
3934
3935 /* A generic implementation, covering both manager_ref_uid() and manager_ref_gid(), under the assumption
3936 * that uid_t and gid_t are actually defined the same way, with the same validity rules. */
3937
3938 assert_cc(sizeof(uid_t) == sizeof(gid_t));
3939 assert_cc(UID_INVALID == (uid_t) GID_INVALID);
3940
3941 if (uid == 0) /* We don't keep track of root, and will never destroy it */
3942 return 0;
3943
3944 r = hashmap_ensure_allocated(uid_refs, &trivial_hash_ops);
3945 if (r < 0)
3946 return r;
3947
3948 c = PTR_TO_UINT32(hashmap_get(*uid_refs, UID_TO_PTR(uid)));
3949
3950 n = c & ~DESTROY_IPC_FLAG;
3951 n++;
3952
3953 if (n & DESTROY_IPC_FLAG) /* check for overflow */
3954 return -EOVERFLOW;
3955
3956 c = n | (c & DESTROY_IPC_FLAG) | (clean_ipc ? DESTROY_IPC_FLAG : 0);
3957
3958 return hashmap_replace(*uid_refs, UID_TO_PTR(uid), UINT32_TO_PTR(c));
3959}
3960
3961int manager_ref_uid(Manager *m, uid_t uid, bool clean_ipc) {
3962 return manager_ref_uid_internal(m, &m->uid_refs, uid, clean_ipc);
3963}
3964
3965int manager_ref_gid(Manager *m, gid_t gid, bool clean_ipc) {
3966 return manager_ref_uid_internal(m, &m->gid_refs, (uid_t) gid, clean_ipc);
3967}
3968
3969static void manager_vacuum_uid_refs_internal(
3970 Manager *m,
3971 Hashmap **uid_refs,
3972 int (*_clean_ipc)(uid_t uid)) {
3973
3974 Iterator i;
3975 void *p, *k;
3976
3977 assert(m);
3978 assert(uid_refs);
3979 assert(_clean_ipc);
3980
3981 HASHMAP_FOREACH_KEY(p, k, *uid_refs, i) {
3982 uint32_t c, n;
3983 uid_t uid;
3984
3985 uid = PTR_TO_UID(k);
3986 c = PTR_TO_UINT32(p);
3987
3988 n = c & ~DESTROY_IPC_FLAG;
3989 if (n > 0)
3990 continue;
3991
3992 if (c & DESTROY_IPC_FLAG) {
3993 log_debug("Found unreferenced %s " UID_FMT " after reload/reexec. Cleaning up.",
3994 _clean_ipc == clean_ipc_by_uid ? "UID" : "GID",
3995 uid);
3996 (void) _clean_ipc(uid);
3997 }
3998
3999 assert_se(hashmap_remove(*uid_refs, k) == p);
4000 }
4001}
4002
4003void manager_vacuum_uid_refs(Manager *m) {
4004 manager_vacuum_uid_refs_internal(m, &m->uid_refs, clean_ipc_by_uid);
4005}
4006
4007void manager_vacuum_gid_refs(Manager *m) {
4008 manager_vacuum_uid_refs_internal(m, &m->gid_refs, clean_ipc_by_gid);
4009}
4010
4011static void manager_serialize_uid_refs_internal(
4012 Manager *m,
4013 FILE *f,
4014 Hashmap **uid_refs,
4015 const char *field_name) {
4016
4017 Iterator i;
4018 void *p, *k;
4019
4020 assert(m);
4021 assert(f);
4022 assert(uid_refs);
4023 assert(field_name);
4024
4025 /* Serialize the UID reference table. Or actually, just the IPC destruction flag of it, as the actual counter
4026 * of it is better rebuild after a reload/reexec. */
4027
4028 HASHMAP_FOREACH_KEY(p, k, *uid_refs, i) {
4029 uint32_t c;
4030 uid_t uid;
4031
4032 uid = PTR_TO_UID(k);
4033 c = PTR_TO_UINT32(p);
4034
4035 if (!(c & DESTROY_IPC_FLAG))
4036 continue;
4037
4038 fprintf(f, "%s=" UID_FMT "\n", field_name, uid);
4039 }
4040}
4041
4042void manager_serialize_uid_refs(Manager *m, FILE *f) {
4043 manager_serialize_uid_refs_internal(m, f, &m->uid_refs, "destroy-ipc-uid");
4044}
4045
4046void manager_serialize_gid_refs(Manager *m, FILE *f) {
4047 manager_serialize_uid_refs_internal(m, f, &m->gid_refs, "destroy-ipc-gid");
4048}
4049
4050static void manager_deserialize_uid_refs_one_internal(
4051 Manager *m,
4052 Hashmap** uid_refs,
4053 const char *value) {
4054
4055 uid_t uid;
4056 uint32_t c;
4057 int r;
4058
4059 assert(m);
4060 assert(uid_refs);
4061 assert(value);
4062
4063 r = parse_uid(value, &uid);
4064 if (r < 0 || uid == 0) {
4065 log_debug("Unable to parse UID reference serialization");
4066 return;
4067 }
4068
4069 r = hashmap_ensure_allocated(uid_refs, &trivial_hash_ops);
4070 if (r < 0) {
4071 log_oom();
4072 return;
4073 }
4074
4075 c = PTR_TO_UINT32(hashmap_get(*uid_refs, UID_TO_PTR(uid)));
4076 if (c & DESTROY_IPC_FLAG)
4077 return;
4078
4079 c |= DESTROY_IPC_FLAG;
4080
4081 r = hashmap_replace(*uid_refs, UID_TO_PTR(uid), UINT32_TO_PTR(c));
4082 if (r < 0) {
4083 log_debug("Failed to add UID reference entry");
4084 return;
4085 }
4086}
4087
4088void manager_deserialize_uid_refs_one(Manager *m, const char *value) {
4089 manager_deserialize_uid_refs_one_internal(m, &m->uid_refs, value);
4090}
4091
4092void manager_deserialize_gid_refs_one(Manager *m, const char *value) {
4093 manager_deserialize_uid_refs_one_internal(m, &m->gid_refs, value);
4094}
4095
4096int manager_dispatch_user_lookup_fd(sd_event_source *source, int fd, uint32_t revents, void *userdata) {
4097 struct buffer {
4098 uid_t uid;
4099 gid_t gid;
4100 char unit_name[UNIT_NAME_MAX+1];
4101 } _packed_ buffer;
4102
4103 Manager *m = userdata;
4104 ssize_t l;
4105 size_t n;
4106 Unit *u;
4107
4108 assert_se(source);
4109 assert_se(m);
4110
4111 /* Invoked whenever a child process succeeded resolving its user/group to use and sent us the resulting UID/GID
4112 * in a datagram. We parse the datagram here and pass it off to the unit, so that it can add a reference to the
4113 * UID/GID so that it can destroy the UID/GID's IPC objects when the reference counter drops to 0. */
4114
4115 l = recv(fd, &buffer, sizeof(buffer), MSG_DONTWAIT);
4116 if (l < 0) {
4c701096 4117 if (IN_SET(errno, EINTR, EAGAIN))
00d9ef85
LP
4118 return 0;
4119
4120 return log_error_errno(errno, "Failed to read from user lookup fd: %m");
4121 }
4122
4123 if ((size_t) l <= offsetof(struct buffer, unit_name)) {
4124 log_warning("Received too short user lookup message, ignoring.");
4125 return 0;
4126 }
4127
4128 if ((size_t) l > offsetof(struct buffer, unit_name) + UNIT_NAME_MAX) {
4129 log_warning("Received too long user lookup message, ignoring.");
4130 return 0;
4131 }
4132
4133 if (!uid_is_valid(buffer.uid) && !gid_is_valid(buffer.gid)) {
4134 log_warning("Got user lookup message with invalid UID/GID pair, ignoring.");
4135 return 0;
4136 }
4137
4138 n = (size_t) l - offsetof(struct buffer, unit_name);
4139 if (memchr(buffer.unit_name, 0, n)) {
4140 log_warning("Received lookup message with embedded NUL character, ignoring.");
4141 return 0;
4142 }
4143
4144 buffer.unit_name[n] = 0;
4145 u = manager_get_unit(m, buffer.unit_name);
4146 if (!u) {
4147 log_debug("Got user lookup message but unit doesn't exist, ignoring.");
4148 return 0;
4149 }
4150
4151 log_unit_debug(u, "User lookup succeeded: uid=" UID_FMT " gid=" GID_FMT, buffer.uid, buffer.gid);
4152
4153 unit_notify_user_lookup(u, buffer.uid, buffer.gid);
4154 return 0;
4155}
4156
af6b0ecc 4157char *manager_taint_string(Manager *m) {
90d7464d 4158 _cleanup_free_ char *destination = NULL, *overflowuid = NULL, *overflowgid = NULL;
af6b0ecc
LP
4159 char *buf, *e;
4160 int r;
4161
198ce932
ZJS
4162 /* Returns a "taint string", e.g. "local-hwclock:var-run-bad".
4163 * Only things that are detected at runtime should be tagged
4164 * here. For stuff that is set during compilation, emit a warning
4165 * in the configuration phase. */
4166
af6b0ecc
LP
4167 assert(m);
4168
4169 buf = new(char, sizeof("split-usr:"
4170 "cgroups-missing:"
4171 "local-hwclock:"
4172 "var-run-bad:"
90d7464d
LP
4173 "overflowuid-not-65534:"
4174 "overflowgid-not-65534:"));
af6b0ecc
LP
4175 if (!buf)
4176 return NULL;
4177
4178 e = buf;
0fd402b0 4179 buf[0] = 0;
af6b0ecc
LP
4180
4181 if (m->taint_usr)
4182 e = stpcpy(e, "split-usr:");
4183
4184 if (access("/proc/cgroups", F_OK) < 0)
4185 e = stpcpy(e, "cgroups-missing:");
4186
4187 if (clock_is_localtime(NULL) > 0)
4188 e = stpcpy(e, "local-hwclock:");
4189
4190 r = readlink_malloc("/var/run", &destination);
4191 if (r < 0 || !PATH_IN_SET(destination, "../run", "/run"))
4192 e = stpcpy(e, "var-run-bad:");
4193
90d7464d
LP
4194 r = read_one_line_file("/proc/sys/kernel/overflowuid", &overflowuid);
4195 if (r >= 0 && !streq(overflowuid, "65534"))
4196 e = stpcpy(e, "overflowuid-not-65534:");
4197
4198 r = read_one_line_file("/proc/sys/kernel/overflowgid", &overflowgid);
4199 if (r >= 0 && !streq(overflowgid, "65534"))
4200 e = stpcpy(e, "overflowgid-not-65534:");
4201
af6b0ecc
LP
4202 /* remove the last ':' */
4203 if (e != buf)
4204 e[-1] = 0;
4205
4206 return buf;
4207}
4208
adefcf28
LP
4209void manager_ref_console(Manager *m) {
4210 assert(m);
4211
4212 m->n_on_console++;
4213}
4214
4215void manager_unref_console(Manager *m) {
4216
4217 assert(m->n_on_console > 0);
4218 m->n_on_console--;
4219
4220 if (m->n_on_console == 0)
4221 m->no_console_output = false; /* unset no_console_output flag, since the console is definitely free now */
4222}
4223
f755e3b7 4224static const char *const manager_state_table[_MANAGER_STATE_MAX] = {
d81afec1 4225 [MANAGER_INITIALIZING] = "initializing",
f755e3b7
LP
4226 [MANAGER_STARTING] = "starting",
4227 [MANAGER_RUNNING] = "running",
4228 [MANAGER_DEGRADED] = "degraded",
4229 [MANAGER_MAINTENANCE] = "maintenance",
4230 [MANAGER_STOPPING] = "stopping",
4231};
4232
4233DEFINE_STRING_TABLE_LOOKUP(manager_state, ManagerState);
9f9f0342
LP
4234
4235static const char *const manager_timestamp_table[_MANAGER_TIMESTAMP_MAX] = {
4236 [MANAGER_TIMESTAMP_FIRMWARE] = "firmware",
4237 [MANAGER_TIMESTAMP_LOADER] = "loader",
4238 [MANAGER_TIMESTAMP_KERNEL] = "kernel",
4239 [MANAGER_TIMESTAMP_INITRD] = "initrd",
4240 [MANAGER_TIMESTAMP_USERSPACE] = "userspace",
4241 [MANAGER_TIMESTAMP_FINISH] = "finish",
4242 [MANAGER_TIMESTAMP_SECURITY_START] = "security-start",
4243 [MANAGER_TIMESTAMP_SECURITY_FINISH] = "security-finish",
4244 [MANAGER_TIMESTAMP_GENERATORS_START] = "generators-start",
4245 [MANAGER_TIMESTAMP_GENERATORS_FINISH] = "generators-finish",
4246 [MANAGER_TIMESTAMP_UNITS_LOAD_START] = "units-load-start",
4247 [MANAGER_TIMESTAMP_UNITS_LOAD_FINISH] = "units-load-finish",
4248};
4249
4250DEFINE_STRING_TABLE_LOOKUP(manager_timestamp, ManagerTimestamp);