]> git.ipfire.org Git - thirdparty/systemd.git/blob - src/core/socket.c
Merge pull request #10262 from keszybz/hibres-disable
[thirdparty/systemd.git] / src / core / socket.c
1 /* SPDX-License-Identifier: LGPL-2.1+ */
2
3 #include <arpa/inet.h>
4 #include <errno.h>
5 #include <fcntl.h>
6 #include <mqueue.h>
7 #include <netinet/tcp.h>
8 #include <signal.h>
9 #include <sys/epoll.h>
10 #include <sys/stat.h>
11 #include <unistd.h>
12 #include <linux/sctp.h>
13
14 #include "alloc-util.h"
15 #include "bpf-firewall.h"
16 #include "bus-error.h"
17 #include "bus-util.h"
18 #include "copy.h"
19 #include "dbus-socket.h"
20 #include "def.h"
21 #include "exit-status.h"
22 #include "fd-util.h"
23 #include "format-util.h"
24 #include "fs-util.h"
25 #include "in-addr-util.h"
26 #include "io-util.h"
27 #include "label.h"
28 #include "log.h"
29 #include "missing.h"
30 #include "mkdir.h"
31 #include "parse-util.h"
32 #include "path-util.h"
33 #include "process-util.h"
34 #include "selinux-util.h"
35 #include "signal-util.h"
36 #include "smack-util.h"
37 #include "socket.h"
38 #include "socket-protocol-list.h"
39 #include "special.h"
40 #include "string-table.h"
41 #include "string-util.h"
42 #include "strv.h"
43 #include "unit-name.h"
44 #include "unit.h"
45 #include "user-util.h"
46
47 struct SocketPeer {
48 unsigned n_ref;
49
50 Socket *socket;
51 union sockaddr_union peer;
52 socklen_t peer_salen;
53 };
54
55 static const UnitActiveState state_translation_table[_SOCKET_STATE_MAX] = {
56 [SOCKET_DEAD] = UNIT_INACTIVE,
57 [SOCKET_START_PRE] = UNIT_ACTIVATING,
58 [SOCKET_START_CHOWN] = UNIT_ACTIVATING,
59 [SOCKET_START_POST] = UNIT_ACTIVATING,
60 [SOCKET_LISTENING] = UNIT_ACTIVE,
61 [SOCKET_RUNNING] = UNIT_ACTIVE,
62 [SOCKET_STOP_PRE] = UNIT_DEACTIVATING,
63 [SOCKET_STOP_PRE_SIGTERM] = UNIT_DEACTIVATING,
64 [SOCKET_STOP_PRE_SIGKILL] = UNIT_DEACTIVATING,
65 [SOCKET_STOP_POST] = UNIT_DEACTIVATING,
66 [SOCKET_FINAL_SIGTERM] = UNIT_DEACTIVATING,
67 [SOCKET_FINAL_SIGKILL] = UNIT_DEACTIVATING,
68 [SOCKET_FAILED] = UNIT_FAILED
69 };
70
71 static int socket_dispatch_io(sd_event_source *source, int fd, uint32_t revents, void *userdata);
72 static int socket_dispatch_timer(sd_event_source *source, usec_t usec, void *userdata);
73
74 static void socket_init(Unit *u) {
75 Socket *s = SOCKET(u);
76
77 assert(u);
78 assert(u->load_state == UNIT_STUB);
79
80 s->backlog = SOMAXCONN;
81 s->timeout_usec = u->manager->default_timeout_start_usec;
82 s->directory_mode = 0755;
83 s->socket_mode = 0666;
84
85 s->max_connections = 64;
86
87 s->priority = -1;
88 s->ip_tos = -1;
89 s->ip_ttl = -1;
90 s->mark = -1;
91
92 s->exec_context.std_output = u->manager->default_std_output;
93 s->exec_context.std_error = u->manager->default_std_error;
94
95 s->control_command_id = _SOCKET_EXEC_COMMAND_INVALID;
96
97 s->trigger_limit.interval = USEC_INFINITY;
98 s->trigger_limit.burst = (unsigned) -1;
99 }
100
101 static void socket_unwatch_control_pid(Socket *s) {
102 assert(s);
103
104 if (s->control_pid <= 0)
105 return;
106
107 unit_unwatch_pid(UNIT(s), s->control_pid);
108 s->control_pid = 0;
109 }
110
111 static void socket_cleanup_fd_list(SocketPort *p) {
112 assert(p);
113
114 close_many(p->auxiliary_fds, p->n_auxiliary_fds);
115 p->auxiliary_fds = mfree(p->auxiliary_fds);
116 p->n_auxiliary_fds = 0;
117 }
118
119 void socket_free_ports(Socket *s) {
120 SocketPort *p;
121
122 assert(s);
123
124 while ((p = s->ports)) {
125 LIST_REMOVE(port, s->ports, p);
126
127 sd_event_source_unref(p->event_source);
128
129 socket_cleanup_fd_list(p);
130 safe_close(p->fd);
131 free(p->path);
132 free(p);
133 }
134 }
135
136 static void socket_done(Unit *u) {
137 Socket *s = SOCKET(u);
138 SocketPeer *p;
139
140 assert(s);
141
142 socket_free_ports(s);
143
144 while ((p = set_steal_first(s->peers_by_address)))
145 p->socket = NULL;
146
147 s->peers_by_address = set_free(s->peers_by_address);
148
149 s->exec_runtime = exec_runtime_unref(s->exec_runtime, false);
150 exec_command_free_array(s->exec_command, _SOCKET_EXEC_COMMAND_MAX);
151 s->control_command = NULL;
152
153 dynamic_creds_unref(&s->dynamic_creds);
154
155 socket_unwatch_control_pid(s);
156
157 unit_ref_unset(&s->service);
158
159 s->tcp_congestion = mfree(s->tcp_congestion);
160 s->bind_to_device = mfree(s->bind_to_device);
161
162 s->smack = mfree(s->smack);
163 s->smack_ip_in = mfree(s->smack_ip_in);
164 s->smack_ip_out = mfree(s->smack_ip_out);
165
166 strv_free(s->symlinks);
167
168 s->user = mfree(s->user);
169 s->group = mfree(s->group);
170
171 s->fdname = mfree(s->fdname);
172
173 s->timer_event_source = sd_event_source_unref(s->timer_event_source);
174 }
175
176 static int socket_arm_timer(Socket *s, usec_t usec) {
177 int r;
178
179 assert(s);
180
181 if (s->timer_event_source) {
182 r = sd_event_source_set_time(s->timer_event_source, usec);
183 if (r < 0)
184 return r;
185
186 return sd_event_source_set_enabled(s->timer_event_source, SD_EVENT_ONESHOT);
187 }
188
189 if (usec == USEC_INFINITY)
190 return 0;
191
192 r = sd_event_add_time(
193 UNIT(s)->manager->event,
194 &s->timer_event_source,
195 CLOCK_MONOTONIC,
196 usec, 0,
197 socket_dispatch_timer, s);
198 if (r < 0)
199 return r;
200
201 (void) sd_event_source_set_description(s->timer_event_source, "socket-timer");
202
203 return 0;
204 }
205
206 int socket_instantiate_service(Socket *s) {
207 _cleanup_free_ char *prefix = NULL, *name = NULL;
208 int r;
209 Unit *u;
210
211 assert(s);
212
213 /* This fills in s->service if it isn't filled in yet. For
214 * Accept=yes sockets we create the next connection service
215 * here. For Accept=no this is mostly a NOP since the service
216 * is figured out at load time anyway. */
217
218 if (UNIT_DEREF(s->service))
219 return 0;
220
221 if (!s->accept)
222 return 0;
223
224 r = unit_name_to_prefix(UNIT(s)->id, &prefix);
225 if (r < 0)
226 return r;
227
228 if (asprintf(&name, "%s@%u.service", prefix, s->n_accepted) < 0)
229 return -ENOMEM;
230
231 r = manager_load_unit(UNIT(s)->manager, name, NULL, NULL, &u);
232 if (r < 0)
233 return r;
234
235 unit_ref_set(&s->service, UNIT(s), u);
236
237 return unit_add_two_dependencies(UNIT(s), UNIT_BEFORE, UNIT_TRIGGERS, u, false, UNIT_DEPENDENCY_IMPLICIT);
238 }
239
240 static bool have_non_accept_socket(Socket *s) {
241 SocketPort *p;
242
243 assert(s);
244
245 if (!s->accept)
246 return true;
247
248 LIST_FOREACH(port, p, s->ports) {
249
250 if (p->type != SOCKET_SOCKET)
251 return true;
252
253 if (!socket_address_can_accept(&p->address))
254 return true;
255 }
256
257 return false;
258 }
259
260 static int socket_add_mount_dependencies(Socket *s) {
261 SocketPort *p;
262 int r;
263
264 assert(s);
265
266 LIST_FOREACH(port, p, s->ports) {
267 const char *path = NULL;
268
269 if (p->type == SOCKET_SOCKET)
270 path = socket_address_get_path(&p->address);
271 else if (IN_SET(p->type, SOCKET_FIFO, SOCKET_SPECIAL, SOCKET_USB_FUNCTION))
272 path = p->path;
273
274 if (!path)
275 continue;
276
277 r = unit_require_mounts_for(UNIT(s), path, UNIT_DEPENDENCY_FILE);
278 if (r < 0)
279 return r;
280 }
281
282 return 0;
283 }
284
285 static int socket_add_device_dependencies(Socket *s) {
286 char *t;
287
288 assert(s);
289
290 if (!s->bind_to_device || streq(s->bind_to_device, "lo"))
291 return 0;
292
293 t = strjoina("/sys/subsystem/net/devices/", s->bind_to_device);
294 return unit_add_node_dependency(UNIT(s), t, false, UNIT_BINDS_TO, UNIT_DEPENDENCY_FILE);
295 }
296
297 static int socket_add_default_dependencies(Socket *s) {
298 int r;
299 assert(s);
300
301 if (!UNIT(s)->default_dependencies)
302 return 0;
303
304 r = unit_add_dependency_by_name(UNIT(s), UNIT_BEFORE, SPECIAL_SOCKETS_TARGET, true, UNIT_DEPENDENCY_DEFAULT);
305 if (r < 0)
306 return r;
307
308 if (MANAGER_IS_SYSTEM(UNIT(s)->manager)) {
309 r = unit_add_two_dependencies_by_name(UNIT(s), UNIT_AFTER, UNIT_REQUIRES, SPECIAL_SYSINIT_TARGET, true, UNIT_DEPENDENCY_DEFAULT);
310 if (r < 0)
311 return r;
312 }
313
314 return unit_add_two_dependencies_by_name(UNIT(s), UNIT_BEFORE, UNIT_CONFLICTS, SPECIAL_SHUTDOWN_TARGET, true, UNIT_DEPENDENCY_DEFAULT);
315 }
316
317 _pure_ static bool socket_has_exec(Socket *s) {
318 unsigned i;
319 assert(s);
320
321 for (i = 0; i < _SOCKET_EXEC_COMMAND_MAX; i++)
322 if (s->exec_command[i])
323 return true;
324
325 return false;
326 }
327
328 static int socket_add_extras(Socket *s) {
329 Unit *u = UNIT(s);
330 int r;
331
332 assert(s);
333
334 /* Pick defaults for the trigger limit, if nothing was explicitly configured. We pick a relatively high limit
335 * in Accept=yes mode, and a lower limit for Accept=no. Reason: in Accept=yes mode we are invoking accept()
336 * ourselves before the trigger limit can hit, thus incoming connections are taken off the socket queue quickly
337 * and reliably. This is different for Accept=no, where the spawned service has to take the incoming traffic
338 * off the queues, which it might not necessarily do. Moreover, while Accept=no services are supposed to
339 * process whatever is queued in one go, and thus should normally never have to be started frequently. This is
340 * different for Accept=yes where each connection is processed by a new service instance, and thus frequent
341 * service starts are typical. */
342
343 if (s->trigger_limit.interval == USEC_INFINITY)
344 s->trigger_limit.interval = 2 * USEC_PER_SEC;
345
346 if (s->trigger_limit.burst == (unsigned) -1) {
347 if (s->accept)
348 s->trigger_limit.burst = 200;
349 else
350 s->trigger_limit.burst = 20;
351 }
352
353 if (have_non_accept_socket(s)) {
354
355 if (!UNIT_DEREF(s->service)) {
356 Unit *x;
357
358 r = unit_load_related_unit(u, ".service", &x);
359 if (r < 0)
360 return r;
361
362 unit_ref_set(&s->service, u, x);
363 }
364
365 r = unit_add_two_dependencies(u, UNIT_BEFORE, UNIT_TRIGGERS, UNIT_DEREF(s->service), true, UNIT_DEPENDENCY_IMPLICIT);
366 if (r < 0)
367 return r;
368 }
369
370 r = socket_add_mount_dependencies(s);
371 if (r < 0)
372 return r;
373
374 r = socket_add_device_dependencies(s);
375 if (r < 0)
376 return r;
377
378 r = unit_patch_contexts(u);
379 if (r < 0)
380 return r;
381
382 if (socket_has_exec(s)) {
383 r = unit_add_exec_dependencies(u, &s->exec_context);
384 if (r < 0)
385 return r;
386 }
387
388 r = unit_set_default_slice(u);
389 if (r < 0)
390 return r;
391
392 r = socket_add_default_dependencies(s);
393 if (r < 0)
394 return r;
395
396 return 0;
397 }
398
399 static const char *socket_find_symlink_target(Socket *s) {
400 const char *found = NULL;
401 SocketPort *p;
402
403 LIST_FOREACH(port, p, s->ports) {
404 const char *f = NULL;
405
406 switch (p->type) {
407
408 case SOCKET_FIFO:
409 f = p->path;
410 break;
411
412 case SOCKET_SOCKET:
413 f = socket_address_get_path(&p->address);
414 break;
415
416 default:
417 break;
418 }
419
420 if (f) {
421 if (found)
422 return NULL;
423
424 found = f;
425 }
426 }
427
428 return found;
429 }
430
431 static int socket_verify(Socket *s) {
432 assert(s);
433
434 if (UNIT(s)->load_state != UNIT_LOADED)
435 return 0;
436
437 if (!s->ports) {
438 log_unit_error(UNIT(s), "Unit has no Listen setting (ListenStream=, ListenDatagram=, ListenFIFO=, ...). Refusing.");
439 return -ENOEXEC;
440 }
441
442 if (s->accept && have_non_accept_socket(s)) {
443 log_unit_error(UNIT(s), "Unit configured for accepting sockets, but sockets are non-accepting. Refusing.");
444 return -ENOEXEC;
445 }
446
447 if (s->accept && s->max_connections <= 0) {
448 log_unit_error(UNIT(s), "MaxConnection= setting too small. Refusing.");
449 return -ENOEXEC;
450 }
451
452 if (s->accept && UNIT_DEREF(s->service)) {
453 log_unit_error(UNIT(s), "Explicit service configuration for accepting socket units not supported. Refusing.");
454 return -ENOEXEC;
455 }
456
457 if (s->exec_context.pam_name && s->kill_context.kill_mode != KILL_CONTROL_GROUP) {
458 log_unit_error(UNIT(s), "Unit has PAM enabled. Kill mode must be set to 'control-group'. Refusing.");
459 return -ENOEXEC;
460 }
461
462 if (!strv_isempty(s->symlinks) && !socket_find_symlink_target(s)) {
463 log_unit_error(UNIT(s), "Unit has symlinks set but none or more than one node in the file system. Refusing.");
464 return -ENOEXEC;
465 }
466
467 return 0;
468 }
469
470 static void peer_address_hash_func(const void *p, struct siphash *state) {
471 const SocketPeer *s = p;
472
473 assert(s);
474
475 if (s->peer.sa.sa_family == AF_INET)
476 siphash24_compress(&s->peer.in.sin_addr, sizeof(s->peer.in.sin_addr), state);
477 else if (s->peer.sa.sa_family == AF_INET6)
478 siphash24_compress(&s->peer.in6.sin6_addr, sizeof(s->peer.in6.sin6_addr), state);
479 else if (s->peer.sa.sa_family == AF_VSOCK)
480 siphash24_compress(&s->peer.vm.svm_cid, sizeof(s->peer.vm.svm_cid), state);
481 else
482 assert_not_reached("Unknown address family.");
483 }
484
485 static int peer_address_compare_func(const void *a, const void *b) {
486 const SocketPeer *x = a, *y = b;
487 int r;
488
489 r = CMP(x->peer.sa.sa_family, y->peer.sa.sa_family);
490 if (r != 0)
491 return r;
492
493 switch(x->peer.sa.sa_family) {
494 case AF_INET:
495 return memcmp(&x->peer.in.sin_addr, &y->peer.in.sin_addr, sizeof(x->peer.in.sin_addr));
496 case AF_INET6:
497 return memcmp(&x->peer.in6.sin6_addr, &y->peer.in6.sin6_addr, sizeof(x->peer.in6.sin6_addr));
498 case AF_VSOCK:
499 if (x->peer.vm.svm_cid < y->peer.vm.svm_cid)
500 return -1;
501 if (x->peer.vm.svm_cid > y->peer.vm.svm_cid)
502 return 1;
503 return 0;
504 }
505 assert_not_reached("Black sheep in the family!");
506 }
507
508 const struct hash_ops peer_address_hash_ops = {
509 .hash = peer_address_hash_func,
510 .compare = peer_address_compare_func
511 };
512
513 static int socket_load(Unit *u) {
514 Socket *s = SOCKET(u);
515 int r;
516
517 assert(u);
518 assert(u->load_state == UNIT_STUB);
519
520 r = set_ensure_allocated(&s->peers_by_address, &peer_address_hash_ops);
521 if (r < 0)
522 return r;
523
524 r = unit_load_fragment_and_dropin(u);
525 if (r < 0)
526 return r;
527
528 if (u->load_state == UNIT_LOADED) {
529 /* This is a new unit? Then let's add in some extras */
530 r = socket_add_extras(s);
531 if (r < 0)
532 return r;
533 }
534
535 return socket_verify(s);
536 }
537
538 static SocketPeer *socket_peer_new(void) {
539 SocketPeer *p;
540
541 p = new0(SocketPeer, 1);
542 if (!p)
543 return NULL;
544
545 p->n_ref = 1;
546
547 return p;
548 }
549
550 static SocketPeer *socket_peer_free(SocketPeer *p) {
551 assert(p);
552
553 if (p->socket)
554 set_remove(p->socket->peers_by_address, p);
555
556 return mfree(p);
557 }
558
559 DEFINE_TRIVIAL_REF_UNREF_FUNC(SocketPeer, socket_peer, socket_peer_free);
560
561 int socket_acquire_peer(Socket *s, int fd, SocketPeer **p) {
562 _cleanup_(socket_peer_unrefp) SocketPeer *remote = NULL;
563 SocketPeer sa = {}, *i;
564 socklen_t salen = sizeof(sa.peer);
565 int r;
566
567 assert(fd >= 0);
568 assert(s);
569
570 r = getpeername(fd, &sa.peer.sa, &salen);
571 if (r < 0)
572 return log_error_errno(errno, "getpeername failed: %m");
573
574 if (!IN_SET(sa.peer.sa.sa_family, AF_INET, AF_INET6, AF_VSOCK)) {
575 *p = NULL;
576 return 0;
577 }
578
579 i = set_get(s->peers_by_address, &sa);
580 if (i) {
581 *p = socket_peer_ref(i);
582 return 1;
583 }
584
585 remote = socket_peer_new();
586 if (!remote)
587 return log_oom();
588
589 remote->peer = sa.peer;
590 remote->peer_salen = salen;
591
592 r = set_put(s->peers_by_address, remote);
593 if (r < 0)
594 return r;
595
596 remote->socket = s;
597
598 *p = TAKE_PTR(remote);
599
600 return 1;
601 }
602
603 _const_ static const char* listen_lookup(int family, int type) {
604
605 if (family == AF_NETLINK)
606 return "ListenNetlink";
607
608 if (type == SOCK_STREAM)
609 return "ListenStream";
610 else if (type == SOCK_DGRAM)
611 return "ListenDatagram";
612 else if (type == SOCK_SEQPACKET)
613 return "ListenSequentialPacket";
614
615 assert_not_reached("Unknown socket type");
616 return NULL;
617 }
618
619 static void socket_dump(Unit *u, FILE *f, const char *prefix) {
620 char time_string[FORMAT_TIMESPAN_MAX];
621 SocketExecCommand c;
622 Socket *s = SOCKET(u);
623 SocketPort *p;
624 const char *prefix2, *str;
625
626 assert(s);
627 assert(f);
628
629 prefix = strempty(prefix);
630 prefix2 = strjoina(prefix, "\t");
631
632 fprintf(f,
633 "%sSocket State: %s\n"
634 "%sResult: %s\n"
635 "%sBindIPv6Only: %s\n"
636 "%sBacklog: %u\n"
637 "%sSocketMode: %04o\n"
638 "%sDirectoryMode: %04o\n"
639 "%sKeepAlive: %s\n"
640 "%sNoDelay: %s\n"
641 "%sFreeBind: %s\n"
642 "%sTransparent: %s\n"
643 "%sBroadcast: %s\n"
644 "%sPassCredentials: %s\n"
645 "%sPassSecurity: %s\n"
646 "%sTCPCongestion: %s\n"
647 "%sRemoveOnStop: %s\n"
648 "%sWritable: %s\n"
649 "%sFileDescriptorName: %s\n"
650 "%sSELinuxContextFromNet: %s\n",
651 prefix, socket_state_to_string(s->state),
652 prefix, socket_result_to_string(s->result),
653 prefix, socket_address_bind_ipv6_only_to_string(s->bind_ipv6_only),
654 prefix, s->backlog,
655 prefix, s->socket_mode,
656 prefix, s->directory_mode,
657 prefix, yes_no(s->keep_alive),
658 prefix, yes_no(s->no_delay),
659 prefix, yes_no(s->free_bind),
660 prefix, yes_no(s->transparent),
661 prefix, yes_no(s->broadcast),
662 prefix, yes_no(s->pass_cred),
663 prefix, yes_no(s->pass_sec),
664 prefix, strna(s->tcp_congestion),
665 prefix, yes_no(s->remove_on_stop),
666 prefix, yes_no(s->writable),
667 prefix, socket_fdname(s),
668 prefix, yes_no(s->selinux_context_from_net));
669
670 if (s->control_pid > 0)
671 fprintf(f,
672 "%sControl PID: "PID_FMT"\n",
673 prefix, s->control_pid);
674
675 if (s->bind_to_device)
676 fprintf(f,
677 "%sBindToDevice: %s\n",
678 prefix, s->bind_to_device);
679
680 if (s->accept)
681 fprintf(f,
682 "%sAccepted: %u\n"
683 "%sNConnections: %u\n"
684 "%sMaxConnections: %u\n"
685 "%sMaxConnectionsPerSource: %u\n",
686 prefix, s->n_accepted,
687 prefix, s->n_connections,
688 prefix, s->max_connections,
689 prefix, s->max_connections_per_source);
690
691 if (s->priority >= 0)
692 fprintf(f,
693 "%sPriority: %i\n",
694 prefix, s->priority);
695
696 if (s->receive_buffer > 0)
697 fprintf(f,
698 "%sReceiveBuffer: %zu\n",
699 prefix, s->receive_buffer);
700
701 if (s->send_buffer > 0)
702 fprintf(f,
703 "%sSendBuffer: %zu\n",
704 prefix, s->send_buffer);
705
706 if (s->ip_tos >= 0)
707 fprintf(f,
708 "%sIPTOS: %i\n",
709 prefix, s->ip_tos);
710
711 if (s->ip_ttl >= 0)
712 fprintf(f,
713 "%sIPTTL: %i\n",
714 prefix, s->ip_ttl);
715
716 if (s->pipe_size > 0)
717 fprintf(f,
718 "%sPipeSize: %zu\n",
719 prefix, s->pipe_size);
720
721 if (s->mark >= 0)
722 fprintf(f,
723 "%sMark: %i\n",
724 prefix, s->mark);
725
726 if (s->mq_maxmsg > 0)
727 fprintf(f,
728 "%sMessageQueueMaxMessages: %li\n",
729 prefix, s->mq_maxmsg);
730
731 if (s->mq_msgsize > 0)
732 fprintf(f,
733 "%sMessageQueueMessageSize: %li\n",
734 prefix, s->mq_msgsize);
735
736 if (s->reuse_port)
737 fprintf(f,
738 "%sReusePort: %s\n",
739 prefix, yes_no(s->reuse_port));
740
741 if (s->smack)
742 fprintf(f,
743 "%sSmackLabel: %s\n",
744 prefix, s->smack);
745
746 if (s->smack_ip_in)
747 fprintf(f,
748 "%sSmackLabelIPIn: %s\n",
749 prefix, s->smack_ip_in);
750
751 if (s->smack_ip_out)
752 fprintf(f,
753 "%sSmackLabelIPOut: %s\n",
754 prefix, s->smack_ip_out);
755
756 if (!isempty(s->user) || !isempty(s->group))
757 fprintf(f,
758 "%sSocketUser: %s\n"
759 "%sSocketGroup: %s\n",
760 prefix, strna(s->user),
761 prefix, strna(s->group));
762
763 if (s->keep_alive_time > 0)
764 fprintf(f,
765 "%sKeepAliveTimeSec: %s\n",
766 prefix, format_timespan(time_string, FORMAT_TIMESPAN_MAX, s->keep_alive_time, USEC_PER_SEC));
767
768 if (s->keep_alive_interval > 0)
769 fprintf(f,
770 "%sKeepAliveIntervalSec: %s\n",
771 prefix, format_timespan(time_string, FORMAT_TIMESPAN_MAX, s->keep_alive_interval, USEC_PER_SEC));
772
773 if (s->keep_alive_cnt > 0)
774 fprintf(f,
775 "%sKeepAliveProbes: %u\n",
776 prefix, s->keep_alive_cnt);
777
778 if (s->defer_accept > 0)
779 fprintf(f,
780 "%sDeferAcceptSec: %s\n",
781 prefix, format_timespan(time_string, FORMAT_TIMESPAN_MAX, s->defer_accept, USEC_PER_SEC));
782
783 LIST_FOREACH(port, p, s->ports) {
784
785 switch (p->type) {
786 case SOCKET_SOCKET: {
787 _cleanup_free_ char *k = NULL;
788 const char *t;
789 int r;
790
791 r = socket_address_print(&p->address, &k);
792 if (r < 0)
793 t = strerror(-r);
794 else
795 t = k;
796
797 fprintf(f, "%s%s: %s\n", prefix, listen_lookup(socket_address_family(&p->address), p->address.type), t);
798 break;
799 }
800 case SOCKET_SPECIAL:
801 fprintf(f, "%sListenSpecial: %s\n", prefix, p->path);
802 break;
803 case SOCKET_USB_FUNCTION:
804 fprintf(f, "%sListenUSBFunction: %s\n", prefix, p->path);
805 break;
806 case SOCKET_MQUEUE:
807 fprintf(f, "%sListenMessageQueue: %s\n", prefix, p->path);
808 break;
809 default:
810 fprintf(f, "%sListenFIFO: %s\n", prefix, p->path);
811 }
812 }
813
814 fprintf(f,
815 "%sTriggerLimitIntervalSec: %s\n"
816 "%sTriggerLimitBurst: %u\n",
817 prefix, format_timespan(time_string, FORMAT_TIMESPAN_MAX, s->trigger_limit.interval, USEC_PER_SEC),
818 prefix, s->trigger_limit.burst);
819
820 str = socket_protocol_to_name(s->socket_protocol);
821 if (str)
822 fprintf(f, "%sSocketProtocol: %s\n", prefix, str);
823
824 if (!strv_isempty(s->symlinks)) {
825 char **q;
826
827 fprintf(f, "%sSymlinks:", prefix);
828 STRV_FOREACH(q, s->symlinks)
829 fprintf(f, " %s", *q);
830
831 fprintf(f, "\n");
832 }
833
834 fprintf(f,
835 "%sTimeoutSec: %s\n",
836 prefix, format_timespan(time_string, FORMAT_TIMESPAN_MAX, s->timeout_usec, USEC_PER_SEC));
837
838 exec_context_dump(&s->exec_context, f, prefix);
839 kill_context_dump(&s->kill_context, f, prefix);
840
841 for (c = 0; c < _SOCKET_EXEC_COMMAND_MAX; c++) {
842 if (!s->exec_command[c])
843 continue;
844
845 fprintf(f, "%s-> %s:\n",
846 prefix, socket_exec_command_to_string(c));
847
848 exec_command_dump_list(s->exec_command[c], f, prefix2);
849 }
850
851 cgroup_context_dump(&s->cgroup_context, f, prefix);
852 }
853
854 static int instance_from_socket(int fd, unsigned nr, char **instance) {
855 socklen_t l;
856 char *r;
857 union sockaddr_union local, remote;
858
859 assert(fd >= 0);
860 assert(instance);
861
862 l = sizeof(local);
863 if (getsockname(fd, &local.sa, &l) < 0)
864 return -errno;
865
866 l = sizeof(remote);
867 if (getpeername(fd, &remote.sa, &l) < 0)
868 return -errno;
869
870 switch (local.sa.sa_family) {
871
872 case AF_INET: {
873 uint32_t
874 a = be32toh(local.in.sin_addr.s_addr),
875 b = be32toh(remote.in.sin_addr.s_addr);
876
877 if (asprintf(&r,
878 "%u-%u.%u.%u.%u:%u-%u.%u.%u.%u:%u",
879 nr,
880 a >> 24, (a >> 16) & 0xFF, (a >> 8) & 0xFF, a & 0xFF,
881 be16toh(local.in.sin_port),
882 b >> 24, (b >> 16) & 0xFF, (b >> 8) & 0xFF, b & 0xFF,
883 be16toh(remote.in.sin_port)) < 0)
884 return -ENOMEM;
885
886 break;
887 }
888
889 case AF_INET6: {
890 static const unsigned char ipv4_prefix[] = {
891 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0xFF, 0xFF
892 };
893
894 if (memcmp(&local.in6.sin6_addr, ipv4_prefix, sizeof(ipv4_prefix)) == 0 &&
895 memcmp(&remote.in6.sin6_addr, ipv4_prefix, sizeof(ipv4_prefix)) == 0) {
896 const uint8_t
897 *a = local.in6.sin6_addr.s6_addr+12,
898 *b = remote.in6.sin6_addr.s6_addr+12;
899
900 if (asprintf(&r,
901 "%u-%u.%u.%u.%u:%u-%u.%u.%u.%u:%u",
902 nr,
903 a[0], a[1], a[2], a[3],
904 be16toh(local.in6.sin6_port),
905 b[0], b[1], b[2], b[3],
906 be16toh(remote.in6.sin6_port)) < 0)
907 return -ENOMEM;
908 } else {
909 char a[INET6_ADDRSTRLEN], b[INET6_ADDRSTRLEN];
910
911 if (asprintf(&r,
912 "%u-%s:%u-%s:%u",
913 nr,
914 inet_ntop(AF_INET6, &local.in6.sin6_addr, a, sizeof(a)),
915 be16toh(local.in6.sin6_port),
916 inet_ntop(AF_INET6, &remote.in6.sin6_addr, b, sizeof(b)),
917 be16toh(remote.in6.sin6_port)) < 0)
918 return -ENOMEM;
919 }
920
921 break;
922 }
923
924 case AF_UNIX: {
925 struct ucred ucred;
926 int k;
927
928 k = getpeercred(fd, &ucred);
929 if (k >= 0) {
930 if (asprintf(&r,
931 "%u-"PID_FMT"-"UID_FMT,
932 nr, ucred.pid, ucred.uid) < 0)
933 return -ENOMEM;
934 } else if (k == -ENODATA) {
935 /* This handles the case where somebody is
936 * connecting from another pid/uid namespace
937 * (e.g. from outside of our container). */
938 if (asprintf(&r,
939 "%u-unknown",
940 nr) < 0)
941 return -ENOMEM;
942 } else
943 return k;
944
945 break;
946 }
947
948 case AF_VSOCK:
949 if (asprintf(&r,
950 "%u-%u:%u-%u:%u",
951 nr,
952 local.vm.svm_cid, local.vm.svm_port,
953 remote.vm.svm_cid, remote.vm.svm_port) < 0)
954 return -ENOMEM;
955
956 break;
957
958 default:
959 assert_not_reached("Unhandled socket type.");
960 }
961
962 *instance = r;
963 return 0;
964 }
965
966 static void socket_close_fds(Socket *s) {
967 SocketPort *p;
968 char **i;
969
970 assert(s);
971
972 LIST_FOREACH(port, p, s->ports) {
973 bool was_open;
974
975 was_open = p->fd >= 0;
976
977 p->event_source = sd_event_source_unref(p->event_source);
978 p->fd = safe_close(p->fd);
979 socket_cleanup_fd_list(p);
980
981 /* One little note: we should normally not delete any sockets in the file system here! After all some
982 * other process we spawned might still have a reference of this fd and wants to continue to use
983 * it. Therefore we normally delete sockets in the file system before we create a new one, not after we
984 * stopped using one! That all said, if the user explicitly requested this, we'll delete them here
985 * anyway, but only then. */
986
987 if (!was_open || !s->remove_on_stop)
988 continue;
989
990 switch (p->type) {
991
992 case SOCKET_FIFO:
993 (void) unlink(p->path);
994 break;
995
996 case SOCKET_MQUEUE:
997 (void) mq_unlink(p->path);
998 break;
999
1000 case SOCKET_SOCKET:
1001 (void) socket_address_unlink(&p->address);
1002 break;
1003
1004 default:
1005 break;
1006 }
1007 }
1008
1009 if (s->remove_on_stop)
1010 STRV_FOREACH(i, s->symlinks)
1011 (void) unlink(*i);
1012 }
1013
1014 static void socket_apply_socket_options(Socket *s, int fd) {
1015 int r;
1016
1017 assert(s);
1018 assert(fd >= 0);
1019
1020 if (s->keep_alive) {
1021 int one = 1;
1022 if (setsockopt(fd, SOL_SOCKET, SO_KEEPALIVE, &one, sizeof(one)) < 0)
1023 log_unit_warning_errno(UNIT(s), errno, "SO_KEEPALIVE failed: %m");
1024 }
1025
1026 if (s->keep_alive_time > 0) {
1027 int value = s->keep_alive_time / USEC_PER_SEC;
1028 if (setsockopt(fd, SOL_TCP, TCP_KEEPIDLE, &value, sizeof(value)) < 0)
1029 log_unit_warning_errno(UNIT(s), errno, "TCP_KEEPIDLE failed: %m");
1030 }
1031
1032 if (s->keep_alive_interval > 0) {
1033 int value = s->keep_alive_interval / USEC_PER_SEC;
1034 if (setsockopt(fd, SOL_TCP, TCP_KEEPINTVL, &value, sizeof(value)) < 0)
1035 log_unit_warning_errno(UNIT(s), errno, "TCP_KEEPINTVL failed: %m");
1036 }
1037
1038 if (s->keep_alive_cnt > 0) {
1039 int value = s->keep_alive_cnt;
1040 if (setsockopt(fd, SOL_TCP, TCP_KEEPCNT, &value, sizeof(value)) < 0)
1041 log_unit_warning_errno(UNIT(s), errno, "TCP_KEEPCNT failed: %m");
1042 }
1043
1044 if (s->defer_accept > 0) {
1045 int value = s->defer_accept / USEC_PER_SEC;
1046 if (setsockopt(fd, SOL_TCP, TCP_DEFER_ACCEPT, &value, sizeof(value)) < 0)
1047 log_unit_warning_errno(UNIT(s), errno, "TCP_DEFER_ACCEPT failed: %m");
1048 }
1049
1050 if (s->no_delay) {
1051 int one = 1;
1052
1053 if (s->socket_protocol == IPPROTO_SCTP) {
1054 if (setsockopt(fd, SOL_SCTP, SCTP_NODELAY, &one, sizeof(one)) < 0)
1055 log_unit_warning_errno(UNIT(s), errno, "SCTP_NODELAY failed: %m");
1056 } else {
1057 if (setsockopt(fd, SOL_TCP, TCP_NODELAY, &one, sizeof(one)) < 0)
1058 log_unit_warning_errno(UNIT(s), errno, "TCP_NODELAY failed: %m");
1059 }
1060 }
1061
1062 if (s->broadcast) {
1063 int one = 1;
1064 if (setsockopt(fd, SOL_SOCKET, SO_BROADCAST, &one, sizeof(one)) < 0)
1065 log_unit_warning_errno(UNIT(s), errno, "SO_BROADCAST failed: %m");
1066 }
1067
1068 if (s->pass_cred) {
1069 int one = 1;
1070 if (setsockopt(fd, SOL_SOCKET, SO_PASSCRED, &one, sizeof(one)) < 0)
1071 log_unit_warning_errno(UNIT(s), errno, "SO_PASSCRED failed: %m");
1072 }
1073
1074 if (s->pass_sec) {
1075 int one = 1;
1076 if (setsockopt(fd, SOL_SOCKET, SO_PASSSEC, &one, sizeof(one)) < 0)
1077 log_unit_warning_errno(UNIT(s), errno, "SO_PASSSEC failed: %m");
1078 }
1079
1080 if (s->priority >= 0)
1081 if (setsockopt(fd, SOL_SOCKET, SO_PRIORITY, &s->priority, sizeof(s->priority)) < 0)
1082 log_unit_warning_errno(UNIT(s), errno, "SO_PRIORITY failed: %m");
1083
1084 if (s->receive_buffer > 0) {
1085 int value = (int) s->receive_buffer;
1086
1087 /* We first try with SO_RCVBUFFORCE, in case we have the perms for that */
1088 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUFFORCE, &value, sizeof(value)) < 0)
1089 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, sizeof(value)) < 0)
1090 log_unit_warning_errno(UNIT(s), errno, "SO_RCVBUF failed: %m");
1091 }
1092
1093 if (s->send_buffer > 0) {
1094 int value = (int) s->send_buffer;
1095 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUFFORCE, &value, sizeof(value)) < 0)
1096 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, sizeof(value)) < 0)
1097 log_unit_warning_errno(UNIT(s), errno, "SO_SNDBUF failed: %m");
1098 }
1099
1100 if (s->mark >= 0)
1101 if (setsockopt(fd, SOL_SOCKET, SO_MARK, &s->mark, sizeof(s->mark)) < 0)
1102 log_unit_warning_errno(UNIT(s), errno, "SO_MARK failed: %m");
1103
1104 if (s->ip_tos >= 0)
1105 if (setsockopt(fd, IPPROTO_IP, IP_TOS, &s->ip_tos, sizeof(s->ip_tos)) < 0)
1106 log_unit_warning_errno(UNIT(s), errno, "IP_TOS failed: %m");
1107
1108 if (s->ip_ttl >= 0) {
1109 int x;
1110
1111 r = setsockopt(fd, IPPROTO_IP, IP_TTL, &s->ip_ttl, sizeof(s->ip_ttl));
1112
1113 if (socket_ipv6_is_supported())
1114 x = setsockopt(fd, IPPROTO_IPV6, IPV6_UNICAST_HOPS, &s->ip_ttl, sizeof(s->ip_ttl));
1115 else {
1116 x = -1;
1117 errno = EAFNOSUPPORT;
1118 }
1119
1120 if (r < 0 && x < 0)
1121 log_unit_warning_errno(UNIT(s), errno, "IP_TTL/IPV6_UNICAST_HOPS failed: %m");
1122 }
1123
1124 if (s->tcp_congestion)
1125 if (setsockopt(fd, SOL_TCP, TCP_CONGESTION, s->tcp_congestion, strlen(s->tcp_congestion)+1) < 0)
1126 log_unit_warning_errno(UNIT(s), errno, "TCP_CONGESTION failed: %m");
1127
1128 if (s->smack_ip_in) {
1129 r = mac_smack_apply_fd(fd, SMACK_ATTR_IPIN, s->smack_ip_in);
1130 if (r < 0)
1131 log_unit_error_errno(UNIT(s), r, "mac_smack_apply_ip_in_fd: %m");
1132 }
1133
1134 if (s->smack_ip_out) {
1135 r = mac_smack_apply_fd(fd, SMACK_ATTR_IPOUT, s->smack_ip_out);
1136 if (r < 0)
1137 log_unit_error_errno(UNIT(s), r, "mac_smack_apply_ip_out_fd: %m");
1138 }
1139 }
1140
1141 static void socket_apply_fifo_options(Socket *s, int fd) {
1142 int r;
1143
1144 assert(s);
1145 assert(fd >= 0);
1146
1147 if (s->pipe_size > 0)
1148 if (fcntl(fd, F_SETPIPE_SZ, s->pipe_size) < 0)
1149 log_unit_warning_errno(UNIT(s), errno, "Setting pipe size failed, ignoring: %m");
1150
1151 if (s->smack) {
1152 r = mac_smack_apply_fd(fd, SMACK_ATTR_ACCESS, s->smack);
1153 if (r < 0)
1154 log_unit_error_errno(UNIT(s), r, "SMACK relabelling failed, ignoring: %m");
1155 }
1156 }
1157
1158 static int fifo_address_create(
1159 const char *path,
1160 mode_t directory_mode,
1161 mode_t socket_mode) {
1162
1163 _cleanup_close_ int fd = -1;
1164 mode_t old_mask;
1165 struct stat st;
1166 int r;
1167
1168 assert(path);
1169
1170 (void) mkdir_parents_label(path, directory_mode);
1171
1172 r = mac_selinux_create_file_prepare(path, S_IFIFO);
1173 if (r < 0)
1174 return r;
1175
1176 /* Enforce the right access mode for the fifo */
1177 old_mask = umask(~socket_mode);
1178
1179 /* Include the original umask in our mask */
1180 (void) umask(~socket_mode | old_mask);
1181
1182 r = mkfifo(path, socket_mode);
1183 (void) umask(old_mask);
1184
1185 if (r < 0 && errno != EEXIST) {
1186 r = -errno;
1187 goto fail;
1188 }
1189
1190 fd = open(path, O_RDWR | O_CLOEXEC | O_NOCTTY | O_NONBLOCK | O_NOFOLLOW);
1191 if (fd < 0) {
1192 r = -errno;
1193 goto fail;
1194 }
1195
1196 mac_selinux_create_file_clear();
1197
1198 if (fstat(fd, &st) < 0) {
1199 r = -errno;
1200 goto fail;
1201 }
1202
1203 if (!S_ISFIFO(st.st_mode) ||
1204 (st.st_mode & 0777) != (socket_mode & ~old_mask) ||
1205 st.st_uid != getuid() ||
1206 st.st_gid != getgid()) {
1207 r = -EEXIST;
1208 goto fail;
1209 }
1210
1211 return TAKE_FD(fd);
1212
1213 fail:
1214 mac_selinux_create_file_clear();
1215 return r;
1216 }
1217
1218 static int special_address_create(const char *path, bool writable) {
1219 _cleanup_close_ int fd = -1;
1220 struct stat st;
1221
1222 assert(path);
1223
1224 fd = open(path, (writable ? O_RDWR : O_RDONLY)|O_CLOEXEC|O_NOCTTY|O_NONBLOCK|O_NOFOLLOW);
1225 if (fd < 0)
1226 return -errno;
1227
1228 if (fstat(fd, &st) < 0)
1229 return -errno;
1230
1231 /* Check whether this is a /proc, /sys or /dev file or char device */
1232 if (!S_ISREG(st.st_mode) && !S_ISCHR(st.st_mode))
1233 return -EEXIST;
1234
1235 return TAKE_FD(fd);
1236 }
1237
1238 static int usbffs_address_create(const char *path) {
1239 _cleanup_close_ int fd = -1;
1240 struct stat st;
1241
1242 assert(path);
1243
1244 fd = open(path, O_RDWR|O_CLOEXEC|O_NOCTTY|O_NONBLOCK|O_NOFOLLOW);
1245 if (fd < 0)
1246 return -errno;
1247
1248 if (fstat(fd, &st) < 0)
1249 return -errno;
1250
1251 /* Check whether this is a regular file (ffs endpoint) */
1252 if (!S_ISREG(st.st_mode))
1253 return -EEXIST;
1254
1255 return TAKE_FD(fd);
1256 }
1257
1258 static int mq_address_create(
1259 const char *path,
1260 mode_t mq_mode,
1261 long maxmsg,
1262 long msgsize) {
1263
1264 _cleanup_close_ int fd = -1;
1265 struct stat st;
1266 mode_t old_mask;
1267 struct mq_attr _attr, *attr = NULL;
1268
1269 assert(path);
1270
1271 if (maxmsg > 0 && msgsize > 0) {
1272 _attr = (struct mq_attr) {
1273 .mq_flags = O_NONBLOCK,
1274 .mq_maxmsg = maxmsg,
1275 .mq_msgsize = msgsize,
1276 };
1277 attr = &_attr;
1278 }
1279
1280 /* Enforce the right access mode for the mq */
1281 old_mask = umask(~mq_mode);
1282
1283 /* Include the original umask in our mask */
1284 (void) umask(~mq_mode | old_mask);
1285 fd = mq_open(path, O_RDONLY|O_CLOEXEC|O_NONBLOCK|O_CREAT, mq_mode, attr);
1286 (void) umask(old_mask);
1287
1288 if (fd < 0)
1289 return -errno;
1290
1291 if (fstat(fd, &st) < 0)
1292 return -errno;
1293
1294 if ((st.st_mode & 0777) != (mq_mode & ~old_mask) ||
1295 st.st_uid != getuid() ||
1296 st.st_gid != getgid())
1297 return -EEXIST;
1298
1299 return TAKE_FD(fd);
1300 }
1301
1302 static int socket_symlink(Socket *s) {
1303 const char *p;
1304 char **i;
1305 int r;
1306
1307 assert(s);
1308
1309 p = socket_find_symlink_target(s);
1310 if (!p)
1311 return 0;
1312
1313 STRV_FOREACH(i, s->symlinks) {
1314 (void) mkdir_parents_label(*i, s->directory_mode);
1315
1316 r = symlink_idempotent(p, *i, false);
1317
1318 if (r == -EEXIST && s->remove_on_stop) {
1319 /* If there's already something where we want to create the symlink, and the destructive
1320 * RemoveOnStop= mode is set, then we might as well try to remove what already exists and try
1321 * again. */
1322
1323 if (unlink(*i) >= 0)
1324 r = symlink_idempotent(p, *i, false);
1325 }
1326
1327 if (r < 0)
1328 log_unit_warning_errno(UNIT(s), r, "Failed to create symlink %s → %s, ignoring: %m", p, *i);
1329 }
1330
1331 return 0;
1332 }
1333
1334 static int usbffs_write_descs(int fd, Service *s) {
1335 int r;
1336
1337 if (!s->usb_function_descriptors || !s->usb_function_strings)
1338 return -EINVAL;
1339
1340 r = copy_file_fd(s->usb_function_descriptors, fd, 0);
1341 if (r < 0)
1342 return r;
1343
1344 return copy_file_fd(s->usb_function_strings, fd, 0);
1345 }
1346
1347 static int usbffs_select_ep(const struct dirent *d) {
1348 return d->d_name[0] != '.' && !streq(d->d_name, "ep0");
1349 }
1350
1351 static int usbffs_dispatch_eps(SocketPort *p) {
1352 _cleanup_free_ struct dirent **ent = NULL;
1353 size_t n, k, i;
1354 int r;
1355
1356 r = scandir(p->path, &ent, usbffs_select_ep, alphasort);
1357 if (r < 0)
1358 return -errno;
1359
1360 n = (size_t) r;
1361 p->auxiliary_fds = new(int, n);
1362 if (!p->auxiliary_fds) {
1363 r = -ENOMEM;
1364 goto clear;
1365 }
1366
1367 p->n_auxiliary_fds = n;
1368
1369 k = 0;
1370 for (i = 0; i < n; ++i) {
1371 _cleanup_free_ char *ep = NULL;
1372
1373 ep = path_make_absolute(ent[i]->d_name, p->path);
1374 if (!ep) {
1375 r = -ENOMEM;
1376 goto fail;
1377 }
1378
1379 path_simplify(ep, false);
1380
1381 r = usbffs_address_create(ep);
1382 if (r < 0)
1383 goto fail;
1384
1385 p->auxiliary_fds[k++] = r;
1386 }
1387
1388 r = 0;
1389 goto clear;
1390
1391 fail:
1392 close_many(p->auxiliary_fds, k);
1393 p->auxiliary_fds = mfree(p->auxiliary_fds);
1394 p->n_auxiliary_fds = 0;
1395
1396 clear:
1397 for (i = 0; i < n; ++i)
1398 free(ent[i]);
1399
1400 return r;
1401 }
1402
1403 static int socket_determine_selinux_label(Socket *s, char **ret) {
1404 Service *service;
1405 ExecCommand *c;
1406 _cleanup_free_ char *path = NULL;
1407 int r;
1408
1409 assert(s);
1410 assert(ret);
1411
1412 if (s->selinux_context_from_net) {
1413 /* If this is requested, get label from the network label */
1414
1415 r = mac_selinux_get_our_label(ret);
1416 if (r == -EOPNOTSUPP)
1417 goto no_label;
1418
1419 } else {
1420 /* Otherwise, get it from the executable we are about to start */
1421 r = socket_instantiate_service(s);
1422 if (r < 0)
1423 return r;
1424
1425 if (!UNIT_ISSET(s->service))
1426 goto no_label;
1427
1428 service = SERVICE(UNIT_DEREF(s->service));
1429 c = service->exec_command[SERVICE_EXEC_START];
1430 if (!c)
1431 goto no_label;
1432
1433 r = chase_symlinks(c->path, service->exec_context.root_directory, CHASE_PREFIX_ROOT, &path);
1434 if (r < 0)
1435 goto no_label;
1436
1437 r = mac_selinux_get_create_label_from_exe(path, ret);
1438 if (IN_SET(r, -EPERM, -EOPNOTSUPP))
1439 goto no_label;
1440 }
1441
1442 return r;
1443
1444 no_label:
1445 *ret = NULL;
1446 return 0;
1447 }
1448
1449 static int socket_address_listen_do(
1450 Socket *s,
1451 const SocketAddress *address,
1452 const char *label) {
1453
1454 assert(s);
1455 assert(address);
1456
1457 return socket_address_listen(
1458 address,
1459 SOCK_CLOEXEC|SOCK_NONBLOCK,
1460 s->backlog,
1461 s->bind_ipv6_only,
1462 s->bind_to_device,
1463 s->reuse_port,
1464 s->free_bind,
1465 s->transparent,
1466 s->directory_mode,
1467 s->socket_mode,
1468 label);
1469 }
1470
1471 static int socket_address_listen_in_cgroup(
1472 Socket *s,
1473 const SocketAddress *address,
1474 const char *label) {
1475
1476 _cleanup_close_pair_ int pair[2] = { -1, -1 };
1477 int fd, r;
1478 pid_t pid;
1479
1480 assert(s);
1481 assert(address);
1482
1483 /* This is a wrapper around socket_address_listen(), that forks off a helper process inside the socket's cgroup
1484 * in which the socket is actually created. This way we ensure the socket is actually properly attached to the
1485 * unit's cgroup for the purpose of BPF filtering and such. */
1486
1487 if (!IN_SET(address->sockaddr.sa.sa_family, AF_INET, AF_INET6))
1488 goto shortcut; /* BPF filtering only applies to IPv4 + IPv6, shortcut things for other protocols */
1489
1490 r = bpf_firewall_supported();
1491 if (r < 0)
1492 return r;
1493 if (r == BPF_FIREWALL_UNSUPPORTED) /* If BPF firewalling isn't supported anyway — there's no point in this forking complexity */
1494 goto shortcut;
1495
1496 if (socketpair(AF_UNIX, SOCK_SEQPACKET|SOCK_CLOEXEC, 0, pair) < 0)
1497 return log_unit_error_errno(UNIT(s), errno, "Failed to create communication channel: %m");
1498
1499 r = unit_fork_helper_process(UNIT(s), "(sd-listen)", &pid);
1500 if (r < 0)
1501 return log_unit_error_errno(UNIT(s), r, "Failed to fork off listener stub process: %m");
1502 if (r == 0) {
1503 /* Child */
1504
1505 pair[0] = safe_close(pair[0]);
1506
1507 fd = socket_address_listen_do(s, address, label);
1508 if (fd < 0) {
1509 log_unit_error_errno(UNIT(s), fd, "Failed to create listening socket: %m");
1510 _exit(EXIT_FAILURE);
1511 }
1512
1513 r = send_one_fd(pair[1], fd, 0);
1514 if (r < 0) {
1515 log_unit_error_errno(UNIT(s), r, "Failed to send listening socket to parent: %m");
1516 _exit(EXIT_FAILURE);
1517 }
1518
1519 _exit(EXIT_SUCCESS);
1520 }
1521
1522 pair[1] = safe_close(pair[1]);
1523 fd = receive_one_fd(pair[0], 0);
1524
1525 /* We synchronously wait for the helper, as it shouldn't be slow */
1526 r = wait_for_terminate_and_check("(sd-listen)", pid, WAIT_LOG_ABNORMAL);
1527 if (r < 0) {
1528 safe_close(fd);
1529 return r;
1530 }
1531
1532 if (fd < 0)
1533 return log_unit_error_errno(UNIT(s), fd, "Failed to receive listening socket: %m");
1534
1535 return fd;
1536
1537 shortcut:
1538 fd = socket_address_listen_do(s, address, label);
1539 if (fd < 0)
1540 return log_error_errno(fd, "Failed to create listening socket: %m");
1541
1542 return fd;
1543 }
1544
1545 static int socket_open_fds(Socket *s) {
1546 _cleanup_(mac_selinux_freep) char *label = NULL;
1547 bool know_label = false;
1548 SocketPort *p;
1549 int r;
1550
1551 assert(s);
1552
1553 LIST_FOREACH(port, p, s->ports) {
1554
1555 if (p->fd >= 0)
1556 continue;
1557
1558 switch (p->type) {
1559
1560 case SOCKET_SOCKET:
1561
1562 if (!know_label) {
1563 /* Figure out label, if we don't it know yet. We do it once, for the first socket where
1564 * we need this and remember it for the rest. */
1565
1566 r = socket_determine_selinux_label(s, &label);
1567 if (r < 0)
1568 goto rollback;
1569
1570 know_label = true;
1571 }
1572
1573 /* Apply the socket protocol */
1574 switch (p->address.type) {
1575
1576 case SOCK_STREAM:
1577 case SOCK_SEQPACKET:
1578 if (s->socket_protocol == IPPROTO_SCTP)
1579 p->address.protocol = s->socket_protocol;
1580 break;
1581
1582 case SOCK_DGRAM:
1583 if (s->socket_protocol == IPPROTO_UDPLITE)
1584 p->address.protocol = s->socket_protocol;
1585 break;
1586 }
1587
1588 r = socket_address_listen_in_cgroup(s, &p->address, label);
1589 if (r < 0)
1590 goto rollback;
1591
1592 p->fd = r;
1593 socket_apply_socket_options(s, p->fd);
1594 socket_symlink(s);
1595 break;
1596
1597 case SOCKET_SPECIAL:
1598
1599 p->fd = special_address_create(p->path, s->writable);
1600 if (p->fd < 0) {
1601 r = p->fd;
1602 goto rollback;
1603 }
1604 break;
1605
1606 case SOCKET_FIFO:
1607
1608 p->fd = fifo_address_create(
1609 p->path,
1610 s->directory_mode,
1611 s->socket_mode);
1612 if (p->fd < 0) {
1613 r = p->fd;
1614 goto rollback;
1615 }
1616
1617 socket_apply_fifo_options(s, p->fd);
1618 socket_symlink(s);
1619 break;
1620
1621 case SOCKET_MQUEUE:
1622
1623 p->fd = mq_address_create(
1624 p->path,
1625 s->socket_mode,
1626 s->mq_maxmsg,
1627 s->mq_msgsize);
1628 if (p->fd < 0) {
1629 r = p->fd;
1630 goto rollback;
1631 }
1632 break;
1633
1634 case SOCKET_USB_FUNCTION: {
1635 _cleanup_free_ char *ep = NULL;
1636
1637 ep = path_make_absolute("ep0", p->path);
1638
1639 p->fd = usbffs_address_create(ep);
1640 if (p->fd < 0) {
1641 r = p->fd;
1642 goto rollback;
1643 }
1644
1645 r = usbffs_write_descs(p->fd, SERVICE(UNIT_DEREF(s->service)));
1646 if (r < 0)
1647 goto rollback;
1648
1649 r = usbffs_dispatch_eps(p);
1650 if (r < 0)
1651 goto rollback;
1652
1653 break;
1654 }
1655 default:
1656 assert_not_reached("Unknown port type");
1657 }
1658 }
1659
1660 return 0;
1661
1662 rollback:
1663 socket_close_fds(s);
1664 return r;
1665 }
1666
1667 static void socket_unwatch_fds(Socket *s) {
1668 SocketPort *p;
1669 int r;
1670
1671 assert(s);
1672
1673 LIST_FOREACH(port, p, s->ports) {
1674 if (p->fd < 0)
1675 continue;
1676
1677 if (!p->event_source)
1678 continue;
1679
1680 r = sd_event_source_set_enabled(p->event_source, SD_EVENT_OFF);
1681 if (r < 0)
1682 log_unit_debug_errno(UNIT(s), r, "Failed to disable event source: %m");
1683 }
1684 }
1685
1686 static int socket_watch_fds(Socket *s) {
1687 SocketPort *p;
1688 int r;
1689
1690 assert(s);
1691
1692 LIST_FOREACH(port, p, s->ports) {
1693 if (p->fd < 0)
1694 continue;
1695
1696 if (p->event_source) {
1697 r = sd_event_source_set_enabled(p->event_source, SD_EVENT_ON);
1698 if (r < 0)
1699 goto fail;
1700 } else {
1701 r = sd_event_add_io(UNIT(s)->manager->event, &p->event_source, p->fd, EPOLLIN, socket_dispatch_io, p);
1702 if (r < 0)
1703 goto fail;
1704
1705 (void) sd_event_source_set_description(p->event_source, "socket-port-io");
1706 }
1707 }
1708
1709 return 0;
1710
1711 fail:
1712 log_unit_warning_errno(UNIT(s), r, "Failed to watch listening fds: %m");
1713 socket_unwatch_fds(s);
1714 return r;
1715 }
1716
1717 enum {
1718 SOCKET_OPEN_NONE,
1719 SOCKET_OPEN_SOME,
1720 SOCKET_OPEN_ALL,
1721 };
1722
1723 static int socket_check_open(Socket *s) {
1724 bool have_open = false, have_closed = false;
1725 SocketPort *p;
1726
1727 assert(s);
1728
1729 LIST_FOREACH(port, p, s->ports) {
1730 if (p->fd < 0)
1731 have_closed = true;
1732 else
1733 have_open = true;
1734
1735 if (have_open && have_closed)
1736 return SOCKET_OPEN_SOME;
1737 }
1738
1739 if (have_open)
1740 return SOCKET_OPEN_ALL;
1741
1742 return SOCKET_OPEN_NONE;
1743 }
1744
1745 static void socket_set_state(Socket *s, SocketState state) {
1746 SocketState old_state;
1747 assert(s);
1748
1749 old_state = s->state;
1750 s->state = state;
1751
1752 if (!IN_SET(state,
1753 SOCKET_START_PRE,
1754 SOCKET_START_CHOWN,
1755 SOCKET_START_POST,
1756 SOCKET_STOP_PRE,
1757 SOCKET_STOP_PRE_SIGTERM,
1758 SOCKET_STOP_PRE_SIGKILL,
1759 SOCKET_STOP_POST,
1760 SOCKET_FINAL_SIGTERM,
1761 SOCKET_FINAL_SIGKILL)) {
1762
1763 s->timer_event_source = sd_event_source_unref(s->timer_event_source);
1764 socket_unwatch_control_pid(s);
1765 s->control_command = NULL;
1766 s->control_command_id = _SOCKET_EXEC_COMMAND_INVALID;
1767 }
1768
1769 if (state != SOCKET_LISTENING)
1770 socket_unwatch_fds(s);
1771
1772 if (!IN_SET(state,
1773 SOCKET_START_CHOWN,
1774 SOCKET_START_POST,
1775 SOCKET_LISTENING,
1776 SOCKET_RUNNING,
1777 SOCKET_STOP_PRE,
1778 SOCKET_STOP_PRE_SIGTERM,
1779 SOCKET_STOP_PRE_SIGKILL))
1780 socket_close_fds(s);
1781
1782 if (state != old_state)
1783 log_unit_debug(UNIT(s), "Changed %s -> %s", socket_state_to_string(old_state), socket_state_to_string(state));
1784
1785 unit_notify(UNIT(s), state_translation_table[old_state], state_translation_table[state], 0);
1786 }
1787
1788 static int socket_coldplug(Unit *u) {
1789 Socket *s = SOCKET(u);
1790 int r;
1791
1792 assert(s);
1793 assert(s->state == SOCKET_DEAD);
1794
1795 if (s->deserialized_state == s->state)
1796 return 0;
1797
1798 if (s->control_pid > 0 &&
1799 pid_is_unwaited(s->control_pid) &&
1800 IN_SET(s->deserialized_state,
1801 SOCKET_START_PRE,
1802 SOCKET_START_CHOWN,
1803 SOCKET_START_POST,
1804 SOCKET_STOP_PRE,
1805 SOCKET_STOP_PRE_SIGTERM,
1806 SOCKET_STOP_PRE_SIGKILL,
1807 SOCKET_STOP_POST,
1808 SOCKET_FINAL_SIGTERM,
1809 SOCKET_FINAL_SIGKILL)) {
1810
1811 r = unit_watch_pid(UNIT(s), s->control_pid);
1812 if (r < 0)
1813 return r;
1814
1815 r = socket_arm_timer(s, usec_add(u->state_change_timestamp.monotonic, s->timeout_usec));
1816 if (r < 0)
1817 return r;
1818 }
1819
1820 if (IN_SET(s->deserialized_state,
1821 SOCKET_START_CHOWN,
1822 SOCKET_START_POST,
1823 SOCKET_LISTENING,
1824 SOCKET_RUNNING)) {
1825
1826 /* Originally, we used to simply reopen all sockets here that we didn't have file descriptors
1827 * for. However, this is problematic, as we won't traverse throught the SOCKET_START_CHOWN state for
1828 * them, and thus the UID/GID wouldn't be right. Hence, instead simply check if we have all fds open,
1829 * and if there's a mismatch, warn loudly. */
1830
1831 r = socket_check_open(s);
1832 if (r == SOCKET_OPEN_NONE)
1833 log_unit_warning(UNIT(s),
1834 "Socket unit configuration has changed while unit has been running, "
1835 "no open socket file descriptor left. "
1836 "The socket unit is not functional until restarted.");
1837 else if (r == SOCKET_OPEN_SOME)
1838 log_unit_warning(UNIT(s),
1839 "Socket unit configuration has changed while unit has been running, "
1840 "and some socket file descriptors have not been opened yet. "
1841 "The socket unit is not fully functional until restarted.");
1842 }
1843
1844 if (s->deserialized_state == SOCKET_LISTENING) {
1845 r = socket_watch_fds(s);
1846 if (r < 0)
1847 return r;
1848 }
1849
1850 if (!IN_SET(s->deserialized_state, SOCKET_DEAD, SOCKET_FAILED)) {
1851 (void) unit_setup_dynamic_creds(u);
1852 (void) unit_setup_exec_runtime(u);
1853 }
1854
1855 socket_set_state(s, s->deserialized_state);
1856 return 0;
1857 }
1858
1859 static int socket_spawn(Socket *s, ExecCommand *c, pid_t *_pid) {
1860
1861 ExecParameters exec_params = {
1862 .flags = EXEC_APPLY_SANDBOXING|EXEC_APPLY_CHROOT|EXEC_APPLY_TTY_STDIN,
1863 .stdin_fd = -1,
1864 .stdout_fd = -1,
1865 .stderr_fd = -1,
1866 .exec_fd = -1,
1867 };
1868 pid_t pid;
1869 int r;
1870
1871 assert(s);
1872 assert(c);
1873 assert(_pid);
1874
1875 r = unit_prepare_exec(UNIT(s));
1876 if (r < 0)
1877 return r;
1878
1879 r = socket_arm_timer(s, usec_add(now(CLOCK_MONOTONIC), s->timeout_usec));
1880 if (r < 0)
1881 return r;
1882
1883 unit_set_exec_params(UNIT(s), &exec_params);
1884
1885 r = exec_spawn(UNIT(s),
1886 c,
1887 &s->exec_context,
1888 &exec_params,
1889 s->exec_runtime,
1890 &s->dynamic_creds,
1891 &pid);
1892 if (r < 0)
1893 return r;
1894
1895 r = unit_watch_pid(UNIT(s), pid);
1896 if (r < 0)
1897 /* FIXME: we need to do something here */
1898 return r;
1899
1900 *_pid = pid;
1901
1902 return 0;
1903 }
1904
1905 static int socket_chown(Socket *s, pid_t *_pid) {
1906 pid_t pid;
1907 int r;
1908
1909 r = socket_arm_timer(s, usec_add(now(CLOCK_MONOTONIC), s->timeout_usec));
1910 if (r < 0)
1911 goto fail;
1912
1913 /* We have to resolve the user names out-of-process, hence
1914 * let's fork here. It's messy, but well, what can we do? */
1915
1916 r = unit_fork_helper_process(UNIT(s), "(sd-chown)", &pid);
1917 if (r < 0)
1918 return r;
1919 if (r == 0) {
1920 uid_t uid = UID_INVALID;
1921 gid_t gid = GID_INVALID;
1922 SocketPort *p;
1923
1924 /* Child */
1925
1926 if (!isempty(s->user)) {
1927 const char *user = s->user;
1928
1929 r = get_user_creds(&user, &uid, &gid, NULL, NULL, 0);
1930 if (r < 0) {
1931 log_unit_error_errno(UNIT(s), r, "Failed to resolve user %s: %m", user);
1932 _exit(EXIT_USER);
1933 }
1934 }
1935
1936 if (!isempty(s->group)) {
1937 const char *group = s->group;
1938
1939 r = get_group_creds(&group, &gid, 0);
1940 if (r < 0) {
1941 log_unit_error_errno(UNIT(s), r, "Failed to resolve group %s: %m", group);
1942 _exit(EXIT_GROUP);
1943 }
1944 }
1945
1946 LIST_FOREACH(port, p, s->ports) {
1947 const char *path = NULL;
1948
1949 if (p->type == SOCKET_SOCKET)
1950 path = socket_address_get_path(&p->address);
1951 else if (p->type == SOCKET_FIFO)
1952 path = p->path;
1953
1954 if (!path)
1955 continue;
1956
1957 if (chown(path, uid, gid) < 0) {
1958 log_unit_error_errno(UNIT(s), errno, "Failed to chown(): %m");
1959 _exit(EXIT_CHOWN);
1960 }
1961 }
1962
1963 _exit(EXIT_SUCCESS);
1964 }
1965
1966 r = unit_watch_pid(UNIT(s), pid);
1967 if (r < 0)
1968 goto fail;
1969
1970 *_pid = pid;
1971 return 0;
1972
1973 fail:
1974 s->timer_event_source = sd_event_source_unref(s->timer_event_source);
1975 return r;
1976 }
1977
1978 static void socket_enter_dead(Socket *s, SocketResult f) {
1979 assert(s);
1980
1981 if (s->result == SOCKET_SUCCESS)
1982 s->result = f;
1983
1984 if (s->result != SOCKET_SUCCESS)
1985 log_unit_warning(UNIT(s), "Failed with result '%s'.", socket_result_to_string(s->result));
1986
1987 socket_set_state(s, s->result != SOCKET_SUCCESS ? SOCKET_FAILED : SOCKET_DEAD);
1988
1989 s->exec_runtime = exec_runtime_unref(s->exec_runtime, true);
1990
1991 exec_context_destroy_runtime_directory(&s->exec_context, UNIT(s)->manager->prefix[EXEC_DIRECTORY_RUNTIME]);
1992
1993 unit_unref_uid_gid(UNIT(s), true);
1994
1995 dynamic_creds_destroy(&s->dynamic_creds);
1996 }
1997
1998 static void socket_enter_signal(Socket *s, SocketState state, SocketResult f);
1999
2000 static void socket_enter_stop_post(Socket *s, SocketResult f) {
2001 int r;
2002 assert(s);
2003
2004 if (s->result == SOCKET_SUCCESS)
2005 s->result = f;
2006
2007 socket_unwatch_control_pid(s);
2008 s->control_command_id = SOCKET_EXEC_STOP_POST;
2009 s->control_command = s->exec_command[SOCKET_EXEC_STOP_POST];
2010
2011 if (s->control_command) {
2012 r = socket_spawn(s, s->control_command, &s->control_pid);
2013 if (r < 0)
2014 goto fail;
2015
2016 socket_set_state(s, SOCKET_STOP_POST);
2017 } else
2018 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, SOCKET_SUCCESS);
2019
2020 return;
2021
2022 fail:
2023 log_unit_warning_errno(UNIT(s), r, "Failed to run 'stop-post' task: %m");
2024 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, SOCKET_FAILURE_RESOURCES);
2025 }
2026
2027 static void socket_enter_signal(Socket *s, SocketState state, SocketResult f) {
2028 int r;
2029
2030 assert(s);
2031
2032 if (s->result == SOCKET_SUCCESS)
2033 s->result = f;
2034
2035 r = unit_kill_context(
2036 UNIT(s),
2037 &s->kill_context,
2038 !IN_SET(state, SOCKET_STOP_PRE_SIGTERM, SOCKET_FINAL_SIGTERM) ?
2039 KILL_KILL : KILL_TERMINATE,
2040 -1,
2041 s->control_pid,
2042 false);
2043 if (r < 0)
2044 goto fail;
2045
2046 if (r > 0) {
2047 r = socket_arm_timer(s, usec_add(now(CLOCK_MONOTONIC), s->timeout_usec));
2048 if (r < 0)
2049 goto fail;
2050
2051 socket_set_state(s, state);
2052 } else if (state == SOCKET_STOP_PRE_SIGTERM)
2053 socket_enter_signal(s, SOCKET_STOP_PRE_SIGKILL, SOCKET_SUCCESS);
2054 else if (state == SOCKET_STOP_PRE_SIGKILL)
2055 socket_enter_stop_post(s, SOCKET_SUCCESS);
2056 else if (state == SOCKET_FINAL_SIGTERM)
2057 socket_enter_signal(s, SOCKET_FINAL_SIGKILL, SOCKET_SUCCESS);
2058 else
2059 socket_enter_dead(s, SOCKET_SUCCESS);
2060
2061 return;
2062
2063 fail:
2064 log_unit_warning_errno(UNIT(s), r, "Failed to kill processes: %m");
2065
2066 if (IN_SET(state, SOCKET_STOP_PRE_SIGTERM, SOCKET_STOP_PRE_SIGKILL))
2067 socket_enter_stop_post(s, SOCKET_FAILURE_RESOURCES);
2068 else
2069 socket_enter_dead(s, SOCKET_FAILURE_RESOURCES);
2070 }
2071
2072 static void socket_enter_stop_pre(Socket *s, SocketResult f) {
2073 int r;
2074 assert(s);
2075
2076 if (s->result == SOCKET_SUCCESS)
2077 s->result = f;
2078
2079 socket_unwatch_control_pid(s);
2080 s->control_command_id = SOCKET_EXEC_STOP_PRE;
2081 s->control_command = s->exec_command[SOCKET_EXEC_STOP_PRE];
2082
2083 if (s->control_command) {
2084 r = socket_spawn(s, s->control_command, &s->control_pid);
2085 if (r < 0)
2086 goto fail;
2087
2088 socket_set_state(s, SOCKET_STOP_PRE);
2089 } else
2090 socket_enter_stop_post(s, SOCKET_SUCCESS);
2091
2092 return;
2093
2094 fail:
2095 log_unit_warning_errno(UNIT(s), r, "Failed to run 'stop-pre' task: %m");
2096 socket_enter_stop_post(s, SOCKET_FAILURE_RESOURCES);
2097 }
2098
2099 static void socket_enter_listening(Socket *s) {
2100 int r;
2101 assert(s);
2102
2103 r = socket_watch_fds(s);
2104 if (r < 0) {
2105 log_unit_warning_errno(UNIT(s), r, "Failed to watch sockets: %m");
2106 goto fail;
2107 }
2108
2109 socket_set_state(s, SOCKET_LISTENING);
2110 return;
2111
2112 fail:
2113 socket_enter_stop_pre(s, SOCKET_FAILURE_RESOURCES);
2114 }
2115
2116 static void socket_enter_start_post(Socket *s) {
2117 int r;
2118 assert(s);
2119
2120 socket_unwatch_control_pid(s);
2121 s->control_command_id = SOCKET_EXEC_START_POST;
2122 s->control_command = s->exec_command[SOCKET_EXEC_START_POST];
2123
2124 if (s->control_command) {
2125 r = socket_spawn(s, s->control_command, &s->control_pid);
2126 if (r < 0) {
2127 log_unit_warning_errno(UNIT(s), r, "Failed to run 'start-post' task: %m");
2128 goto fail;
2129 }
2130
2131 socket_set_state(s, SOCKET_START_POST);
2132 } else
2133 socket_enter_listening(s);
2134
2135 return;
2136
2137 fail:
2138 socket_enter_stop_pre(s, SOCKET_FAILURE_RESOURCES);
2139 }
2140
2141 static void socket_enter_start_chown(Socket *s) {
2142 int r;
2143
2144 assert(s);
2145
2146 r = socket_open_fds(s);
2147 if (r < 0) {
2148 log_unit_warning_errno(UNIT(s), r, "Failed to listen on sockets: %m");
2149 goto fail;
2150 }
2151
2152 if (!isempty(s->user) || !isempty(s->group)) {
2153
2154 socket_unwatch_control_pid(s);
2155 s->control_command_id = SOCKET_EXEC_START_CHOWN;
2156 s->control_command = NULL;
2157
2158 r = socket_chown(s, &s->control_pid);
2159 if (r < 0) {
2160 log_unit_warning_errno(UNIT(s), r, "Failed to fork 'start-chown' task: %m");
2161 goto fail;
2162 }
2163
2164 socket_set_state(s, SOCKET_START_CHOWN);
2165 } else
2166 socket_enter_start_post(s);
2167
2168 return;
2169
2170 fail:
2171 socket_enter_stop_pre(s, SOCKET_FAILURE_RESOURCES);
2172 }
2173
2174 static void socket_enter_start_pre(Socket *s) {
2175 int r;
2176 assert(s);
2177
2178 socket_unwatch_control_pid(s);
2179
2180 unit_warn_leftover_processes(UNIT(s));
2181
2182 s->control_command_id = SOCKET_EXEC_START_PRE;
2183 s->control_command = s->exec_command[SOCKET_EXEC_START_PRE];
2184
2185 if (s->control_command) {
2186 r = socket_spawn(s, s->control_command, &s->control_pid);
2187 if (r < 0) {
2188 log_unit_warning_errno(UNIT(s), r, "Failed to run 'start-pre' task: %m");
2189 goto fail;
2190 }
2191
2192 socket_set_state(s, SOCKET_START_PRE);
2193 } else
2194 socket_enter_start_chown(s);
2195
2196 return;
2197
2198 fail:
2199 socket_enter_dead(s, SOCKET_FAILURE_RESOURCES);
2200 }
2201
2202 static void flush_ports(Socket *s) {
2203 SocketPort *p;
2204
2205 /* Flush all incoming traffic, regardless if actual bytes or new connections, so that this socket isn't busy
2206 * anymore */
2207
2208 LIST_FOREACH(port, p, s->ports) {
2209 if (p->fd < 0)
2210 continue;
2211
2212 (void) flush_accept(p->fd);
2213 (void) flush_fd(p->fd);
2214 }
2215 }
2216
2217 static void socket_enter_running(Socket *s, int cfd) {
2218 _cleanup_(sd_bus_error_free) sd_bus_error error = SD_BUS_ERROR_NULL;
2219 int r;
2220
2221 /* Note that this call takes possession of the connection fd passed. It either has to assign it somewhere or
2222 * close it. */
2223
2224 assert(s);
2225
2226 /* We don't take connections anymore if we are supposed to shut down anyway */
2227 if (unit_stop_pending(UNIT(s))) {
2228
2229 log_unit_debug(UNIT(s), "Suppressing connection request since unit stop is scheduled.");
2230
2231 if (cfd >= 0)
2232 goto refuse;
2233 else
2234 flush_ports(s);
2235
2236 return;
2237 }
2238
2239 if (!ratelimit_below(&s->trigger_limit)) {
2240 log_unit_warning(UNIT(s), "Trigger limit hit, refusing further activation.");
2241 socket_enter_stop_pre(s, SOCKET_FAILURE_TRIGGER_LIMIT_HIT);
2242 goto refuse;
2243 }
2244
2245 if (cfd < 0) {
2246 bool pending = false;
2247 Unit *other;
2248 Iterator i;
2249 void *v;
2250
2251 /* If there's already a start pending don't bother to
2252 * do anything */
2253 HASHMAP_FOREACH_KEY(v, other, UNIT(s)->dependencies[UNIT_TRIGGERS], i)
2254 if (unit_active_or_pending(other)) {
2255 pending = true;
2256 break;
2257 }
2258
2259 if (!pending) {
2260 if (!UNIT_ISSET(s->service)) {
2261 log_unit_error(UNIT(s), "Service to activate vanished, refusing activation.");
2262 r = -ENOENT;
2263 goto fail;
2264 }
2265
2266 r = manager_add_job(UNIT(s)->manager, JOB_START, UNIT_DEREF(s->service), JOB_REPLACE, &error, NULL);
2267 if (r < 0)
2268 goto fail;
2269 }
2270
2271 socket_set_state(s, SOCKET_RUNNING);
2272 } else {
2273 _cleanup_free_ char *prefix = NULL, *instance = NULL, *name = NULL;
2274 _cleanup_(socket_peer_unrefp) SocketPeer *p = NULL;
2275 Service *service;
2276
2277 if (s->n_connections >= s->max_connections) {
2278 log_unit_warning(UNIT(s), "Too many incoming connections (%u), dropping connection.",
2279 s->n_connections);
2280 goto refuse;
2281 }
2282
2283 if (s->max_connections_per_source > 0) {
2284 r = socket_acquire_peer(s, cfd, &p);
2285 if (r < 0) {
2286 goto refuse;
2287 } else if (r > 0 && p->n_ref > s->max_connections_per_source) {
2288 _cleanup_free_ char *t = NULL;
2289
2290 (void) sockaddr_pretty(&p->peer.sa, p->peer_salen, true, false, &t);
2291
2292 log_unit_warning(UNIT(s),
2293 "Too many incoming connections (%u) from source %s, dropping connection.",
2294 p->n_ref, strnull(t));
2295 goto refuse;
2296 }
2297 }
2298
2299 r = socket_instantiate_service(s);
2300 if (r < 0)
2301 goto fail;
2302
2303 r = instance_from_socket(cfd, s->n_accepted, &instance);
2304 if (r < 0) {
2305 if (r != -ENOTCONN)
2306 goto fail;
2307
2308 /* ENOTCONN is legitimate if TCP RST was received.
2309 * This connection is over, but the socket unit lives on. */
2310 log_unit_debug(UNIT(s), "Got ENOTCONN on incoming socket, assuming aborted connection attempt, ignoring.");
2311 goto refuse;
2312 }
2313
2314 r = unit_name_to_prefix(UNIT(s)->id, &prefix);
2315 if (r < 0)
2316 goto fail;
2317
2318 r = unit_name_build(prefix, instance, ".service", &name);
2319 if (r < 0)
2320 goto fail;
2321
2322 r = unit_add_name(UNIT_DEREF(s->service), name);
2323 if (r < 0)
2324 goto fail;
2325
2326 service = SERVICE(UNIT_DEREF(s->service));
2327 unit_ref_unset(&s->service);
2328
2329 s->n_accepted++;
2330 unit_choose_id(UNIT(service), name);
2331
2332 r = service_set_socket_fd(service, cfd, s, s->selinux_context_from_net);
2333 if (r < 0)
2334 goto fail;
2335
2336 cfd = -1; /* We passed ownership of the fd to the service now. Forget it here. */
2337 s->n_connections++;
2338
2339 service->peer = TAKE_PTR(p); /* Pass ownership of the peer reference */
2340
2341 r = manager_add_job(UNIT(s)->manager, JOB_START, UNIT(service), JOB_REPLACE, &error, NULL);
2342 if (r < 0) {
2343 /* We failed to activate the new service, but it still exists. Let's make sure the service
2344 * closes and forgets the connection fd again, immediately. */
2345 service_close_socket_fd(service);
2346 goto fail;
2347 }
2348
2349 /* Notify clients about changed counters */
2350 unit_add_to_dbus_queue(UNIT(s));
2351 }
2352
2353 return;
2354
2355 refuse:
2356 s->n_refused++;
2357 safe_close(cfd);
2358 return;
2359
2360 fail:
2361 log_unit_warning(UNIT(s), "Failed to queue service startup job (Maybe the service file is missing or not a %s unit?): %s",
2362 cfd >= 0 ? "template" : "non-template",
2363 bus_error_message(&error, r));
2364
2365 socket_enter_stop_pre(s, SOCKET_FAILURE_RESOURCES);
2366 safe_close(cfd);
2367 }
2368
2369 static void socket_run_next(Socket *s) {
2370 int r;
2371
2372 assert(s);
2373 assert(s->control_command);
2374 assert(s->control_command->command_next);
2375
2376 socket_unwatch_control_pid(s);
2377
2378 s->control_command = s->control_command->command_next;
2379
2380 r = socket_spawn(s, s->control_command, &s->control_pid);
2381 if (r < 0)
2382 goto fail;
2383
2384 return;
2385
2386 fail:
2387 log_unit_warning_errno(UNIT(s), r, "Failed to run next task: %m");
2388
2389 if (s->state == SOCKET_START_POST)
2390 socket_enter_stop_pre(s, SOCKET_FAILURE_RESOURCES);
2391 else if (s->state == SOCKET_STOP_POST)
2392 socket_enter_dead(s, SOCKET_FAILURE_RESOURCES);
2393 else
2394 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, SOCKET_FAILURE_RESOURCES);
2395 }
2396
2397 static int socket_start(Unit *u) {
2398 Socket *s = SOCKET(u);
2399 int r;
2400
2401 assert(s);
2402
2403 /* We cannot fulfill this request right now, try again later
2404 * please! */
2405 if (IN_SET(s->state,
2406 SOCKET_STOP_PRE,
2407 SOCKET_STOP_PRE_SIGKILL,
2408 SOCKET_STOP_PRE_SIGTERM,
2409 SOCKET_STOP_POST,
2410 SOCKET_FINAL_SIGTERM,
2411 SOCKET_FINAL_SIGKILL))
2412 return -EAGAIN;
2413
2414 /* Already on it! */
2415 if (IN_SET(s->state,
2416 SOCKET_START_PRE,
2417 SOCKET_START_CHOWN,
2418 SOCKET_START_POST))
2419 return 0;
2420
2421 /* Cannot run this without the service being around */
2422 if (UNIT_ISSET(s->service)) {
2423 Service *service;
2424
2425 service = SERVICE(UNIT_DEREF(s->service));
2426
2427 if (UNIT(service)->load_state != UNIT_LOADED) {
2428 log_unit_error(u, "Socket service %s not loaded, refusing.", UNIT(service)->id);
2429 return -ENOENT;
2430 }
2431
2432 /* If the service is already active we cannot start the
2433 * socket */
2434 if (!IN_SET(service->state, SERVICE_DEAD, SERVICE_FAILED, SERVICE_AUTO_RESTART)) {
2435 log_unit_error(u, "Socket service %s already active, refusing.", UNIT(service)->id);
2436 return -EBUSY;
2437 }
2438 }
2439
2440 assert(IN_SET(s->state, SOCKET_DEAD, SOCKET_FAILED));
2441
2442 r = unit_start_limit_test(u);
2443 if (r < 0) {
2444 socket_enter_dead(s, SOCKET_FAILURE_START_LIMIT_HIT);
2445 return r;
2446 }
2447
2448 r = unit_acquire_invocation_id(u);
2449 if (r < 0)
2450 return r;
2451
2452 s->result = SOCKET_SUCCESS;
2453 exec_command_reset_status_list_array(s->exec_command, _SOCKET_EXEC_COMMAND_MAX);
2454
2455 u->reset_accounting = true;
2456
2457 socket_enter_start_pre(s);
2458 return 1;
2459 }
2460
2461 static int socket_stop(Unit *u) {
2462 Socket *s = SOCKET(u);
2463
2464 assert(s);
2465
2466 /* Already on it */
2467 if (IN_SET(s->state,
2468 SOCKET_STOP_PRE,
2469 SOCKET_STOP_PRE_SIGTERM,
2470 SOCKET_STOP_PRE_SIGKILL,
2471 SOCKET_STOP_POST,
2472 SOCKET_FINAL_SIGTERM,
2473 SOCKET_FINAL_SIGKILL))
2474 return 0;
2475
2476 /* If there's already something running we go directly into
2477 * kill mode. */
2478 if (IN_SET(s->state,
2479 SOCKET_START_PRE,
2480 SOCKET_START_CHOWN,
2481 SOCKET_START_POST)) {
2482 socket_enter_signal(s, SOCKET_STOP_PRE_SIGTERM, SOCKET_SUCCESS);
2483 return -EAGAIN;
2484 }
2485
2486 assert(IN_SET(s->state, SOCKET_LISTENING, SOCKET_RUNNING));
2487
2488 socket_enter_stop_pre(s, SOCKET_SUCCESS);
2489 return 1;
2490 }
2491
2492 static int socket_serialize(Unit *u, FILE *f, FDSet *fds) {
2493 Socket *s = SOCKET(u);
2494 SocketPort *p;
2495 int r;
2496
2497 assert(u);
2498 assert(f);
2499 assert(fds);
2500
2501 unit_serialize_item(u, f, "state", socket_state_to_string(s->state));
2502 unit_serialize_item(u, f, "result", socket_result_to_string(s->result));
2503 unit_serialize_item_format(u, f, "n-accepted", "%u", s->n_accepted);
2504 unit_serialize_item_format(u, f, "n-refused", "%u", s->n_refused);
2505
2506 if (s->control_pid > 0)
2507 unit_serialize_item_format(u, f, "control-pid", PID_FMT, s->control_pid);
2508
2509 if (s->control_command_id >= 0)
2510 unit_serialize_item(u, f, "control-command", socket_exec_command_to_string(s->control_command_id));
2511
2512 LIST_FOREACH(port, p, s->ports) {
2513 int copy;
2514
2515 if (p->fd < 0)
2516 continue;
2517
2518 copy = fdset_put_dup(fds, p->fd);
2519 if (copy < 0)
2520 return copy;
2521
2522 if (p->type == SOCKET_SOCKET) {
2523 _cleanup_free_ char *t = NULL;
2524
2525 r = socket_address_print(&p->address, &t);
2526 if (r < 0)
2527 return r;
2528
2529 if (socket_address_family(&p->address) == AF_NETLINK)
2530 unit_serialize_item_format(u, f, "netlink", "%i %s", copy, t);
2531 else
2532 unit_serialize_item_format(u, f, "socket", "%i %i %s", copy, p->address.type, t);
2533
2534 } else if (p->type == SOCKET_SPECIAL)
2535 unit_serialize_item_format(u, f, "special", "%i %s", copy, p->path);
2536 else if (p->type == SOCKET_MQUEUE)
2537 unit_serialize_item_format(u, f, "mqueue", "%i %s", copy, p->path);
2538 else if (p->type == SOCKET_USB_FUNCTION)
2539 unit_serialize_item_format(u, f, "ffs", "%i %s", copy, p->path);
2540 else {
2541 assert(p->type == SOCKET_FIFO);
2542 unit_serialize_item_format(u, f, "fifo", "%i %s", copy, p->path);
2543 }
2544 }
2545
2546 return 0;
2547 }
2548
2549 static void socket_port_take_fd(SocketPort *p, FDSet *fds, int fd) {
2550 safe_close(p->fd);
2551 p->fd = fdset_remove(fds, fd);
2552 }
2553
2554 static int socket_deserialize_item(Unit *u, const char *key, const char *value, FDSet *fds) {
2555 Socket *s = SOCKET(u);
2556
2557 assert(u);
2558 assert(key);
2559 assert(value);
2560
2561 if (streq(key, "state")) {
2562 SocketState state;
2563
2564 state = socket_state_from_string(value);
2565 if (state < 0)
2566 log_unit_debug(u, "Failed to parse state value: %s", value);
2567 else
2568 s->deserialized_state = state;
2569 } else if (streq(key, "result")) {
2570 SocketResult f;
2571
2572 f = socket_result_from_string(value);
2573 if (f < 0)
2574 log_unit_debug(u, "Failed to parse result value: %s", value);
2575 else if (f != SOCKET_SUCCESS)
2576 s->result = f;
2577
2578 } else if (streq(key, "n-accepted")) {
2579 unsigned k;
2580
2581 if (safe_atou(value, &k) < 0)
2582 log_unit_debug(u, "Failed to parse n-accepted value: %s", value);
2583 else
2584 s->n_accepted += k;
2585 } else if (streq(key, "n-refused")) {
2586 unsigned k;
2587
2588 if (safe_atou(value, &k) < 0)
2589 log_unit_debug(u, "Failed to parse n-refused value: %s", value);
2590 else
2591 s->n_refused += k;
2592 } else if (streq(key, "control-pid")) {
2593 pid_t pid;
2594
2595 if (parse_pid(value, &pid) < 0)
2596 log_unit_debug(u, "Failed to parse control-pid value: %s", value);
2597 else
2598 s->control_pid = pid;
2599 } else if (streq(key, "control-command")) {
2600 SocketExecCommand id;
2601
2602 id = socket_exec_command_from_string(value);
2603 if (id < 0)
2604 log_unit_debug(u, "Failed to parse exec-command value: %s", value);
2605 else {
2606 s->control_command_id = id;
2607 s->control_command = s->exec_command[id];
2608 }
2609 } else if (streq(key, "fifo")) {
2610 int fd, skip = 0;
2611 SocketPort *p;
2612
2613 if (sscanf(value, "%i %n", &fd, &skip) < 1 || fd < 0 || !fdset_contains(fds, fd))
2614 log_unit_debug(u, "Failed to parse fifo value: %s", value);
2615 else
2616 LIST_FOREACH(port, p, s->ports)
2617 if (p->type == SOCKET_FIFO &&
2618 path_equal_or_files_same(p->path, value+skip, 0)) {
2619 socket_port_take_fd(p, fds, fd);
2620 break;
2621 }
2622
2623 } else if (streq(key, "special")) {
2624 int fd, skip = 0;
2625 SocketPort *p;
2626
2627 if (sscanf(value, "%i %n", &fd, &skip) < 1 || fd < 0 || !fdset_contains(fds, fd))
2628 log_unit_debug(u, "Failed to parse special value: %s", value);
2629 else
2630 LIST_FOREACH(port, p, s->ports)
2631 if (p->type == SOCKET_SPECIAL &&
2632 path_equal_or_files_same(p->path, value+skip, 0)) {
2633 socket_port_take_fd(p, fds, fd);
2634 break;
2635 }
2636
2637 } else if (streq(key, "mqueue")) {
2638 int fd, skip = 0;
2639 SocketPort *p;
2640
2641 if (sscanf(value, "%i %n", &fd, &skip) < 1 || fd < 0 || !fdset_contains(fds, fd))
2642 log_unit_debug(u, "Failed to parse mqueue value: %s", value);
2643 else
2644 LIST_FOREACH(port, p, s->ports)
2645 if (p->type == SOCKET_MQUEUE &&
2646 streq(p->path, value+skip)) {
2647 socket_port_take_fd(p, fds, fd);
2648 break;
2649 }
2650
2651 } else if (streq(key, "socket")) {
2652 int fd, type, skip = 0;
2653 SocketPort *p;
2654
2655 if (sscanf(value, "%i %i %n", &fd, &type, &skip) < 2 || fd < 0 || type < 0 || !fdset_contains(fds, fd))
2656 log_unit_debug(u, "Failed to parse socket value: %s", value);
2657 else
2658 LIST_FOREACH(port, p, s->ports)
2659 if (socket_address_is(&p->address, value+skip, type)) {
2660 socket_port_take_fd(p, fds, fd);
2661 break;
2662 }
2663
2664 } else if (streq(key, "netlink")) {
2665 int fd, skip = 0;
2666 SocketPort *p;
2667
2668 if (sscanf(value, "%i %n", &fd, &skip) < 1 || fd < 0 || !fdset_contains(fds, fd))
2669 log_unit_debug(u, "Failed to parse socket value: %s", value);
2670 else
2671 LIST_FOREACH(port, p, s->ports)
2672 if (socket_address_is_netlink(&p->address, value+skip)) {
2673 socket_port_take_fd(p, fds, fd);
2674 break;
2675 }
2676
2677 } else if (streq(key, "ffs")) {
2678 int fd, skip = 0;
2679 SocketPort *p;
2680
2681 if (sscanf(value, "%i %n", &fd, &skip) < 1 || fd < 0 || !fdset_contains(fds, fd))
2682 log_unit_debug(u, "Failed to parse ffs value: %s", value);
2683 else
2684 LIST_FOREACH(port, p, s->ports)
2685 if (p->type == SOCKET_USB_FUNCTION &&
2686 path_equal_or_files_same(p->path, value+skip, 0)) {
2687 socket_port_take_fd(p, fds, fd);
2688 break;
2689 }
2690
2691 } else
2692 log_unit_debug(UNIT(s), "Unknown serialization key: %s", key);
2693
2694 return 0;
2695 }
2696
2697 static void socket_distribute_fds(Unit *u, FDSet *fds) {
2698 Socket *s = SOCKET(u);
2699 SocketPort *p;
2700
2701 assert(u);
2702
2703 LIST_FOREACH(port, p, s->ports) {
2704 Iterator i;
2705 int fd;
2706
2707 if (p->type != SOCKET_SOCKET)
2708 continue;
2709
2710 if (p->fd >= 0)
2711 continue;
2712
2713 FDSET_FOREACH(fd, fds, i) {
2714 if (socket_address_matches_fd(&p->address, fd)) {
2715 p->fd = fdset_remove(fds, fd);
2716 s->deserialized_state = SOCKET_LISTENING;
2717 break;
2718 }
2719 }
2720 }
2721 }
2722
2723 _pure_ static UnitActiveState socket_active_state(Unit *u) {
2724 assert(u);
2725
2726 return state_translation_table[SOCKET(u)->state];
2727 }
2728
2729 _pure_ static const char *socket_sub_state_to_string(Unit *u) {
2730 assert(u);
2731
2732 return socket_state_to_string(SOCKET(u)->state);
2733 }
2734
2735 const char* socket_port_type_to_string(SocketPort *p) {
2736
2737 assert(p);
2738
2739 switch (p->type) {
2740
2741 case SOCKET_SOCKET:
2742
2743 switch (p->address.type) {
2744
2745 case SOCK_STREAM:
2746 return "Stream";
2747
2748 case SOCK_DGRAM:
2749 return "Datagram";
2750
2751 case SOCK_SEQPACKET:
2752 return "SequentialPacket";
2753
2754 case SOCK_RAW:
2755 if (socket_address_family(&p->address) == AF_NETLINK)
2756 return "Netlink";
2757
2758 _fallthrough_;
2759 default:
2760 return NULL;
2761 }
2762
2763 case SOCKET_SPECIAL:
2764 return "Special";
2765
2766 case SOCKET_MQUEUE:
2767 return "MessageQueue";
2768
2769 case SOCKET_FIFO:
2770 return "FIFO";
2771
2772 case SOCKET_USB_FUNCTION:
2773 return "USBFunction";
2774
2775 default:
2776 return NULL;
2777 }
2778 }
2779
2780 SocketType socket_port_type_from_string(const char *s) {
2781 assert(s);
2782
2783 if (STR_IN_SET(s, "Stream", "Datagram", "SequentialPacket", "Netlink"))
2784 return SOCKET_SOCKET;
2785 else if (streq(s, "Special"))
2786 return SOCKET_SPECIAL;
2787 else if (streq(s, "MessageQueue"))
2788 return SOCKET_MQUEUE;
2789 else if (streq(s, "FIFO"))
2790 return SOCKET_FIFO;
2791 else if (streq(s, "USBFunction"))
2792 return SOCKET_USB_FUNCTION;
2793 else
2794 return _SOCKET_TYPE_INVALID;
2795 }
2796
2797 _pure_ static bool socket_may_gc(Unit *u) {
2798 Socket *s = SOCKET(u);
2799
2800 assert(u);
2801
2802 return s->n_connections == 0;
2803 }
2804
2805 static int socket_accept_do(Socket *s, int fd) {
2806 int cfd;
2807
2808 assert(s);
2809 assert(fd >= 0);
2810
2811 for (;;) {
2812 cfd = accept4(fd, NULL, NULL, SOCK_NONBLOCK);
2813 if (cfd < 0) {
2814 if (errno == EINTR)
2815 continue;
2816
2817 return -errno;
2818 }
2819
2820 break;
2821 }
2822
2823 return cfd;
2824 }
2825
2826 static int socket_accept_in_cgroup(Socket *s, SocketPort *p, int fd) {
2827 _cleanup_close_pair_ int pair[2] = { -1, -1 };
2828 int cfd, r;
2829 pid_t pid;
2830
2831 assert(s);
2832 assert(p);
2833 assert(fd >= 0);
2834
2835 /* Similar to socket_address_listen_in_cgroup(), but for accept() rathern than socket(): make sure that any
2836 * connection socket is also properly associated with the cgroup. */
2837
2838 if (!IN_SET(p->address.sockaddr.sa.sa_family, AF_INET, AF_INET6))
2839 goto shortcut;
2840
2841 r = bpf_firewall_supported();
2842 if (r < 0)
2843 return r;
2844 if (r == BPF_FIREWALL_UNSUPPORTED)
2845 goto shortcut;
2846
2847 if (socketpair(AF_UNIX, SOCK_SEQPACKET|SOCK_CLOEXEC, 0, pair) < 0)
2848 return log_unit_error_errno(UNIT(s), errno, "Failed to create communication channel: %m");
2849
2850 r = unit_fork_helper_process(UNIT(s), "(sd-accept)", &pid);
2851 if (r < 0)
2852 return log_unit_error_errno(UNIT(s), r, "Failed to fork off accept stub process: %m");
2853 if (r == 0) {
2854 /* Child */
2855
2856 pair[0] = safe_close(pair[0]);
2857
2858 cfd = socket_accept_do(s, fd);
2859 if (cfd < 0) {
2860 log_unit_error_errno(UNIT(s), cfd, "Failed to accept connection socket: %m");
2861 _exit(EXIT_FAILURE);
2862 }
2863
2864 r = send_one_fd(pair[1], cfd, 0);
2865 if (r < 0) {
2866 log_unit_error_errno(UNIT(s), r, "Failed to send connection socket to parent: %m");
2867 _exit(EXIT_FAILURE);
2868 }
2869
2870 _exit(EXIT_SUCCESS);
2871 }
2872
2873 pair[1] = safe_close(pair[1]);
2874 cfd = receive_one_fd(pair[0], 0);
2875
2876 /* We synchronously wait for the helper, as it shouldn't be slow */
2877 r = wait_for_terminate_and_check("(sd-accept)", pid, WAIT_LOG_ABNORMAL);
2878 if (r < 0) {
2879 safe_close(cfd);
2880 return r;
2881 }
2882
2883 if (cfd < 0)
2884 return log_unit_error_errno(UNIT(s), cfd, "Failed to receive connection socket: %m");
2885
2886 return cfd;
2887
2888 shortcut:
2889 cfd = socket_accept_do(s, fd);
2890 if (cfd < 0)
2891 return log_unit_error_errno(UNIT(s), cfd, "Failed to accept connection socket: %m");
2892
2893 return cfd;
2894 }
2895
2896 static int socket_dispatch_io(sd_event_source *source, int fd, uint32_t revents, void *userdata) {
2897 SocketPort *p = userdata;
2898 int cfd = -1;
2899
2900 assert(p);
2901 assert(fd >= 0);
2902
2903 if (p->socket->state != SOCKET_LISTENING)
2904 return 0;
2905
2906 log_unit_debug(UNIT(p->socket), "Incoming traffic");
2907
2908 if (revents != EPOLLIN) {
2909
2910 if (revents & EPOLLHUP)
2911 log_unit_error(UNIT(p->socket), "Got POLLHUP on a listening socket. The service probably invoked shutdown() on it, and should better not do that.");
2912 else
2913 log_unit_error(UNIT(p->socket), "Got unexpected poll event (0x%x) on socket.", revents);
2914 goto fail;
2915 }
2916
2917 if (p->socket->accept &&
2918 p->type == SOCKET_SOCKET &&
2919 socket_address_can_accept(&p->address)) {
2920
2921 cfd = socket_accept_in_cgroup(p->socket, p, fd);
2922 if (cfd < 0)
2923 goto fail;
2924
2925 socket_apply_socket_options(p->socket, cfd);
2926 }
2927
2928 socket_enter_running(p->socket, cfd);
2929 return 0;
2930
2931 fail:
2932 socket_enter_stop_pre(p->socket, SOCKET_FAILURE_RESOURCES);
2933 return 0;
2934 }
2935
2936 static void socket_sigchld_event(Unit *u, pid_t pid, int code, int status) {
2937 Socket *s = SOCKET(u);
2938 SocketResult f;
2939
2940 assert(s);
2941 assert(pid >= 0);
2942
2943 if (pid != s->control_pid)
2944 return;
2945
2946 s->control_pid = 0;
2947
2948 if (is_clean_exit(code, status, EXIT_CLEAN_COMMAND, NULL))
2949 f = SOCKET_SUCCESS;
2950 else if (code == CLD_EXITED)
2951 f = SOCKET_FAILURE_EXIT_CODE;
2952 else if (code == CLD_KILLED)
2953 f = SOCKET_FAILURE_SIGNAL;
2954 else if (code == CLD_DUMPED)
2955 f = SOCKET_FAILURE_CORE_DUMP;
2956 else
2957 assert_not_reached("Unknown sigchld code");
2958
2959 if (s->control_command) {
2960 exec_status_exit(&s->control_command->exec_status, &s->exec_context, pid, code, status);
2961
2962 if (s->control_command->flags & EXEC_COMMAND_IGNORE_FAILURE)
2963 f = SOCKET_SUCCESS;
2964 }
2965
2966 log_unit_full(u, f == SOCKET_SUCCESS ? LOG_DEBUG : LOG_NOTICE, 0,
2967 "Control process exited, code=%s status=%i",
2968 sigchld_code_to_string(code), status);
2969
2970 if (s->result == SOCKET_SUCCESS)
2971 s->result = f;
2972
2973 if (s->control_command &&
2974 s->control_command->command_next &&
2975 f == SOCKET_SUCCESS) {
2976
2977 log_unit_debug(u, "Running next command for state %s", socket_state_to_string(s->state));
2978 socket_run_next(s);
2979 } else {
2980 s->control_command = NULL;
2981 s->control_command_id = _SOCKET_EXEC_COMMAND_INVALID;
2982
2983 /* No further commands for this step, so let's figure
2984 * out what to do next */
2985
2986 log_unit_debug(u, "Got final SIGCHLD for state %s", socket_state_to_string(s->state));
2987
2988 switch (s->state) {
2989
2990 case SOCKET_START_PRE:
2991 if (f == SOCKET_SUCCESS)
2992 socket_enter_start_chown(s);
2993 else
2994 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, f);
2995 break;
2996
2997 case SOCKET_START_CHOWN:
2998 if (f == SOCKET_SUCCESS)
2999 socket_enter_start_post(s);
3000 else
3001 socket_enter_stop_pre(s, f);
3002 break;
3003
3004 case SOCKET_START_POST:
3005 if (f == SOCKET_SUCCESS)
3006 socket_enter_listening(s);
3007 else
3008 socket_enter_stop_pre(s, f);
3009 break;
3010
3011 case SOCKET_STOP_PRE:
3012 case SOCKET_STOP_PRE_SIGTERM:
3013 case SOCKET_STOP_PRE_SIGKILL:
3014 socket_enter_stop_post(s, f);
3015 break;
3016
3017 case SOCKET_STOP_POST:
3018 case SOCKET_FINAL_SIGTERM:
3019 case SOCKET_FINAL_SIGKILL:
3020 socket_enter_dead(s, f);
3021 break;
3022
3023 default:
3024 assert_not_reached("Uh, control process died at wrong time.");
3025 }
3026 }
3027
3028 /* Notify clients about changed exit status */
3029 unit_add_to_dbus_queue(u);
3030 }
3031
3032 static int socket_dispatch_timer(sd_event_source *source, usec_t usec, void *userdata) {
3033 Socket *s = SOCKET(userdata);
3034
3035 assert(s);
3036 assert(s->timer_event_source == source);
3037
3038 switch (s->state) {
3039
3040 case SOCKET_START_PRE:
3041 log_unit_warning(UNIT(s), "Starting timed out. Terminating.");
3042 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, SOCKET_FAILURE_TIMEOUT);
3043 break;
3044
3045 case SOCKET_START_CHOWN:
3046 case SOCKET_START_POST:
3047 log_unit_warning(UNIT(s), "Starting timed out. Stopping.");
3048 socket_enter_stop_pre(s, SOCKET_FAILURE_TIMEOUT);
3049 break;
3050
3051 case SOCKET_STOP_PRE:
3052 log_unit_warning(UNIT(s), "Stopping timed out. Terminating.");
3053 socket_enter_signal(s, SOCKET_STOP_PRE_SIGTERM, SOCKET_FAILURE_TIMEOUT);
3054 break;
3055
3056 case SOCKET_STOP_PRE_SIGTERM:
3057 if (s->kill_context.send_sigkill) {
3058 log_unit_warning(UNIT(s), "Stopping timed out. Killing.");
3059 socket_enter_signal(s, SOCKET_STOP_PRE_SIGKILL, SOCKET_FAILURE_TIMEOUT);
3060 } else {
3061 log_unit_warning(UNIT(s), "Stopping timed out. Skipping SIGKILL. Ignoring.");
3062 socket_enter_stop_post(s, SOCKET_FAILURE_TIMEOUT);
3063 }
3064 break;
3065
3066 case SOCKET_STOP_PRE_SIGKILL:
3067 log_unit_warning(UNIT(s), "Processes still around after SIGKILL. Ignoring.");
3068 socket_enter_stop_post(s, SOCKET_FAILURE_TIMEOUT);
3069 break;
3070
3071 case SOCKET_STOP_POST:
3072 log_unit_warning(UNIT(s), "Stopping timed out (2). Terminating.");
3073 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, SOCKET_FAILURE_TIMEOUT);
3074 break;
3075
3076 case SOCKET_FINAL_SIGTERM:
3077 if (s->kill_context.send_sigkill) {
3078 log_unit_warning(UNIT(s), "Stopping timed out (2). Killing.");
3079 socket_enter_signal(s, SOCKET_FINAL_SIGKILL, SOCKET_FAILURE_TIMEOUT);
3080 } else {
3081 log_unit_warning(UNIT(s), "Stopping timed out (2). Skipping SIGKILL. Ignoring.");
3082 socket_enter_dead(s, SOCKET_FAILURE_TIMEOUT);
3083 }
3084 break;
3085
3086 case SOCKET_FINAL_SIGKILL:
3087 log_unit_warning(UNIT(s), "Still around after SIGKILL (2). Entering failed mode.");
3088 socket_enter_dead(s, SOCKET_FAILURE_TIMEOUT);
3089 break;
3090
3091 default:
3092 assert_not_reached("Timeout at wrong time.");
3093 }
3094
3095 return 0;
3096 }
3097
3098 int socket_collect_fds(Socket *s, int **fds) {
3099 size_t k = 0, n = 0;
3100 SocketPort *p;
3101 int *rfds;
3102
3103 assert(s);
3104 assert(fds);
3105
3106 /* Called from the service code for requesting our fds */
3107
3108 LIST_FOREACH(port, p, s->ports) {
3109 if (p->fd >= 0)
3110 n++;
3111 n += p->n_auxiliary_fds;
3112 }
3113
3114 if (n <= 0) {
3115 *fds = NULL;
3116 return 0;
3117 }
3118
3119 rfds = new(int, n);
3120 if (!rfds)
3121 return -ENOMEM;
3122
3123 LIST_FOREACH(port, p, s->ports) {
3124 size_t i;
3125
3126 if (p->fd >= 0)
3127 rfds[k++] = p->fd;
3128 for (i = 0; i < p->n_auxiliary_fds; ++i)
3129 rfds[k++] = p->auxiliary_fds[i];
3130 }
3131
3132 assert(k == n);
3133
3134 *fds = rfds;
3135 return (int) n;
3136 }
3137
3138 static void socket_reset_failed(Unit *u) {
3139 Socket *s = SOCKET(u);
3140
3141 assert(s);
3142
3143 if (s->state == SOCKET_FAILED)
3144 socket_set_state(s, SOCKET_DEAD);
3145
3146 s->result = SOCKET_SUCCESS;
3147 }
3148
3149 void socket_connection_unref(Socket *s) {
3150 assert(s);
3151
3152 /* The service is dead. Yay!
3153 *
3154 * This is strictly for one-instance-per-connection
3155 * services. */
3156
3157 assert(s->n_connections > 0);
3158 s->n_connections--;
3159
3160 log_unit_debug(UNIT(s), "One connection closed, %u left.", s->n_connections);
3161 }
3162
3163 static void socket_trigger_notify(Unit *u, Unit *other) {
3164 Socket *s = SOCKET(u);
3165
3166 assert(u);
3167 assert(other);
3168
3169 /* Filter out invocations with bogus state */
3170 if (other->load_state != UNIT_LOADED || other->type != UNIT_SERVICE)
3171 return;
3172
3173 /* Don't propagate state changes from the service if we are already down */
3174 if (!IN_SET(s->state, SOCKET_RUNNING, SOCKET_LISTENING))
3175 return;
3176
3177 /* We don't care for the service state if we are in Accept=yes mode */
3178 if (s->accept)
3179 return;
3180
3181 /* Propagate start limit hit state */
3182 if (other->start_limit_hit) {
3183 socket_enter_stop_pre(s, SOCKET_FAILURE_SERVICE_START_LIMIT_HIT);
3184 return;
3185 }
3186
3187 /* Don't propagate anything if there's still a job queued */
3188 if (other->job)
3189 return;
3190
3191 if (IN_SET(SERVICE(other)->state,
3192 SERVICE_DEAD, SERVICE_FAILED,
3193 SERVICE_FINAL_SIGTERM, SERVICE_FINAL_SIGKILL,
3194 SERVICE_AUTO_RESTART))
3195 socket_enter_listening(s);
3196
3197 if (SERVICE(other)->state == SERVICE_RUNNING)
3198 socket_set_state(s, SOCKET_RUNNING);
3199 }
3200
3201 static int socket_kill(Unit *u, KillWho who, int signo, sd_bus_error *error) {
3202 return unit_kill_common(u, who, signo, -1, SOCKET(u)->control_pid, error);
3203 }
3204
3205 static int socket_get_timeout(Unit *u, usec_t *timeout) {
3206 Socket *s = SOCKET(u);
3207 usec_t t;
3208 int r;
3209
3210 if (!s->timer_event_source)
3211 return 0;
3212
3213 r = sd_event_source_get_time(s->timer_event_source, &t);
3214 if (r < 0)
3215 return r;
3216 if (t == USEC_INFINITY)
3217 return 0;
3218
3219 *timeout = t;
3220 return 1;
3221 }
3222
3223 char *socket_fdname(Socket *s) {
3224 assert(s);
3225
3226 /* Returns the name to use for $LISTEN_NAMES. If the user
3227 * didn't specify anything specifically, use the socket unit's
3228 * name as fallback. */
3229
3230 return s->fdname ?: UNIT(s)->id;
3231 }
3232
3233 static int socket_control_pid(Unit *u) {
3234 Socket *s = SOCKET(u);
3235
3236 assert(s);
3237
3238 return s->control_pid;
3239 }
3240
3241 static const char* const socket_exec_command_table[_SOCKET_EXEC_COMMAND_MAX] = {
3242 [SOCKET_EXEC_START_PRE] = "ExecStartPre",
3243 [SOCKET_EXEC_START_CHOWN] = "ExecStartChown",
3244 [SOCKET_EXEC_START_POST] = "ExecStartPost",
3245 [SOCKET_EXEC_STOP_PRE] = "ExecStopPre",
3246 [SOCKET_EXEC_STOP_POST] = "ExecStopPost"
3247 };
3248
3249 DEFINE_STRING_TABLE_LOOKUP(socket_exec_command, SocketExecCommand);
3250
3251 static const char* const socket_result_table[_SOCKET_RESULT_MAX] = {
3252 [SOCKET_SUCCESS] = "success",
3253 [SOCKET_FAILURE_RESOURCES] = "resources",
3254 [SOCKET_FAILURE_TIMEOUT] = "timeout",
3255 [SOCKET_FAILURE_EXIT_CODE] = "exit-code",
3256 [SOCKET_FAILURE_SIGNAL] = "signal",
3257 [SOCKET_FAILURE_CORE_DUMP] = "core-dump",
3258 [SOCKET_FAILURE_START_LIMIT_HIT] = "start-limit-hit",
3259 [SOCKET_FAILURE_TRIGGER_LIMIT_HIT] = "trigger-limit-hit",
3260 [SOCKET_FAILURE_SERVICE_START_LIMIT_HIT] = "service-start-limit-hit"
3261 };
3262
3263 DEFINE_STRING_TABLE_LOOKUP(socket_result, SocketResult);
3264
3265 const UnitVTable socket_vtable = {
3266 .object_size = sizeof(Socket),
3267 .exec_context_offset = offsetof(Socket, exec_context),
3268 .cgroup_context_offset = offsetof(Socket, cgroup_context),
3269 .kill_context_offset = offsetof(Socket, kill_context),
3270 .exec_runtime_offset = offsetof(Socket, exec_runtime),
3271 .dynamic_creds_offset = offsetof(Socket, dynamic_creds),
3272
3273 .sections =
3274 "Unit\0"
3275 "Socket\0"
3276 "Install\0",
3277 .private_section = "Socket",
3278
3279 .can_transient = true,
3280
3281 .init = socket_init,
3282 .done = socket_done,
3283 .load = socket_load,
3284
3285 .coldplug = socket_coldplug,
3286
3287 .dump = socket_dump,
3288
3289 .start = socket_start,
3290 .stop = socket_stop,
3291
3292 .kill = socket_kill,
3293
3294 .get_timeout = socket_get_timeout,
3295
3296 .serialize = socket_serialize,
3297 .deserialize_item = socket_deserialize_item,
3298 .distribute_fds = socket_distribute_fds,
3299
3300 .active_state = socket_active_state,
3301 .sub_state_to_string = socket_sub_state_to_string,
3302
3303 .may_gc = socket_may_gc,
3304
3305 .sigchld_event = socket_sigchld_event,
3306
3307 .trigger_notify = socket_trigger_notify,
3308
3309 .reset_failed = socket_reset_failed,
3310
3311 .control_pid = socket_control_pid,
3312
3313 .bus_vtable = bus_socket_vtable,
3314 .bus_set_property = bus_socket_set_property,
3315 .bus_commit_properties = bus_socket_commit_properties,
3316
3317 .status_message_formats = {
3318 /*.starting_stopping = {
3319 [0] = "Starting socket %s...",
3320 [1] = "Stopping socket %s...",
3321 },*/
3322 .finished_start_job = {
3323 [JOB_DONE] = "Listening on %s.",
3324 [JOB_FAILED] = "Failed to listen on %s.",
3325 [JOB_TIMEOUT] = "Timed out starting %s.",
3326 },
3327 .finished_stop_job = {
3328 [JOB_DONE] = "Closed %s.",
3329 [JOB_FAILED] = "Failed stopping %s.",
3330 [JOB_TIMEOUT] = "Timed out stopping %s.",
3331 },
3332 },
3333 };