]> git.ipfire.org Git - thirdparty/systemd.git/blob - src/core/socket.c
Merge pull request #9504 from poettering/nss-deadlock
[thirdparty/systemd.git] / src / core / socket.c
1 /* SPDX-License-Identifier: LGPL-2.1+ */
2
3 #include <arpa/inet.h>
4 #include <errno.h>
5 #include <fcntl.h>
6 #include <mqueue.h>
7 #include <netinet/tcp.h>
8 #include <signal.h>
9 #include <sys/epoll.h>
10 #include <sys/stat.h>
11 #include <unistd.h>
12 #include <linux/sctp.h>
13
14 #include "alloc-util.h"
15 #include "bpf-firewall.h"
16 #include "bus-error.h"
17 #include "bus-util.h"
18 #include "copy.h"
19 #include "dbus-socket.h"
20 #include "def.h"
21 #include "exit-status.h"
22 #include "fd-util.h"
23 #include "format-util.h"
24 #include "fs-util.h"
25 #include "in-addr-util.h"
26 #include "io-util.h"
27 #include "label.h"
28 #include "log.h"
29 #include "missing.h"
30 #include "mkdir.h"
31 #include "parse-util.h"
32 #include "path-util.h"
33 #include "process-util.h"
34 #include "selinux-util.h"
35 #include "signal-util.h"
36 #include "smack-util.h"
37 #include "socket.h"
38 #include "socket-protocol-list.h"
39 #include "special.h"
40 #include "string-table.h"
41 #include "string-util.h"
42 #include "strv.h"
43 #include "unit-name.h"
44 #include "unit.h"
45 #include "user-util.h"
46
47 struct SocketPeer {
48 unsigned n_ref;
49
50 Socket *socket;
51 union sockaddr_union peer;
52 socklen_t peer_salen;
53 };
54
55 static const UnitActiveState state_translation_table[_SOCKET_STATE_MAX] = {
56 [SOCKET_DEAD] = UNIT_INACTIVE,
57 [SOCKET_START_PRE] = UNIT_ACTIVATING,
58 [SOCKET_START_CHOWN] = UNIT_ACTIVATING,
59 [SOCKET_START_POST] = UNIT_ACTIVATING,
60 [SOCKET_LISTENING] = UNIT_ACTIVE,
61 [SOCKET_RUNNING] = UNIT_ACTIVE,
62 [SOCKET_STOP_PRE] = UNIT_DEACTIVATING,
63 [SOCKET_STOP_PRE_SIGTERM] = UNIT_DEACTIVATING,
64 [SOCKET_STOP_PRE_SIGKILL] = UNIT_DEACTIVATING,
65 [SOCKET_STOP_POST] = UNIT_DEACTIVATING,
66 [SOCKET_FINAL_SIGTERM] = UNIT_DEACTIVATING,
67 [SOCKET_FINAL_SIGKILL] = UNIT_DEACTIVATING,
68 [SOCKET_FAILED] = UNIT_FAILED
69 };
70
71 static int socket_dispatch_io(sd_event_source *source, int fd, uint32_t revents, void *userdata);
72 static int socket_dispatch_timer(sd_event_source *source, usec_t usec, void *userdata);
73
74 static void socket_init(Unit *u) {
75 Socket *s = SOCKET(u);
76
77 assert(u);
78 assert(u->load_state == UNIT_STUB);
79
80 s->backlog = SOMAXCONN;
81 s->timeout_usec = u->manager->default_timeout_start_usec;
82 s->directory_mode = 0755;
83 s->socket_mode = 0666;
84
85 s->max_connections = 64;
86
87 s->priority = -1;
88 s->ip_tos = -1;
89 s->ip_ttl = -1;
90 s->mark = -1;
91
92 s->exec_context.std_output = u->manager->default_std_output;
93 s->exec_context.std_error = u->manager->default_std_error;
94
95 s->control_command_id = _SOCKET_EXEC_COMMAND_INVALID;
96
97 s->trigger_limit.interval = USEC_INFINITY;
98 s->trigger_limit.burst = (unsigned) -1;
99 }
100
101 static void socket_unwatch_control_pid(Socket *s) {
102 assert(s);
103
104 if (s->control_pid <= 0)
105 return;
106
107 unit_unwatch_pid(UNIT(s), s->control_pid);
108 s->control_pid = 0;
109 }
110
111 static void socket_cleanup_fd_list(SocketPort *p) {
112 assert(p);
113
114 close_many(p->auxiliary_fds, p->n_auxiliary_fds);
115 p->auxiliary_fds = mfree(p->auxiliary_fds);
116 p->n_auxiliary_fds = 0;
117 }
118
119 void socket_free_ports(Socket *s) {
120 SocketPort *p;
121
122 assert(s);
123
124 while ((p = s->ports)) {
125 LIST_REMOVE(port, s->ports, p);
126
127 sd_event_source_unref(p->event_source);
128
129 socket_cleanup_fd_list(p);
130 safe_close(p->fd);
131 free(p->path);
132 free(p);
133 }
134 }
135
136 static void socket_done(Unit *u) {
137 Socket *s = SOCKET(u);
138 SocketPeer *p;
139
140 assert(s);
141
142 socket_free_ports(s);
143
144 while ((p = set_steal_first(s->peers_by_address)))
145 p->socket = NULL;
146
147 s->peers_by_address = set_free(s->peers_by_address);
148
149 s->exec_runtime = exec_runtime_unref(s->exec_runtime, false);
150 exec_command_free_array(s->exec_command, _SOCKET_EXEC_COMMAND_MAX);
151 s->control_command = NULL;
152
153 dynamic_creds_unref(&s->dynamic_creds);
154
155 socket_unwatch_control_pid(s);
156
157 unit_ref_unset(&s->service);
158
159 s->tcp_congestion = mfree(s->tcp_congestion);
160 s->bind_to_device = mfree(s->bind_to_device);
161
162 s->smack = mfree(s->smack);
163 s->smack_ip_in = mfree(s->smack_ip_in);
164 s->smack_ip_out = mfree(s->smack_ip_out);
165
166 strv_free(s->symlinks);
167
168 s->user = mfree(s->user);
169 s->group = mfree(s->group);
170
171 s->fdname = mfree(s->fdname);
172
173 s->timer_event_source = sd_event_source_unref(s->timer_event_source);
174 }
175
176 static int socket_arm_timer(Socket *s, usec_t usec) {
177 int r;
178
179 assert(s);
180
181 if (s->timer_event_source) {
182 r = sd_event_source_set_time(s->timer_event_source, usec);
183 if (r < 0)
184 return r;
185
186 return sd_event_source_set_enabled(s->timer_event_source, SD_EVENT_ONESHOT);
187 }
188
189 if (usec == USEC_INFINITY)
190 return 0;
191
192 r = sd_event_add_time(
193 UNIT(s)->manager->event,
194 &s->timer_event_source,
195 CLOCK_MONOTONIC,
196 usec, 0,
197 socket_dispatch_timer, s);
198 if (r < 0)
199 return r;
200
201 (void) sd_event_source_set_description(s->timer_event_source, "socket-timer");
202
203 return 0;
204 }
205
206 int socket_instantiate_service(Socket *s) {
207 _cleanup_free_ char *prefix = NULL, *name = NULL;
208 int r;
209 Unit *u;
210
211 assert(s);
212
213 /* This fills in s->service if it isn't filled in yet. For
214 * Accept=yes sockets we create the next connection service
215 * here. For Accept=no this is mostly a NOP since the service
216 * is figured out at load time anyway. */
217
218 if (UNIT_DEREF(s->service))
219 return 0;
220
221 if (!s->accept)
222 return 0;
223
224 r = unit_name_to_prefix(UNIT(s)->id, &prefix);
225 if (r < 0)
226 return r;
227
228 if (asprintf(&name, "%s@%u.service", prefix, s->n_accepted) < 0)
229 return -ENOMEM;
230
231 r = manager_load_unit(UNIT(s)->manager, name, NULL, NULL, &u);
232 if (r < 0)
233 return r;
234
235 unit_ref_set(&s->service, UNIT(s), u);
236
237 return unit_add_two_dependencies(UNIT(s), UNIT_BEFORE, UNIT_TRIGGERS, u, false, UNIT_DEPENDENCY_IMPLICIT);
238 }
239
240 static bool have_non_accept_socket(Socket *s) {
241 SocketPort *p;
242
243 assert(s);
244
245 if (!s->accept)
246 return true;
247
248 LIST_FOREACH(port, p, s->ports) {
249
250 if (p->type != SOCKET_SOCKET)
251 return true;
252
253 if (!socket_address_can_accept(&p->address))
254 return true;
255 }
256
257 return false;
258 }
259
260 static int socket_add_mount_dependencies(Socket *s) {
261 SocketPort *p;
262 int r;
263
264 assert(s);
265
266 LIST_FOREACH(port, p, s->ports) {
267 const char *path = NULL;
268
269 if (p->type == SOCKET_SOCKET)
270 path = socket_address_get_path(&p->address);
271 else if (IN_SET(p->type, SOCKET_FIFO, SOCKET_SPECIAL, SOCKET_USB_FUNCTION))
272 path = p->path;
273
274 if (!path)
275 continue;
276
277 r = unit_require_mounts_for(UNIT(s), path, UNIT_DEPENDENCY_FILE);
278 if (r < 0)
279 return r;
280 }
281
282 return 0;
283 }
284
285 static int socket_add_device_dependencies(Socket *s) {
286 char *t;
287
288 assert(s);
289
290 if (!s->bind_to_device || streq(s->bind_to_device, "lo"))
291 return 0;
292
293 t = strjoina("/sys/subsystem/net/devices/", s->bind_to_device);
294 return unit_add_node_dependency(UNIT(s), t, false, UNIT_BINDS_TO, UNIT_DEPENDENCY_FILE);
295 }
296
297 static int socket_add_default_dependencies(Socket *s) {
298 int r;
299 assert(s);
300
301 if (!UNIT(s)->default_dependencies)
302 return 0;
303
304 r = unit_add_dependency_by_name(UNIT(s), UNIT_BEFORE, SPECIAL_SOCKETS_TARGET, NULL, true, UNIT_DEPENDENCY_DEFAULT);
305 if (r < 0)
306 return r;
307
308 if (MANAGER_IS_SYSTEM(UNIT(s)->manager)) {
309 r = unit_add_two_dependencies_by_name(UNIT(s), UNIT_AFTER, UNIT_REQUIRES, SPECIAL_SYSINIT_TARGET, NULL, true, UNIT_DEPENDENCY_DEFAULT);
310 if (r < 0)
311 return r;
312 }
313
314 return unit_add_two_dependencies_by_name(UNIT(s), UNIT_BEFORE, UNIT_CONFLICTS, SPECIAL_SHUTDOWN_TARGET, NULL, true, UNIT_DEPENDENCY_DEFAULT);
315 }
316
317 _pure_ static bool socket_has_exec(Socket *s) {
318 unsigned i;
319 assert(s);
320
321 for (i = 0; i < _SOCKET_EXEC_COMMAND_MAX; i++)
322 if (s->exec_command[i])
323 return true;
324
325 return false;
326 }
327
328 static int socket_add_extras(Socket *s) {
329 Unit *u = UNIT(s);
330 int r;
331
332 assert(s);
333
334 /* Pick defaults for the trigger limit, if nothing was explicitly configured. We pick a relatively high limit
335 * in Accept=yes mode, and a lower limit for Accept=no. Reason: in Accept=yes mode we are invoking accept()
336 * ourselves before the trigger limit can hit, thus incoming connections are taken off the socket queue quickly
337 * and reliably. This is different for Accept=no, where the spawned service has to take the incoming traffic
338 * off the queues, which it might not necessarily do. Moreover, while Accept=no services are supposed to
339 * process whatever is queued in one go, and thus should normally never have to be started frequently. This is
340 * different for Accept=yes where each connection is processed by a new service instance, and thus frequent
341 * service starts are typical. */
342
343 if (s->trigger_limit.interval == USEC_INFINITY)
344 s->trigger_limit.interval = 2 * USEC_PER_SEC;
345
346 if (s->trigger_limit.burst == (unsigned) -1) {
347 if (s->accept)
348 s->trigger_limit.burst = 200;
349 else
350 s->trigger_limit.burst = 20;
351 }
352
353 if (have_non_accept_socket(s)) {
354
355 if (!UNIT_DEREF(s->service)) {
356 Unit *x;
357
358 r = unit_load_related_unit(u, ".service", &x);
359 if (r < 0)
360 return r;
361
362 unit_ref_set(&s->service, u, x);
363 }
364
365 r = unit_add_two_dependencies(u, UNIT_BEFORE, UNIT_TRIGGERS, UNIT_DEREF(s->service), true, UNIT_DEPENDENCY_IMPLICIT);
366 if (r < 0)
367 return r;
368 }
369
370 r = socket_add_mount_dependencies(s);
371 if (r < 0)
372 return r;
373
374 r = socket_add_device_dependencies(s);
375 if (r < 0)
376 return r;
377
378 r = unit_patch_contexts(u);
379 if (r < 0)
380 return r;
381
382 if (socket_has_exec(s)) {
383 r = unit_add_exec_dependencies(u, &s->exec_context);
384 if (r < 0)
385 return r;
386 }
387
388 r = unit_set_default_slice(u);
389 if (r < 0)
390 return r;
391
392 r = socket_add_default_dependencies(s);
393 if (r < 0)
394 return r;
395
396 return 0;
397 }
398
399 static const char *socket_find_symlink_target(Socket *s) {
400 const char *found = NULL;
401 SocketPort *p;
402
403 LIST_FOREACH(port, p, s->ports) {
404 const char *f = NULL;
405
406 switch (p->type) {
407
408 case SOCKET_FIFO:
409 f = p->path;
410 break;
411
412 case SOCKET_SOCKET:
413 f = socket_address_get_path(&p->address);
414 break;
415
416 default:
417 break;
418 }
419
420 if (f) {
421 if (found)
422 return NULL;
423
424 found = f;
425 }
426 }
427
428 return found;
429 }
430
431 static int socket_verify(Socket *s) {
432 assert(s);
433
434 if (UNIT(s)->load_state != UNIT_LOADED)
435 return 0;
436
437 if (!s->ports) {
438 log_unit_error(UNIT(s), "Unit has no Listen setting (ListenStream=, ListenDatagram=, ListenFIFO=, ...). Refusing.");
439 return -ENOEXEC;
440 }
441
442 if (s->accept && have_non_accept_socket(s)) {
443 log_unit_error(UNIT(s), "Unit configured for accepting sockets, but sockets are non-accepting. Refusing.");
444 return -ENOEXEC;
445 }
446
447 if (s->accept && s->max_connections <= 0) {
448 log_unit_error(UNIT(s), "MaxConnection= setting too small. Refusing.");
449 return -ENOEXEC;
450 }
451
452 if (s->accept && UNIT_DEREF(s->service)) {
453 log_unit_error(UNIT(s), "Explicit service configuration for accepting socket units not supported. Refusing.");
454 return -ENOEXEC;
455 }
456
457 if (s->exec_context.pam_name && s->kill_context.kill_mode != KILL_CONTROL_GROUP) {
458 log_unit_error(UNIT(s), "Unit has PAM enabled. Kill mode must be set to 'control-group'. Refusing.");
459 return -ENOEXEC;
460 }
461
462 if (!strv_isempty(s->symlinks) && !socket_find_symlink_target(s)) {
463 log_unit_error(UNIT(s), "Unit has symlinks set but none or more than one node in the file system. Refusing.");
464 return -ENOEXEC;
465 }
466
467 return 0;
468 }
469
470 static void peer_address_hash_func(const void *p, struct siphash *state) {
471 const SocketPeer *s = p;
472
473 assert(s);
474
475 if (s->peer.sa.sa_family == AF_INET)
476 siphash24_compress(&s->peer.in.sin_addr, sizeof(s->peer.in.sin_addr), state);
477 else if (s->peer.sa.sa_family == AF_INET6)
478 siphash24_compress(&s->peer.in6.sin6_addr, sizeof(s->peer.in6.sin6_addr), state);
479 else if (s->peer.sa.sa_family == AF_VSOCK)
480 siphash24_compress(&s->peer.vm.svm_cid, sizeof(s->peer.vm.svm_cid), state);
481 else
482 assert_not_reached("Unknown address family.");
483 }
484
485 static int peer_address_compare_func(const void *a, const void *b) {
486 const SocketPeer *x = a, *y = b;
487
488 if (x->peer.sa.sa_family < y->peer.sa.sa_family)
489 return -1;
490 if (x->peer.sa.sa_family > y->peer.sa.sa_family)
491 return 1;
492
493 switch(x->peer.sa.sa_family) {
494 case AF_INET:
495 return memcmp(&x->peer.in.sin_addr, &y->peer.in.sin_addr, sizeof(x->peer.in.sin_addr));
496 case AF_INET6:
497 return memcmp(&x->peer.in6.sin6_addr, &y->peer.in6.sin6_addr, sizeof(x->peer.in6.sin6_addr));
498 case AF_VSOCK:
499 if (x->peer.vm.svm_cid < y->peer.vm.svm_cid)
500 return -1;
501 if (x->peer.vm.svm_cid > y->peer.vm.svm_cid)
502 return 1;
503 return 0;
504 }
505 assert_not_reached("Black sheep in the family!");
506 }
507
508 const struct hash_ops peer_address_hash_ops = {
509 .hash = peer_address_hash_func,
510 .compare = peer_address_compare_func
511 };
512
513 static int socket_load(Unit *u) {
514 Socket *s = SOCKET(u);
515 int r;
516
517 assert(u);
518 assert(u->load_state == UNIT_STUB);
519
520 r = set_ensure_allocated(&s->peers_by_address, &peer_address_hash_ops);
521 if (r < 0)
522 return r;
523
524 r = unit_load_fragment_and_dropin(u);
525 if (r < 0)
526 return r;
527
528 if (u->load_state == UNIT_LOADED) {
529 /* This is a new unit? Then let's add in some extras */
530 r = socket_add_extras(s);
531 if (r < 0)
532 return r;
533 }
534
535 return socket_verify(s);
536 }
537
538 static SocketPeer *socket_peer_new(void) {
539 SocketPeer *p;
540
541 p = new0(SocketPeer, 1);
542 if (!p)
543 return NULL;
544
545 p->n_ref = 1;
546
547 return p;
548 }
549
550 SocketPeer *socket_peer_ref(SocketPeer *p) {
551 if (!p)
552 return NULL;
553
554 assert(p->n_ref > 0);
555 p->n_ref++;
556
557 return p;
558 }
559
560 SocketPeer *socket_peer_unref(SocketPeer *p) {
561 if (!p)
562 return NULL;
563
564 assert(p->n_ref > 0);
565
566 p->n_ref--;
567
568 if (p->n_ref > 0)
569 return NULL;
570
571 if (p->socket)
572 set_remove(p->socket->peers_by_address, p);
573
574 return mfree(p);
575 }
576
577 int socket_acquire_peer(Socket *s, int fd, SocketPeer **p) {
578 _cleanup_(socket_peer_unrefp) SocketPeer *remote = NULL;
579 SocketPeer sa = {}, *i;
580 socklen_t salen = sizeof(sa.peer);
581 int r;
582
583 assert(fd >= 0);
584 assert(s);
585
586 r = getpeername(fd, &sa.peer.sa, &salen);
587 if (r < 0)
588 return log_error_errno(errno, "getpeername failed: %m");
589
590 if (!IN_SET(sa.peer.sa.sa_family, AF_INET, AF_INET6, AF_VSOCK)) {
591 *p = NULL;
592 return 0;
593 }
594
595 i = set_get(s->peers_by_address, &sa);
596 if (i) {
597 *p = socket_peer_ref(i);
598 return 1;
599 }
600
601 remote = socket_peer_new();
602 if (!remote)
603 return log_oom();
604
605 remote->peer = sa.peer;
606 remote->peer_salen = salen;
607
608 r = set_put(s->peers_by_address, remote);
609 if (r < 0)
610 return r;
611
612 remote->socket = s;
613
614 *p = TAKE_PTR(remote);
615
616 return 1;
617 }
618
619 _const_ static const char* listen_lookup(int family, int type) {
620
621 if (family == AF_NETLINK)
622 return "ListenNetlink";
623
624 if (type == SOCK_STREAM)
625 return "ListenStream";
626 else if (type == SOCK_DGRAM)
627 return "ListenDatagram";
628 else if (type == SOCK_SEQPACKET)
629 return "ListenSequentialPacket";
630
631 assert_not_reached("Unknown socket type");
632 return NULL;
633 }
634
635 static void socket_dump(Unit *u, FILE *f, const char *prefix) {
636 char time_string[FORMAT_TIMESPAN_MAX];
637 SocketExecCommand c;
638 Socket *s = SOCKET(u);
639 SocketPort *p;
640 const char *prefix2, *str;
641
642 assert(s);
643 assert(f);
644
645 prefix = strempty(prefix);
646 prefix2 = strjoina(prefix, "\t");
647
648 fprintf(f,
649 "%sSocket State: %s\n"
650 "%sResult: %s\n"
651 "%sBindIPv6Only: %s\n"
652 "%sBacklog: %u\n"
653 "%sSocketMode: %04o\n"
654 "%sDirectoryMode: %04o\n"
655 "%sKeepAlive: %s\n"
656 "%sNoDelay: %s\n"
657 "%sFreeBind: %s\n"
658 "%sTransparent: %s\n"
659 "%sBroadcast: %s\n"
660 "%sPassCredentials: %s\n"
661 "%sPassSecurity: %s\n"
662 "%sTCPCongestion: %s\n"
663 "%sRemoveOnStop: %s\n"
664 "%sWritable: %s\n"
665 "%sFileDescriptorName: %s\n"
666 "%sSELinuxContextFromNet: %s\n",
667 prefix, socket_state_to_string(s->state),
668 prefix, socket_result_to_string(s->result),
669 prefix, socket_address_bind_ipv6_only_to_string(s->bind_ipv6_only),
670 prefix, s->backlog,
671 prefix, s->socket_mode,
672 prefix, s->directory_mode,
673 prefix, yes_no(s->keep_alive),
674 prefix, yes_no(s->no_delay),
675 prefix, yes_no(s->free_bind),
676 prefix, yes_no(s->transparent),
677 prefix, yes_no(s->broadcast),
678 prefix, yes_no(s->pass_cred),
679 prefix, yes_no(s->pass_sec),
680 prefix, strna(s->tcp_congestion),
681 prefix, yes_no(s->remove_on_stop),
682 prefix, yes_no(s->writable),
683 prefix, socket_fdname(s),
684 prefix, yes_no(s->selinux_context_from_net));
685
686 if (s->control_pid > 0)
687 fprintf(f,
688 "%sControl PID: "PID_FMT"\n",
689 prefix, s->control_pid);
690
691 if (s->bind_to_device)
692 fprintf(f,
693 "%sBindToDevice: %s\n",
694 prefix, s->bind_to_device);
695
696 if (s->accept)
697 fprintf(f,
698 "%sAccepted: %u\n"
699 "%sNConnections: %u\n"
700 "%sMaxConnections: %u\n"
701 "%sMaxConnectionsPerSource: %u\n",
702 prefix, s->n_accepted,
703 prefix, s->n_connections,
704 prefix, s->max_connections,
705 prefix, s->max_connections_per_source);
706
707 if (s->priority >= 0)
708 fprintf(f,
709 "%sPriority: %i\n",
710 prefix, s->priority);
711
712 if (s->receive_buffer > 0)
713 fprintf(f,
714 "%sReceiveBuffer: %zu\n",
715 prefix, s->receive_buffer);
716
717 if (s->send_buffer > 0)
718 fprintf(f,
719 "%sSendBuffer: %zu\n",
720 prefix, s->send_buffer);
721
722 if (s->ip_tos >= 0)
723 fprintf(f,
724 "%sIPTOS: %i\n",
725 prefix, s->ip_tos);
726
727 if (s->ip_ttl >= 0)
728 fprintf(f,
729 "%sIPTTL: %i\n",
730 prefix, s->ip_ttl);
731
732 if (s->pipe_size > 0)
733 fprintf(f,
734 "%sPipeSize: %zu\n",
735 prefix, s->pipe_size);
736
737 if (s->mark >= 0)
738 fprintf(f,
739 "%sMark: %i\n",
740 prefix, s->mark);
741
742 if (s->mq_maxmsg > 0)
743 fprintf(f,
744 "%sMessageQueueMaxMessages: %li\n",
745 prefix, s->mq_maxmsg);
746
747 if (s->mq_msgsize > 0)
748 fprintf(f,
749 "%sMessageQueueMessageSize: %li\n",
750 prefix, s->mq_msgsize);
751
752 if (s->reuse_port)
753 fprintf(f,
754 "%sReusePort: %s\n",
755 prefix, yes_no(s->reuse_port));
756
757 if (s->smack)
758 fprintf(f,
759 "%sSmackLabel: %s\n",
760 prefix, s->smack);
761
762 if (s->smack_ip_in)
763 fprintf(f,
764 "%sSmackLabelIPIn: %s\n",
765 prefix, s->smack_ip_in);
766
767 if (s->smack_ip_out)
768 fprintf(f,
769 "%sSmackLabelIPOut: %s\n",
770 prefix, s->smack_ip_out);
771
772 if (!isempty(s->user) || !isempty(s->group))
773 fprintf(f,
774 "%sSocketUser: %s\n"
775 "%sSocketGroup: %s\n",
776 prefix, strna(s->user),
777 prefix, strna(s->group));
778
779 if (s->keep_alive_time > 0)
780 fprintf(f,
781 "%sKeepAliveTimeSec: %s\n",
782 prefix, format_timespan(time_string, FORMAT_TIMESPAN_MAX, s->keep_alive_time, USEC_PER_SEC));
783
784 if (s->keep_alive_interval > 0)
785 fprintf(f,
786 "%sKeepAliveIntervalSec: %s\n",
787 prefix, format_timespan(time_string, FORMAT_TIMESPAN_MAX, s->keep_alive_interval, USEC_PER_SEC));
788
789 if (s->keep_alive_cnt > 0)
790 fprintf(f,
791 "%sKeepAliveProbes: %u\n",
792 prefix, s->keep_alive_cnt);
793
794 if (s->defer_accept > 0)
795 fprintf(f,
796 "%sDeferAcceptSec: %s\n",
797 prefix, format_timespan(time_string, FORMAT_TIMESPAN_MAX, s->defer_accept, USEC_PER_SEC));
798
799 LIST_FOREACH(port, p, s->ports) {
800
801 switch (p->type) {
802 case SOCKET_SOCKET: {
803 _cleanup_free_ char *k = NULL;
804 const char *t;
805 int r;
806
807 r = socket_address_print(&p->address, &k);
808 if (r < 0)
809 t = strerror(-r);
810 else
811 t = k;
812
813 fprintf(f, "%s%s: %s\n", prefix, listen_lookup(socket_address_family(&p->address), p->address.type), t);
814 break;
815 }
816 case SOCKET_SPECIAL:
817 fprintf(f, "%sListenSpecial: %s\n", prefix, p->path);
818 break;
819 case SOCKET_USB_FUNCTION:
820 fprintf(f, "%sListenUSBFunction: %s\n", prefix, p->path);
821 break;
822 case SOCKET_MQUEUE:
823 fprintf(f, "%sListenMessageQueue: %s\n", prefix, p->path);
824 break;
825 default:
826 fprintf(f, "%sListenFIFO: %s\n", prefix, p->path);
827 }
828 }
829
830 fprintf(f,
831 "%sTriggerLimitIntervalSec: %s\n"
832 "%sTriggerLimitBurst: %u\n",
833 prefix, format_timespan(time_string, FORMAT_TIMESPAN_MAX, s->trigger_limit.interval, USEC_PER_SEC),
834 prefix, s->trigger_limit.burst);
835
836 str = socket_protocol_to_name(s->socket_protocol);
837 if (str)
838 fprintf(f, "%sSocketProtocol: %s\n", prefix, str);
839
840 if (!strv_isempty(s->symlinks)) {
841 char **q;
842
843 fprintf(f, "%sSymlinks:", prefix);
844 STRV_FOREACH(q, s->symlinks)
845 fprintf(f, " %s", *q);
846
847 fprintf(f, "\n");
848 }
849
850 fprintf(f,
851 "%sTimeoutSec: %s\n",
852 prefix, format_timespan(time_string, FORMAT_TIMESPAN_MAX, s->timeout_usec, USEC_PER_SEC));
853
854 exec_context_dump(&s->exec_context, f, prefix);
855 kill_context_dump(&s->kill_context, f, prefix);
856
857 for (c = 0; c < _SOCKET_EXEC_COMMAND_MAX; c++) {
858 if (!s->exec_command[c])
859 continue;
860
861 fprintf(f, "%s-> %s:\n",
862 prefix, socket_exec_command_to_string(c));
863
864 exec_command_dump_list(s->exec_command[c], f, prefix2);
865 }
866
867 cgroup_context_dump(&s->cgroup_context, f, prefix);
868 }
869
870 static int instance_from_socket(int fd, unsigned nr, char **instance) {
871 socklen_t l;
872 char *r;
873 union sockaddr_union local, remote;
874
875 assert(fd >= 0);
876 assert(instance);
877
878 l = sizeof(local);
879 if (getsockname(fd, &local.sa, &l) < 0)
880 return -errno;
881
882 l = sizeof(remote);
883 if (getpeername(fd, &remote.sa, &l) < 0)
884 return -errno;
885
886 switch (local.sa.sa_family) {
887
888 case AF_INET: {
889 uint32_t
890 a = be32toh(local.in.sin_addr.s_addr),
891 b = be32toh(remote.in.sin_addr.s_addr);
892
893 if (asprintf(&r,
894 "%u-%u.%u.%u.%u:%u-%u.%u.%u.%u:%u",
895 nr,
896 a >> 24, (a >> 16) & 0xFF, (a >> 8) & 0xFF, a & 0xFF,
897 be16toh(local.in.sin_port),
898 b >> 24, (b >> 16) & 0xFF, (b >> 8) & 0xFF, b & 0xFF,
899 be16toh(remote.in.sin_port)) < 0)
900 return -ENOMEM;
901
902 break;
903 }
904
905 case AF_INET6: {
906 static const unsigned char ipv4_prefix[] = {
907 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0xFF, 0xFF
908 };
909
910 if (memcmp(&local.in6.sin6_addr, ipv4_prefix, sizeof(ipv4_prefix)) == 0 &&
911 memcmp(&remote.in6.sin6_addr, ipv4_prefix, sizeof(ipv4_prefix)) == 0) {
912 const uint8_t
913 *a = local.in6.sin6_addr.s6_addr+12,
914 *b = remote.in6.sin6_addr.s6_addr+12;
915
916 if (asprintf(&r,
917 "%u-%u.%u.%u.%u:%u-%u.%u.%u.%u:%u",
918 nr,
919 a[0], a[1], a[2], a[3],
920 be16toh(local.in6.sin6_port),
921 b[0], b[1], b[2], b[3],
922 be16toh(remote.in6.sin6_port)) < 0)
923 return -ENOMEM;
924 } else {
925 char a[INET6_ADDRSTRLEN], b[INET6_ADDRSTRLEN];
926
927 if (asprintf(&r,
928 "%u-%s:%u-%s:%u",
929 nr,
930 inet_ntop(AF_INET6, &local.in6.sin6_addr, a, sizeof(a)),
931 be16toh(local.in6.sin6_port),
932 inet_ntop(AF_INET6, &remote.in6.sin6_addr, b, sizeof(b)),
933 be16toh(remote.in6.sin6_port)) < 0)
934 return -ENOMEM;
935 }
936
937 break;
938 }
939
940 case AF_UNIX: {
941 struct ucred ucred;
942 int k;
943
944 k = getpeercred(fd, &ucred);
945 if (k >= 0) {
946 if (asprintf(&r,
947 "%u-"PID_FMT"-"UID_FMT,
948 nr, ucred.pid, ucred.uid) < 0)
949 return -ENOMEM;
950 } else if (k == -ENODATA) {
951 /* This handles the case where somebody is
952 * connecting from another pid/uid namespace
953 * (e.g. from outside of our container). */
954 if (asprintf(&r,
955 "%u-unknown",
956 nr) < 0)
957 return -ENOMEM;
958 } else
959 return k;
960
961 break;
962 }
963
964 case AF_VSOCK:
965 if (asprintf(&r,
966 "%u-%u:%u-%u:%u",
967 nr,
968 local.vm.svm_cid, local.vm.svm_port,
969 remote.vm.svm_cid, remote.vm.svm_port) < 0)
970 return -ENOMEM;
971
972 break;
973
974 default:
975 assert_not_reached("Unhandled socket type.");
976 }
977
978 *instance = r;
979 return 0;
980 }
981
982 static void socket_close_fds(Socket *s) {
983 SocketPort *p;
984 char **i;
985
986 assert(s);
987
988 LIST_FOREACH(port, p, s->ports) {
989 bool was_open;
990
991 was_open = p->fd >= 0;
992
993 p->event_source = sd_event_source_unref(p->event_source);
994 p->fd = safe_close(p->fd);
995 socket_cleanup_fd_list(p);
996
997 /* One little note: we should normally not delete any sockets in the file system here! After all some
998 * other process we spawned might still have a reference of this fd and wants to continue to use
999 * it. Therefore we normally delete sockets in the file system before we create a new one, not after we
1000 * stopped using one! That all said, if the user explicitly requested this, we'll delete them here
1001 * anyway, but only then. */
1002
1003 if (!was_open || !s->remove_on_stop)
1004 continue;
1005
1006 switch (p->type) {
1007
1008 case SOCKET_FIFO:
1009 (void) unlink(p->path);
1010 break;
1011
1012 case SOCKET_MQUEUE:
1013 (void) mq_unlink(p->path);
1014 break;
1015
1016 case SOCKET_SOCKET:
1017 (void) socket_address_unlink(&p->address);
1018 break;
1019
1020 default:
1021 break;
1022 }
1023 }
1024
1025 if (s->remove_on_stop)
1026 STRV_FOREACH(i, s->symlinks)
1027 (void) unlink(*i);
1028 }
1029
1030 static void socket_apply_socket_options(Socket *s, int fd) {
1031 int r;
1032
1033 assert(s);
1034 assert(fd >= 0);
1035
1036 if (s->keep_alive) {
1037 int one = 1;
1038 if (setsockopt(fd, SOL_SOCKET, SO_KEEPALIVE, &one, sizeof(one)) < 0)
1039 log_unit_warning_errno(UNIT(s), errno, "SO_KEEPALIVE failed: %m");
1040 }
1041
1042 if (s->keep_alive_time > 0) {
1043 int value = s->keep_alive_time / USEC_PER_SEC;
1044 if (setsockopt(fd, SOL_TCP, TCP_KEEPIDLE, &value, sizeof(value)) < 0)
1045 log_unit_warning_errno(UNIT(s), errno, "TCP_KEEPIDLE failed: %m");
1046 }
1047
1048 if (s->keep_alive_interval > 0) {
1049 int value = s->keep_alive_interval / USEC_PER_SEC;
1050 if (setsockopt(fd, SOL_TCP, TCP_KEEPINTVL, &value, sizeof(value)) < 0)
1051 log_unit_warning_errno(UNIT(s), errno, "TCP_KEEPINTVL failed: %m");
1052 }
1053
1054 if (s->keep_alive_cnt > 0) {
1055 int value = s->keep_alive_cnt;
1056 if (setsockopt(fd, SOL_TCP, TCP_KEEPCNT, &value, sizeof(value)) < 0)
1057 log_unit_warning_errno(UNIT(s), errno, "TCP_KEEPCNT failed: %m");
1058 }
1059
1060 if (s->defer_accept > 0) {
1061 int value = s->defer_accept / USEC_PER_SEC;
1062 if (setsockopt(fd, SOL_TCP, TCP_DEFER_ACCEPT, &value, sizeof(value)) < 0)
1063 log_unit_warning_errno(UNIT(s), errno, "TCP_DEFER_ACCEPT failed: %m");
1064 }
1065
1066 if (s->no_delay) {
1067 int one = 1;
1068
1069 if (s->socket_protocol == IPPROTO_SCTP) {
1070 if (setsockopt(fd, SOL_SCTP, SCTP_NODELAY, &one, sizeof(one)) < 0)
1071 log_unit_warning_errno(UNIT(s), errno, "SCTP_NODELAY failed: %m");
1072 } else {
1073 if (setsockopt(fd, SOL_TCP, TCP_NODELAY, &one, sizeof(one)) < 0)
1074 log_unit_warning_errno(UNIT(s), errno, "TCP_NODELAY failed: %m");
1075 }
1076 }
1077
1078 if (s->broadcast) {
1079 int one = 1;
1080 if (setsockopt(fd, SOL_SOCKET, SO_BROADCAST, &one, sizeof(one)) < 0)
1081 log_unit_warning_errno(UNIT(s), errno, "SO_BROADCAST failed: %m");
1082 }
1083
1084 if (s->pass_cred) {
1085 int one = 1;
1086 if (setsockopt(fd, SOL_SOCKET, SO_PASSCRED, &one, sizeof(one)) < 0)
1087 log_unit_warning_errno(UNIT(s), errno, "SO_PASSCRED failed: %m");
1088 }
1089
1090 if (s->pass_sec) {
1091 int one = 1;
1092 if (setsockopt(fd, SOL_SOCKET, SO_PASSSEC, &one, sizeof(one)) < 0)
1093 log_unit_warning_errno(UNIT(s), errno, "SO_PASSSEC failed: %m");
1094 }
1095
1096 if (s->priority >= 0)
1097 if (setsockopt(fd, SOL_SOCKET, SO_PRIORITY, &s->priority, sizeof(s->priority)) < 0)
1098 log_unit_warning_errno(UNIT(s), errno, "SO_PRIORITY failed: %m");
1099
1100 if (s->receive_buffer > 0) {
1101 int value = (int) s->receive_buffer;
1102
1103 /* We first try with SO_RCVBUFFORCE, in case we have the perms for that */
1104 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUFFORCE, &value, sizeof(value)) < 0)
1105 if (setsockopt(fd, SOL_SOCKET, SO_RCVBUF, &value, sizeof(value)) < 0)
1106 log_unit_warning_errno(UNIT(s), errno, "SO_RCVBUF failed: %m");
1107 }
1108
1109 if (s->send_buffer > 0) {
1110 int value = (int) s->send_buffer;
1111 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUFFORCE, &value, sizeof(value)) < 0)
1112 if (setsockopt(fd, SOL_SOCKET, SO_SNDBUF, &value, sizeof(value)) < 0)
1113 log_unit_warning_errno(UNIT(s), errno, "SO_SNDBUF failed: %m");
1114 }
1115
1116 if (s->mark >= 0)
1117 if (setsockopt(fd, SOL_SOCKET, SO_MARK, &s->mark, sizeof(s->mark)) < 0)
1118 log_unit_warning_errno(UNIT(s), errno, "SO_MARK failed: %m");
1119
1120 if (s->ip_tos >= 0)
1121 if (setsockopt(fd, IPPROTO_IP, IP_TOS, &s->ip_tos, sizeof(s->ip_tos)) < 0)
1122 log_unit_warning_errno(UNIT(s), errno, "IP_TOS failed: %m");
1123
1124 if (s->ip_ttl >= 0) {
1125 int x;
1126
1127 r = setsockopt(fd, IPPROTO_IP, IP_TTL, &s->ip_ttl, sizeof(s->ip_ttl));
1128
1129 if (socket_ipv6_is_supported())
1130 x = setsockopt(fd, IPPROTO_IPV6, IPV6_UNICAST_HOPS, &s->ip_ttl, sizeof(s->ip_ttl));
1131 else {
1132 x = -1;
1133 errno = EAFNOSUPPORT;
1134 }
1135
1136 if (r < 0 && x < 0)
1137 log_unit_warning_errno(UNIT(s), errno, "IP_TTL/IPV6_UNICAST_HOPS failed: %m");
1138 }
1139
1140 if (s->tcp_congestion)
1141 if (setsockopt(fd, SOL_TCP, TCP_CONGESTION, s->tcp_congestion, strlen(s->tcp_congestion)+1) < 0)
1142 log_unit_warning_errno(UNIT(s), errno, "TCP_CONGESTION failed: %m");
1143
1144 if (s->smack_ip_in) {
1145 r = mac_smack_apply_fd(fd, SMACK_ATTR_IPIN, s->smack_ip_in);
1146 if (r < 0)
1147 log_unit_error_errno(UNIT(s), r, "mac_smack_apply_ip_in_fd: %m");
1148 }
1149
1150 if (s->smack_ip_out) {
1151 r = mac_smack_apply_fd(fd, SMACK_ATTR_IPOUT, s->smack_ip_out);
1152 if (r < 0)
1153 log_unit_error_errno(UNIT(s), r, "mac_smack_apply_ip_out_fd: %m");
1154 }
1155 }
1156
1157 static void socket_apply_fifo_options(Socket *s, int fd) {
1158 int r;
1159
1160 assert(s);
1161 assert(fd >= 0);
1162
1163 if (s->pipe_size > 0)
1164 if (fcntl(fd, F_SETPIPE_SZ, s->pipe_size) < 0)
1165 log_unit_warning_errno(UNIT(s), errno, "Setting pipe size failed, ignoring: %m");
1166
1167 if (s->smack) {
1168 r = mac_smack_apply_fd(fd, SMACK_ATTR_ACCESS, s->smack);
1169 if (r < 0)
1170 log_unit_error_errno(UNIT(s), r, "SMACK relabelling failed, ignoring: %m");
1171 }
1172 }
1173
1174 static int fifo_address_create(
1175 const char *path,
1176 mode_t directory_mode,
1177 mode_t socket_mode) {
1178
1179 _cleanup_close_ int fd = -1;
1180 mode_t old_mask;
1181 struct stat st;
1182 int r;
1183
1184 assert(path);
1185
1186 (void) mkdir_parents_label(path, directory_mode);
1187
1188 r = mac_selinux_create_file_prepare(path, S_IFIFO);
1189 if (r < 0)
1190 return r;
1191
1192 /* Enforce the right access mode for the fifo */
1193 old_mask = umask(~socket_mode);
1194
1195 /* Include the original umask in our mask */
1196 (void) umask(~socket_mode | old_mask);
1197
1198 r = mkfifo(path, socket_mode);
1199 (void) umask(old_mask);
1200
1201 if (r < 0 && errno != EEXIST) {
1202 r = -errno;
1203 goto fail;
1204 }
1205
1206 fd = open(path, O_RDWR | O_CLOEXEC | O_NOCTTY | O_NONBLOCK | O_NOFOLLOW);
1207 if (fd < 0) {
1208 r = -errno;
1209 goto fail;
1210 }
1211
1212 mac_selinux_create_file_clear();
1213
1214 if (fstat(fd, &st) < 0) {
1215 r = -errno;
1216 goto fail;
1217 }
1218
1219 if (!S_ISFIFO(st.st_mode) ||
1220 (st.st_mode & 0777) != (socket_mode & ~old_mask) ||
1221 st.st_uid != getuid() ||
1222 st.st_gid != getgid()) {
1223 r = -EEXIST;
1224 goto fail;
1225 }
1226
1227 return TAKE_FD(fd);
1228
1229 fail:
1230 mac_selinux_create_file_clear();
1231 return r;
1232 }
1233
1234 static int special_address_create(const char *path, bool writable) {
1235 _cleanup_close_ int fd = -1;
1236 struct stat st;
1237
1238 assert(path);
1239
1240 fd = open(path, (writable ? O_RDWR : O_RDONLY)|O_CLOEXEC|O_NOCTTY|O_NONBLOCK|O_NOFOLLOW);
1241 if (fd < 0)
1242 return -errno;
1243
1244 if (fstat(fd, &st) < 0)
1245 return -errno;
1246
1247 /* Check whether this is a /proc, /sys or /dev file or char device */
1248 if (!S_ISREG(st.st_mode) && !S_ISCHR(st.st_mode))
1249 return -EEXIST;
1250
1251 return TAKE_FD(fd);
1252 }
1253
1254 static int usbffs_address_create(const char *path) {
1255 _cleanup_close_ int fd = -1;
1256 struct stat st;
1257
1258 assert(path);
1259
1260 fd = open(path, O_RDWR|O_CLOEXEC|O_NOCTTY|O_NONBLOCK|O_NOFOLLOW);
1261 if (fd < 0)
1262 return -errno;
1263
1264 if (fstat(fd, &st) < 0)
1265 return -errno;
1266
1267 /* Check whether this is a regular file (ffs endpoint) */
1268 if (!S_ISREG(st.st_mode))
1269 return -EEXIST;
1270
1271 return TAKE_FD(fd);
1272 }
1273
1274 static int mq_address_create(
1275 const char *path,
1276 mode_t mq_mode,
1277 long maxmsg,
1278 long msgsize) {
1279
1280 _cleanup_close_ int fd = -1;
1281 struct stat st;
1282 mode_t old_mask;
1283 struct mq_attr _attr, *attr = NULL;
1284
1285 assert(path);
1286
1287 if (maxmsg > 0 && msgsize > 0) {
1288 _attr = (struct mq_attr) {
1289 .mq_flags = O_NONBLOCK,
1290 .mq_maxmsg = maxmsg,
1291 .mq_msgsize = msgsize,
1292 };
1293 attr = &_attr;
1294 }
1295
1296 /* Enforce the right access mode for the mq */
1297 old_mask = umask(~mq_mode);
1298
1299 /* Include the original umask in our mask */
1300 (void) umask(~mq_mode | old_mask);
1301 fd = mq_open(path, O_RDONLY|O_CLOEXEC|O_NONBLOCK|O_CREAT, mq_mode, attr);
1302 (void) umask(old_mask);
1303
1304 if (fd < 0)
1305 return -errno;
1306
1307 if (fstat(fd, &st) < 0)
1308 return -errno;
1309
1310 if ((st.st_mode & 0777) != (mq_mode & ~old_mask) ||
1311 st.st_uid != getuid() ||
1312 st.st_gid != getgid())
1313 return -EEXIST;
1314
1315 return TAKE_FD(fd);
1316 }
1317
1318 static int socket_symlink(Socket *s) {
1319 const char *p;
1320 char **i;
1321 int r;
1322
1323 assert(s);
1324
1325 p = socket_find_symlink_target(s);
1326 if (!p)
1327 return 0;
1328
1329 STRV_FOREACH(i, s->symlinks) {
1330 (void) mkdir_parents_label(*i, s->directory_mode);
1331
1332 r = symlink_idempotent(p, *i);
1333
1334 if (r == -EEXIST && s->remove_on_stop) {
1335 /* If there's already something where we want to create the symlink, and the destructive
1336 * RemoveOnStop= mode is set, then we might as well try to remove what already exists and try
1337 * again. */
1338
1339 if (unlink(*i) >= 0)
1340 r = symlink_idempotent(p, *i);
1341 }
1342
1343 if (r < 0)
1344 log_unit_warning_errno(UNIT(s), r, "Failed to create symlink %s → %s, ignoring: %m", p, *i);
1345 }
1346
1347 return 0;
1348 }
1349
1350 static int usbffs_write_descs(int fd, Service *s) {
1351 int r;
1352
1353 if (!s->usb_function_descriptors || !s->usb_function_strings)
1354 return -EINVAL;
1355
1356 r = copy_file_fd(s->usb_function_descriptors, fd, 0);
1357 if (r < 0)
1358 return r;
1359
1360 return copy_file_fd(s->usb_function_strings, fd, 0);
1361 }
1362
1363 static int usbffs_select_ep(const struct dirent *d) {
1364 return d->d_name[0] != '.' && !streq(d->d_name, "ep0");
1365 }
1366
1367 static int usbffs_dispatch_eps(SocketPort *p) {
1368 _cleanup_free_ struct dirent **ent = NULL;
1369 size_t n, k, i;
1370 int r;
1371
1372 r = scandir(p->path, &ent, usbffs_select_ep, alphasort);
1373 if (r < 0)
1374 return -errno;
1375
1376 n = (size_t) r;
1377 p->auxiliary_fds = new(int, n);
1378 if (!p->auxiliary_fds)
1379 return -ENOMEM;
1380
1381 p->n_auxiliary_fds = n;
1382
1383 k = 0;
1384 for (i = 0; i < n; ++i) {
1385 _cleanup_free_ char *ep = NULL;
1386
1387 ep = path_make_absolute(ent[i]->d_name, p->path);
1388 if (!ep)
1389 return -ENOMEM;
1390
1391 path_simplify(ep, false);
1392
1393 r = usbffs_address_create(ep);
1394 if (r < 0)
1395 goto fail;
1396
1397 p->auxiliary_fds[k++] = r;
1398 free(ent[i]);
1399 }
1400
1401 return r;
1402
1403 fail:
1404 close_many(p->auxiliary_fds, k);
1405 p->auxiliary_fds = mfree(p->auxiliary_fds);
1406 p->n_auxiliary_fds = 0;
1407
1408 return r;
1409 }
1410
1411 static int socket_determine_selinux_label(Socket *s, char **ret) {
1412 Service *service;
1413 ExecCommand *c;
1414 _cleanup_free_ char *path = NULL;
1415 int r;
1416
1417 assert(s);
1418 assert(ret);
1419
1420 if (s->selinux_context_from_net) {
1421 /* If this is requested, get label from the network label */
1422
1423 r = mac_selinux_get_our_label(ret);
1424 if (r == -EOPNOTSUPP)
1425 goto no_label;
1426
1427 } else {
1428 /* Otherwise, get it from the executable we are about to start */
1429 r = socket_instantiate_service(s);
1430 if (r < 0)
1431 return r;
1432
1433 if (!UNIT_ISSET(s->service))
1434 goto no_label;
1435
1436 service = SERVICE(UNIT_DEREF(s->service));
1437 c = service->exec_command[SERVICE_EXEC_START];
1438 if (!c)
1439 goto no_label;
1440
1441 r = chase_symlinks(c->path, service->exec_context.root_directory, CHASE_PREFIX_ROOT, &path);
1442 if (r < 0)
1443 goto no_label;
1444
1445 r = mac_selinux_get_create_label_from_exe(path, ret);
1446 if (IN_SET(r, -EPERM, -EOPNOTSUPP))
1447 goto no_label;
1448 }
1449
1450 return r;
1451
1452 no_label:
1453 *ret = NULL;
1454 return 0;
1455 }
1456
1457 static int socket_address_listen_do(
1458 Socket *s,
1459 const SocketAddress *address,
1460 const char *label) {
1461
1462 assert(s);
1463 assert(address);
1464
1465 return socket_address_listen(
1466 address,
1467 SOCK_CLOEXEC|SOCK_NONBLOCK,
1468 s->backlog,
1469 s->bind_ipv6_only,
1470 s->bind_to_device,
1471 s->reuse_port,
1472 s->free_bind,
1473 s->transparent,
1474 s->directory_mode,
1475 s->socket_mode,
1476 label);
1477 }
1478
1479 static int socket_address_listen_in_cgroup(
1480 Socket *s,
1481 const SocketAddress *address,
1482 const char *label) {
1483
1484 _cleanup_close_pair_ int pair[2] = { -1, -1 };
1485 int fd, r;
1486 pid_t pid;
1487
1488 assert(s);
1489 assert(address);
1490
1491 /* This is a wrapper around socket_address_listen(), that forks off a helper process inside the socket's cgroup
1492 * in which the socket is actually created. This way we ensure the socket is actually properly attached to the
1493 * unit's cgroup for the purpose of BPF filtering and such. */
1494
1495 if (!IN_SET(address->sockaddr.sa.sa_family, AF_INET, AF_INET6))
1496 goto shortcut; /* BPF filtering only applies to IPv4 + IPv6, shortcut things for other protocols */
1497
1498 r = bpf_firewall_supported();
1499 if (r < 0)
1500 return r;
1501 if (r == BPF_FIREWALL_UNSUPPORTED) /* If BPF firewalling isn't supported anyway — there's no point in this forking complexity */
1502 goto shortcut;
1503
1504 if (socketpair(AF_UNIX, SOCK_SEQPACKET|SOCK_CLOEXEC, 0, pair) < 0)
1505 return log_unit_error_errno(UNIT(s), errno, "Failed to create communication channel: %m");
1506
1507 r = unit_fork_helper_process(UNIT(s), "(sd-listen)", &pid);
1508 if (r < 0)
1509 return log_unit_error_errno(UNIT(s), r, "Failed to fork off listener stub process: %m");
1510 if (r == 0) {
1511 /* Child */
1512
1513 pair[0] = safe_close(pair[0]);
1514
1515 fd = socket_address_listen_do(s, address, label);
1516 if (fd < 0) {
1517 log_unit_error_errno(UNIT(s), fd, "Failed to create listening socket: %m");
1518 _exit(EXIT_FAILURE);
1519 }
1520
1521 r = send_one_fd(pair[1], fd, 0);
1522 if (r < 0) {
1523 log_unit_error_errno(UNIT(s), r, "Failed to send listening socket to parent: %m");
1524 _exit(EXIT_FAILURE);
1525 }
1526
1527 _exit(EXIT_SUCCESS);
1528 }
1529
1530 pair[1] = safe_close(pair[1]);
1531 fd = receive_one_fd(pair[0], 0);
1532
1533 /* We synchronously wait for the helper, as it shouldn't be slow */
1534 r = wait_for_terminate_and_check("(sd-listen)", pid, WAIT_LOG_ABNORMAL);
1535 if (r < 0) {
1536 safe_close(fd);
1537 return r;
1538 }
1539
1540 if (fd < 0)
1541 return log_unit_error_errno(UNIT(s), fd, "Failed to receive listening socket: %m");
1542
1543 return fd;
1544
1545 shortcut:
1546 fd = socket_address_listen_do(s, address, label);
1547 if (fd < 0)
1548 return log_error_errno(fd, "Failed to create listening socket: %m");
1549
1550 return fd;
1551 }
1552
1553 static int socket_open_fds(Socket *s) {
1554 _cleanup_(mac_selinux_freep) char *label = NULL;
1555 bool know_label = false;
1556 SocketPort *p;
1557 int r;
1558
1559 assert(s);
1560
1561 LIST_FOREACH(port, p, s->ports) {
1562
1563 if (p->fd >= 0)
1564 continue;
1565
1566 switch (p->type) {
1567
1568 case SOCKET_SOCKET:
1569
1570 if (!know_label) {
1571 /* Figure out label, if we don't it know yet. We do it once, for the first socket where
1572 * we need this and remember it for the rest. */
1573
1574 r = socket_determine_selinux_label(s, &label);
1575 if (r < 0)
1576 goto rollback;
1577
1578 know_label = true;
1579 }
1580
1581 /* Apply the socket protocol */
1582 switch (p->address.type) {
1583
1584 case SOCK_STREAM:
1585 case SOCK_SEQPACKET:
1586 if (s->socket_protocol == IPPROTO_SCTP)
1587 p->address.protocol = s->socket_protocol;
1588 break;
1589
1590 case SOCK_DGRAM:
1591 if (s->socket_protocol == IPPROTO_UDPLITE)
1592 p->address.protocol = s->socket_protocol;
1593 break;
1594 }
1595
1596 r = socket_address_listen_in_cgroup(s, &p->address, label);
1597 if (r < 0)
1598 goto rollback;
1599
1600 p->fd = r;
1601 socket_apply_socket_options(s, p->fd);
1602 socket_symlink(s);
1603 break;
1604
1605 case SOCKET_SPECIAL:
1606
1607 p->fd = special_address_create(p->path, s->writable);
1608 if (p->fd < 0) {
1609 r = p->fd;
1610 goto rollback;
1611 }
1612 break;
1613
1614 case SOCKET_FIFO:
1615
1616 p->fd = fifo_address_create(
1617 p->path,
1618 s->directory_mode,
1619 s->socket_mode);
1620 if (p->fd < 0) {
1621 r = p->fd;
1622 goto rollback;
1623 }
1624
1625 socket_apply_fifo_options(s, p->fd);
1626 socket_symlink(s);
1627 break;
1628
1629 case SOCKET_MQUEUE:
1630
1631 p->fd = mq_address_create(
1632 p->path,
1633 s->socket_mode,
1634 s->mq_maxmsg,
1635 s->mq_msgsize);
1636 if (p->fd < 0) {
1637 r = p->fd;
1638 goto rollback;
1639 }
1640 break;
1641
1642 case SOCKET_USB_FUNCTION: {
1643 _cleanup_free_ char *ep = NULL;
1644
1645 ep = path_make_absolute("ep0", p->path);
1646
1647 p->fd = usbffs_address_create(ep);
1648 if (p->fd < 0) {
1649 r = p->fd;
1650 goto rollback;
1651 }
1652
1653 r = usbffs_write_descs(p->fd, SERVICE(UNIT_DEREF(s->service)));
1654 if (r < 0)
1655 goto rollback;
1656
1657 r = usbffs_dispatch_eps(p);
1658 if (r < 0)
1659 goto rollback;
1660
1661 break;
1662 }
1663 default:
1664 assert_not_reached("Unknown port type");
1665 }
1666 }
1667
1668 return 0;
1669
1670 rollback:
1671 socket_close_fds(s);
1672 return r;
1673 }
1674
1675 static void socket_unwatch_fds(Socket *s) {
1676 SocketPort *p;
1677 int r;
1678
1679 assert(s);
1680
1681 LIST_FOREACH(port, p, s->ports) {
1682 if (p->fd < 0)
1683 continue;
1684
1685 if (!p->event_source)
1686 continue;
1687
1688 r = sd_event_source_set_enabled(p->event_source, SD_EVENT_OFF);
1689 if (r < 0)
1690 log_unit_debug_errno(UNIT(s), r, "Failed to disable event source: %m");
1691 }
1692 }
1693
1694 static int socket_watch_fds(Socket *s) {
1695 SocketPort *p;
1696 int r;
1697
1698 assert(s);
1699
1700 LIST_FOREACH(port, p, s->ports) {
1701 if (p->fd < 0)
1702 continue;
1703
1704 if (p->event_source) {
1705 r = sd_event_source_set_enabled(p->event_source, SD_EVENT_ON);
1706 if (r < 0)
1707 goto fail;
1708 } else {
1709 r = sd_event_add_io(UNIT(s)->manager->event, &p->event_source, p->fd, EPOLLIN, socket_dispatch_io, p);
1710 if (r < 0)
1711 goto fail;
1712
1713 (void) sd_event_source_set_description(p->event_source, "socket-port-io");
1714 }
1715 }
1716
1717 return 0;
1718
1719 fail:
1720 log_unit_warning_errno(UNIT(s), r, "Failed to watch listening fds: %m");
1721 socket_unwatch_fds(s);
1722 return r;
1723 }
1724
1725 enum {
1726 SOCKET_OPEN_NONE,
1727 SOCKET_OPEN_SOME,
1728 SOCKET_OPEN_ALL,
1729 };
1730
1731 static int socket_check_open(Socket *s) {
1732 bool have_open = false, have_closed = false;
1733 SocketPort *p;
1734
1735 assert(s);
1736
1737 LIST_FOREACH(port, p, s->ports) {
1738 if (p->fd < 0)
1739 have_closed = true;
1740 else
1741 have_open = true;
1742
1743 if (have_open && have_closed)
1744 return SOCKET_OPEN_SOME;
1745 }
1746
1747 if (have_open)
1748 return SOCKET_OPEN_ALL;
1749
1750 return SOCKET_OPEN_NONE;
1751 }
1752
1753 static void socket_set_state(Socket *s, SocketState state) {
1754 SocketState old_state;
1755 assert(s);
1756
1757 old_state = s->state;
1758 s->state = state;
1759
1760 if (!IN_SET(state,
1761 SOCKET_START_PRE,
1762 SOCKET_START_CHOWN,
1763 SOCKET_START_POST,
1764 SOCKET_STOP_PRE,
1765 SOCKET_STOP_PRE_SIGTERM,
1766 SOCKET_STOP_PRE_SIGKILL,
1767 SOCKET_STOP_POST,
1768 SOCKET_FINAL_SIGTERM,
1769 SOCKET_FINAL_SIGKILL)) {
1770
1771 s->timer_event_source = sd_event_source_unref(s->timer_event_source);
1772 socket_unwatch_control_pid(s);
1773 s->control_command = NULL;
1774 s->control_command_id = _SOCKET_EXEC_COMMAND_INVALID;
1775 }
1776
1777 if (state != SOCKET_LISTENING)
1778 socket_unwatch_fds(s);
1779
1780 if (!IN_SET(state,
1781 SOCKET_START_CHOWN,
1782 SOCKET_START_POST,
1783 SOCKET_LISTENING,
1784 SOCKET_RUNNING,
1785 SOCKET_STOP_PRE,
1786 SOCKET_STOP_PRE_SIGTERM,
1787 SOCKET_STOP_PRE_SIGKILL))
1788 socket_close_fds(s);
1789
1790 if (state != old_state)
1791 log_unit_debug(UNIT(s), "Changed %s -> %s", socket_state_to_string(old_state), socket_state_to_string(state));
1792
1793 unit_notify(UNIT(s), state_translation_table[old_state], state_translation_table[state], 0);
1794 }
1795
1796 static int socket_coldplug(Unit *u) {
1797 Socket *s = SOCKET(u);
1798 int r;
1799
1800 assert(s);
1801 assert(s->state == SOCKET_DEAD);
1802
1803 if (s->deserialized_state == s->state)
1804 return 0;
1805
1806 if (s->control_pid > 0 &&
1807 pid_is_unwaited(s->control_pid) &&
1808 IN_SET(s->deserialized_state,
1809 SOCKET_START_PRE,
1810 SOCKET_START_CHOWN,
1811 SOCKET_START_POST,
1812 SOCKET_STOP_PRE,
1813 SOCKET_STOP_PRE_SIGTERM,
1814 SOCKET_STOP_PRE_SIGKILL,
1815 SOCKET_STOP_POST,
1816 SOCKET_FINAL_SIGTERM,
1817 SOCKET_FINAL_SIGKILL)) {
1818
1819 r = unit_watch_pid(UNIT(s), s->control_pid);
1820 if (r < 0)
1821 return r;
1822
1823 r = socket_arm_timer(s, usec_add(u->state_change_timestamp.monotonic, s->timeout_usec));
1824 if (r < 0)
1825 return r;
1826 }
1827
1828 if (IN_SET(s->deserialized_state,
1829 SOCKET_START_CHOWN,
1830 SOCKET_START_POST,
1831 SOCKET_LISTENING,
1832 SOCKET_RUNNING)) {
1833
1834 /* Originally, we used to simply reopen all sockets here that we didn't have file descriptors
1835 * for. However, this is problematic, as we won't traverse throught the SOCKET_START_CHOWN state for
1836 * them, and thus the UID/GID wouldn't be right. Hence, instead simply check if we have all fds open,
1837 * and if there's a mismatch, warn loudly. */
1838
1839 r = socket_check_open(s);
1840 if (r == SOCKET_OPEN_NONE)
1841 log_unit_warning(UNIT(s),
1842 "Socket unit configuration has changed while unit has been running, "
1843 "no open socket file descriptor left. "
1844 "The socket unit is not functional until restarted.");
1845 else if (r == SOCKET_OPEN_SOME)
1846 log_unit_warning(UNIT(s),
1847 "Socket unit configuration has changed while unit has been running, "
1848 "and some socket file descriptors have not been opened yet. "
1849 "The socket unit is not fully functional until restarted.");
1850 }
1851
1852 if (s->deserialized_state == SOCKET_LISTENING) {
1853 r = socket_watch_fds(s);
1854 if (r < 0)
1855 return r;
1856 }
1857
1858 if (!IN_SET(s->deserialized_state, SOCKET_DEAD, SOCKET_FAILED)) {
1859 (void) unit_setup_dynamic_creds(u);
1860 (void) unit_setup_exec_runtime(u);
1861 }
1862
1863 socket_set_state(s, s->deserialized_state);
1864 return 0;
1865 }
1866
1867 static int socket_spawn(Socket *s, ExecCommand *c, pid_t *_pid) {
1868
1869 ExecParameters exec_params = {
1870 .flags = EXEC_APPLY_SANDBOXING|EXEC_APPLY_CHROOT|EXEC_APPLY_TTY_STDIN,
1871 .stdin_fd = -1,
1872 .stdout_fd = -1,
1873 .stderr_fd = -1,
1874 .exec_fd = -1,
1875 };
1876 pid_t pid;
1877 int r;
1878
1879 assert(s);
1880 assert(c);
1881 assert(_pid);
1882
1883 r = unit_prepare_exec(UNIT(s));
1884 if (r < 0)
1885 return r;
1886
1887 r = socket_arm_timer(s, usec_add(now(CLOCK_MONOTONIC), s->timeout_usec));
1888 if (r < 0)
1889 return r;
1890
1891 unit_set_exec_params(UNIT(s), &exec_params);
1892
1893 exec_params.argv = c->argv;
1894
1895 r = exec_spawn(UNIT(s),
1896 c,
1897 &s->exec_context,
1898 &exec_params,
1899 s->exec_runtime,
1900 &s->dynamic_creds,
1901 &pid);
1902 if (r < 0)
1903 return r;
1904
1905 r = unit_watch_pid(UNIT(s), pid);
1906 if (r < 0)
1907 /* FIXME: we need to do something here */
1908 return r;
1909
1910 *_pid = pid;
1911
1912 return 0;
1913 }
1914
1915 static int socket_chown(Socket *s, pid_t *_pid) {
1916 pid_t pid;
1917 int r;
1918
1919 r = socket_arm_timer(s, usec_add(now(CLOCK_MONOTONIC), s->timeout_usec));
1920 if (r < 0)
1921 goto fail;
1922
1923 /* We have to resolve the user names out-of-process, hence
1924 * let's fork here. It's messy, but well, what can we do? */
1925
1926 r = unit_fork_helper_process(UNIT(s), "(sd-chown)", &pid);
1927 if (r < 0)
1928 return r;
1929 if (r == 0) {
1930 uid_t uid = UID_INVALID;
1931 gid_t gid = GID_INVALID;
1932 SocketPort *p;
1933
1934 /* Child */
1935
1936 if (!isempty(s->user)) {
1937 const char *user = s->user;
1938
1939 r = get_user_creds(&user, &uid, &gid, NULL, NULL);
1940 if (r < 0) {
1941 log_unit_error_errno(UNIT(s), r, "Failed to resolve user %s: %m", user);
1942 _exit(EXIT_USER);
1943 }
1944 }
1945
1946 if (!isempty(s->group)) {
1947 const char *group = s->group;
1948
1949 r = get_group_creds(&group, &gid);
1950 if (r < 0) {
1951 log_unit_error_errno(UNIT(s), r, "Failed to resolve group %s: %m", group);
1952 _exit(EXIT_GROUP);
1953 }
1954 }
1955
1956 LIST_FOREACH(port, p, s->ports) {
1957 const char *path = NULL;
1958
1959 if (p->type == SOCKET_SOCKET)
1960 path = socket_address_get_path(&p->address);
1961 else if (p->type == SOCKET_FIFO)
1962 path = p->path;
1963
1964 if (!path)
1965 continue;
1966
1967 if (chown(path, uid, gid) < 0) {
1968 log_unit_error_errno(UNIT(s), errno, "Failed to chown(): %m");
1969 _exit(EXIT_CHOWN);
1970 }
1971 }
1972
1973 _exit(EXIT_SUCCESS);
1974 }
1975
1976 r = unit_watch_pid(UNIT(s), pid);
1977 if (r < 0)
1978 goto fail;
1979
1980 *_pid = pid;
1981 return 0;
1982
1983 fail:
1984 s->timer_event_source = sd_event_source_unref(s->timer_event_source);
1985 return r;
1986 }
1987
1988 static void socket_enter_dead(Socket *s, SocketResult f) {
1989 assert(s);
1990
1991 if (s->result == SOCKET_SUCCESS)
1992 s->result = f;
1993
1994 if (s->result != SOCKET_SUCCESS)
1995 log_unit_warning(UNIT(s), "Failed with result '%s'.", socket_result_to_string(s->result));
1996
1997 socket_set_state(s, s->result != SOCKET_SUCCESS ? SOCKET_FAILED : SOCKET_DEAD);
1998
1999 s->exec_runtime = exec_runtime_unref(s->exec_runtime, true);
2000
2001 exec_context_destroy_runtime_directory(&s->exec_context, UNIT(s)->manager->prefix[EXEC_DIRECTORY_RUNTIME]);
2002
2003 unit_unref_uid_gid(UNIT(s), true);
2004
2005 dynamic_creds_destroy(&s->dynamic_creds);
2006 }
2007
2008 static void socket_enter_signal(Socket *s, SocketState state, SocketResult f);
2009
2010 static void socket_enter_stop_post(Socket *s, SocketResult f) {
2011 int r;
2012 assert(s);
2013
2014 if (s->result == SOCKET_SUCCESS)
2015 s->result = f;
2016
2017 socket_unwatch_control_pid(s);
2018 s->control_command_id = SOCKET_EXEC_STOP_POST;
2019 s->control_command = s->exec_command[SOCKET_EXEC_STOP_POST];
2020
2021 if (s->control_command) {
2022 r = socket_spawn(s, s->control_command, &s->control_pid);
2023 if (r < 0)
2024 goto fail;
2025
2026 socket_set_state(s, SOCKET_STOP_POST);
2027 } else
2028 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, SOCKET_SUCCESS);
2029
2030 return;
2031
2032 fail:
2033 log_unit_warning_errno(UNIT(s), r, "Failed to run 'stop-post' task: %m");
2034 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, SOCKET_FAILURE_RESOURCES);
2035 }
2036
2037 static void socket_enter_signal(Socket *s, SocketState state, SocketResult f) {
2038 int r;
2039
2040 assert(s);
2041
2042 if (s->result == SOCKET_SUCCESS)
2043 s->result = f;
2044
2045 r = unit_kill_context(
2046 UNIT(s),
2047 &s->kill_context,
2048 !IN_SET(state, SOCKET_STOP_PRE_SIGTERM, SOCKET_FINAL_SIGTERM) ?
2049 KILL_KILL : KILL_TERMINATE,
2050 -1,
2051 s->control_pid,
2052 false);
2053 if (r < 0)
2054 goto fail;
2055
2056 if (r > 0) {
2057 r = socket_arm_timer(s, usec_add(now(CLOCK_MONOTONIC), s->timeout_usec));
2058 if (r < 0)
2059 goto fail;
2060
2061 socket_set_state(s, state);
2062 } else if (state == SOCKET_STOP_PRE_SIGTERM)
2063 socket_enter_signal(s, SOCKET_STOP_PRE_SIGKILL, SOCKET_SUCCESS);
2064 else if (state == SOCKET_STOP_PRE_SIGKILL)
2065 socket_enter_stop_post(s, SOCKET_SUCCESS);
2066 else if (state == SOCKET_FINAL_SIGTERM)
2067 socket_enter_signal(s, SOCKET_FINAL_SIGKILL, SOCKET_SUCCESS);
2068 else
2069 socket_enter_dead(s, SOCKET_SUCCESS);
2070
2071 return;
2072
2073 fail:
2074 log_unit_warning_errno(UNIT(s), r, "Failed to kill processes: %m");
2075
2076 if (IN_SET(state, SOCKET_STOP_PRE_SIGTERM, SOCKET_STOP_PRE_SIGKILL))
2077 socket_enter_stop_post(s, SOCKET_FAILURE_RESOURCES);
2078 else
2079 socket_enter_dead(s, SOCKET_FAILURE_RESOURCES);
2080 }
2081
2082 static void socket_enter_stop_pre(Socket *s, SocketResult f) {
2083 int r;
2084 assert(s);
2085
2086 if (s->result == SOCKET_SUCCESS)
2087 s->result = f;
2088
2089 socket_unwatch_control_pid(s);
2090 s->control_command_id = SOCKET_EXEC_STOP_PRE;
2091 s->control_command = s->exec_command[SOCKET_EXEC_STOP_PRE];
2092
2093 if (s->control_command) {
2094 r = socket_spawn(s, s->control_command, &s->control_pid);
2095 if (r < 0)
2096 goto fail;
2097
2098 socket_set_state(s, SOCKET_STOP_PRE);
2099 } else
2100 socket_enter_stop_post(s, SOCKET_SUCCESS);
2101
2102 return;
2103
2104 fail:
2105 log_unit_warning_errno(UNIT(s), r, "Failed to run 'stop-pre' task: %m");
2106 socket_enter_stop_post(s, SOCKET_FAILURE_RESOURCES);
2107 }
2108
2109 static void socket_enter_listening(Socket *s) {
2110 int r;
2111 assert(s);
2112
2113 r = socket_watch_fds(s);
2114 if (r < 0) {
2115 log_unit_warning_errno(UNIT(s), r, "Failed to watch sockets: %m");
2116 goto fail;
2117 }
2118
2119 socket_set_state(s, SOCKET_LISTENING);
2120 return;
2121
2122 fail:
2123 socket_enter_stop_pre(s, SOCKET_FAILURE_RESOURCES);
2124 }
2125
2126 static void socket_enter_start_post(Socket *s) {
2127 int r;
2128 assert(s);
2129
2130 socket_unwatch_control_pid(s);
2131 s->control_command_id = SOCKET_EXEC_START_POST;
2132 s->control_command = s->exec_command[SOCKET_EXEC_START_POST];
2133
2134 if (s->control_command) {
2135 r = socket_spawn(s, s->control_command, &s->control_pid);
2136 if (r < 0) {
2137 log_unit_warning_errno(UNIT(s), r, "Failed to run 'start-post' task: %m");
2138 goto fail;
2139 }
2140
2141 socket_set_state(s, SOCKET_START_POST);
2142 } else
2143 socket_enter_listening(s);
2144
2145 return;
2146
2147 fail:
2148 socket_enter_stop_pre(s, SOCKET_FAILURE_RESOURCES);
2149 }
2150
2151 static void socket_enter_start_chown(Socket *s) {
2152 int r;
2153
2154 assert(s);
2155
2156 r = socket_open_fds(s);
2157 if (r < 0) {
2158 log_unit_warning_errno(UNIT(s), r, "Failed to listen on sockets: %m");
2159 goto fail;
2160 }
2161
2162 if (!isempty(s->user) || !isempty(s->group)) {
2163
2164 socket_unwatch_control_pid(s);
2165 s->control_command_id = SOCKET_EXEC_START_CHOWN;
2166 s->control_command = NULL;
2167
2168 r = socket_chown(s, &s->control_pid);
2169 if (r < 0) {
2170 log_unit_warning_errno(UNIT(s), r, "Failed to fork 'start-chown' task: %m");
2171 goto fail;
2172 }
2173
2174 socket_set_state(s, SOCKET_START_CHOWN);
2175 } else
2176 socket_enter_start_post(s);
2177
2178 return;
2179
2180 fail:
2181 socket_enter_stop_pre(s, SOCKET_FAILURE_RESOURCES);
2182 }
2183
2184 static void socket_enter_start_pre(Socket *s) {
2185 int r;
2186 assert(s);
2187
2188 socket_unwatch_control_pid(s);
2189
2190 unit_warn_leftover_processes(UNIT(s));
2191
2192 s->control_command_id = SOCKET_EXEC_START_PRE;
2193 s->control_command = s->exec_command[SOCKET_EXEC_START_PRE];
2194
2195 if (s->control_command) {
2196 r = socket_spawn(s, s->control_command, &s->control_pid);
2197 if (r < 0) {
2198 log_unit_warning_errno(UNIT(s), r, "Failed to run 'start-pre' task: %m");
2199 goto fail;
2200 }
2201
2202 socket_set_state(s, SOCKET_START_PRE);
2203 } else
2204 socket_enter_start_chown(s);
2205
2206 return;
2207
2208 fail:
2209 socket_enter_dead(s, SOCKET_FAILURE_RESOURCES);
2210 }
2211
2212 static void flush_ports(Socket *s) {
2213 SocketPort *p;
2214
2215 /* Flush all incoming traffic, regardless if actual bytes or new connections, so that this socket isn't busy
2216 * anymore */
2217
2218 LIST_FOREACH(port, p, s->ports) {
2219 if (p->fd < 0)
2220 continue;
2221
2222 (void) flush_accept(p->fd);
2223 (void) flush_fd(p->fd);
2224 }
2225 }
2226
2227 static void socket_enter_running(Socket *s, int cfd) {
2228 _cleanup_(sd_bus_error_free) sd_bus_error error = SD_BUS_ERROR_NULL;
2229 int r;
2230
2231 /* Note that this call takes possession of the connection fd passed. It either has to assign it somewhere or
2232 * close it. */
2233
2234 assert(s);
2235
2236 /* We don't take connections anymore if we are supposed to shut down anyway */
2237 if (unit_stop_pending(UNIT(s))) {
2238
2239 log_unit_debug(UNIT(s), "Suppressing connection request since unit stop is scheduled.");
2240
2241 if (cfd >= 0)
2242 goto refuse;
2243 else
2244 flush_ports(s);
2245
2246 return;
2247 }
2248
2249 if (!ratelimit_below(&s->trigger_limit)) {
2250 log_unit_warning(UNIT(s), "Trigger limit hit, refusing further activation.");
2251 socket_enter_stop_pre(s, SOCKET_FAILURE_TRIGGER_LIMIT_HIT);
2252 goto refuse;
2253 }
2254
2255 if (cfd < 0) {
2256 bool pending = false;
2257 Unit *other;
2258 Iterator i;
2259 void *v;
2260
2261 /* If there's already a start pending don't bother to
2262 * do anything */
2263 HASHMAP_FOREACH_KEY(v, other, UNIT(s)->dependencies[UNIT_TRIGGERS], i)
2264 if (unit_active_or_pending(other)) {
2265 pending = true;
2266 break;
2267 }
2268
2269 if (!pending) {
2270 if (!UNIT_ISSET(s->service)) {
2271 log_unit_error(UNIT(s), "Service to activate vanished, refusing activation.");
2272 r = -ENOENT;
2273 goto fail;
2274 }
2275
2276 r = manager_add_job(UNIT(s)->manager, JOB_START, UNIT_DEREF(s->service), JOB_REPLACE, &error, NULL);
2277 if (r < 0)
2278 goto fail;
2279 }
2280
2281 socket_set_state(s, SOCKET_RUNNING);
2282 } else {
2283 _cleanup_free_ char *prefix = NULL, *instance = NULL, *name = NULL;
2284 _cleanup_(socket_peer_unrefp) SocketPeer *p = NULL;
2285 Service *service;
2286
2287 if (s->n_connections >= s->max_connections) {
2288 log_unit_warning(UNIT(s), "Too many incoming connections (%u), dropping connection.",
2289 s->n_connections);
2290 goto refuse;
2291 }
2292
2293 if (s->max_connections_per_source > 0) {
2294 r = socket_acquire_peer(s, cfd, &p);
2295 if (r < 0) {
2296 goto refuse;
2297 } else if (r > 0 && p->n_ref > s->max_connections_per_source) {
2298 _cleanup_free_ char *t = NULL;
2299
2300 (void) sockaddr_pretty(&p->peer.sa, p->peer_salen, true, false, &t);
2301
2302 log_unit_warning(UNIT(s),
2303 "Too many incoming connections (%u) from source %s, dropping connection.",
2304 p->n_ref, strnull(t));
2305 goto refuse;
2306 }
2307 }
2308
2309 r = socket_instantiate_service(s);
2310 if (r < 0)
2311 goto fail;
2312
2313 r = instance_from_socket(cfd, s->n_accepted, &instance);
2314 if (r < 0) {
2315 if (r != -ENOTCONN)
2316 goto fail;
2317
2318 /* ENOTCONN is legitimate if TCP RST was received.
2319 * This connection is over, but the socket unit lives on. */
2320 log_unit_debug(UNIT(s), "Got ENOTCONN on incoming socket, assuming aborted connection attempt, ignoring.");
2321 goto refuse;
2322 }
2323
2324 r = unit_name_to_prefix(UNIT(s)->id, &prefix);
2325 if (r < 0)
2326 goto fail;
2327
2328 r = unit_name_build(prefix, instance, ".service", &name);
2329 if (r < 0)
2330 goto fail;
2331
2332 r = unit_add_name(UNIT_DEREF(s->service), name);
2333 if (r < 0)
2334 goto fail;
2335
2336 service = SERVICE(UNIT_DEREF(s->service));
2337 unit_ref_unset(&s->service);
2338
2339 s->n_accepted++;
2340 unit_choose_id(UNIT(service), name);
2341
2342 r = service_set_socket_fd(service, cfd, s, s->selinux_context_from_net);
2343 if (r < 0)
2344 goto fail;
2345
2346 cfd = -1; /* We passed ownership of the fd to the service now. Forget it here. */
2347 s->n_connections++;
2348
2349 service->peer = TAKE_PTR(p); /* Pass ownership of the peer reference */
2350
2351 r = manager_add_job(UNIT(s)->manager, JOB_START, UNIT(service), JOB_REPLACE, &error, NULL);
2352 if (r < 0) {
2353 /* We failed to activate the new service, but it still exists. Let's make sure the service
2354 * closes and forgets the connection fd again, immediately. */
2355 service_close_socket_fd(service);
2356 goto fail;
2357 }
2358
2359 /* Notify clients about changed counters */
2360 unit_add_to_dbus_queue(UNIT(s));
2361 }
2362
2363 return;
2364
2365 refuse:
2366 s->n_refused++;
2367 safe_close(cfd);
2368 return;
2369
2370 fail:
2371 log_unit_warning(UNIT(s), "Failed to queue service startup job (Maybe the service file is missing or not a %s unit?): %s",
2372 cfd >= 0 ? "template" : "non-template",
2373 bus_error_message(&error, r));
2374
2375 socket_enter_stop_pre(s, SOCKET_FAILURE_RESOURCES);
2376 safe_close(cfd);
2377 }
2378
2379 static void socket_run_next(Socket *s) {
2380 int r;
2381
2382 assert(s);
2383 assert(s->control_command);
2384 assert(s->control_command->command_next);
2385
2386 socket_unwatch_control_pid(s);
2387
2388 s->control_command = s->control_command->command_next;
2389
2390 r = socket_spawn(s, s->control_command, &s->control_pid);
2391 if (r < 0)
2392 goto fail;
2393
2394 return;
2395
2396 fail:
2397 log_unit_warning_errno(UNIT(s), r, "Failed to run next task: %m");
2398
2399 if (s->state == SOCKET_START_POST)
2400 socket_enter_stop_pre(s, SOCKET_FAILURE_RESOURCES);
2401 else if (s->state == SOCKET_STOP_POST)
2402 socket_enter_dead(s, SOCKET_FAILURE_RESOURCES);
2403 else
2404 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, SOCKET_FAILURE_RESOURCES);
2405 }
2406
2407 static int socket_start(Unit *u) {
2408 Socket *s = SOCKET(u);
2409 int r;
2410
2411 assert(s);
2412
2413 /* We cannot fulfill this request right now, try again later
2414 * please! */
2415 if (IN_SET(s->state,
2416 SOCKET_STOP_PRE,
2417 SOCKET_STOP_PRE_SIGKILL,
2418 SOCKET_STOP_PRE_SIGTERM,
2419 SOCKET_STOP_POST,
2420 SOCKET_FINAL_SIGTERM,
2421 SOCKET_FINAL_SIGKILL))
2422 return -EAGAIN;
2423
2424 /* Already on it! */
2425 if (IN_SET(s->state,
2426 SOCKET_START_PRE,
2427 SOCKET_START_CHOWN,
2428 SOCKET_START_POST))
2429 return 0;
2430
2431 /* Cannot run this without the service being around */
2432 if (UNIT_ISSET(s->service)) {
2433 Service *service;
2434
2435 service = SERVICE(UNIT_DEREF(s->service));
2436
2437 if (UNIT(service)->load_state != UNIT_LOADED) {
2438 log_unit_error(u, "Socket service %s not loaded, refusing.", UNIT(service)->id);
2439 return -ENOENT;
2440 }
2441
2442 /* If the service is already active we cannot start the
2443 * socket */
2444 if (!IN_SET(service->state, SERVICE_DEAD, SERVICE_FAILED, SERVICE_AUTO_RESTART)) {
2445 log_unit_error(u, "Socket service %s already active, refusing.", UNIT(service)->id);
2446 return -EBUSY;
2447 }
2448 }
2449
2450 assert(IN_SET(s->state, SOCKET_DEAD, SOCKET_FAILED));
2451
2452 r = unit_start_limit_test(u);
2453 if (r < 0) {
2454 socket_enter_dead(s, SOCKET_FAILURE_START_LIMIT_HIT);
2455 return r;
2456 }
2457
2458 r = unit_acquire_invocation_id(u);
2459 if (r < 0)
2460 return r;
2461
2462 s->result = SOCKET_SUCCESS;
2463
2464 u->reset_accounting = true;
2465
2466 socket_enter_start_pre(s);
2467 return 1;
2468 }
2469
2470 static int socket_stop(Unit *u) {
2471 Socket *s = SOCKET(u);
2472
2473 assert(s);
2474
2475 /* Already on it */
2476 if (IN_SET(s->state,
2477 SOCKET_STOP_PRE,
2478 SOCKET_STOP_PRE_SIGTERM,
2479 SOCKET_STOP_PRE_SIGKILL,
2480 SOCKET_STOP_POST,
2481 SOCKET_FINAL_SIGTERM,
2482 SOCKET_FINAL_SIGKILL))
2483 return 0;
2484
2485 /* If there's already something running we go directly into
2486 * kill mode. */
2487 if (IN_SET(s->state,
2488 SOCKET_START_PRE,
2489 SOCKET_START_CHOWN,
2490 SOCKET_START_POST)) {
2491 socket_enter_signal(s, SOCKET_STOP_PRE_SIGTERM, SOCKET_SUCCESS);
2492 return -EAGAIN;
2493 }
2494
2495 assert(IN_SET(s->state, SOCKET_LISTENING, SOCKET_RUNNING));
2496
2497 socket_enter_stop_pre(s, SOCKET_SUCCESS);
2498 return 1;
2499 }
2500
2501 static int socket_serialize(Unit *u, FILE *f, FDSet *fds) {
2502 Socket *s = SOCKET(u);
2503 SocketPort *p;
2504 int r;
2505
2506 assert(u);
2507 assert(f);
2508 assert(fds);
2509
2510 unit_serialize_item(u, f, "state", socket_state_to_string(s->state));
2511 unit_serialize_item(u, f, "result", socket_result_to_string(s->result));
2512 unit_serialize_item_format(u, f, "n-accepted", "%u", s->n_accepted);
2513 unit_serialize_item_format(u, f, "n-refused", "%u", s->n_refused);
2514
2515 if (s->control_pid > 0)
2516 unit_serialize_item_format(u, f, "control-pid", PID_FMT, s->control_pid);
2517
2518 if (s->control_command_id >= 0)
2519 unit_serialize_item(u, f, "control-command", socket_exec_command_to_string(s->control_command_id));
2520
2521 LIST_FOREACH(port, p, s->ports) {
2522 int copy;
2523
2524 if (p->fd < 0)
2525 continue;
2526
2527 copy = fdset_put_dup(fds, p->fd);
2528 if (copy < 0)
2529 return copy;
2530
2531 if (p->type == SOCKET_SOCKET) {
2532 _cleanup_free_ char *t = NULL;
2533
2534 r = socket_address_print(&p->address, &t);
2535 if (r < 0)
2536 return r;
2537
2538 if (socket_address_family(&p->address) == AF_NETLINK)
2539 unit_serialize_item_format(u, f, "netlink", "%i %s", copy, t);
2540 else
2541 unit_serialize_item_format(u, f, "socket", "%i %i %s", copy, p->address.type, t);
2542
2543 } else if (p->type == SOCKET_SPECIAL)
2544 unit_serialize_item_format(u, f, "special", "%i %s", copy, p->path);
2545 else if (p->type == SOCKET_MQUEUE)
2546 unit_serialize_item_format(u, f, "mqueue", "%i %s", copy, p->path);
2547 else if (p->type == SOCKET_USB_FUNCTION)
2548 unit_serialize_item_format(u, f, "ffs", "%i %s", copy, p->path);
2549 else {
2550 assert(p->type == SOCKET_FIFO);
2551 unit_serialize_item_format(u, f, "fifo", "%i %s", copy, p->path);
2552 }
2553 }
2554
2555 return 0;
2556 }
2557
2558 static void socket_port_take_fd(SocketPort *p, FDSet *fds, int fd) {
2559 safe_close(p->fd);
2560 p->fd = fdset_remove(fds, fd);
2561 }
2562
2563 static int socket_deserialize_item(Unit *u, const char *key, const char *value, FDSet *fds) {
2564 Socket *s = SOCKET(u);
2565
2566 assert(u);
2567 assert(key);
2568 assert(value);
2569
2570 if (streq(key, "state")) {
2571 SocketState state;
2572
2573 state = socket_state_from_string(value);
2574 if (state < 0)
2575 log_unit_debug(u, "Failed to parse state value: %s", value);
2576 else
2577 s->deserialized_state = state;
2578 } else if (streq(key, "result")) {
2579 SocketResult f;
2580
2581 f = socket_result_from_string(value);
2582 if (f < 0)
2583 log_unit_debug(u, "Failed to parse result value: %s", value);
2584 else if (f != SOCKET_SUCCESS)
2585 s->result = f;
2586
2587 } else if (streq(key, "n-accepted")) {
2588 unsigned k;
2589
2590 if (safe_atou(value, &k) < 0)
2591 log_unit_debug(u, "Failed to parse n-accepted value: %s", value);
2592 else
2593 s->n_accepted += k;
2594 } else if (streq(key, "n-refused")) {
2595 unsigned k;
2596
2597 if (safe_atou(value, &k) < 0)
2598 log_unit_debug(u, "Failed to parse n-refused value: %s", value);
2599 else
2600 s->n_refused += k;
2601 } else if (streq(key, "control-pid")) {
2602 pid_t pid;
2603
2604 if (parse_pid(value, &pid) < 0)
2605 log_unit_debug(u, "Failed to parse control-pid value: %s", value);
2606 else
2607 s->control_pid = pid;
2608 } else if (streq(key, "control-command")) {
2609 SocketExecCommand id;
2610
2611 id = socket_exec_command_from_string(value);
2612 if (id < 0)
2613 log_unit_debug(u, "Failed to parse exec-command value: %s", value);
2614 else {
2615 s->control_command_id = id;
2616 s->control_command = s->exec_command[id];
2617 }
2618 } else if (streq(key, "fifo")) {
2619 int fd, skip = 0;
2620 SocketPort *p;
2621
2622 if (sscanf(value, "%i %n", &fd, &skip) < 1 || fd < 0 || !fdset_contains(fds, fd))
2623 log_unit_debug(u, "Failed to parse fifo value: %s", value);
2624 else
2625 LIST_FOREACH(port, p, s->ports)
2626 if (p->type == SOCKET_FIFO &&
2627 path_equal_or_files_same(p->path, value+skip, 0)) {
2628 socket_port_take_fd(p, fds, fd);
2629 break;
2630 }
2631
2632 } else if (streq(key, "special")) {
2633 int fd, skip = 0;
2634 SocketPort *p;
2635
2636 if (sscanf(value, "%i %n", &fd, &skip) < 1 || fd < 0 || !fdset_contains(fds, fd))
2637 log_unit_debug(u, "Failed to parse special value: %s", value);
2638 else
2639 LIST_FOREACH(port, p, s->ports)
2640 if (p->type == SOCKET_SPECIAL &&
2641 path_equal_or_files_same(p->path, value+skip, 0)) {
2642 socket_port_take_fd(p, fds, fd);
2643 break;
2644 }
2645
2646 } else if (streq(key, "mqueue")) {
2647 int fd, skip = 0;
2648 SocketPort *p;
2649
2650 if (sscanf(value, "%i %n", &fd, &skip) < 1 || fd < 0 || !fdset_contains(fds, fd))
2651 log_unit_debug(u, "Failed to parse mqueue value: %s", value);
2652 else
2653 LIST_FOREACH(port, p, s->ports)
2654 if (p->type == SOCKET_MQUEUE &&
2655 streq(p->path, value+skip)) {
2656 socket_port_take_fd(p, fds, fd);
2657 break;
2658 }
2659
2660 } else if (streq(key, "socket")) {
2661 int fd, type, skip = 0;
2662 SocketPort *p;
2663
2664 if (sscanf(value, "%i %i %n", &fd, &type, &skip) < 2 || fd < 0 || type < 0 || !fdset_contains(fds, fd))
2665 log_unit_debug(u, "Failed to parse socket value: %s", value);
2666 else
2667 LIST_FOREACH(port, p, s->ports)
2668 if (socket_address_is(&p->address, value+skip, type)) {
2669 socket_port_take_fd(p, fds, fd);
2670 break;
2671 }
2672
2673 } else if (streq(key, "netlink")) {
2674 int fd, skip = 0;
2675 SocketPort *p;
2676
2677 if (sscanf(value, "%i %n", &fd, &skip) < 1 || fd < 0 || !fdset_contains(fds, fd))
2678 log_unit_debug(u, "Failed to parse socket value: %s", value);
2679 else
2680 LIST_FOREACH(port, p, s->ports)
2681 if (socket_address_is_netlink(&p->address, value+skip)) {
2682 socket_port_take_fd(p, fds, fd);
2683 break;
2684 }
2685
2686 } else if (streq(key, "ffs")) {
2687 int fd, skip = 0;
2688 SocketPort *p;
2689
2690 if (sscanf(value, "%i %n", &fd, &skip) < 1 || fd < 0 || !fdset_contains(fds, fd))
2691 log_unit_debug(u, "Failed to parse ffs value: %s", value);
2692 else
2693 LIST_FOREACH(port, p, s->ports)
2694 if (p->type == SOCKET_USB_FUNCTION &&
2695 path_equal_or_files_same(p->path, value+skip, 0)) {
2696 socket_port_take_fd(p, fds, fd);
2697 break;
2698 }
2699
2700 } else
2701 log_unit_debug(UNIT(s), "Unknown serialization key: %s", key);
2702
2703 return 0;
2704 }
2705
2706 static void socket_distribute_fds(Unit *u, FDSet *fds) {
2707 Socket *s = SOCKET(u);
2708 SocketPort *p;
2709
2710 assert(u);
2711
2712 LIST_FOREACH(port, p, s->ports) {
2713 Iterator i;
2714 int fd;
2715
2716 if (p->type != SOCKET_SOCKET)
2717 continue;
2718
2719 if (p->fd >= 0)
2720 continue;
2721
2722 FDSET_FOREACH(fd, fds, i) {
2723 if (socket_address_matches_fd(&p->address, fd)) {
2724 p->fd = fdset_remove(fds, fd);
2725 s->deserialized_state = SOCKET_LISTENING;
2726 break;
2727 }
2728 }
2729 }
2730 }
2731
2732 _pure_ static UnitActiveState socket_active_state(Unit *u) {
2733 assert(u);
2734
2735 return state_translation_table[SOCKET(u)->state];
2736 }
2737
2738 _pure_ static const char *socket_sub_state_to_string(Unit *u) {
2739 assert(u);
2740
2741 return socket_state_to_string(SOCKET(u)->state);
2742 }
2743
2744 const char* socket_port_type_to_string(SocketPort *p) {
2745
2746 assert(p);
2747
2748 switch (p->type) {
2749
2750 case SOCKET_SOCKET:
2751
2752 switch (p->address.type) {
2753
2754 case SOCK_STREAM:
2755 return "Stream";
2756
2757 case SOCK_DGRAM:
2758 return "Datagram";
2759
2760 case SOCK_SEQPACKET:
2761 return "SequentialPacket";
2762
2763 case SOCK_RAW:
2764 if (socket_address_family(&p->address) == AF_NETLINK)
2765 return "Netlink";
2766
2767 _fallthrough_;
2768 default:
2769 return NULL;
2770 }
2771
2772 case SOCKET_SPECIAL:
2773 return "Special";
2774
2775 case SOCKET_MQUEUE:
2776 return "MessageQueue";
2777
2778 case SOCKET_FIFO:
2779 return "FIFO";
2780
2781 case SOCKET_USB_FUNCTION:
2782 return "USBFunction";
2783
2784 default:
2785 return NULL;
2786 }
2787 }
2788
2789 SocketType socket_port_type_from_string(const char *s) {
2790 assert(s);
2791
2792 if (STR_IN_SET(s, "Stream", "Datagram", "SequentialPacket", "Netlink"))
2793 return SOCKET_SOCKET;
2794 else if (streq(s, "Special"))
2795 return SOCKET_SPECIAL;
2796 else if (streq(s, "MessageQueue"))
2797 return SOCKET_MQUEUE;
2798 else if (streq(s, "FIFO"))
2799 return SOCKET_FIFO;
2800 else if (streq(s, "USBFunction"))
2801 return SOCKET_USB_FUNCTION;
2802 else
2803 return _SOCKET_TYPE_INVALID;
2804 }
2805
2806 _pure_ static bool socket_may_gc(Unit *u) {
2807 Socket *s = SOCKET(u);
2808
2809 assert(u);
2810
2811 return s->n_connections == 0;
2812 }
2813
2814 static int socket_accept_do(Socket *s, int fd) {
2815 int cfd;
2816
2817 assert(s);
2818 assert(fd >= 0);
2819
2820 for (;;) {
2821 cfd = accept4(fd, NULL, NULL, SOCK_NONBLOCK);
2822 if (cfd < 0) {
2823 if (errno == EINTR)
2824 continue;
2825
2826 return -errno;
2827 }
2828
2829 break;
2830 }
2831
2832 return cfd;
2833 }
2834
2835 static int socket_accept_in_cgroup(Socket *s, SocketPort *p, int fd) {
2836 _cleanup_close_pair_ int pair[2] = { -1, -1 };
2837 int cfd, r;
2838 pid_t pid;
2839
2840 assert(s);
2841 assert(p);
2842 assert(fd >= 0);
2843
2844 /* Similar to socket_address_listen_in_cgroup(), but for accept() rathern than socket(): make sure that any
2845 * connection socket is also properly associated with the cgroup. */
2846
2847 if (!IN_SET(p->address.sockaddr.sa.sa_family, AF_INET, AF_INET6))
2848 goto shortcut;
2849
2850 r = bpf_firewall_supported();
2851 if (r < 0)
2852 return r;
2853 if (r == BPF_FIREWALL_UNSUPPORTED)
2854 goto shortcut;
2855
2856 if (socketpair(AF_UNIX, SOCK_SEQPACKET|SOCK_CLOEXEC, 0, pair) < 0)
2857 return log_unit_error_errno(UNIT(s), errno, "Failed to create communication channel: %m");
2858
2859 r = unit_fork_helper_process(UNIT(s), "(sd-accept)", &pid);
2860 if (r < 0)
2861 return log_unit_error_errno(UNIT(s), r, "Failed to fork off accept stub process: %m");
2862 if (r == 0) {
2863 /* Child */
2864
2865 pair[0] = safe_close(pair[0]);
2866
2867 cfd = socket_accept_do(s, fd);
2868 if (cfd < 0) {
2869 log_unit_error_errno(UNIT(s), cfd, "Failed to accept connection socket: %m");
2870 _exit(EXIT_FAILURE);
2871 }
2872
2873 r = send_one_fd(pair[1], cfd, 0);
2874 if (r < 0) {
2875 log_unit_error_errno(UNIT(s), r, "Failed to send connection socket to parent: %m");
2876 _exit(EXIT_FAILURE);
2877 }
2878
2879 _exit(EXIT_SUCCESS);
2880 }
2881
2882 pair[1] = safe_close(pair[1]);
2883 cfd = receive_one_fd(pair[0], 0);
2884
2885 /* We synchronously wait for the helper, as it shouldn't be slow */
2886 r = wait_for_terminate_and_check("(sd-accept)", pid, WAIT_LOG_ABNORMAL);
2887 if (r < 0) {
2888 safe_close(cfd);
2889 return r;
2890 }
2891
2892 if (cfd < 0)
2893 return log_unit_error_errno(UNIT(s), cfd, "Failed to receive connection socket: %m");
2894
2895 return cfd;
2896
2897 shortcut:
2898 cfd = socket_accept_do(s, fd);
2899 if (cfd < 0)
2900 return log_unit_error_errno(UNIT(s), cfd, "Failed to accept connection socket: %m");
2901
2902 return cfd;
2903 }
2904
2905 static int socket_dispatch_io(sd_event_source *source, int fd, uint32_t revents, void *userdata) {
2906 SocketPort *p = userdata;
2907 int cfd = -1;
2908
2909 assert(p);
2910 assert(fd >= 0);
2911
2912 if (p->socket->state != SOCKET_LISTENING)
2913 return 0;
2914
2915 log_unit_debug(UNIT(p->socket), "Incoming traffic");
2916
2917 if (revents != EPOLLIN) {
2918
2919 if (revents & EPOLLHUP)
2920 log_unit_error(UNIT(p->socket), "Got POLLHUP on a listening socket. The service probably invoked shutdown() on it, and should better not do that.");
2921 else
2922 log_unit_error(UNIT(p->socket), "Got unexpected poll event (0x%x) on socket.", revents);
2923 goto fail;
2924 }
2925
2926 if (p->socket->accept &&
2927 p->type == SOCKET_SOCKET &&
2928 socket_address_can_accept(&p->address)) {
2929
2930 cfd = socket_accept_in_cgroup(p->socket, p, fd);
2931 if (cfd < 0)
2932 goto fail;
2933
2934 socket_apply_socket_options(p->socket, cfd);
2935 }
2936
2937 socket_enter_running(p->socket, cfd);
2938 return 0;
2939
2940 fail:
2941 socket_enter_stop_pre(p->socket, SOCKET_FAILURE_RESOURCES);
2942 return 0;
2943 }
2944
2945 static void socket_sigchld_event(Unit *u, pid_t pid, int code, int status) {
2946 Socket *s = SOCKET(u);
2947 SocketResult f;
2948
2949 assert(s);
2950 assert(pid >= 0);
2951
2952 if (pid != s->control_pid)
2953 return;
2954
2955 s->control_pid = 0;
2956
2957 if (is_clean_exit(code, status, EXIT_CLEAN_COMMAND, NULL))
2958 f = SOCKET_SUCCESS;
2959 else if (code == CLD_EXITED)
2960 f = SOCKET_FAILURE_EXIT_CODE;
2961 else if (code == CLD_KILLED)
2962 f = SOCKET_FAILURE_SIGNAL;
2963 else if (code == CLD_DUMPED)
2964 f = SOCKET_FAILURE_CORE_DUMP;
2965 else
2966 assert_not_reached("Unknown sigchld code");
2967
2968 if (s->control_command) {
2969 exec_status_exit(&s->control_command->exec_status, &s->exec_context, pid, code, status);
2970
2971 if (s->control_command->flags & EXEC_COMMAND_IGNORE_FAILURE)
2972 f = SOCKET_SUCCESS;
2973 }
2974
2975 log_unit_full(u, f == SOCKET_SUCCESS ? LOG_DEBUG : LOG_NOTICE, 0,
2976 "Control process exited, code=%s status=%i",
2977 sigchld_code_to_string(code), status);
2978
2979 if (s->result == SOCKET_SUCCESS)
2980 s->result = f;
2981
2982 if (s->control_command &&
2983 s->control_command->command_next &&
2984 f == SOCKET_SUCCESS) {
2985
2986 log_unit_debug(u, "Running next command for state %s", socket_state_to_string(s->state));
2987 socket_run_next(s);
2988 } else {
2989 s->control_command = NULL;
2990 s->control_command_id = _SOCKET_EXEC_COMMAND_INVALID;
2991
2992 /* No further commands for this step, so let's figure
2993 * out what to do next */
2994
2995 log_unit_debug(u, "Got final SIGCHLD for state %s", socket_state_to_string(s->state));
2996
2997 switch (s->state) {
2998
2999 case SOCKET_START_PRE:
3000 if (f == SOCKET_SUCCESS)
3001 socket_enter_start_chown(s);
3002 else
3003 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, f);
3004 break;
3005
3006 case SOCKET_START_CHOWN:
3007 if (f == SOCKET_SUCCESS)
3008 socket_enter_start_post(s);
3009 else
3010 socket_enter_stop_pre(s, f);
3011 break;
3012
3013 case SOCKET_START_POST:
3014 if (f == SOCKET_SUCCESS)
3015 socket_enter_listening(s);
3016 else
3017 socket_enter_stop_pre(s, f);
3018 break;
3019
3020 case SOCKET_STOP_PRE:
3021 case SOCKET_STOP_PRE_SIGTERM:
3022 case SOCKET_STOP_PRE_SIGKILL:
3023 socket_enter_stop_post(s, f);
3024 break;
3025
3026 case SOCKET_STOP_POST:
3027 case SOCKET_FINAL_SIGTERM:
3028 case SOCKET_FINAL_SIGKILL:
3029 socket_enter_dead(s, f);
3030 break;
3031
3032 default:
3033 assert_not_reached("Uh, control process died at wrong time.");
3034 }
3035 }
3036
3037 /* Notify clients about changed exit status */
3038 unit_add_to_dbus_queue(u);
3039 }
3040
3041 static int socket_dispatch_timer(sd_event_source *source, usec_t usec, void *userdata) {
3042 Socket *s = SOCKET(userdata);
3043
3044 assert(s);
3045 assert(s->timer_event_source == source);
3046
3047 switch (s->state) {
3048
3049 case SOCKET_START_PRE:
3050 log_unit_warning(UNIT(s), "Starting timed out. Terminating.");
3051 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, SOCKET_FAILURE_TIMEOUT);
3052 break;
3053
3054 case SOCKET_START_CHOWN:
3055 case SOCKET_START_POST:
3056 log_unit_warning(UNIT(s), "Starting timed out. Stopping.");
3057 socket_enter_stop_pre(s, SOCKET_FAILURE_TIMEOUT);
3058 break;
3059
3060 case SOCKET_STOP_PRE:
3061 log_unit_warning(UNIT(s), "Stopping timed out. Terminating.");
3062 socket_enter_signal(s, SOCKET_STOP_PRE_SIGTERM, SOCKET_FAILURE_TIMEOUT);
3063 break;
3064
3065 case SOCKET_STOP_PRE_SIGTERM:
3066 if (s->kill_context.send_sigkill) {
3067 log_unit_warning(UNIT(s), "Stopping timed out. Killing.");
3068 socket_enter_signal(s, SOCKET_STOP_PRE_SIGKILL, SOCKET_FAILURE_TIMEOUT);
3069 } else {
3070 log_unit_warning(UNIT(s), "Stopping timed out. Skipping SIGKILL. Ignoring.");
3071 socket_enter_stop_post(s, SOCKET_FAILURE_TIMEOUT);
3072 }
3073 break;
3074
3075 case SOCKET_STOP_PRE_SIGKILL:
3076 log_unit_warning(UNIT(s), "Processes still around after SIGKILL. Ignoring.");
3077 socket_enter_stop_post(s, SOCKET_FAILURE_TIMEOUT);
3078 break;
3079
3080 case SOCKET_STOP_POST:
3081 log_unit_warning(UNIT(s), "Stopping timed out (2). Terminating.");
3082 socket_enter_signal(s, SOCKET_FINAL_SIGTERM, SOCKET_FAILURE_TIMEOUT);
3083 break;
3084
3085 case SOCKET_FINAL_SIGTERM:
3086 if (s->kill_context.send_sigkill) {
3087 log_unit_warning(UNIT(s), "Stopping timed out (2). Killing.");
3088 socket_enter_signal(s, SOCKET_FINAL_SIGKILL, SOCKET_FAILURE_TIMEOUT);
3089 } else {
3090 log_unit_warning(UNIT(s), "Stopping timed out (2). Skipping SIGKILL. Ignoring.");
3091 socket_enter_dead(s, SOCKET_FAILURE_TIMEOUT);
3092 }
3093 break;
3094
3095 case SOCKET_FINAL_SIGKILL:
3096 log_unit_warning(UNIT(s), "Still around after SIGKILL (2). Entering failed mode.");
3097 socket_enter_dead(s, SOCKET_FAILURE_TIMEOUT);
3098 break;
3099
3100 default:
3101 assert_not_reached("Timeout at wrong time.");
3102 }
3103
3104 return 0;
3105 }
3106
3107 int socket_collect_fds(Socket *s, int **fds) {
3108 size_t k = 0, n = 0;
3109 SocketPort *p;
3110 int *rfds;
3111
3112 assert(s);
3113 assert(fds);
3114
3115 /* Called from the service code for requesting our fds */
3116
3117 LIST_FOREACH(port, p, s->ports) {
3118 if (p->fd >= 0)
3119 n++;
3120 n += p->n_auxiliary_fds;
3121 }
3122
3123 if (n <= 0) {
3124 *fds = NULL;
3125 return 0;
3126 }
3127
3128 rfds = new(int, n);
3129 if (!rfds)
3130 return -ENOMEM;
3131
3132 LIST_FOREACH(port, p, s->ports) {
3133 size_t i;
3134
3135 if (p->fd >= 0)
3136 rfds[k++] = p->fd;
3137 for (i = 0; i < p->n_auxiliary_fds; ++i)
3138 rfds[k++] = p->auxiliary_fds[i];
3139 }
3140
3141 assert(k == n);
3142
3143 *fds = rfds;
3144 return (int) n;
3145 }
3146
3147 static void socket_reset_failed(Unit *u) {
3148 Socket *s = SOCKET(u);
3149
3150 assert(s);
3151
3152 if (s->state == SOCKET_FAILED)
3153 socket_set_state(s, SOCKET_DEAD);
3154
3155 s->result = SOCKET_SUCCESS;
3156 }
3157
3158 void socket_connection_unref(Socket *s) {
3159 assert(s);
3160
3161 /* The service is dead. Yay!
3162 *
3163 * This is strictly for one-instance-per-connection
3164 * services. */
3165
3166 assert(s->n_connections > 0);
3167 s->n_connections--;
3168
3169 log_unit_debug(UNIT(s), "One connection closed, %u left.", s->n_connections);
3170 }
3171
3172 static void socket_trigger_notify(Unit *u, Unit *other) {
3173 Socket *s = SOCKET(u);
3174
3175 assert(u);
3176 assert(other);
3177
3178 /* Filter out invocations with bogus state */
3179 if (other->load_state != UNIT_LOADED || other->type != UNIT_SERVICE)
3180 return;
3181
3182 /* Don't propagate state changes from the service if we are already down */
3183 if (!IN_SET(s->state, SOCKET_RUNNING, SOCKET_LISTENING))
3184 return;
3185
3186 /* We don't care for the service state if we are in Accept=yes mode */
3187 if (s->accept)
3188 return;
3189
3190 /* Propagate start limit hit state */
3191 if (other->start_limit_hit) {
3192 socket_enter_stop_pre(s, SOCKET_FAILURE_SERVICE_START_LIMIT_HIT);
3193 return;
3194 }
3195
3196 /* Don't propagate anything if there's still a job queued */
3197 if (other->job)
3198 return;
3199
3200 if (IN_SET(SERVICE(other)->state,
3201 SERVICE_DEAD, SERVICE_FAILED,
3202 SERVICE_FINAL_SIGTERM, SERVICE_FINAL_SIGKILL,
3203 SERVICE_AUTO_RESTART))
3204 socket_enter_listening(s);
3205
3206 if (SERVICE(other)->state == SERVICE_RUNNING)
3207 socket_set_state(s, SOCKET_RUNNING);
3208 }
3209
3210 static int socket_kill(Unit *u, KillWho who, int signo, sd_bus_error *error) {
3211 return unit_kill_common(u, who, signo, -1, SOCKET(u)->control_pid, error);
3212 }
3213
3214 static int socket_get_timeout(Unit *u, usec_t *timeout) {
3215 Socket *s = SOCKET(u);
3216 usec_t t;
3217 int r;
3218
3219 if (!s->timer_event_source)
3220 return 0;
3221
3222 r = sd_event_source_get_time(s->timer_event_source, &t);
3223 if (r < 0)
3224 return r;
3225 if (t == USEC_INFINITY)
3226 return 0;
3227
3228 *timeout = t;
3229 return 1;
3230 }
3231
3232 char *socket_fdname(Socket *s) {
3233 assert(s);
3234
3235 /* Returns the name to use for $LISTEN_NAMES. If the user
3236 * didn't specify anything specifically, use the socket unit's
3237 * name as fallback. */
3238
3239 return s->fdname ?: UNIT(s)->id;
3240 }
3241
3242 static int socket_control_pid(Unit *u) {
3243 Socket *s = SOCKET(u);
3244
3245 assert(s);
3246
3247 return s->control_pid;
3248 }
3249
3250 static const char* const socket_exec_command_table[_SOCKET_EXEC_COMMAND_MAX] = {
3251 [SOCKET_EXEC_START_PRE] = "ExecStartPre",
3252 [SOCKET_EXEC_START_CHOWN] = "ExecStartChown",
3253 [SOCKET_EXEC_START_POST] = "ExecStartPost",
3254 [SOCKET_EXEC_STOP_PRE] = "ExecStopPre",
3255 [SOCKET_EXEC_STOP_POST] = "ExecStopPost"
3256 };
3257
3258 DEFINE_STRING_TABLE_LOOKUP(socket_exec_command, SocketExecCommand);
3259
3260 static const char* const socket_result_table[_SOCKET_RESULT_MAX] = {
3261 [SOCKET_SUCCESS] = "success",
3262 [SOCKET_FAILURE_RESOURCES] = "resources",
3263 [SOCKET_FAILURE_TIMEOUT] = "timeout",
3264 [SOCKET_FAILURE_EXIT_CODE] = "exit-code",
3265 [SOCKET_FAILURE_SIGNAL] = "signal",
3266 [SOCKET_FAILURE_CORE_DUMP] = "core-dump",
3267 [SOCKET_FAILURE_START_LIMIT_HIT] = "start-limit-hit",
3268 [SOCKET_FAILURE_TRIGGER_LIMIT_HIT] = "trigger-limit-hit",
3269 [SOCKET_FAILURE_SERVICE_START_LIMIT_HIT] = "service-start-limit-hit"
3270 };
3271
3272 DEFINE_STRING_TABLE_LOOKUP(socket_result, SocketResult);
3273
3274 const UnitVTable socket_vtable = {
3275 .object_size = sizeof(Socket),
3276 .exec_context_offset = offsetof(Socket, exec_context),
3277 .cgroup_context_offset = offsetof(Socket, cgroup_context),
3278 .kill_context_offset = offsetof(Socket, kill_context),
3279 .exec_runtime_offset = offsetof(Socket, exec_runtime),
3280 .dynamic_creds_offset = offsetof(Socket, dynamic_creds),
3281
3282 .sections =
3283 "Unit\0"
3284 "Socket\0"
3285 "Install\0",
3286 .private_section = "Socket",
3287
3288 .can_transient = true,
3289
3290 .init = socket_init,
3291 .done = socket_done,
3292 .load = socket_load,
3293
3294 .coldplug = socket_coldplug,
3295
3296 .dump = socket_dump,
3297
3298 .start = socket_start,
3299 .stop = socket_stop,
3300
3301 .kill = socket_kill,
3302
3303 .get_timeout = socket_get_timeout,
3304
3305 .serialize = socket_serialize,
3306 .deserialize_item = socket_deserialize_item,
3307 .distribute_fds = socket_distribute_fds,
3308
3309 .active_state = socket_active_state,
3310 .sub_state_to_string = socket_sub_state_to_string,
3311
3312 .may_gc = socket_may_gc,
3313
3314 .sigchld_event = socket_sigchld_event,
3315
3316 .trigger_notify = socket_trigger_notify,
3317
3318 .reset_failed = socket_reset_failed,
3319
3320 .control_pid = socket_control_pid,
3321
3322 .bus_vtable = bus_socket_vtable,
3323 .bus_set_property = bus_socket_set_property,
3324 .bus_commit_properties = bus_socket_commit_properties,
3325
3326 .status_message_formats = {
3327 /*.starting_stopping = {
3328 [0] = "Starting socket %s...",
3329 [1] = "Stopping socket %s...",
3330 },*/
3331 .finished_start_job = {
3332 [JOB_DONE] = "Listening on %s.",
3333 [JOB_FAILED] = "Failed to listen on %s.",
3334 [JOB_TIMEOUT] = "Timed out starting %s.",
3335 },
3336 .finished_stop_job = {
3337 [JOB_DONE] = "Closed %s.",
3338 [JOB_FAILED] = "Failed stopping %s.",
3339 [JOB_TIMEOUT] = "Timed out stopping %s.",
3340 },
3341 },
3342 };