1 /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/
4 This file is part of systemd.
6 Copyright 2011 Lennart Poettering
8 systemd is free software; you can redistribute it and/or modify it
9 under the terms of the GNU General Public License as published by
10 the Free Software Foundation; either version 2 of the License, or
11 (at your option) any later version.
13 systemd is distributed in the hope that it will be useful, but
14 WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with systemd; If not, see <http://www.gnu.org/licenses/>.
22 #include <sys/epoll.h>
23 #include <sys/socket.h>
25 #include <sys/signalfd.h>
29 #include <acl/libacl.h>
31 #include <sys/ioctl.h>
32 #include <linux/sockios.h>
33 #include <sys/statvfs.h>
35 #include <systemd/sd-journal.h>
36 #include <systemd/sd-login.h>
37 #include <systemd/sd-messages.h>
38 #include <systemd/sd-daemon.h>
41 #include "journal-file.h"
42 #include "socket-util.h"
44 #include "cgroup-util.h"
46 #include "journal-rate-limit.h"
47 #include "journal-internal.h"
48 #include "conf-parser.h"
51 #define USER_JOURNALS_MAX 1024
52 #define STDOUT_STREAMS_MAX 4096
54 #define DEFAULT_RATE_LIMIT_INTERVAL (10*USEC_PER_SEC)
55 #define DEFAULT_RATE_LIMIT_BURST 200
57 #define RECHECK_AVAILABLE_SPACE_USEC (30*USEC_PER_SEC)
59 #define RECHECK_VAR_AVAILABLE_USEC (30*USEC_PER_SEC)
61 #define SYSLOG_TIMEOUT_USEC (5*USEC_PER_SEC)
63 #define N_IOVEC_META_FIELDS 16
65 typedef enum StdoutStreamState
{
67 STDOUT_STREAM_PRIORITY
,
68 STDOUT_STREAM_PRIORITY_PREFIX
,
69 STDOUT_STREAM_FORWARD_TO_SYSLOG
,
70 STDOUT_STREAM_FORWARD_TO_KMSG
,
71 STDOUT_STREAM_FORWARD_TO_CONSOLE
,
77 StdoutStreamState state
;
85 bool priority_prefix
:1;
86 bool forward_to_syslog
:1;
87 bool forward_to_kmsg
:1;
88 bool forward_to_console
:1;
90 char buffer
[LINE_MAX
+1];
93 LIST_FIELDS(StdoutStream
, stdout_stream
);
96 static int server_flush_to_var(Server
*s
);
98 static uint64_t available_space(Server
*s
) {
103 uint64_t sum
= 0, avail
= 0, ss_avail
= 0;
109 ts
= now(CLOCK_MONOTONIC
);
111 if (s
->cached_available_space_timestamp
+ RECHECK_AVAILABLE_SPACE_USEC
> ts
)
112 return s
->cached_available_space
;
114 r
= sd_id128_get_machine(&machine
);
118 if (s
->system_journal
) {
119 f
= "/var/log/journal/";
120 m
= &s
->system_metrics
;
122 f
= "/run/log/journal/";
123 m
= &s
->runtime_metrics
;
128 p
= strappend(f
, sd_id128_to_string(machine
, ids
));
138 if (fstatvfs(dirfd(d
), &ss
) < 0)
143 struct dirent buf
, *de
;
146 k
= readdir_r(d
, &buf
, &de
);
155 if (!dirent_is_file_with_suffix(de
, ".journal"))
158 if (fstatat(dirfd(d
), de
->d_name
, &st
, AT_SYMLINK_NOFOLLOW
) < 0)
161 sum
+= (uint64_t) st
.st_blocks
* (uint64_t) st
.st_blksize
;
164 avail
= sum
>= m
->max_use
? 0 : m
->max_use
- sum
;
166 ss_avail
= ss
.f_bsize
* ss
.f_bavail
;
168 ss_avail
= ss_avail
< m
->keep_free
? 0 : ss_avail
- m
->keep_free
;
170 if (ss_avail
< avail
)
173 s
->cached_available_space
= avail
;
174 s
->cached_available_space_timestamp
= ts
;
182 static void fix_perms(JournalFile
*f
, uid_t uid
) {
185 acl_permset_t permset
;
190 r
= fchmod_and_fchown(f
->fd
, 0640, 0, 0);
192 log_warning("Failed to fix access mode/rights on %s, ignoring: %s", f
->path
, strerror(-r
));
197 acl
= acl_get_fd(f
->fd
);
199 log_warning("Failed to read ACL on %s, ignoring: %m", f
->path
);
203 r
= acl_find_uid(acl
, uid
, &entry
);
206 if (acl_create_entry(&acl
, &entry
) < 0 ||
207 acl_set_tag_type(entry
, ACL_USER
) < 0 ||
208 acl_set_qualifier(entry
, &uid
) < 0) {
209 log_warning("Failed to patch ACL on %s, ignoring: %m", f
->path
);
214 if (acl_get_permset(entry
, &permset
) < 0 ||
215 acl_add_perm(permset
, ACL_READ
) < 0 ||
216 acl_calc_mask(&acl
) < 0) {
217 log_warning("Failed to patch ACL on %s, ignoring: %m", f
->path
);
221 if (acl_set_fd(f
->fd
, acl
) < 0)
222 log_warning("Failed to set ACL on %s, ignoring: %m", f
->path
);
228 static JournalFile
* find_journal(Server
*s
, uid_t uid
) {
237 /* We split up user logs only on /var, not on /run. If the
238 * runtime file is open, we write to it exclusively, in order
239 * to guarantee proper order as soon as we flush /run to
240 * /var and close the runtime file. */
242 if (s
->runtime_journal
)
243 return s
->runtime_journal
;
246 return s
->system_journal
;
248 r
= sd_id128_get_machine(&machine
);
250 return s
->system_journal
;
252 f
= hashmap_get(s
->user_journals
, UINT32_TO_PTR(uid
));
256 if (asprintf(&p
, "/var/log/journal/%s/user-%lu.journal", sd_id128_to_string(machine
, ids
), (unsigned long) uid
) < 0)
257 return s
->system_journal
;
259 while (hashmap_size(s
->user_journals
) >= USER_JOURNALS_MAX
) {
260 /* Too many open? Then let's close one */
261 f
= hashmap_steal_first(s
->user_journals
);
263 journal_file_close(f
);
266 r
= journal_file_open(p
, O_RDWR
|O_CREAT
, 0640, s
->system_journal
, &f
);
270 return s
->system_journal
;
273 f
->metrics
= s
->system_metrics
;
274 f
->compress
= s
->compress
;
276 r
= hashmap_put(s
->user_journals
, UINT32_TO_PTR(uid
), f
);
278 journal_file_close(f
);
279 return s
->system_journal
;
285 static void server_rotate(Server
*s
) {
291 log_info("Rotating...");
293 if (s
->runtime_journal
) {
294 r
= journal_file_rotate(&s
->runtime_journal
);
296 log_error("Failed to rotate %s: %s", s
->runtime_journal
->path
, strerror(-r
));
299 if (s
->system_journal
) {
300 r
= journal_file_rotate(&s
->system_journal
);
302 log_error("Failed to rotate %s: %s", s
->system_journal
->path
, strerror(-r
));
305 HASHMAP_FOREACH_KEY(f
, k
, s
->user_journals
, i
) {
306 r
= journal_file_rotate(&f
);
308 log_error("Failed to rotate %s: %s", f
->path
, strerror(-r
));
310 hashmap_replace(s
->user_journals
, k
, f
);
314 static void server_vacuum(Server
*s
) {
320 log_info("Vacuuming...");
322 r
= sd_id128_get_machine(&machine
);
324 log_error("Failed to get machine ID: %s", strerror(-r
));
328 sd_id128_to_string(machine
, ids
);
330 if (s
->system_journal
) {
331 if (asprintf(&p
, "/var/log/journal/%s", ids
) < 0) {
332 log_error("Out of memory.");
336 r
= journal_directory_vacuum(p
, s
->system_metrics
.max_use
, s
->system_metrics
.keep_free
);
337 if (r
< 0 && r
!= -ENOENT
)
338 log_error("Failed to vacuum %s: %s", p
, strerror(-r
));
343 if (s
->runtime_journal
) {
344 if (asprintf(&p
, "/run/log/journal/%s", ids
) < 0) {
345 log_error("Out of memory.");
349 r
= journal_directory_vacuum(p
, s
->runtime_metrics
.max_use
, s
->runtime_metrics
.keep_free
);
350 if (r
< 0 && r
!= -ENOENT
)
351 log_error("Failed to vacuum %s: %s", p
, strerror(-r
));
355 s
->cached_available_space_timestamp
= 0;
358 static char *shortened_cgroup_path(pid_t pid
) {
360 char *process_path
, *init_path
, *path
;
364 r
= cg_get_by_pid(SYSTEMD_CGROUP_CONTROLLER
, pid
, &process_path
);
368 r
= cg_get_by_pid(SYSTEMD_CGROUP_CONTROLLER
, 1, &init_path
);
374 if (endswith(init_path
, "/system"))
375 init_path
[strlen(init_path
) - 7] = 0;
376 else if (streq(init_path
, "/"))
379 if (startswith(process_path
, init_path
)) {
382 p
= strdup(process_path
+ strlen(init_path
));
400 static void dispatch_message_real(Server
*s
,
401 struct iovec
*iovec
, unsigned n
, unsigned m
,
403 struct timeval
*tv
) {
405 char *pid
= NULL
, *uid
= NULL
, *gid
= NULL
,
406 *source_time
= NULL
, *boot_id
= NULL
, *machine_id
= NULL
,
407 *comm
= NULL
, *cmdline
= NULL
, *hostname
= NULL
,
408 *audit_session
= NULL
, *audit_loginuid
= NULL
,
409 *exe
= NULL
, *cgroup
= NULL
, *session
= NULL
,
410 *owner_uid
= NULL
, *unit
= NULL
;
416 uid_t loginuid
= 0, realuid
= 0;
418 bool vacuumed
= false;
423 assert(n
+ N_IOVEC_META_FIELDS
<= m
);
429 realuid
= ucred
->uid
;
431 if (asprintf(&pid
, "_PID=%lu", (unsigned long) ucred
->pid
) >= 0)
432 IOVEC_SET_STRING(iovec
[n
++], pid
);
434 if (asprintf(&uid
, "_UID=%lu", (unsigned long) ucred
->uid
) >= 0)
435 IOVEC_SET_STRING(iovec
[n
++], uid
);
437 if (asprintf(&gid
, "_GID=%lu", (unsigned long) ucred
->gid
) >= 0)
438 IOVEC_SET_STRING(iovec
[n
++], gid
);
440 r
= get_process_comm(ucred
->pid
, &t
);
442 comm
= strappend("_COMM=", t
);
446 IOVEC_SET_STRING(iovec
[n
++], comm
);
449 r
= get_process_exe(ucred
->pid
, &t
);
451 exe
= strappend("_EXE=", t
);
455 IOVEC_SET_STRING(iovec
[n
++], exe
);
458 r
= get_process_cmdline(ucred
->pid
, LINE_MAX
, false, &t
);
460 cmdline
= strappend("_CMDLINE=", t
);
464 IOVEC_SET_STRING(iovec
[n
++], cmdline
);
467 r
= audit_session_from_pid(ucred
->pid
, &audit
);
469 if (asprintf(&audit_session
, "_AUDIT_SESSION=%lu", (unsigned long) audit
) >= 0)
470 IOVEC_SET_STRING(iovec
[n
++], audit_session
);
472 r
= audit_loginuid_from_pid(ucred
->pid
, &loginuid
);
474 if (asprintf(&audit_loginuid
, "_AUDIT_LOGINUID=%lu", (unsigned long) loginuid
) >= 0)
475 IOVEC_SET_STRING(iovec
[n
++], audit_loginuid
);
477 t
= shortened_cgroup_path(ucred
->pid
);
479 cgroup
= strappend("_SYSTEMD_CGROUP=", t
);
483 IOVEC_SET_STRING(iovec
[n
++], cgroup
);
486 if (sd_pid_get_session(ucred
->pid
, &t
) >= 0) {
487 session
= strappend("_SYSTEMD_SESSION=", t
);
491 IOVEC_SET_STRING(iovec
[n
++], session
);
494 if (sd_pid_get_unit(ucred
->pid
, &t
) >= 0) {
495 unit
= strappend("_SYSTEMD_UNIT=", t
);
499 IOVEC_SET_STRING(iovec
[n
++], unit
);
502 if (sd_pid_get_owner_uid(ucred
->uid
, &owner
) >= 0)
503 if (asprintf(&owner_uid
, "_SYSTEMD_OWNER_UID=%lu", (unsigned long) owner
) >= 0)
504 IOVEC_SET_STRING(iovec
[n
++], owner_uid
);
508 if (asprintf(&source_time
, "_SOURCE_REALTIME_TIMESTAMP=%llu",
509 (unsigned long long) timeval_load(tv
)) >= 0)
510 IOVEC_SET_STRING(iovec
[n
++], source_time
);
513 /* Note that strictly speaking storing the boot id here is
514 * redundant since the entry includes this in-line
515 * anyway. However, we need this indexed, too. */
516 r
= sd_id128_get_boot(&id
);
518 if (asprintf(&boot_id
, "_BOOT_ID=%s", sd_id128_to_string(id
, idbuf
)) >= 0)
519 IOVEC_SET_STRING(iovec
[n
++], boot_id
);
521 r
= sd_id128_get_machine(&id
);
523 if (asprintf(&machine_id
, "_MACHINE_ID=%s", sd_id128_to_string(id
, idbuf
)) >= 0)
524 IOVEC_SET_STRING(iovec
[n
++], machine_id
);
526 t
= gethostname_malloc();
528 hostname
= strappend("_HOSTNAME=", t
);
531 IOVEC_SET_STRING(iovec
[n
++], hostname
);
536 server_flush_to_var(s
);
539 f
= find_journal(s
, realuid
== 0 ? 0 : loginuid
);
541 log_warning("Dropping message, as we can't find a place to store the data.");
543 r
= journal_file_append_entry(f
, NULL
, iovec
, n
, &s
->seqnum
, NULL
, NULL
);
545 if (r
== -E2BIG
&& !vacuumed
) {
546 log_info("Allocation limit reached.");
552 log_info("Retrying write.");
557 log_error("Failed to write entry, ignoring: %s", strerror(-r
));
571 free(audit_loginuid
);
578 static void driver_message(Server
*s
, sd_id128_t message_id
, const char *format
, ...) {
579 char mid
[11 + 32 + 1];
580 char buffer
[16 + LINE_MAX
+ 1];
581 struct iovec iovec
[N_IOVEC_META_FIELDS
+ 3];
589 IOVEC_SET_STRING(iovec
[n
++], "PRIORITY=5");
591 memcpy(buffer
, "MESSAGE=", 8);
592 va_start(ap
, format
);
593 vsnprintf(buffer
+ 8, sizeof(buffer
) - 8, format
, ap
);
595 char_array_0(buffer
);
596 IOVEC_SET_STRING(iovec
[n
++], buffer
);
598 snprintf(mid
, sizeof(mid
), "MESSAGE_ID=" SD_ID128_FORMAT_STR
, SD_ID128_FORMAT_VAL(message_id
));
600 IOVEC_SET_STRING(iovec
[n
++], mid
);
603 ucred
.pid
= getpid();
604 ucred
.uid
= getuid();
605 ucred
.gid
= getgid();
607 dispatch_message_real(s
, iovec
, n
, ELEMENTSOF(iovec
), &ucred
, NULL
);
610 static void dispatch_message(Server
*s
,
611 struct iovec
*iovec
, unsigned n
, unsigned m
,
616 char *path
= NULL
, *c
;
619 assert(iovec
|| n
== 0);
627 path
= shortened_cgroup_path(ucred
->pid
);
631 /* example: /user/lennart/3/foobar
632 * /system/dbus.service/foobar
634 * So let's cut of everything past the third /, since that is
635 * wher user directories start */
637 c
= strchr(path
, '/');
639 c
= strchr(c
+1, '/');
641 c
= strchr(c
+1, '/');
647 rl
= journal_rate_limit_test(s
->rate_limit
, path
, priority
& LOG_PRIMASK
, available_space(s
));
654 /* Write a suppression message if we suppressed something */
656 driver_message(s
, SD_MESSAGE_JOURNAL_DROPPED
, "Suppressed %u messages from %s", rl
- 1, path
);
661 dispatch_message_real(s
, iovec
, n
, m
, ucred
, tv
);
664 static void forward_syslog_iovec(Server
*s
, const struct iovec
*iovec
, unsigned n_iovec
, struct ucred
*ucred
, struct timeval
*tv
) {
665 struct msghdr msghdr
;
666 struct cmsghdr
*cmsg
;
668 struct cmsghdr cmsghdr
;
669 uint8_t buf
[CMSG_SPACE(sizeof(struct ucred
))];
671 union sockaddr_union sa
;
678 msghdr
.msg_iov
= (struct iovec
*) iovec
;
679 msghdr
.msg_iovlen
= n_iovec
;
682 sa
.un
.sun_family
= AF_UNIX
;
683 strncpy(sa
.un
.sun_path
, "/run/systemd/syslog", sizeof(sa
.un
.sun_path
));
684 msghdr
.msg_name
= &sa
;
685 msghdr
.msg_namelen
= offsetof(union sockaddr_union
, un
.sun_path
) + strlen(sa
.un
.sun_path
);
689 msghdr
.msg_control
= &control
;
690 msghdr
.msg_controllen
= sizeof(control
);
692 cmsg
= CMSG_FIRSTHDR(&msghdr
);
693 cmsg
->cmsg_level
= SOL_SOCKET
;
694 cmsg
->cmsg_type
= SCM_CREDENTIALS
;
695 cmsg
->cmsg_len
= CMSG_LEN(sizeof(struct ucred
));
696 memcpy(CMSG_DATA(cmsg
), ucred
, sizeof(struct ucred
));
697 msghdr
.msg_controllen
= cmsg
->cmsg_len
;
700 /* Forward the syslog message we received via /dev/log to
701 * /run/systemd/syslog. Unfortunately we currently can't set
702 * the SO_TIMESTAMP auxiliary data, and hence we don't. */
704 if (sendmsg(s
->syslog_fd
, &msghdr
, MSG_NOSIGNAL
) >= 0)
707 if (ucred
&& errno
== ESRCH
) {
710 /* Hmm, presumably the sender process vanished
711 * by now, so let's fix it as good as we
716 memcpy(CMSG_DATA(cmsg
), &u
, sizeof(struct ucred
));
718 if (sendmsg(s
->syslog_fd
, &msghdr
, MSG_NOSIGNAL
) >= 0)
722 log_debug("Failed to forward syslog message: %m");
725 static void forward_syslog_raw(Server
*s
, const char *buffer
, struct ucred
*ucred
, struct timeval
*tv
) {
731 IOVEC_SET_STRING(iovec
, buffer
);
732 forward_syslog_iovec(s
, &iovec
, 1, ucred
, tv
);
735 static void forward_syslog(Server
*s
, int priority
, const char *tag
, const char *message
, struct ucred
*ucred
, struct timeval
*tv
) {
736 struct iovec iovec
[5];
737 char header_priority
[6], header_time
[64], header_pid
[16];
741 char *tag_buf
= NULL
;
744 assert(priority
>= 0);
745 assert(priority
<= 999);
748 /* First: priority field */
749 snprintf(header_priority
, sizeof(header_priority
), "<%i>", priority
);
750 char_array_0(header_priority
);
751 IOVEC_SET_STRING(iovec
[n
++], header_priority
);
753 /* Second: timestamp */
754 t
= tv
? tv
->tv_sec
: ((time_t) (now(CLOCK_REALTIME
) / USEC_PER_SEC
));
758 if (strftime(header_time
, sizeof(header_time
), "%h %e %T ", tm
) <= 0)
760 IOVEC_SET_STRING(iovec
[n
++], header_time
);
762 /* Third: tag and PID */
765 get_process_comm(ucred
->pid
, &tag_buf
);
769 snprintf(header_pid
, sizeof(header_pid
), "[%lu]: ", (unsigned long) ucred
->pid
);
770 char_array_0(header_pid
);
773 IOVEC_SET_STRING(iovec
[n
++], tag
);
775 IOVEC_SET_STRING(iovec
[n
++], header_pid
);
777 IOVEC_SET_STRING(iovec
[n
++], tag
);
778 IOVEC_SET_STRING(iovec
[n
++], ": ");
781 /* Fourth: message */
782 IOVEC_SET_STRING(iovec
[n
++], message
);
784 forward_syslog_iovec(s
, iovec
, n
, ucred
, tv
);
789 static int fixup_priority(int priority
) {
791 if ((priority
& LOG_FACMASK
) == 0)
792 return (priority
& LOG_PRIMASK
) | LOG_USER
;
797 static void forward_kmsg(Server
*s
, int priority
, const char *tag
, const char *message
, struct ucred
*ucred
) {
798 struct iovec iovec
[5];
799 char header_priority
[6], header_pid
[16];
801 char *tag_buf
= NULL
;
805 assert(priority
>= 0);
806 assert(priority
<= 999);
809 /* Never allow messages with kernel facility to be written to
810 * kmsg, regardless where the data comes from. */
811 priority
= fixup_priority(priority
);
813 /* First: priority field */
814 snprintf(header_priority
, sizeof(header_priority
), "<%i>", priority
);
815 char_array_0(header_priority
);
816 IOVEC_SET_STRING(iovec
[n
++], header_priority
);
818 /* Second: tag and PID */
821 get_process_comm(ucred
->pid
, &tag_buf
);
825 snprintf(header_pid
, sizeof(header_pid
), "[%lu]: ", (unsigned long) ucred
->pid
);
826 char_array_0(header_pid
);
829 IOVEC_SET_STRING(iovec
[n
++], tag
);
831 IOVEC_SET_STRING(iovec
[n
++], header_pid
);
833 IOVEC_SET_STRING(iovec
[n
++], tag
);
834 IOVEC_SET_STRING(iovec
[n
++], ": ");
837 /* Fourth: message */
838 IOVEC_SET_STRING(iovec
[n
++], message
);
839 IOVEC_SET_STRING(iovec
[n
++], "\n");
841 fd
= open("/dev/kmsg", O_WRONLY
|O_NOCTTY
|O_CLOEXEC
);
843 log_debug("Failed to open /dev/kmsg for logging: %s", strerror(errno
));
847 if (writev(fd
, iovec
, n
) < 0)
848 log_debug("Failed to write to /dev/kmsg for logging: %s", strerror(errno
));
850 close_nointr_nofail(fd
);
856 static void forward_console(Server
*s
, const char *tag
, const char *message
, struct ucred
*ucred
) {
857 struct iovec iovec
[4];
860 char *tag_buf
= NULL
;
865 /* First: tag and PID */
868 get_process_comm(ucred
->pid
, &tag_buf
);
872 snprintf(header_pid
, sizeof(header_pid
), "[%lu]: ", (unsigned long) ucred
->pid
);
873 char_array_0(header_pid
);
876 IOVEC_SET_STRING(iovec
[n
++], tag
);
878 IOVEC_SET_STRING(iovec
[n
++], header_pid
);
880 IOVEC_SET_STRING(iovec
[n
++], tag
);
881 IOVEC_SET_STRING(iovec
[n
++], ": ");
885 IOVEC_SET_STRING(iovec
[n
++], message
);
886 IOVEC_SET_STRING(iovec
[n
++], "\n");
888 fd
= open_terminal("/dev/console", O_WRONLY
|O_NOCTTY
|O_CLOEXEC
);
890 log_debug("Failed to open /dev/console for logging: %s", strerror(errno
));
894 if (writev(fd
, iovec
, n
) < 0)
895 log_debug("Failed to write to /dev/console for logging: %s", strerror(errno
));
897 close_nointr_nofail(fd
);
903 static void read_tag(const char **buf
, char **tag
) {
913 p
+= strspn(p
, WHITESPACE
);
914 l
= strcspn(p
, WHITESPACE
);
945 *buf
+= strspn(*buf
, WHITESPACE
);
948 static void process_syslog_message(Server
*s
, const char *buf
, struct ucred
*ucred
, struct timeval
*tv
) {
949 char *message
= NULL
, *syslog_priority
= NULL
, *syslog_facility
= NULL
, *syslog_tag
= NULL
;
950 struct iovec iovec
[N_IOVEC_META_FIELDS
+ 4];
952 int priority
= LOG_USER
| LOG_INFO
;
958 if (s
->forward_to_syslog
)
959 forward_syslog_raw(s
, buf
, ucred
, tv
);
961 parse_syslog_priority((char**) &buf
, &priority
);
962 skip_syslog_date((char**) &buf
);
963 read_tag(&buf
, &tag
);
965 if (s
->forward_to_kmsg
)
966 forward_kmsg(s
, priority
, tag
, buf
, ucred
);
968 if (s
->forward_to_console
)
969 forward_console(s
, tag
, buf
, ucred
);
971 if (asprintf(&syslog_priority
, "PRIORITY=%i", priority
& LOG_PRIMASK
) >= 0)
972 IOVEC_SET_STRING(iovec
[n
++], syslog_priority
);
974 if (priority
& LOG_FACMASK
)
975 if (asprintf(&syslog_facility
, "SYSLOG_FACILITY=%i", LOG_FAC(priority
)) >= 0)
976 IOVEC_SET_STRING(iovec
[n
++], syslog_facility
);
979 syslog_tag
= strappend("SYSLOG_TAG=", tag
);
981 IOVEC_SET_STRING(iovec
[n
++], syslog_tag
);
984 message
= strappend("MESSAGE=", buf
);
986 IOVEC_SET_STRING(iovec
[n
++], message
);
988 dispatch_message(s
, iovec
, n
, ELEMENTSOF(iovec
), ucred
, tv
, priority
);
992 free(syslog_priority
);
993 free(syslog_facility
);
997 static bool valid_user_field(const char *p
, size_t l
) {
1000 /* We kinda enforce POSIX syntax recommendations for
1001 environment variables here, but make a couple of additional
1004 http://pubs.opengroup.org/onlinepubs/000095399/basedefs/xbd_chap08.html */
1006 /* No empty field names */
1010 /* Don't allow names longer than 64 chars */
1014 /* Variables starting with an underscore are protected */
1018 /* Don't allow digits as first character */
1019 if (p
[0] >= '0' && p
[0] <= '9')
1022 /* Only allow A-Z0-9 and '_' */
1023 for (a
= p
; a
< p
+ l
; a
++)
1024 if (!((*a
>= 'A' && *a
<= 'Z') ||
1025 (*a
>= '0' && *a
<= '9') ||
1032 static void process_native_message(Server
*s
, const void *buffer
, size_t buffer_size
, struct ucred
*ucred
, struct timeval
*tv
) {
1033 struct iovec
*iovec
= NULL
;
1034 unsigned n
= 0, m
= 0, j
;
1037 int priority
= LOG_INFO
;
1038 char *tag
= NULL
, *message
= NULL
;
1041 assert(buffer
|| n
== 0);
1044 remaining
= buffer_size
;
1046 while (remaining
> 0) {
1049 e
= memchr(p
, '\n', remaining
);
1052 /* Trailing noise, let's ignore it, and flush what we collected */
1053 log_debug("Received message with trailing noise, ignoring.");
1058 /* Entry separator */
1059 dispatch_message(s
, iovec
, n
, m
, ucred
, tv
, priority
);
1061 priority
= LOG_INFO
;
1068 if (*p
== '.' || *p
== '#') {
1069 /* Ignore control commands for now, and
1071 remaining
-= (e
- p
) + 1;
1076 /* A property follows */
1078 if (n
+N_IOVEC_META_FIELDS
>= m
) {
1082 u
= MAX((n
+N_IOVEC_META_FIELDS
) * 2U, 4U);
1083 c
= realloc(iovec
, u
* sizeof(struct iovec
));
1085 log_error("Out of memory");
1093 q
= memchr(p
, '=', e
- p
);
1095 if (valid_user_field(p
, q
- p
)) {
1100 /* If the field name starts with an
1101 * underscore, skip the variable,
1102 * since that indidates a trusted
1104 iovec
[n
].iov_base
= (char*) p
;
1105 iovec
[n
].iov_len
= l
;
1108 /* We need to determine the priority
1109 * of this entry for the rate limiting
1112 memcmp(p
, "PRIORITY=", 9) == 0 &&
1113 p
[9] >= '0' && p
[9] <= '9')
1114 priority
= (priority
& LOG_FACMASK
) | (p
[9] - '0');
1117 memcmp(p
, "SYSLOG_FACILITY=", 16) == 0 &&
1118 p
[16] >= '0' && p
[16] <= '9')
1119 priority
= (priority
& LOG_PRIMASK
) | ((p
[16] - '0') << 3);
1122 memcmp(p
, "SYSLOG_FACILITY=", 16) == 0 &&
1123 p
[16] >= '0' && p
[16] <= '9' &&
1124 p
[17] >= '0' && p
[17] <= '9')
1125 priority
= (priority
& LOG_PRIMASK
) | (((p
[16] - '0')*10 + (p
[17] - '0')) << 3);
1128 memcmp(p
, "SYSLOG_TAG=", 11) == 0) {
1131 t
= strndup(p
+ 11, l
- 11);
1136 } else if (l
>= 8 &&
1137 memcmp(p
, "MESSAGE=", 8) == 0) {
1140 t
= strndup(p
+ 8, l
- 8);
1148 remaining
-= (e
- p
) + 1;
1155 if (remaining
< e
- p
+ 1 + sizeof(uint64_t) + 1) {
1156 log_debug("Failed to parse message, ignoring.");
1160 memcpy(&l
, e
+ 1, sizeof(uint64_t));
1163 if (remaining
< e
- p
+ 1 + sizeof(uint64_t) + l
+ 1 ||
1164 e
[1+sizeof(uint64_t)+l
] != '\n') {
1165 log_debug("Failed to parse message, ignoring.");
1169 k
= malloc((e
- p
) + 1 + l
);
1171 log_error("Out of memory");
1175 memcpy(k
, p
, e
- p
);
1177 memcpy(k
+ (e
- p
) + 1, e
+ 1 + sizeof(uint64_t), l
);
1179 if (valid_user_field(p
, e
- p
)) {
1180 iovec
[n
].iov_base
= k
;
1181 iovec
[n
].iov_len
= (e
- p
) + 1 + l
;
1186 remaining
-= (e
- p
) + 1 + sizeof(uint64_t) + l
+ 1;
1187 p
= e
+ 1 + sizeof(uint64_t) + l
+ 1;
1192 if (s
->forward_to_syslog
)
1193 forward_syslog(s
, priority
, tag
, message
, ucred
, tv
);
1195 if (s
->forward_to_kmsg
)
1196 forward_kmsg(s
, priority
, tag
, message
, ucred
);
1198 if (s
->forward_to_console
)
1199 forward_console(s
, tag
, message
, ucred
);
1202 dispatch_message(s
, iovec
, n
, m
, ucred
, tv
, priority
);
1204 for (j
= 0; j
< n
; j
++)
1205 if (iovec
[j
].iov_base
< buffer
||
1206 (const uint8_t*) iovec
[j
].iov_base
>= (const uint8_t*) buffer
+ buffer_size
)
1207 free(iovec
[j
].iov_base
);
1213 static int stdout_stream_log(StdoutStream
*s
, const char *p
) {
1214 struct iovec iovec
[N_IOVEC_META_FIELDS
+ 4];
1215 char *message
= NULL
, *syslog_priority
= NULL
, *syslog_facility
= NULL
, *syslog_tag
= NULL
;
1222 priority
= s
->priority
;
1224 if (s
->priority_prefix
)
1225 parse_syslog_priority((char**) &p
, &priority
);
1227 if (s
->forward_to_syslog
|| s
->server
->forward_to_syslog
)
1228 forward_syslog(s
->server
, fixup_priority(priority
), s
->tag
, p
, &s
->ucred
, NULL
);
1230 if (s
->forward_to_kmsg
|| s
->server
->forward_to_kmsg
)
1231 forward_kmsg(s
->server
, priority
, s
->tag
, p
, &s
->ucred
);
1233 if (s
->forward_to_console
|| s
->server
->forward_to_console
)
1234 forward_console(s
->server
, s
->tag
, p
, &s
->ucred
);
1236 if (asprintf(&syslog_priority
, "PRIORITY=%i", priority
& LOG_PRIMASK
) >= 0)
1237 IOVEC_SET_STRING(iovec
[n
++], syslog_priority
);
1239 if (priority
& LOG_FACMASK
)
1240 if (asprintf(&syslog_facility
, "SYSLOG_FACILITY=%i", LOG_FAC(priority
)) >= 0)
1241 IOVEC_SET_STRING(iovec
[n
++], syslog_facility
);
1244 syslog_tag
= strappend("SYSLOG_TAG=", s
->tag
);
1246 IOVEC_SET_STRING(iovec
[n
++], syslog_tag
);
1249 message
= strappend("MESSAGE=", p
);
1251 IOVEC_SET_STRING(iovec
[n
++], message
);
1253 dispatch_message(s
->server
, iovec
, n
, ELEMENTSOF(iovec
), &s
->ucred
, NULL
, priority
);
1256 free(syslog_priority
);
1257 free(syslog_facility
);
1263 static int stdout_stream_line(StdoutStream
*s
, char *p
) {
1273 case STDOUT_STREAM_TAG
:
1276 log_error("Out of memory");
1280 s
->state
= STDOUT_STREAM_PRIORITY
;
1283 case STDOUT_STREAM_PRIORITY
:
1284 r
= safe_atoi(p
, &s
->priority
);
1285 if (r
< 0 || s
->priority
<= 0 || s
->priority
>= 999) {
1286 log_warning("Failed to parse log priority line.");
1290 s
->state
= STDOUT_STREAM_PRIORITY_PREFIX
;
1293 case STDOUT_STREAM_PRIORITY_PREFIX
:
1294 r
= parse_boolean(p
);
1296 log_warning("Failed to parse priority prefix line.");
1300 s
->priority_prefix
= !!r
;
1301 s
->state
= STDOUT_STREAM_FORWARD_TO_SYSLOG
;
1304 case STDOUT_STREAM_FORWARD_TO_SYSLOG
:
1305 r
= parse_boolean(p
);
1307 log_warning("Failed to parse forward to syslog line.");
1311 s
->forward_to_syslog
= !!r
;
1312 s
->state
= STDOUT_STREAM_FORWARD_TO_KMSG
;
1315 case STDOUT_STREAM_FORWARD_TO_KMSG
:
1316 r
= parse_boolean(p
);
1318 log_warning("Failed to parse copy to kmsg line.");
1322 s
->forward_to_kmsg
= !!r
;
1323 s
->state
= STDOUT_STREAM_FORWARD_TO_CONSOLE
;
1326 case STDOUT_STREAM_FORWARD_TO_CONSOLE
:
1327 r
= parse_boolean(p
);
1329 log_warning("Failed to parse copy to console line.");
1333 s
->forward_to_console
= !!r
;
1334 s
->state
= STDOUT_STREAM_RUNNING
;
1337 case STDOUT_STREAM_RUNNING
:
1338 return stdout_stream_log(s
, p
);
1341 assert_not_reached("Unknown stream state");
1344 static int stdout_stream_scan(StdoutStream
*s
, bool force_flush
) {
1352 remaining
= s
->length
;
1357 end
= memchr(p
, '\n', remaining
);
1360 else if (remaining
>= sizeof(s
->buffer
) - 1) {
1361 end
= p
+ sizeof(s
->buffer
) - 1;
1362 skip
= sizeof(s
->buffer
) - 1;
1368 r
= stdout_stream_line(s
, p
);
1376 if (force_flush
&& remaining
> 0) {
1378 r
= stdout_stream_line(s
, p
);
1386 if (p
> s
->buffer
) {
1387 memmove(s
->buffer
, p
, remaining
);
1388 s
->length
= remaining
;
1394 static int stdout_stream_process(StdoutStream
*s
) {
1400 l
= read(s
->fd
, s
->buffer
+s
->length
, sizeof(s
->buffer
)-1-s
->length
);
1403 if (errno
== EAGAIN
)
1406 log_warning("Failed to read from stream: %m");
1411 r
= stdout_stream_scan(s
, true);
1419 r
= stdout_stream_scan(s
, false);
1427 static void stdout_stream_free(StdoutStream
*s
) {
1431 assert(s
->server
->n_stdout_streams
> 0);
1432 s
->server
->n_stdout_streams
--;
1433 LIST_REMOVE(StdoutStream
, stdout_stream
, s
->server
->stdout_streams
, s
);
1438 epoll_ctl(s
->server
->epoll_fd
, EPOLL_CTL_DEL
, s
->fd
, NULL
);
1440 close_nointr_nofail(s
->fd
);
1447 static int stdout_stream_new(Server
*s
) {
1448 StdoutStream
*stream
;
1451 struct epoll_event ev
;
1455 fd
= accept4(s
->stdout_fd
, NULL
, NULL
, SOCK_NONBLOCK
|SOCK_CLOEXEC
);
1457 if (errno
== EAGAIN
)
1460 log_error("Failed to accept stdout connection: %m");
1464 if (s
->n_stdout_streams
>= STDOUT_STREAMS_MAX
) {
1465 log_warning("Too many stdout streams, refusing connection.");
1466 close_nointr_nofail(fd
);
1470 stream
= new0(StdoutStream
, 1);
1472 log_error("Out of memory.");
1473 close_nointr_nofail(fd
);
1479 len
= sizeof(stream
->ucred
);
1480 if (getsockopt(fd
, SOL_SOCKET
, SO_PEERCRED
, &stream
->ucred
, &len
) < 0) {
1481 log_error("Failed to determine peer credentials: %m");
1486 if (shutdown(fd
, SHUT_WR
) < 0) {
1487 log_error("Failed to shutdown writing side of socket: %m");
1493 ev
.data
.ptr
= stream
;
1494 ev
.events
= EPOLLIN
;
1495 if (epoll_ctl(s
->epoll_fd
, EPOLL_CTL_ADD
, fd
, &ev
) < 0) {
1496 log_error("Failed to add stream to event loop: %m");
1502 LIST_PREPEND(StdoutStream
, stdout_stream
, s
->stdout_streams
, stream
);
1503 s
->n_stdout_streams
++;
1508 stdout_stream_free(stream
);
1512 static int system_journal_open(Server
*s
) {
1518 r
= sd_id128_get_machine(&machine
);
1522 sd_id128_to_string(machine
, ids
);
1524 if (!s
->system_journal
) {
1526 /* First try to create the machine path, but not the prefix */
1527 fn
= strappend("/var/log/journal/", ids
);
1530 (void) mkdir(fn
, 0755);
1533 /* The create the system journal file */
1534 fn
= join("/var/log/journal/", ids
, "/system.journal", NULL
);
1538 r
= journal_file_open(fn
, O_RDWR
|O_CREAT
, 0640, NULL
, &s
->system_journal
);
1542 journal_default_metrics(&s
->system_metrics
, s
->system_journal
->fd
);
1544 s
->system_journal
->metrics
= s
->system_metrics
;
1545 s
->system_journal
->compress
= s
->compress
;
1547 fix_perms(s
->system_journal
, 0);
1550 if (r
!= -ENOENT
&& r
!= -EROFS
)
1551 log_warning("Failed to open system journal: %s", strerror(-r
));
1557 if (!s
->runtime_journal
) {
1559 fn
= join("/run/log/journal/", ids
, "/system.journal", NULL
);
1563 if (s
->system_journal
) {
1565 /* Try to open the runtime journal, but only
1566 * if it already exists, so that we can flush
1567 * it into the system journal */
1569 r
= journal_file_open(fn
, O_RDWR
, 0640, NULL
, &s
->runtime_journal
);
1574 log_warning("Failed to open runtime journal: %s", strerror(-r
));
1581 /* OK, we really need the runtime journal, so create
1582 * it if necessary. */
1584 (void) mkdir_parents(fn
, 0755);
1585 r
= journal_file_open(fn
, O_RDWR
|O_CREAT
, 0640, NULL
, &s
->runtime_journal
);
1589 log_error("Failed to open runtime journal: %s", strerror(-r
));
1594 if (s
->runtime_journal
) {
1595 journal_default_metrics(&s
->runtime_metrics
, s
->runtime_journal
->fd
);
1597 s
->runtime_journal
->metrics
= s
->runtime_metrics
;
1598 s
->runtime_journal
->compress
= s
->compress
;
1600 fix_perms(s
->runtime_journal
, 0);
1607 static int server_flush_to_var(Server
*s
) {
1608 char path
[] = "/run/log/journal/xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxx";
1617 if (!s
->runtime_journal
)
1620 ts
= now(CLOCK_MONOTONIC
);
1621 if (s
->var_available_timestamp
+ RECHECK_VAR_AVAILABLE_USEC
> ts
)
1624 s
->var_available_timestamp
= ts
;
1626 system_journal_open(s
);
1628 if (!s
->system_journal
)
1631 r
= sd_id128_get_machine(&machine
);
1633 log_error("Failed to get machine id: %s", strerror(-r
));
1637 r
= sd_journal_open(&j
, SD_JOURNAL_RUNTIME_ONLY
);
1639 log_error("Failed to read runtime journal: %s", strerror(-r
));
1643 SD_JOURNAL_FOREACH(j
) {
1646 f
= j
->current_file
;
1647 assert(f
&& f
->current_offset
> 0);
1649 r
= journal_file_move_to_object(f
, OBJECT_ENTRY
, f
->current_offset
, &o
);
1651 log_error("Can't read entry: %s", strerror(-r
));
1655 r
= journal_file_copy_entry(f
, s
->system_journal
, o
, f
->current_offset
, NULL
, NULL
, NULL
);
1657 log_info("Allocation limit reached.");
1659 journal_file_post_change(s
->system_journal
);
1663 r
= journal_file_copy_entry(f
, s
->system_journal
, o
, f
->current_offset
, NULL
, NULL
, NULL
);
1667 log_error("Can't write entry: %s", strerror(-r
));
1673 journal_file_post_change(s
->system_journal
);
1675 journal_file_close(s
->runtime_journal
);
1676 s
->runtime_journal
= NULL
;
1679 sd_id128_to_string(machine
, path
+ 17);
1680 rm_rf(path
, false, true, false);
1686 static int process_event(Server
*s
, struct epoll_event
*ev
) {
1689 if (ev
->data
.fd
== s
->signal_fd
) {
1690 struct signalfd_siginfo sfsi
;
1693 if (ev
->events
!= EPOLLIN
) {
1694 log_info("Got invalid event from epoll.");
1698 n
= read(s
->signal_fd
, &sfsi
, sizeof(sfsi
));
1699 if (n
!= sizeof(sfsi
)) {
1704 if (errno
== EINTR
|| errno
== EAGAIN
)
1710 if (sfsi
.ssi_signo
== SIGUSR1
) {
1711 server_flush_to_var(s
);
1715 log_debug("Received SIG%s", signal_to_string(sfsi
.ssi_signo
));
1718 } else if (ev
->data
.fd
== s
->native_fd
||
1719 ev
->data
.fd
== s
->syslog_fd
) {
1721 if (ev
->events
!= EPOLLIN
) {
1722 log_info("Got invalid event from epoll.");
1727 struct msghdr msghdr
;
1729 struct ucred
*ucred
= NULL
;
1730 struct timeval
*tv
= NULL
;
1731 struct cmsghdr
*cmsg
;
1733 struct cmsghdr cmsghdr
;
1734 uint8_t buf
[CMSG_SPACE(sizeof(struct ucred
)) +
1735 CMSG_SPACE(sizeof(struct timeval
))];
1740 if (ioctl(ev
->data
.fd
, SIOCINQ
, &v
) < 0) {
1741 log_error("SIOCINQ failed: %m");
1748 if (s
->buffer_size
< (size_t) v
) {
1752 l
= MAX(LINE_MAX
+ (size_t) v
, s
->buffer_size
* 2);
1753 b
= realloc(s
->buffer
, l
+1);
1756 log_error("Couldn't increase buffer.");
1765 iovec
.iov_base
= s
->buffer
;
1766 iovec
.iov_len
= s
->buffer_size
;
1770 msghdr
.msg_iov
= &iovec
;
1771 msghdr
.msg_iovlen
= 1;
1772 msghdr
.msg_control
= &control
;
1773 msghdr
.msg_controllen
= sizeof(control
);
1775 n
= recvmsg(ev
->data
.fd
, &msghdr
, MSG_DONTWAIT
);
1778 if (errno
== EINTR
|| errno
== EAGAIN
)
1781 log_error("recvmsg() failed: %m");
1785 for (cmsg
= CMSG_FIRSTHDR(&msghdr
); cmsg
; cmsg
= CMSG_NXTHDR(&msghdr
, cmsg
)) {
1787 if (cmsg
->cmsg_level
== SOL_SOCKET
&&
1788 cmsg
->cmsg_type
== SCM_CREDENTIALS
&&
1789 cmsg
->cmsg_len
== CMSG_LEN(sizeof(struct ucred
)))
1790 ucred
= (struct ucred
*) CMSG_DATA(cmsg
);
1791 else if (cmsg
->cmsg_level
== SOL_SOCKET
&&
1792 cmsg
->cmsg_type
== SO_TIMESTAMP
&&
1793 cmsg
->cmsg_len
== CMSG_LEN(sizeof(struct timeval
)))
1794 tv
= (struct timeval
*) CMSG_DATA(cmsg
);
1797 if (ev
->data
.fd
== s
->syslog_fd
) {
1800 e
= memchr(s
->buffer
, '\n', n
);
1806 process_syslog_message(s
, strstrip(s
->buffer
), ucred
, tv
);
1808 process_native_message(s
, s
->buffer
, n
, ucred
, tv
);
1813 } else if (ev
->data
.fd
== s
->stdout_fd
) {
1815 if (ev
->events
!= EPOLLIN
) {
1816 log_info("Got invalid event from epoll.");
1820 stdout_stream_new(s
);
1824 StdoutStream
*stream
;
1826 if ((ev
->events
|EPOLLIN
|EPOLLHUP
) != (EPOLLIN
|EPOLLHUP
)) {
1827 log_info("Got invalid event from epoll.");
1831 /* If it is none of the well-known fds, it must be an
1832 * stdout stream fd. Note that this is a bit ugly here
1833 * (since we rely that none of the well-known fds
1834 * could be interpreted as pointer), but nonetheless
1835 * safe, since the well-known fds would never get an
1836 * fd > 4096, i.e. beyond the first memory page */
1838 stream
= ev
->data
.ptr
;
1840 if (stdout_stream_process(stream
) <= 0)
1841 stdout_stream_free(stream
);
1846 log_error("Unknown event.");
1850 static int open_syslog_socket(Server
*s
) {
1851 union sockaddr_union sa
;
1853 struct epoll_event ev
;
1858 if (s
->syslog_fd
< 0) {
1860 s
->syslog_fd
= socket(AF_UNIX
, SOCK_DGRAM
|SOCK_CLOEXEC
, 0);
1861 if (s
->syslog_fd
< 0) {
1862 log_error("socket() failed: %m");
1867 sa
.un
.sun_family
= AF_UNIX
;
1868 strncpy(sa
.un
.sun_path
, "/dev/log", sizeof(sa
.un
.sun_path
));
1870 unlink(sa
.un
.sun_path
);
1872 r
= bind(s
->syslog_fd
, &sa
.sa
, offsetof(union sockaddr_union
, un
.sun_path
) + strlen(sa
.un
.sun_path
));
1874 log_error("bind() failed: %m");
1878 chmod(sa
.un
.sun_path
, 0666);
1882 r
= setsockopt(s
->syslog_fd
, SOL_SOCKET
, SO_PASSCRED
, &one
, sizeof(one
));
1884 log_error("SO_PASSCRED failed: %m");
1889 r
= setsockopt(s
->syslog_fd
, SOL_SOCKET
, SO_TIMESTAMP
, &one
, sizeof(one
));
1891 log_error("SO_TIMESTAMP failed: %m");
1895 /* Since we use the same socket for forwarding this to some
1896 * other syslog implementation, make sure we don't hang
1898 timeval_store(&tv
, SYSLOG_TIMEOUT_USEC
);
1899 if (setsockopt(s
->syslog_fd
, SOL_SOCKET
, SO_SNDTIMEO
, &tv
, sizeof(tv
)) < 0) {
1900 log_error("SO_SNDTIMEO failed: %m");
1905 ev
.events
= EPOLLIN
;
1906 ev
.data
.fd
= s
->syslog_fd
;
1907 if (epoll_ctl(s
->epoll_fd
, EPOLL_CTL_ADD
, s
->syslog_fd
, &ev
) < 0) {
1908 log_error("Failed to add syslog server fd to epoll object: %m");
1915 static int open_native_socket(Server
*s
) {
1916 union sockaddr_union sa
;
1918 struct epoll_event ev
;
1922 if (s
->native_fd
< 0) {
1924 s
->native_fd
= socket(AF_UNIX
, SOCK_DGRAM
|SOCK_CLOEXEC
, 0);
1925 if (s
->native_fd
< 0) {
1926 log_error("socket() failed: %m");
1931 sa
.un
.sun_family
= AF_UNIX
;
1932 strncpy(sa
.un
.sun_path
, "/run/systemd/journal", sizeof(sa
.un
.sun_path
));
1934 unlink(sa
.un
.sun_path
);
1936 r
= bind(s
->native_fd
, &sa
.sa
, offsetof(union sockaddr_union
, un
.sun_path
) + strlen(sa
.un
.sun_path
));
1938 log_error("bind() failed: %m");
1942 chmod(sa
.un
.sun_path
, 0666);
1946 r
= setsockopt(s
->native_fd
, SOL_SOCKET
, SO_PASSCRED
, &one
, sizeof(one
));
1948 log_error("SO_PASSCRED failed: %m");
1953 r
= setsockopt(s
->native_fd
, SOL_SOCKET
, SO_TIMESTAMP
, &one
, sizeof(one
));
1955 log_error("SO_TIMESTAMP failed: %m");
1960 ev
.events
= EPOLLIN
;
1961 ev
.data
.fd
= s
->native_fd
;
1962 if (epoll_ctl(s
->epoll_fd
, EPOLL_CTL_ADD
, s
->native_fd
, &ev
) < 0) {
1963 log_error("Failed to add native server fd to epoll object: %m");
1970 static int open_stdout_socket(Server
*s
) {
1971 union sockaddr_union sa
;
1973 struct epoll_event ev
;
1977 if (s
->stdout_fd
< 0) {
1979 s
->stdout_fd
= socket(AF_UNIX
, SOCK_STREAM
|SOCK_CLOEXEC
, 0);
1980 if (s
->stdout_fd
< 0) {
1981 log_error("socket() failed: %m");
1986 sa
.un
.sun_family
= AF_UNIX
;
1987 strncpy(sa
.un
.sun_path
, "/run/systemd/stdout", sizeof(sa
.un
.sun_path
));
1989 unlink(sa
.un
.sun_path
);
1991 r
= bind(s
->stdout_fd
, &sa
.sa
, offsetof(union sockaddr_union
, un
.sun_path
) + strlen(sa
.un
.sun_path
));
1993 log_error("bind() failed: %m");
1997 chmod(sa
.un
.sun_path
, 0666);
1999 if (listen(s
->stdout_fd
, SOMAXCONN
) < 0) {
2000 log_error("liste() failed: %m");
2006 ev
.events
= EPOLLIN
;
2007 ev
.data
.fd
= s
->stdout_fd
;
2008 if (epoll_ctl(s
->epoll_fd
, EPOLL_CTL_ADD
, s
->stdout_fd
, &ev
) < 0) {
2009 log_error("Failed to add stdout server fd to epoll object: %m");
2016 static int open_signalfd(Server
*s
) {
2018 struct epoll_event ev
;
2022 assert_se(sigemptyset(&mask
) == 0);
2023 sigset_add_many(&mask
, SIGINT
, SIGTERM
, SIGUSR1
, -1);
2024 assert_se(sigprocmask(SIG_SETMASK
, &mask
, NULL
) == 0);
2026 s
->signal_fd
= signalfd(-1, &mask
, SFD_NONBLOCK
|SFD_CLOEXEC
);
2027 if (s
->signal_fd
< 0) {
2028 log_error("signalfd(): %m");
2033 ev
.events
= EPOLLIN
;
2034 ev
.data
.fd
= s
->signal_fd
;
2036 if (epoll_ctl(s
->epoll_fd
, EPOLL_CTL_ADD
, s
->signal_fd
, &ev
) < 0) {
2037 log_error("epoll_ctl(): %m");
2044 static int server_parse_config_file(Server
*s
) {
2051 fn
= "/etc/systemd/systemd-journald.conf";
2052 f
= fopen(fn
, "re");
2054 if (errno
== ENOENT
)
2057 log_warning("Failed to open configuration file %s: %m", fn
);
2061 r
= config_parse(fn
, f
, "Journal\0", config_item_perf_lookup
, (void*) journald_gperf_lookup
, false, s
);
2063 log_warning("Failed to parse configuration file: %s", strerror(-r
));
2070 static int server_init(Server
*s
) {
2076 s
->syslog_fd
= s
->native_fd
= s
->stdout_fd
= s
->signal_fd
= s
->epoll_fd
= -1;
2079 s
->rate_limit_interval
= DEFAULT_RATE_LIMIT_INTERVAL
;
2080 s
->rate_limit_burst
= DEFAULT_RATE_LIMIT_BURST
;
2082 s
->forward_to_syslog
= true;
2084 memset(&s
->system_metrics
, 0xFF, sizeof(s
->system_metrics
));
2085 memset(&s
->runtime_metrics
, 0xFF, sizeof(s
->runtime_metrics
));
2087 server_parse_config_file(s
);
2089 s
->user_journals
= hashmap_new(trivial_hash_func
, trivial_compare_func
);
2090 if (!s
->user_journals
) {
2091 log_error("Out of memory.");
2095 s
->epoll_fd
= epoll_create1(EPOLL_CLOEXEC
);
2096 if (s
->epoll_fd
< 0) {
2097 log_error("Failed to create epoll object: %m");
2101 n
= sd_listen_fds(true);
2103 log_error("Failed to read listening file descriptors from environment: %s", strerror(-n
));
2107 for (fd
= SD_LISTEN_FDS_START
; fd
< SD_LISTEN_FDS_START
+ n
; fd
++) {
2109 if (sd_is_socket_unix(fd
, SOCK_DGRAM
, -1, "/run/systemd/native", 0) > 0) {
2111 if (s
->native_fd
>= 0) {
2112 log_error("Too many native sockets passed.");
2118 } else if (sd_is_socket_unix(fd
, SOCK_STREAM
, 1, "/run/systemd/stdout", 0) > 0) {
2120 if (s
->stdout_fd
>= 0) {
2121 log_error("Too many stdout sockets passed.");
2127 } else if (sd_is_socket_unix(fd
, SOCK_DGRAM
, -1, "/dev/log", 0) > 0) {
2129 if (s
->syslog_fd
>= 0) {
2130 log_error("Too many /dev/log sockets passed.");
2137 log_error("Unknown socket passed.");
2142 r
= open_syslog_socket(s
);
2146 r
= open_native_socket(s
);
2150 r
= open_stdout_socket(s
);
2154 r
= system_journal_open(s
);
2158 r
= open_signalfd(s
);
2162 s
->rate_limit
= journal_rate_limit_new(s
->rate_limit_interval
, s
->rate_limit_burst
);
2169 static void server_done(Server
*s
) {
2173 while (s
->stdout_streams
)
2174 stdout_stream_free(s
->stdout_streams
);
2176 if (s
->system_journal
)
2177 journal_file_close(s
->system_journal
);
2179 if (s
->runtime_journal
)
2180 journal_file_close(s
->runtime_journal
);
2182 while ((f
= hashmap_steal_first(s
->user_journals
)))
2183 journal_file_close(f
);
2185 hashmap_free(s
->user_journals
);
2187 if (s
->epoll_fd
>= 0)
2188 close_nointr_nofail(s
->epoll_fd
);
2190 if (s
->signal_fd
>= 0)
2191 close_nointr_nofail(s
->signal_fd
);
2193 if (s
->syslog_fd
>= 0)
2194 close_nointr_nofail(s
->syslog_fd
);
2196 if (s
->native_fd
>= 0)
2197 close_nointr_nofail(s
->native_fd
);
2199 if (s
->stdout_fd
>= 0)
2200 close_nointr_nofail(s
->stdout_fd
);
2203 journal_rate_limit_free(s
->rate_limit
);
2208 int main(int argc
, char *argv
[]) {
2212 /* if (getppid() != 1) { */
2213 /* log_error("This program should be invoked by init only."); */
2214 /* return EXIT_FAILURE; */
2218 log_error("This program does not take arguments.");
2219 return EXIT_FAILURE
;
2222 log_set_target(LOG_TARGET_CONSOLE
);
2223 log_parse_environment();
2228 r
= server_init(&server
);
2232 server_vacuum(&server
);
2233 server_flush_to_var(&server
);
2235 log_debug("systemd-journald running as pid %lu", (unsigned long) getpid());
2236 driver_message(&server
, SD_MESSAGE_JOURNAL_START
, "Journal started");
2240 "STATUS=Processing requests...");
2243 struct epoll_event event
;
2245 r
= epoll_wait(server
.epoll_fd
, &event
, 1, -1);
2251 log_error("epoll_wait() failed: %m");
2257 r
= process_event(&server
, &event
);
2264 log_debug("systemd-journald stopped as pid %lu", (unsigned long) getpid());
2265 driver_message(&server
, SD_MESSAGE_JOURNAL_STOP
, "Journal stopped");
2269 "STATUS=Shutting down...");
2271 server_done(&server
);
2273 return r
< 0 ? EXIT_FAILURE
: EXIT_SUCCESS
;