]> git.ipfire.org Git - thirdparty/systemd.git/blame - src/coredump/coredump.c
coredump: when reconstructing original kernel coredump context, chop off trailing...
[thirdparty/systemd.git] / src / coredump / coredump.c
CommitLineData
f5e04665
LP
1/***
2 This file is part of systemd.
3
4 Copyright 2012 Lennart Poettering
5
6 systemd is free software; you can redistribute it and/or modify it
5430f7f2
LP
7 under the terms of the GNU Lesser General Public License as published by
8 the Free Software Foundation; either version 2.1 of the License, or
f5e04665
LP
9 (at your option) any later version.
10
11 systemd is distributed in the hope that it will be useful, but
12 WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
5430f7f2 14 Lesser General Public License for more details.
f5e04665 15
5430f7f2 16 You should have received a copy of the GNU Lesser General Public License
f5e04665
LP
17 along with systemd; If not, see <http://www.gnu.org/licenses/>.
18***/
19
20#include <errno.h>
803a3464
LP
21#include <stdio.h>
22#include <sys/prctl.h>
cacd6403 23#include <sys/xattr.h>
4f5dd394 24#include <unistd.h>
f5e04665 25
4d229b31 26#ifdef HAVE_ELFUTILS
3c171f0b
LP
27#include <dwarf.h>
28#include <elfutils/libdwfl.h>
4d229b31
UTL
29#endif
30
73a99163 31#include "sd-daemon.h"
f11943c5
LP
32#include "sd-journal.h"
33#include "sd-login.h"
73a99163 34#include "sd-messages.h"
4f5dd394
LP
35
36#include "acl-util.h"
b5efdb8a 37#include "alloc-util.h"
430f0182 38#include "capability-util.h"
ba1261bc 39#include "cgroup-util.h"
4f5dd394 40#include "compress.h"
34c10968
LP
41#include "conf-parser.h"
42#include "copy.h"
f11943c5 43#include "coredump-vacuum.h"
a0956174 44#include "dirent-util.h"
4f5dd394 45#include "escape.h"
3ffd4af2 46#include "fd-util.h"
4f5dd394 47#include "fileio.h"
f4f15635 48#include "fs-util.h"
afc5dbf3 49#include "io-util.h"
b18453ed 50#include "journal-importer.h"
4f5dd394
LP
51#include "log.h"
52#include "macro.h"
0c773903 53#include "missing.h"
4f5dd394 54#include "mkdir.h"
6bedfcbb 55#include "parse-util.h"
0b452006 56#include "process-util.h"
d14bcb4e 57#include "signal-util.h"
3c171f0b 58#include "socket-util.h"
4f5dd394
LP
59#include "special.h"
60#include "stacktrace.h"
8b43440b 61#include "string-table.h"
07630cea 62#include "string-util.h"
4f5dd394 63#include "strv.h"
b1d4f8e1 64#include "user-util.h"
4f5dd394 65#include "util.h"
34727273 66
34c10968 67/* The maximum size up to which we process coredumps */
59f448cf 68#define PROCESS_SIZE_MAX ((uint64_t) (2LLU*1024LLU*1024LLU*1024LLU))
34c10968 69
bdfd7b2c 70/* The maximum size up to which we leave the coredump around on disk */
34c10968
LP
71#define EXTERNAL_SIZE_MAX PROCESS_SIZE_MAX
72
bdfd7b2c 73/* The maximum size up to which we store the coredump in the journal */
34c10968 74#define JOURNAL_SIZE_MAX ((size_t) (767LU*1024LU*1024LU))
f5e04665 75
c4aa09b0 76/* Make sure to not make this larger than the maximum journal entry
874bc134
ZJS
77 * size. See DATA_SIZE_MAX in journald-native.c. */
78assert_cc(JOURNAL_SIZE_MAX <= DATA_SIZE_MAX);
f5e04665
LP
79
80enum {
3c171f0b
LP
81 /* We use this as array indexes for a couple of special fields we use for naming coredumping files, and
82 * attaching xattrs */
83 CONTEXT_PID,
84 CONTEXT_UID,
85 CONTEXT_GID,
86 CONTEXT_SIGNAL,
87 CONTEXT_TIMESTAMP,
bdfd7b2c 88 CONTEXT_RLIMIT,
3c171f0b
LP
89 CONTEXT_COMM,
90 CONTEXT_EXE,
91 _CONTEXT_MAX
f5e04665
LP
92};
93
34c10968
LP
94typedef enum CoredumpStorage {
95 COREDUMP_STORAGE_NONE,
96 COREDUMP_STORAGE_EXTERNAL,
97 COREDUMP_STORAGE_JOURNAL,
34c10968
LP
98 _COREDUMP_STORAGE_MAX,
99 _COREDUMP_STORAGE_INVALID = -1
100} CoredumpStorage;
101
34c10968
LP
102static const char* const coredump_storage_table[_COREDUMP_STORAGE_MAX] = {
103 [COREDUMP_STORAGE_NONE] = "none",
104 [COREDUMP_STORAGE_EXTERNAL] = "external",
105 [COREDUMP_STORAGE_JOURNAL] = "journal",
34c10968
LP
106};
107
108DEFINE_PRIVATE_STRING_TABLE_LOOKUP(coredump_storage, CoredumpStorage);
8c9571d0 109static DEFINE_CONFIG_PARSE_ENUM(config_parse_coredump_storage, coredump_storage, CoredumpStorage, "Failed to parse storage setting");
34727273
ZJS
110
111static CoredumpStorage arg_storage = COREDUMP_STORAGE_EXTERNAL;
8c9571d0 112static bool arg_compress = true;
59f448cf
LP
113static uint64_t arg_process_size_max = PROCESS_SIZE_MAX;
114static uint64_t arg_external_size_max = EXTERNAL_SIZE_MAX;
6e2b4a69 115static uint64_t arg_journal_size_max = JOURNAL_SIZE_MAX;
59f448cf
LP
116static uint64_t arg_keep_free = (uint64_t) -1;
117static uint64_t arg_max_use = (uint64_t) -1;
34c10968
LP
118
119static int parse_config(void) {
34c10968 120 static const ConfigTableItem items[] = {
8c9571d0
LP
121 { "Coredump", "Storage", config_parse_coredump_storage, 0, &arg_storage },
122 { "Coredump", "Compress", config_parse_bool, 0, &arg_compress },
59f448cf
LP
123 { "Coredump", "ProcessSizeMax", config_parse_iec_uint64, 0, &arg_process_size_max },
124 { "Coredump", "ExternalSizeMax", config_parse_iec_uint64, 0, &arg_external_size_max },
8c9571d0 125 { "Coredump", "JournalSizeMax", config_parse_iec_size, 0, &arg_journal_size_max },
59f448cf
LP
126 { "Coredump", "KeepFree", config_parse_iec_uint64, 0, &arg_keep_free },
127 { "Coredump", "MaxUse", config_parse_iec_uint64, 0, &arg_max_use },
34c10968
LP
128 {}
129 };
130
43688c49 131 return config_parse_many_nulstr(PKGSYSCONFDIR "/coredump.conf",
75eb6154 132 CONF_PATHS_NULSTR("systemd/coredump.conf.d"),
301af7e4
JT
133 "Coredump\0",
134 config_item_table_lookup, items,
135 false, NULL);
34c10968
LP
136}
137
73a99163
ZJS
138static inline uint64_t storage_size_max(void) {
139 return arg_storage == COREDUMP_STORAGE_EXTERNAL ? arg_external_size_max : arg_journal_size_max;
140}
141
34c10968
LP
142static int fix_acl(int fd, uid_t uid) {
143
144#ifdef HAVE_ACL
145 _cleanup_(acl_freep) acl_t acl = NULL;
146 acl_entry_t entry;
147 acl_permset_t permset;
709f6e46 148 int r;
34c10968 149
b59233e6
LP
150 assert(fd >= 0);
151
34c10968
LP
152 if (uid <= SYSTEM_UID_MAX)
153 return 0;
154
155 /* Make sure normal users can read (but not write or delete)
156 * their own coredumps */
157
158 acl = acl_get_fd(fd);
4a62c710
MS
159 if (!acl)
160 return log_error_errno(errno, "Failed to get ACL: %m");
34c10968
LP
161
162 if (acl_create_entry(&acl, &entry) < 0 ||
163 acl_set_tag_type(entry, ACL_USER) < 0 ||
d710aaf7
ZJS
164 acl_set_qualifier(entry, &uid) < 0)
165 return log_error_errno(errno, "Failed to patch ACL: %m");
34c10968
LP
166
167 if (acl_get_permset(entry, &permset) < 0 ||
709f6e46
MS
168 acl_add_perm(permset, ACL_READ) < 0)
169 return log_warning_errno(errno, "Failed to patch ACL: %m");
170
171 r = calc_acl_mask_if_needed(&acl);
172 if (r < 0)
173 return log_warning_errno(r, "Failed to patch ACL: %m");
34c10968 174
4a62c710
MS
175 if (acl_set_fd(fd, acl) < 0)
176 return log_error_errno(errno, "Failed to apply ACL: %m");
34c10968
LP
177#endif
178
179 return 0;
180}
181
3c171f0b 182static int fix_xattr(int fd, const char *context[_CONTEXT_MAX]) {
0cd77f97 183
3c171f0b
LP
184 static const char * const xattrs[_CONTEXT_MAX] = {
185 [CONTEXT_PID] = "user.coredump.pid",
186 [CONTEXT_UID] = "user.coredump.uid",
187 [CONTEXT_GID] = "user.coredump.gid",
188 [CONTEXT_SIGNAL] = "user.coredump.signal",
189 [CONTEXT_TIMESTAMP] = "user.coredump.timestamp",
190 [CONTEXT_COMM] = "user.coredump.comm",
191 [CONTEXT_EXE] = "user.coredump.exe",
0cd77f97
LP
192 };
193
34c10968 194 int r = 0;
0cd77f97 195 unsigned i;
34c10968 196
b59233e6
LP
197 assert(fd >= 0);
198
1eef15b1 199 /* Attach some metadata to coredumps via extended
34c10968
LP
200 * attributes. Just because we can. */
201
3c171f0b 202 for (i = 0; i < _CONTEXT_MAX; i++) {
1eef15b1
ZJS
203 int k;
204
3c171f0b 205 if (isempty(context[i]) || !xattrs[i])
0cd77f97 206 continue;
34c10968 207
3c171f0b 208 k = fsetxattr(fd, xattrs[i], context[i], strlen(context[i]), XATTR_CREATE);
1eef15b1 209 if (k < 0 && r == 0)
34c10968 210 r = -errno;
0cd77f97 211 }
34c10968
LP
212
213 return r;
214}
215
b0b21dce 216#define filename_escape(s) xescape((s), "./ ")
34c10968 217
0c773903
EV
218static inline const char *coredump_tmpfile_name(const char *s) {
219 return s ? s : "(unnamed temporary file)";
220}
221
b59233e6
LP
222static int fix_permissions(
223 int fd,
224 const char *filename,
225 const char *target,
3c171f0b 226 const char *context[_CONTEXT_MAX],
b59233e6
LP
227 uid_t uid) {
228
03532f0a
LP
229 int r;
230
b59233e6 231 assert(fd >= 0);
b59233e6 232 assert(target);
3c171f0b 233 assert(context);
cfd652ed
ZJS
234
235 /* Ignore errors on these */
3c171f0b
LP
236 (void) fchmod(fd, 0640);
237 (void) fix_acl(fd, uid);
238 (void) fix_xattr(fd, context);
cfd652ed 239
4a62c710 240 if (fsync(fd) < 0)
0c773903 241 return log_error_errno(errno, "Failed to sync coredump %s: %m", coredump_tmpfile_name(filename));
cfd652ed 242
03532f0a
LP
243 r = link_tmpfile(fd, filename, target);
244 if (r < 0)
245 return log_error_errno(r, "Failed to move coredump %s into place: %m", target);
cfd652ed
ZJS
246
247 return 0;
248}
249
59f448cf 250static int maybe_remove_external_coredump(const char *filename, uint64_t size) {
cfd652ed 251
b59233e6 252 /* Returns 1 if might remove, 0 if will not remove, < 0 on error. */
cfd652ed 253
fc6cec86 254 if (arg_storage == COREDUMP_STORAGE_EXTERNAL &&
cfd652ed
ZJS
255 size <= arg_external_size_max)
256 return 0;
257
258 if (!filename)
259 return 1;
260
4a62c710
MS
261 if (unlink(filename) < 0 && errno != ENOENT)
262 return log_error_errno(errno, "Failed to unlink %s: %m", filename);
cfd652ed
ZJS
263
264 return 1;
265}
266
3c171f0b 267static int make_filename(const char *context[_CONTEXT_MAX], char **ret) {
b59233e6 268 _cleanup_free_ char *c = NULL, *u = NULL, *p = NULL, *t = NULL;
a7f7d1bd 269 sd_id128_t boot = {};
34c10968
LP
270 int r;
271
3c171f0b 272 assert(context);
34c10968 273
3c171f0b 274 c = filename_escape(context[CONTEXT_COMM]);
34c10968 275 if (!c)
b59233e6 276 return -ENOMEM;
34c10968 277
3c171f0b 278 u = filename_escape(context[CONTEXT_UID]);
0dc5d23c 279 if (!u)
b59233e6 280 return -ENOMEM;
34c10968
LP
281
282 r = sd_id128_get_boot(&boot);
b59233e6 283 if (r < 0)
34c10968 284 return r;
34c10968 285
3c171f0b 286 p = filename_escape(context[CONTEXT_PID]);
b59233e6
LP
287 if (!p)
288 return -ENOMEM;
289
3c171f0b 290 t = filename_escape(context[CONTEXT_TIMESTAMP]);
b59233e6
LP
291 if (!t)
292 return -ENOMEM;
293
294 if (asprintf(ret,
0dc5d23c 295 "/var/lib/systemd/coredump/core.%s.%s." SD_ID128_FORMAT_STR ".%s.%s000000",
34c10968 296 c,
0dc5d23c 297 u,
34c10968
LP
298 SD_ID128_FORMAT_VAL(boot),
299 p,
b59233e6
LP
300 t) < 0)
301 return -ENOMEM;
302
303 return 0;
304}
305
306static int save_external_coredump(
3c171f0b
LP
307 const char *context[_CONTEXT_MAX],
308 int input_fd,
b59233e6 309 char **ret_filename,
5f3e0a74
HW
310 int *ret_node_fd,
311 int *ret_data_fd,
59f448cf 312 uint64_t *ret_size) {
b59233e6
LP
313
314 _cleanup_free_ char *fn = NULL, *tmp = NULL;
315 _cleanup_close_ int fd = -1;
bdfd7b2c 316 uint64_t rlimit, max_size;
b59233e6 317 struct stat st;
3c171f0b 318 uid_t uid;
b59233e6
LP
319 int r;
320
3c171f0b 321 assert(context);
b59233e6 322 assert(ret_filename);
5f3e0a74
HW
323 assert(ret_node_fd);
324 assert(ret_data_fd);
b59233e6
LP
325 assert(ret_size);
326
3c171f0b
LP
327 r = parse_uid(context[CONTEXT_UID], &uid);
328 if (r < 0)
329 return log_error_errno(r, "Failed to parse UID: %m");
330
bdfd7b2c
LP
331 r = safe_atou64(context[CONTEXT_RLIMIT], &rlimit);
332 if (r < 0)
333 return log_error_errno(r, "Failed to parse resource limit: %s", context[CONTEXT_RLIMIT]);
6998b540
ZJS
334 if (rlimit < page_size()) {
335 /* Is coredumping disabled? Then don't bother saving/processing the coredump.
336 * Anything below PAGE_SIZE cannot give a readable coredump (the kernel uses
337 * ELF_EXEC_PAGESIZE which is not easily accessible, but is usually the same as PAGE_SIZE. */
73a99163
ZJS
338 log_info("Resource limits disable core dumping for process %s (%s).",
339 context[CONTEXT_PID], context[CONTEXT_COMM]);
bdfd7b2c
LP
340 return -EBADSLT;
341 }
342
343 /* Never store more than the process configured, or than we actually shall keep or process */
73a99163 344 max_size = MIN(rlimit, MAX(arg_process_size_max, storage_size_max()));
bdfd7b2c 345
3c171f0b 346 r = make_filename(context, &fn);
23bbb0de
MS
347 if (r < 0)
348 return log_error_errno(r, "Failed to determine coredump file name: %m");
34c10968 349
d2e54fae 350 mkdir_p_label("/var/lib/systemd/coredump", 0755);
803a3464 351
03532f0a 352 fd = open_tmpfile_linkable(fn, O_RDWR|O_CLOEXEC, &tmp);
4a62c710 353 if (fd < 0)
03532f0a 354 return log_error_errno(fd, "Failed to create temporary file for coredump %s: %m", fn);
803a3464 355
bdfd7b2c 356 r = copy_bytes(input_fd, fd, max_size, false);
73a99163
ZJS
357 if (r < 0) {
358 log_error_errno(r, "Cannot store coredump of %s (%s): %m", context[CONTEXT_PID], context[CONTEXT_COMM]);
93240d3a 359 goto fail;
73a99163
ZJS
360 } else if (r == 1)
361 log_struct(LOG_INFO,
362 LOG_MESSAGE("Core file was truncated to %zu bytes.", max_size),
363 "SIZE_LIMIT=%zu", max_size,
2b044526 364 "MESSAGE_ID=" SD_MESSAGE_TRUNCATED_CORE_STR,
73a99163 365 NULL);
803a3464 366
34c10968 367 if (fstat(fd, &st) < 0) {
73a99163 368 log_error_errno(errno, "Failed to fstat core file %s: %m", coredump_tmpfile_name(tmp));
34c10968
LP
369 goto fail;
370 }
371
7849c2ac 372 if (lseek(fd, 0, SEEK_SET) == (off_t) -1) {
0c773903 373 log_error_errno(errno, "Failed to seek on %s: %m", coredump_tmpfile_name(tmp));
b59233e6 374 goto fail;
7849c2ac
TA
375 }
376
d89c8fdf 377#if defined(HAVE_XZ) || defined(HAVE_LZ4)
cfd652ed 378 /* If we will remove the coredump anyway, do not compress. */
6e9ef603 379 if (arg_compress && !maybe_remove_external_coredump(NULL, st.st_size)) {
cfd652ed 380
b59233e6
LP
381 _cleanup_free_ char *fn_compressed = NULL, *tmp_compressed = NULL;
382 _cleanup_close_ int fd_compressed = -1;
cfd652ed 383
d89c8fdf 384 fn_compressed = strappend(fn, COMPRESSED_EXT);
b59233e6 385 if (!fn_compressed) {
d89c8fdf 386 log_oom();
cfd652ed
ZJS
387 goto uncompressed;
388 }
389
03532f0a
LP
390 fd_compressed = open_tmpfile_linkable(fn_compressed, O_RDWR|O_CLOEXEC, &tmp_compressed);
391 if (fd_compressed < 0) {
392 log_error_errno(fd_compressed, "Failed to create temporary file for coredump %s: %m", fn_compressed);
b59233e6 393 goto uncompressed;
03532f0a 394 }
cfd652ed 395
d89c8fdf 396 r = compress_stream(fd, fd_compressed, -1);
b59233e6 397 if (r < 0) {
0c773903 398 log_error_errno(r, "Failed to compress %s: %m", coredump_tmpfile_name(tmp_compressed));
b59233e6
LP
399 goto fail_compressed;
400 }
401
3c171f0b 402 r = fix_permissions(fd_compressed, tmp_compressed, fn_compressed, context, uid);
cfd652ed 403 if (r < 0)
b59233e6
LP
404 goto fail_compressed;
405
406 /* OK, this worked, we can get rid of the uncompressed version now */
0c773903
EV
407 if (tmp)
408 unlink_noerrno(tmp);
cfd652ed 409
59f448cf 410 *ret_filename = fn_compressed; /* compressed */
5f3e0a74
HW
411 *ret_node_fd = fd_compressed; /* compressed */
412 *ret_data_fd = fd; /* uncompressed */
59f448cf 413 *ret_size = (uint64_t) st.st_size; /* uncompressed */
cfd652ed 414
b59233e6 415 fn_compressed = NULL;
5f3e0a74 416 fd = fd_compressed = -1;
cfd652ed
ZJS
417
418 return 0;
419
b59233e6 420 fail_compressed:
0c773903
EV
421 if (tmp_compressed)
422 (void) unlink(tmp_compressed);
34c10968 423 }
cfd652ed
ZJS
424
425uncompressed:
3b1a55e1 426#endif
5f3e0a74 427
3c171f0b 428 r = fix_permissions(fd, tmp, fn, context, uid);
cfd652ed
ZJS
429 if (r < 0)
430 goto fail;
34c10968
LP
431
432 *ret_filename = fn;
5f3e0a74
HW
433 *ret_data_fd = fd;
434 *ret_node_fd = -1;
59f448cf 435 *ret_size = (uint64_t) st.st_size;
34c10968
LP
436
437 fn = NULL;
438 fd = -1;
439
440 return 0;
441
442fail:
0c773903
EV
443 if (tmp)
444 (void) unlink(tmp);
34c10968
LP
445 return r;
446}
447
448static int allocate_journal_field(int fd, size_t size, char **ret, size_t *ret_size) {
449 _cleanup_free_ char *field = NULL;
450 ssize_t n;
451
8d4e028f 452 assert(fd >= 0);
34c10968
LP
453 assert(ret);
454 assert(ret_size);
455
4a62c710
MS
456 if (lseek(fd, 0, SEEK_SET) == (off_t) -1)
457 return log_warning_errno(errno, "Failed to seek: %m");
803a3464 458
34c10968
LP
459 field = malloc(9 + size);
460 if (!field) {
cfd652ed 461 log_warning("Failed to allocate memory for coredump, coredump will not be stored.");
34c10968
LP
462 return -ENOMEM;
463 }
464
465 memcpy(field, "COREDUMP=", 9);
466
467 n = read(fd, field + 9, size);
23bbb0de
MS
468 if (n < 0)
469 return log_error_errno((int) n, "Failed to read core data: %m");
34c10968
LP
470 if ((size_t) n < size) {
471 log_error("Core data too short.");
472 return -EIO;
473 }
474
475 *ret = field;
476 *ret_size = size + 9;
477
478 field = NULL;
479
480 return 0;
481}
803a3464 482
3f132692
JF
483/* Joins /proc/[pid]/fd/ and /proc/[pid]/fdinfo/ into the following lines:
484 * 0:/dev/pts/23
485 * pos: 0
486 * flags: 0100002
487 *
488 * 1:/dev/pts/23
489 * pos: 0
490 * flags: 0100002
491 *
492 * 2:/dev/pts/23
493 * pos: 0
494 * flags: 0100002
495 * EOF
496 */
497static int compose_open_fds(pid_t pid, char **open_fds) {
4d84bc2f
LP
498 _cleanup_closedir_ DIR *proc_fd_dir = NULL;
499 _cleanup_close_ int proc_fdinfo_fd = -1;
500 _cleanup_free_ char *buffer = NULL;
3f132692 501 _cleanup_fclose_ FILE *stream = NULL;
59059b4a 502 const char *fddelim = "", *path;
3f132692 503 struct dirent *dent = NULL;
4d84bc2f 504 size_t size = 0;
3f132692
JF
505 int r = 0;
506
507 assert(pid >= 0);
508 assert(open_fds != NULL);
509
59059b4a 510 path = procfs_file_alloca(pid, "fd");
3f132692 511 proc_fd_dir = opendir(path);
59059b4a
ZJS
512 if (!proc_fd_dir)
513 return -errno;
3f132692 514
4d84bc2f 515 proc_fdinfo_fd = openat(dirfd(proc_fd_dir), "../fdinfo", O_DIRECTORY|O_NOFOLLOW|O_CLOEXEC|O_PATH);
59059b4a
ZJS
516 if (proc_fdinfo_fd < 0)
517 return -errno;
3f132692 518
4d84bc2f 519 stream = open_memstream(&buffer, &size);
3f132692
JF
520 if (!stream)
521 return -ENOMEM;
522
4d84bc2f 523 FOREACH_DIRENT(dent, proc_fd_dir, return -errno) {
3f132692 524 _cleanup_fclose_ FILE *fdinfo = NULL;
4d84bc2f 525 _cleanup_free_ char *fdname = NULL;
59059b4a 526 char line[LINE_MAX];
4d84bc2f 527 int fd;
3f132692 528
59059b4a 529 r = readlinkat_malloc(dirfd(proc_fd_dir), dent->d_name, &fdname);
3f132692
JF
530 if (r < 0)
531 return r;
532
533 fprintf(stream, "%s%s:%s\n", fddelim, dent->d_name, fdname);
534 fddelim = "\n";
535
536 /* Use the directory entry from /proc/[pid]/fd with /proc/[pid]/fdinfo */
59059b4a
ZJS
537 fd = openat(proc_fdinfo_fd, dent->d_name, O_NOFOLLOW|O_CLOEXEC|O_RDONLY);
538 if (fd < 0)
3f132692
JF
539 continue;
540
59059b4a
ZJS
541 fdinfo = fdopen(fd, "re");
542 if (fdinfo == NULL) {
543 close(fd);
3f132692 544 continue;
59059b4a 545 }
3f132692 546
4d84bc2f
LP
547 FOREACH_LINE(line, fdinfo, break) {
548 fputs(line, stream);
549 if (!endswith(line, "\n"))
550 fputc('\n', stream);
551 }
3f132692
JF
552 }
553
4d84bc2f 554 errno = 0;
74ca738f 555 stream = safe_fclose(stream);
4d84bc2f 556
b3267152 557 if (errno > 0)
4d84bc2f
LP
558 return -errno;
559
560 *open_fds = buffer;
561 buffer = NULL;
562
3f132692
JF
563 return 0;
564}
565
7ed03ce6
JF
566static int get_process_ns(pid_t pid, const char *namespace, ino_t *ns) {
567 const char *p;
568 struct stat stbuf;
569 _cleanup_close_ int proc_ns_dir_fd;
570
571 p = procfs_file_alloca(pid, "ns");
572
573 proc_ns_dir_fd = open(p, O_DIRECTORY | O_CLOEXEC | O_RDONLY);
574 if (proc_ns_dir_fd < 0)
575 return -errno;
576
577 if (fstatat(proc_ns_dir_fd, namespace, &stbuf, /* flags */0) < 0)
578 return -errno;
579
580 *ns = stbuf.st_ino;
581 return 0;
582}
583
584static int get_mount_namespace_leader(pid_t pid, pid_t *container_pid) {
585 pid_t cpid = pid, ppid = 0;
586 ino_t proc_mntns;
587 int r = 0;
588
589 r = get_process_ns(pid, "mnt", &proc_mntns);
590 if (r < 0)
591 return r;
592
aa7530d6 593 for (;;) {
7ed03ce6
JF
594 ino_t parent_mntns;
595
596 r = get_process_ppid(cpid, &ppid);
597 if (r < 0)
598 return r;
599
600 r = get_process_ns(ppid, "mnt", &parent_mntns);
601 if (r < 0)
602 return r;
603
604 if (proc_mntns != parent_mntns)
605 break;
606
607 if (ppid == 1)
608 return -ENOENT;
609
610 cpid = ppid;
611 }
612
613 *container_pid = ppid;
614 return 0;
615}
616
617/* Returns 1 if the parent was found.
618 * Returns 0 if there is not a process we can call the pid's
619 * container parent (the pid's process isn't 'containerized').
620 * Returns a negative number on errors.
621 */
622static int get_process_container_parent_cmdline(pid_t pid, char** cmdline) {
623 int r = 0;
624 pid_t container_pid;
625 const char *proc_root_path;
626 struct stat root_stat, proc_root_stat;
627
628 /* To compare inodes of / and /proc/[pid]/root */
629 if (stat("/", &root_stat) < 0)
630 return -errno;
631
632 proc_root_path = procfs_file_alloca(pid, "root");
633 if (stat(proc_root_path, &proc_root_stat) < 0)
634 return -errno;
635
636 /* The process uses system root. */
637 if (proc_root_stat.st_ino == root_stat.st_ino) {
638 *cmdline = NULL;
639 return 0;
640 }
641
642 r = get_mount_namespace_leader(pid, &container_pid);
643 if (r < 0)
644 return r;
645
d3cba4ea
EV
646 r = get_process_cmdline(container_pid, 0, false, cmdline);
647 if (r < 0)
648 return r;
649
650 return 1;
7ed03ce6
JF
651}
652
3c171f0b
LP
653static int change_uid_gid(const char *context[]) {
654 uid_t uid;
655 gid_t gid;
656 int r;
34c10968 657
3c171f0b
LP
658 r = parse_uid(context[CONTEXT_UID], &uid);
659 if (r < 0)
660 return r;
8c8549db 661
888e378d
LP
662 if (uid <= SYSTEM_UID_MAX) {
663 const char *user = "systemd-coredump";
664
665 r = get_user_creds(&user, &uid, &gid, NULL, NULL);
666 if (r < 0) {
667 log_warning_errno(r, "Cannot resolve %s user. Proceeding to dump core as root: %m", user);
668 uid = gid = 0;
669 }
670 } else {
671 r = parse_gid(context[CONTEXT_GID], &gid);
672 if (r < 0)
673 return r;
674 }
3c171f0b
LP
675
676 return drop_privileges(uid, gid, 0);
677}
8c8549db 678
3c171f0b
LP
679static int submit_coredump(
680 const char *context[_CONTEXT_MAX],
681 struct iovec *iovec,
682 size_t n_iovec_allocated,
683 size_t n_iovec,
684 int input_fd) {
34c10968 685
5f3e0a74 686 _cleanup_close_ int coredump_fd = -1, coredump_node_fd = -1;
3c171f0b 687 _cleanup_free_ char *core_message = NULL, *filename = NULL, *coredump_data = NULL;
a5ca3649 688 uint64_t coredump_size = UINT64_MAX;
3c171f0b 689 int r;
f5e04665 690
3c171f0b
LP
691 assert(context);
692 assert(iovec);
693 assert(n_iovec_allocated >= n_iovec + 3);
694 assert(input_fd >= 0);
f5e04665 695
3c171f0b
LP
696 /* Vacuum before we write anything again */
697 (void) coredump_vacuum(-1, arg_keep_free, arg_max_use);
803a3464 698
3c171f0b
LP
699 /* Always stream the coredump to disk, if that's possible */
700 r = save_external_coredump(context, input_fd, &filename, &coredump_node_fd, &coredump_fd, &coredump_size);
701 if (r < 0)
702 /* Skip whole core dumping part */
703 goto log;
704
705 /* If we don't want to keep the coredump on disk, remove it now, as later on we will lack the privileges for
706 * it. However, we keep the fd to it, so that we can still process it and log it. */
707 r = maybe_remove_external_coredump(filename, coredump_size);
708 if (r < 0)
709 return r;
710 if (r == 0) {
711 const char *coredump_filename;
712
713 coredump_filename = strjoina("COREDUMP_FILENAME=", filename);
714 IOVEC_SET_STRING(iovec[n_iovec++], coredump_filename);
6e9ef603 715 } else if (arg_storage == COREDUMP_STORAGE_EXTERNAL)
5206a724 716 log_info("The core will not be stored: size %"PRIu64" is greater than %"PRIu64" (the configured maximum)",
6e9ef603 717 coredump_size, arg_external_size_max);
f5e04665 718
3c171f0b
LP
719 /* Vacuum again, but exclude the coredump we just created */
720 (void) coredump_vacuum(coredump_node_fd >= 0 ? coredump_node_fd : coredump_fd, arg_keep_free, arg_max_use);
8c9571d0 721
3c171f0b
LP
722 /* Now, let's drop privileges to become the user who owns the segfaulted process and allocate the coredump
723 * memory under the user's uid. This also ensures that the credentials journald will see are the ones of the
724 * coredumping user, thus making sure the user gets access to the core dump. Let's also get rid of all
725 * capabilities, if we run as root, we won't need them anymore. */
726 r = change_uid_gid(context);
727 if (r < 0)
728 return log_error_errno(r, "Failed to drop privileges: %m");
34c10968 729
3c171f0b
LP
730#ifdef HAVE_ELFUTILS
731 /* Try to get a strack trace if we can */
732 if (coredump_size <= arg_process_size_max) {
733 _cleanup_free_ char *stacktrace = NULL;
734
735 r = coredump_make_stack_trace(coredump_fd, context[CONTEXT_EXE], &stacktrace);
736 if (r >= 0)
605405c6
ZJS
737 core_message = strjoin("MESSAGE=Process ", context[CONTEXT_PID],
738 " (", context[CONTEXT_COMM], ") of user ",
739 context[CONTEXT_UID], " dumped core.\n\n",
740 stacktrace);
3c171f0b
LP
741 else if (r == -EINVAL)
742 log_warning("Failed to generate stack trace: %s", dwfl_errmsg(dwfl_errno()));
743 else
744 log_warning_errno(r, "Failed to generate stack trace: %m");
6e9ef603 745 } else
5206a724 746 log_debug("Not generating stack trace: core size %"PRIu64" is greater than %"PRIu64" (the configured maximum)",
6e9ef603 747 coredump_size, arg_process_size_max);
803a3464 748
3c171f0b
LP
749 if (!core_message)
750#endif
751log:
605405c6
ZJS
752 core_message = strjoin("MESSAGE=Process ", context[CONTEXT_PID], " (",
753 context[CONTEXT_COMM], ") of user ",
754 context[CONTEXT_UID], " dumped core.");
3c171f0b
LP
755 if (core_message)
756 IOVEC_SET_STRING(iovec[n_iovec++], core_message);
757
758 /* Optionally store the entire coredump in the journal */
6e9ef603
ZJS
759 if (arg_storage == COREDUMP_STORAGE_JOURNAL) {
760 if (coredump_size <= arg_journal_size_max) {
761 size_t sz = 0;
762
763 /* Store the coredump itself in the journal */
764
765 r = allocate_journal_field(coredump_fd, (size_t) coredump_size, &coredump_data, &sz);
766 if (r >= 0) {
767 iovec[n_iovec].iov_base = coredump_data;
768 iovec[n_iovec].iov_len = sz;
769 n_iovec++;
770 } else
771 log_warning_errno(r, "Failed to attach the core to the journal entry: %m");
772 } else
5206a724 773 log_info("The core will not be stored: size %"PRIu64" is greater than %"PRIu64" (the configured maximum)",
6e9ef603 774 coredump_size, arg_journal_size_max);
f5e04665
LP
775 }
776
3c171f0b
LP
777 assert(n_iovec <= n_iovec_allocated);
778
779 r = sd_journal_sendv(iovec, n_iovec);
780 if (r < 0)
781 return log_error_errno(r, "Failed to log coredump: %m");
782
783 return 0;
784}
785
786static void map_context_fields(const struct iovec *iovec, const char *context[]) {
787
788 static const char * const context_field_names[_CONTEXT_MAX] = {
789 [CONTEXT_PID] = "COREDUMP_PID=",
790 [CONTEXT_UID] = "COREDUMP_UID=",
791 [CONTEXT_GID] = "COREDUMP_GID=",
792 [CONTEXT_SIGNAL] = "COREDUMP_SIGNAL=",
793 [CONTEXT_TIMESTAMP] = "COREDUMP_TIMESTAMP=",
794 [CONTEXT_COMM] = "COREDUMP_COMM=",
795 [CONTEXT_EXE] = "COREDUMP_EXE=",
bdfd7b2c 796 [CONTEXT_RLIMIT] = "COREDUMP_RLIMIT=",
3c171f0b
LP
797 };
798
799 unsigned i;
800
801 assert(iovec);
802 assert(context);
803
804 for (i = 0; i < _CONTEXT_MAX; i++) {
805 size_t l;
806
807 l = strlen(context_field_names[i]);
808 if (iovec->iov_len < l)
809 continue;
810
811 if (memcmp(iovec->iov_base, context_field_names[i], l) != 0)
812 continue;
813
814 /* Note that these strings are NUL terminated, because we made sure that a trailing NUL byte is in the
815 * buffer, though not included in the iov_len count. (see below) */
816 context[i] = (char*) iovec->iov_base + l;
817 break;
818 }
819}
820
821static int process_socket(int fd) {
822 _cleanup_close_ int coredump_fd = -1;
823 struct iovec *iovec = NULL;
80002f66 824 size_t n_iovec = 0, n_allocated = 0, i, k;
3c171f0b
LP
825 const char *context[_CONTEXT_MAX] = {};
826 int r;
827
828 assert(fd >= 0);
829
830 log_set_target(LOG_TARGET_AUTO);
831 log_parse_environment();
832 log_open();
833
988e89ee
ZJS
834 log_debug("Processing coredump received on stdin...");
835
3c171f0b
LP
836 for (;;) {
837 union {
838 struct cmsghdr cmsghdr;
839 uint8_t buf[CMSG_SPACE(sizeof(int))];
840 } control = {};
841 struct msghdr mh = {
842 .msg_control = &control,
843 .msg_controllen = sizeof(control),
844 .msg_iovlen = 1,
845 };
846 ssize_t n;
fe1ef0f8 847 ssize_t l;
3c171f0b 848
5b45a160 849 if (!GREEDY_REALLOC(iovec, n_allocated, n_iovec + 3)) {
3c171f0b
LP
850 r = log_oom();
851 goto finish;
852 }
853
fe1ef0f8
EV
854 l = next_datagram_size_fd(fd);
855 if (l < 0) {
856 r = log_error_errno(l, "Failed to determine datagram size to read: %m");
3c171f0b
LP
857 goto finish;
858 }
859
860 assert(l >= 0);
861
862 iovec[n_iovec].iov_len = l;
863 iovec[n_iovec].iov_base = malloc(l + 1);
3c171f0b
LP
864 if (!iovec[n_iovec].iov_base) {
865 r = log_oom();
866 goto finish;
867 }
868
869 mh.msg_iov = iovec + n_iovec;
870
871 n = recvmsg(fd, &mh, MSG_NOSIGNAL|MSG_CMSG_CLOEXEC);
872 if (n < 0) {
873 free(iovec[n_iovec].iov_base);
874 r = log_error_errno(errno, "Failed to receive datagram: %m");
875 goto finish;
876 }
877
878 if (n == 0) {
879 struct cmsghdr *cmsg, *found = NULL;
880 /* The final zero-length datagram carries the file descriptor and tells us that we're done. */
881
882 free(iovec[n_iovec].iov_base);
883
884 CMSG_FOREACH(cmsg, &mh) {
885 if (cmsg->cmsg_level == SOL_SOCKET &&
886 cmsg->cmsg_type == SCM_RIGHTS &&
887 cmsg->cmsg_len == CMSG_LEN(sizeof(int))) {
888 assert(!found);
889 found = cmsg;
890 }
891 }
892
893 if (!found) {
894 log_error("Coredump file descriptor missing.");
895 r = -EBADMSG;
896 goto finish;
897 }
898
899 assert(coredump_fd < 0);
900 coredump_fd = *(int*) CMSG_DATA(found);
901 break;
902 }
903
904 /* Add trailing NUL byte, in case these are strings */
905 ((char*) iovec[n_iovec].iov_base)[n] = 0;
906 iovec[n_iovec].iov_len = (size_t) n;
907
908 cmsg_close_all(&mh);
909 map_context_fields(iovec + n_iovec, context);
910 n_iovec++;
911 }
912
5b45a160 913 if (!GREEDY_REALLOC(iovec, n_allocated, n_iovec + 3)) {
3c171f0b 914 r = log_oom();
34c10968
LP
915 goto finish;
916 }
917
61233823 918 /* Make sure we got all data we really need */
3c171f0b
LP
919 assert(context[CONTEXT_PID]);
920 assert(context[CONTEXT_UID]);
921 assert(context[CONTEXT_GID]);
922 assert(context[CONTEXT_SIGNAL]);
923 assert(context[CONTEXT_TIMESTAMP]);
bdfd7b2c 924 assert(context[CONTEXT_RLIMIT]);
3c171f0b
LP
925 assert(context[CONTEXT_COMM]);
926 assert(coredump_fd >= 0);
927
80002f66
LP
928 /* Small quirk: the journal fields contain the timestamp padded with six zeroes, so that the kernel-supplied 1s
929 * granularity timestamps becomes 1µs granularity, i.e. the granularity systemd usually operates in. Since we
930 * are reconstructing the original kernel context, we chop this off again, here. */
931 k = strlen(context[CONTEXT_TIMESTAMP]);
932 if (k > 6)
933 context[CONTEXT_TIMESTAMP] = strndupa(context[CONTEXT_TIMESTAMP], k - 6);
934
5b45a160 935 r = submit_coredump(context, iovec, n_allocated, n_iovec, coredump_fd);
3c171f0b
LP
936
937finish:
938 for (i = 0; i < n_iovec; i++)
939 free(iovec[i].iov_base);
940 free(iovec);
941
942 return r;
943}
944
945static int send_iovec(const struct iovec iovec[], size_t n_iovec, int input_fd) {
946
947 static const union sockaddr_union sa = {
948 .un.sun_family = AF_UNIX,
949 .un.sun_path = "/run/systemd/coredump",
950 };
951 _cleanup_close_ int fd = -1;
952 size_t i;
953 int r;
954
955 assert(iovec || n_iovec <= 0);
956 assert(input_fd >= 0);
957
958 fd = socket(AF_UNIX, SOCK_SEQPACKET|SOCK_CLOEXEC, 0);
959 if (fd < 0)
960 return log_error_errno(errno, "Failed to create coredump socket: %m");
961
fc2fffe7 962 if (connect(fd, &sa.sa, SOCKADDR_UN_LEN(sa.un)) < 0)
3c171f0b
LP
963 return log_error_errno(errno, "Failed to connect to coredump service: %m");
964
965 for (i = 0; i < n_iovec; i++) {
fec603eb
LP
966 struct msghdr mh = {
967 .msg_iov = (struct iovec*) iovec + i,
968 .msg_iovlen = 1,
969 };
970 struct iovec copy[2];
971
972 for (;;) {
973 if (sendmsg(fd, &mh, MSG_NOSIGNAL) >= 0)
974 break;
975
976 if (errno == EMSGSIZE && mh.msg_iov[0].iov_len > 0) {
977 /* This field didn't fit? That's a pity. Given that this is just metadata,
978 * let's truncate the field at half, and try again. We append three dots, in
979 * order to show that this is truncated. */
980
981 if (mh.msg_iov != copy) {
982 /* We don't want to modify the caller's iovec, hence let's create our
983 * own array, consisting of two new iovecs, where the first is a
984 * (truncated) copy of what we want to send, and the second one
985 * contains the trailing dots. */
986 copy[0] = iovec[i];
987 copy[1] = (struct iovec) {
988 .iov_base = (char[]) { '.', '.', '.' },
989 .iov_len = 3,
990 };
991
992 mh.msg_iov = copy;
993 mh.msg_iovlen = 2;
994 }
995
996 copy[0].iov_len /= 2; /* halve it, and try again */
997 continue;
998 }
3c171f0b 999
3c171f0b 1000 return log_error_errno(errno, "Failed to send coredump datagram: %m");
fec603eb 1001 }
1eef15b1
ZJS
1002 }
1003
3c171f0b
LP
1004 r = send_one_fd(fd, input_fd, 0);
1005 if (r < 0)
1006 return log_error_errno(r, "Failed to send coredump fd: %m");
1eef15b1 1007
3c171f0b
LP
1008 return 0;
1009}
1eef15b1 1010
78f043f7 1011static int process_special_crash(const char *context[], int input_fd) {
3c171f0b
LP
1012 _cleanup_close_ int coredump_fd = -1, coredump_node_fd = -1;
1013 _cleanup_free_ char *filename = NULL;
1014 uint64_t coredump_size;
1015 int r;
803a3464 1016
3c171f0b
LP
1017 assert(context);
1018 assert(input_fd >= 0);
803a3464 1019
78f043f7 1020 /* If we are pid1 or journald, we cut things short, don't write to the journal, but still create a coredump. */
34c10968 1021
3c171f0b
LP
1022 if (arg_storage != COREDUMP_STORAGE_NONE)
1023 arg_storage = COREDUMP_STORAGE_EXTERNAL;
34c10968 1024
3c171f0b
LP
1025 r = save_external_coredump(context, input_fd, &filename, &coredump_node_fd, &coredump_fd, &coredump_size);
1026 if (r < 0)
1027 return r;
34c10968 1028
3c171f0b
LP
1029 r = maybe_remove_external_coredump(filename, coredump_size);
1030 if (r < 0)
1031 return r;
34c10968 1032
78f043f7
LP
1033 log_notice("Detected coredump of the journal daemon or PID 1, diverted to %s.", filename);
1034
3c171f0b
LP
1035 return 0;
1036}
1037
9aa82023
ZJS
1038static char* set_iovec_field(struct iovec iovec[27], size_t *n_iovec, const char *field, const char *value) {
1039 char *x;
3c171f0b 1040
9aa82023
ZJS
1041 x = strappend(field, value);
1042 if (x)
1043 IOVEC_SET_STRING(iovec[(*n_iovec)++], x);
1044 return x;
1045}
3c171f0b 1046
9aa82023
ZJS
1047static char* set_iovec_field_free(struct iovec iovec[27], size_t *n_iovec, const char *field, char *value) {
1048 char *x;
1049
1050 x = set_iovec_field(iovec, n_iovec, field, value);
1051 free(value);
1052 return x;
1053}
1054
86562420 1055static int gather_pid_metadata_and_process_special_crash(
9aa82023
ZJS
1056 const char *context[_CONTEXT_MAX],
1057 char **comm_fallback,
988e89ee 1058 char **comm_ret,
5b45a160 1059 struct iovec *iovec, size_t *n_iovec) {
d14bcb4e
LP
1060
1061 /* We need 26 empty slots in iovec!
1062 *
1063 * Note that if we fail on oom later on, we do not roll-back changes to the iovec structure. (It remains valid,
1064 * with the first n_iovec fields initialized.) */
3c171f0b
LP
1065
1066 _cleanup_free_ char *exe = NULL, *comm = NULL;
3c171f0b 1067 uid_t owner_uid;
3c171f0b
LP
1068 pid_t pid;
1069 char *t;
9aa82023 1070 const char *p;
d14bcb4e 1071 int r, signo;
3c171f0b 1072
9aa82023 1073 r = parse_pid(context[CONTEXT_PID], &pid);
3c171f0b 1074 if (r < 0)
988e89ee 1075 return log_error_errno(r, "Failed to parse PID \"%s\": %m", context[CONTEXT_PID]);
3c171f0b
LP
1076
1077 r = get_process_comm(pid, &comm);
1078 if (r < 0) {
1079 log_warning_errno(r, "Failed to get COMM, falling back to the command line: %m");
9aa82023 1080 comm = strv_join(comm_fallback, " ");
3c171f0b
LP
1081 if (!comm)
1082 return log_oom();
1083 }
1084
1085 r = get_process_exe(pid, &exe);
1086 if (r < 0)
1087 log_warning_errno(r, "Failed to get EXE, ignoring: %m");
1088
3c171f0b
LP
1089 if (cg_pid_get_unit(pid, &t) >= 0) {
1090
c8091d92
LP
1091 /* If this is PID 1 disable coredump collection, we'll unlikely be able to process it later on. */
1092 if (streq(t, SPECIAL_INIT_SCOPE)) {
1093 log_notice("Due to PID 1 having crashed coredump collection will now be turned off.");
1094 (void) write_string_file("/proc/sys/kernel/core_pattern", "|/bin/false", 0);
1095 }
1096
78f043f7
LP
1097 /* Let's avoid dead-locks when processing journald and init crashes, as socket activation and logging
1098 * are unlikely to work then. */
1099 if (STR_IN_SET(t, SPECIAL_JOURNALD_SERVICE, SPECIAL_INIT_SCOPE)) {
3c171f0b 1100 free(t);
86562420
LP
1101 r = process_special_crash(context, STDIN_FILENO);
1102 if (r < 0)
1103 return r;
1104
1105 return 1; /* > 0 means: we have already processed it, because it's a special crash */
803a3464
LP
1106 }
1107
9aa82023 1108 set_iovec_field_free(iovec, n_iovec, "COREDUMP_UNIT=", t);
8c8549db 1109 }
803a3464 1110
3c171f0b 1111 /* OK, now we know it's not the journal, hence we can make use of it now. */
803a3464
LP
1112 log_set_target(LOG_TARGET_JOURNAL_OR_KMSG);
1113 log_open();
1114
9aa82023
ZJS
1115 if (cg_pid_get_user_unit(pid, &t) >= 0)
1116 set_iovec_field_free(iovec, n_iovec, "COREDUMP_USER_UNIT=", t);
3c171f0b 1117
9aa82023
ZJS
1118 /* The next few are mandatory */
1119 if (!set_iovec_field(iovec, n_iovec, "COREDUMP_PID=", context[CONTEXT_PID]))
1120 return log_oom();
3c171f0b 1121
9aa82023
ZJS
1122 if (!set_iovec_field(iovec, n_iovec, "COREDUMP_UID=", context[CONTEXT_UID]))
1123 return log_oom();
f5e04665 1124
9aa82023
ZJS
1125 if (!set_iovec_field(iovec, n_iovec, "COREDUMP_GID=", context[CONTEXT_GID]))
1126 return log_oom();
f5e04665 1127
9aa82023
ZJS
1128 if (!set_iovec_field(iovec, n_iovec, "COREDUMP_SIGNAL=", context[CONTEXT_SIGNAL]))
1129 return log_oom();
f5e04665 1130
9aa82023
ZJS
1131 if (!set_iovec_field(iovec, n_iovec, "COREDUMP_RLIMIT=", context[CONTEXT_RLIMIT]))
1132 return log_oom();
f5e04665 1133
9aa82023
ZJS
1134 if (!set_iovec_field(iovec, n_iovec, "COREDUMP_COMM=", comm))
1135 return log_oom();
bdfd7b2c 1136
9aa82023
ZJS
1137 if (exe &&
1138 !set_iovec_field(iovec, n_iovec, "COREDUMP_EXE=", exe))
1139 return log_oom();
f5e04665 1140
9aa82023
ZJS
1141 if (sd_pid_get_session(pid, &t) >= 0)
1142 set_iovec_field_free(iovec, n_iovec, "COREDUMP_SESSION=", t);
f5e04665 1143
a035f819 1144 if (sd_pid_get_owner_uid(pid, &owner_uid) >= 0) {
9aa82023 1145 r = asprintf(&t, "COREDUMP_OWNER_UID=" UID_FMT, owner_uid);
7de80bfe 1146 if (r > 0)
9aa82023 1147 IOVEC_SET_STRING(iovec[(*n_iovec)++], t);
f5e04665
LP
1148 }
1149
9aa82023
ZJS
1150 if (sd_pid_get_slice(pid, &t) >= 0)
1151 set_iovec_field_free(iovec, n_iovec, "COREDUMP_SLICE=", t);
f5e04665 1152
9aa82023
ZJS
1153 if (get_process_cmdline(pid, 0, false, &t) >= 0)
1154 set_iovec_field_free(iovec, n_iovec, "COREDUMP_CMDLINE=", t);
a035f819 1155
9aa82023
ZJS
1156 if (cg_pid_get_path_shifted(pid, NULL, &t) >= 0)
1157 set_iovec_field_free(iovec, n_iovec, "COREDUMP_CGROUP=", t);
a035f819 1158
9aa82023
ZJS
1159 if (compose_open_fds(pid, &t) >= 0)
1160 set_iovec_field_free(iovec, n_iovec, "COREDUMP_OPEN_FDS=", t);
3f132692
JF
1161
1162 p = procfs_file_alloca(pid, "status");
9aa82023
ZJS
1163 if (read_full_file(p, &t, NULL) >= 0)
1164 set_iovec_field_free(iovec, n_iovec, "COREDUMP_PROC_STATUS=", t);
3f132692
JF
1165
1166 p = procfs_file_alloca(pid, "maps");
9aa82023
ZJS
1167 if (read_full_file(p, &t, NULL) >= 0)
1168 set_iovec_field_free(iovec, n_iovec, "COREDUMP_PROC_MAPS=", t);
3f132692
JF
1169
1170 p = procfs_file_alloca(pid, "limits");
9aa82023
ZJS
1171 if (read_full_file(p, &t, NULL) >= 0)
1172 set_iovec_field_free(iovec, n_iovec, "COREDUMP_PROC_LIMITS=", t);
3f132692
JF
1173
1174 p = procfs_file_alloca(pid, "cgroup");
9aa82023
ZJS
1175 if (read_full_file(p, &t, NULL) >=0)
1176 set_iovec_field_free(iovec, n_iovec, "COREDUMP_PROC_CGROUP=", t);
3f132692 1177
d7032b1f 1178 p = procfs_file_alloca(pid, "mountinfo");
9aa82023
ZJS
1179 if (read_full_file(p, &t, NULL) >=0)
1180 set_iovec_field_free(iovec, n_iovec, "COREDUMP_PROC_MOUNTINFO=", t);
d7032b1f 1181
9aa82023
ZJS
1182 if (get_process_cwd(pid, &t) >= 0)
1183 set_iovec_field_free(iovec, n_iovec, "COREDUMP_CWD=", t);
3f132692
JF
1184
1185 if (get_process_root(pid, &t) >= 0) {
9aa82023
ZJS
1186 bool proc_self_root_is_slash;
1187
1188 proc_self_root_is_slash = strcmp(t, "/") == 0;
3f132692 1189
9aa82023 1190 set_iovec_field_free(iovec, n_iovec, "COREDUMP_ROOT=", t);
7ed03ce6
JF
1191
1192 /* If the process' root is "/", then there is a chance it has
1193 * mounted own root and hence being containerized. */
9aa82023
ZJS
1194 if (proc_self_root_is_slash && get_process_container_parent_cmdline(pid, &t) > 0)
1195 set_iovec_field_free(iovec, n_iovec, "COREDUMP_CONTAINER_CMDLINE=", t);
3f132692
JF
1196 }
1197
9aa82023
ZJS
1198 if (get_process_environ(pid, &t) >= 0)
1199 set_iovec_field_free(iovec, n_iovec, "COREDUMP_ENVIRON=", t);
1200
1201 t = strjoin("COREDUMP_TIMESTAMP=", context[CONTEXT_TIMESTAMP], "000000", NULL);
1202 if (t)
1203 IOVEC_SET_STRING(iovec[(*n_iovec)++], t);
1204
d14bcb4e
LP
1205 if (safe_atoi(context[CONTEXT_SIGNAL], &signo) >= 0 && SIGNAL_VALID(signo))
1206 set_iovec_field(iovec, n_iovec, "COREDUMP_SIGNAL_NAME=SIG", signal_to_string(signo));
1207
988e89ee
ZJS
1208 if (comm_ret) {
1209 *comm_ret = comm;
1210 comm = NULL;
1211 }
1212
86562420 1213 return 0; /* == 0 means: we successfully acquired all metadata */
9aa82023 1214}
3f132692 1215
9aa82023
ZJS
1216static int process_kernel(int argc, char* argv[]) {
1217
1218 const char *context[_CONTEXT_MAX];
d14bcb4e 1219 struct iovec iovec[28];
988e89ee 1220 size_t i, n_iovec, n_to_free = 0;
9aa82023
ZJS
1221 int r;
1222
988e89ee
ZJS
1223 log_debug("Processing coredump received from the kernel...");
1224
9aa82023 1225 if (argc < CONTEXT_COMM + 1) {
988e89ee 1226 log_error("Not enough arguments passed by the kernel (%i, expected %i).", argc - 1, CONTEXT_COMM + 1 - 1);
9aa82023 1227 return -EINVAL;
3f132692
JF
1228 }
1229
9aa82023
ZJS
1230 context[CONTEXT_PID] = argv[CONTEXT_PID + 1];
1231 context[CONTEXT_UID] = argv[CONTEXT_UID + 1];
1232 context[CONTEXT_GID] = argv[CONTEXT_GID + 1];
1233 context[CONTEXT_SIGNAL] = argv[CONTEXT_SIGNAL + 1];
1234 context[CONTEXT_TIMESTAMP] = argv[CONTEXT_TIMESTAMP + 1];
1235 context[CONTEXT_RLIMIT] = argv[CONTEXT_RLIMIT + 1];
1236
86562420 1237 r = gather_pid_metadata_and_process_special_crash(context, argv + CONTEXT_COMM + 1, NULL, iovec, &n_to_free);
9aa82023
ZJS
1238 if (r < 0)
1239 goto finish;
86562420
LP
1240 if (r > 0) {
1241 /* This was a special crash, and has already been processed. */
1242 r = 0;
1243 goto finish;
1244 }
1245
988e89ee 1246 n_iovec = n_to_free;
f5e04665 1247
2b044526 1248 IOVEC_SET_STRING(iovec[n_iovec++], "MESSAGE_ID=" SD_MESSAGE_COREDUMP_STR);
4850d39a
LP
1249
1250 assert_cc(2 == LOG_CRIT);
3c171f0b 1251 IOVEC_SET_STRING(iovec[n_iovec++], "PRIORITY=2");
0dc5d23c 1252
3c171f0b 1253 assert(n_iovec <= ELEMENTSOF(iovec));
34c10968 1254
9aa82023
ZJS
1255 r = send_iovec(iovec, n_iovec, STDIN_FILENO);
1256
1257 finish:
1258 for (i = 0; i < n_to_free; i++)
1259 free(iovec[i].iov_base);
1260
1261 return r;
3c171f0b 1262}
34c10968 1263
988e89ee
ZJS
1264static int process_backtrace(int argc, char *argv[]) {
1265 const char *context[_CONTEXT_MAX];
5b45a160
ZJS
1266 _cleanup_free_ char *comm = NULL, *message = NULL;
1267 _cleanup_free_ struct iovec *iovec = NULL;
1268 size_t n_iovec, n_allocated, n_to_free = 0, i;
988e89ee 1269 int r;
5b45a160
ZJS
1270 JournalImporter importer = {
1271 .fd = STDIN_FILENO,
1272 };
988e89ee
ZJS
1273
1274 log_debug("Processing backtrace on stdin...");
1275
1276 if (argc < CONTEXT_COMM + 1) {
1277 log_error("Not enough arguments passed (%i, expected %i).", argc - 1, CONTEXT_COMM + 1 - 1);
1278 return -EINVAL;
1279 }
1280
1281 context[CONTEXT_PID] = argv[CONTEXT_PID + 2];
1282 context[CONTEXT_UID] = argv[CONTEXT_UID + 2];
1283 context[CONTEXT_GID] = argv[CONTEXT_GID + 2];
1284 context[CONTEXT_SIGNAL] = argv[CONTEXT_SIGNAL + 2];
1285 context[CONTEXT_TIMESTAMP] = argv[CONTEXT_TIMESTAMP + 2];
1286 context[CONTEXT_RLIMIT] = argv[CONTEXT_RLIMIT + 2];
1287
d14bcb4e 1288 n_allocated = 33; /* 25 metadata, 2 static, +unknown input, rounded up */
5b45a160
ZJS
1289 iovec = new(struct iovec, n_allocated);
1290 if (!iovec)
1291 return log_oom();
1292
86562420 1293 r = gather_pid_metadata_and_process_special_crash(context, argv + CONTEXT_COMM + 2, &comm, iovec, &n_to_free);
988e89ee
ZJS
1294 if (r < 0)
1295 goto finish;
86562420
LP
1296 if (r > 0) {
1297 /* This was a special crash, and has already been processed. */
1298 r = 0;
1299 goto finish;
1300 }
5b45a160 1301 n_iovec = n_to_free;
988e89ee 1302
86562420 1303 for (;;) {
5b45a160
ZJS
1304 r = journal_importer_process_data(&importer);
1305 if (r < 0) {
1306 log_error_errno(r, "Failed to parse journal entry on stdin: %m");
1307 goto finish;
1308 }
1309 if (r == 1)
1310 break;
988e89ee 1311 }
988e89ee 1312
5b45a160
ZJS
1313 if (!GREEDY_REALLOC(iovec, n_allocated, n_iovec + importer.iovw.count + 2))
1314 return log_oom();
1315
1316 if (journal_importer_eof(&importer)) {
1317 log_warning("Did not receive a full journal entry on stdin, ignoring message sent by reporter");
988e89ee 1318
5b45a160
ZJS
1319 message = strjoin("MESSAGE=Process ", context[CONTEXT_PID], " (", comm, ")"
1320 " of user ", context[CONTEXT_UID],
1321 " failed with ", context[CONTEXT_SIGNAL]);
1322 if (!message) {
1323 r = log_oom();
1324 goto finish;
1325 }
1326 IOVEC_SET_STRING(iovec[n_iovec++], message);
1327 } else {
1328 for (i = 0; i < importer.iovw.count; i++)
1329 iovec[n_iovec++] = importer.iovw.iovec[i];
1330 }
988e89ee 1331
2b044526 1332 IOVEC_SET_STRING(iovec[n_iovec++], "MESSAGE_ID=" SD_MESSAGE_BACKTRACE_STR);
988e89ee
ZJS
1333 assert_cc(2 == LOG_CRIT);
1334 IOVEC_SET_STRING(iovec[n_iovec++], "PRIORITY=2");
1335
5b45a160 1336 assert(n_iovec <= n_allocated);
988e89ee
ZJS
1337
1338 r = sd_journal_sendv(iovec, n_iovec);
1339 if (r < 0)
1340 log_error_errno(r, "Failed to log backtrace: %m");
1341
1342 finish:
1343 for (i = 0; i < n_to_free; i++)
1344 free(iovec[i].iov_base);
1345
1346 return r;
1347}
1348
3c171f0b
LP
1349int main(int argc, char *argv[]) {
1350 int r;
fee80f69 1351
9aa82023
ZJS
1352 /* First, log to a safe place, since we don't know what crashed and it might
1353 * be journald which we'd rather not log to then. */
8d4e028f 1354
3c171f0b
LP
1355 log_set_target(LOG_TARGET_KMSG);
1356 log_open();
8d4e028f 1357
3c171f0b
LP
1358 /* Make sure we never enter a loop */
1359 (void) prctl(PR_SET_DUMPABLE, 0);
8d4e028f 1360
3c171f0b
LP
1361 /* Ignore all parse errors */
1362 (void) parse_config();
fee80f69 1363
3c171f0b
LP
1364 log_debug("Selected storage '%s'.", coredump_storage_to_string(arg_storage));
1365 log_debug("Selected compression %s.", yes_no(arg_compress));
fee80f69 1366
3c171f0b
LP
1367 r = sd_listen_fds(false);
1368 if (r < 0) {
1369 log_error_errno(r, "Failed to determine number of file descriptor: %m");
1370 goto finish;
fee80f69
LP
1371 }
1372
9aa82023
ZJS
1373 /* If we got an fd passed, we are running in coredumpd mode. Otherwise we
1374 * are invoked from the kernel as coredump handler. */
988e89ee
ZJS
1375 if (r == 0) {
1376 if (streq_ptr(argv[1], "--backtrace"))
1377 r = process_backtrace(argc, argv);
1378 else
1379 r = process_kernel(argc, argv);
1380 } else if (r == 1)
3c171f0b
LP
1381 r = process_socket(SD_LISTEN_FDS_START);
1382 else {
1383 log_error("Received unexpected number of file descriptors.");
1384 r = -EINVAL;
1385 }
f5e04665
LP
1386
1387finish:
f5e04665
LP
1388 return r < 0 ? EXIT_FAILURE : EXIT_SUCCESS;
1389}