]> git.ipfire.org Git - thirdparty/systemd.git/blame - src/libsystemd/sd-netlink/sd-netlink.c
sd-netlink: introduce netlink_queue_received_message() and friend
[thirdparty/systemd.git] / src / libsystemd / sd-netlink / sd-netlink.c
CommitLineData
db9ecf05 1/* SPDX-License-Identifier: LGPL-2.1-or-later */
65f568bb 2
65f568bb 3#include <poll.h>
65f568bb 4
1c4baffc 5#include "sd-netlink.h"
07630cea 6
b5efdb8a 7#include "alloc-util.h"
3ffd4af2 8#include "fd-util.h"
07630cea 9#include "hashmap.h"
0f2d351f 10#include "io-util.h"
07630cea 11#include "macro.h"
56fdc16d 12#include "netlink-genl.h"
1c4baffc 13#include "netlink-internal.h"
ee38400b 14#include "netlink-slot.h"
84e10015 15#include "netlink-util.h"
dccca82b 16#include "process-util.h"
2583fbea 17#include "socket-util.h"
8190a388 18#include "string-util.h"
65f568bb 19
b522c4b9
LP
20/* Some really high limit, to catch programming errors */
21#define REPLY_CALLBACKS_MAX UINT16_MAX
22
409856d3
YW
23static int netlink_new(sd_netlink **ret) {
24 _cleanup_(sd_netlink_unrefp) sd_netlink *nl = NULL;
65f568bb
TG
25
26 assert_return(ret, -EINVAL);
27
409856d3
YW
28 nl = new(sd_netlink, 1);
29 if (!nl)
65f568bb
TG
30 return -ENOMEM;
31
409856d3 32 *nl = (sd_netlink) {
f23ab4dc 33 .n_ref = 1,
2fea6090
YW
34 .fd = -1,
35 .sockaddr.nl.nl_family = AF_NETLINK,
36 .original_pid = getpid_cached(),
37 .protocol = -1,
adf412b9 38
ac3bc1b8
LP
39 /* Kernel change notification messages have sequence number 0. We want to avoid that with our
40 * own serials, in order not to get confused when matching up kernel replies to our earlier
41 * requests.
42 *
43 * Moreover, when using netlink socket activation (i.e. where PID 1 binds an AF_NETLINK
44 * socket for us and passes it to us across execve()) and we get restarted multiple times
45 * while the socket sticks around we might get confused by replies from earlier runs coming
46 * in late — which is pretty likely if we'd start our sequence numbers always from 1. Hence,
47 * let's start with a value based on the system clock. This should make collisions much less
48 * likely (though still theoretically possible). We use a 32 bit µs counter starting at boot
49 * for this (and explicitly exclude the zero, see above). This counter will wrap around after
50 * a bit more than 1h, but that's hopefully OK as the kernel shouldn't take that long to
51 * reply to our requests.
52 *
53 * We only pick the initial start value this way. For each message we simply increase the
54 * sequence number by 1. This means we could enqueue 1 netlink message per µs without risking
55 * collisions, which should be OK.
56 *
57 * Note this means the serials will be in the range 1…UINT32_MAX here.
58 *
59 * (In an ideal world we'd attach the current serial counter to the netlink socket itself
60 * somehow, to avoid all this, but I couldn't come up with a nice way to do this) */
61 .serial = (uint32_t) (now(CLOCK_MONOTONIC) % UINT32_MAX) + 1,
2fea6090 62 };
8cec01b9 63
409856d3 64 *ret = TAKE_PTR(nl);
65f568bb
TG
65 return 0;
66}
67
dd35a61c 68int sd_netlink_open_fd(sd_netlink **ret, int fd) {
409856d3 69 _cleanup_(sd_netlink_unrefp) sd_netlink *nl = NULL;
13ec9f10 70 int r, protocol;
65f568bb 71
9d0db178 72 assert_return(ret, -EINVAL);
8ac43fee 73 assert_return(fd >= 0, -EBADF);
9d0db178 74
409856d3 75 r = netlink_new(&nl);
65f568bb
TG
76 if (r < 0)
77 return r;
78
13ec9f10 79 r = getsockopt_int(fd, SOL_SOCKET, SO_PROTOCOL, &protocol);
05d0c2e3
JT
80 if (r < 0)
81 return r;
82
409856d3
YW
83 nl->fd = fd;
84 nl->protocol = protocol;
65f568bb 85
d7418b3b 86 r = setsockopt_int(fd, SOL_NETLINK, NETLINK_EXT_ACK, true);
e4a1e68d
YW
87 if (r < 0)
88 log_debug_errno(r, "sd-netlink: Failed to enable NETLINK_EXT_ACK option, ignoring: %m");
89
d7418b3b
YW
90 r = setsockopt_int(fd, SOL_NETLINK, NETLINK_GET_STRICT_CHK, true);
91 if (r < 0)
92 log_debug_errno(r, "sd-netlink: Failed to enable NETLINK_GET_STRICT_CHK option, ignoring: %m");
93
409856d3 94 r = socket_bind(nl);
5c60db87 95 if (r < 0) {
409856d3
YW
96 nl->fd = -1; /* on failure, the caller remains owner of the fd, hence don't close it here */
97 nl->protocol = -1;
b95cc756 98 return r;
5c60db87 99 }
6d0b55c2 100
409856d3 101 *ret = TAKE_PTR(nl);
65f568bb
TG
102
103 return 0;
104}
105
dd35a61c 106int sd_netlink_open(sd_netlink **ret) {
05d0c2e3
JT
107 return netlink_open_family(ret, NETLINK_ROUTE);
108}
109
dd35a61c 110int sd_netlink_increase_rxbuf(sd_netlink *nl, size_t size) {
409856d3
YW
111 assert_return(nl, -EINVAL);
112 assert_return(!netlink_pid_changed(nl), -ECHILD);
75f8a779 113
28e7e934 114 return fd_increase_rxbuf(nl->fd, size);
be660c37
AR
115}
116
409856d3 117static sd_netlink *netlink_free(sd_netlink *nl) {
ee38400b 118 sd_netlink_slot *s;
1c71f7f3 119 unsigned i;
8c578303 120
409856d3 121 assert(nl);
4555ec72 122
409856d3
YW
123 for (i = 0; i < nl->rqueue_size; i++)
124 sd_netlink_message_unref(nl->rqueue[i]);
125 free(nl->rqueue);
8cec01b9 126
409856d3
YW
127 for (i = 0; i < nl->rqueue_partial_size; i++)
128 sd_netlink_message_unref(nl->rqueue_partial[i]);
129 free(nl->rqueue_partial);
4e996881 130
409856d3 131 free(nl->rbuffer);
a88f77c4 132
409856d3 133 while ((s = nl->slots)) {
ee38400b
YW
134 assert(s->floating);
135 netlink_slot_disconnect(s, true);
545bab1f 136 }
409856d3
YW
137 hashmap_free(nl->reply_callbacks);
138 prioq_free(nl->reply_callbacks_prioq);
22fdeadc 139
409856d3
YW
140 sd_event_source_unref(nl->io_event_source);
141 sd_event_source_unref(nl->time_event_source);
142 sd_event_unref(nl->event);
22fdeadc 143
409856d3 144 hashmap_free(nl->broadcast_group_refs);
9c5a882b 145
56fdc16d 146 genl_clear_family(nl);
4e8f0ef9 147
409856d3
YW
148 safe_close(nl->fd);
149 return mfree(nl);
65f568bb
TG
150}
151
f23ab4dc 152DEFINE_TRIVIAL_REF_UNREF_FUNC(sd_netlink, sd_netlink, netlink_free);
1c71f7f3 153
dd35a61c 154int sd_netlink_send(
409856d3
YW
155 sd_netlink *nl,
156 sd_netlink_message *message,
157 uint32_t *serial) {
158
4555ec72 159 int r;
65f568bb
TG
160
161 assert_return(nl, -EINVAL);
409856d3 162 assert_return(!netlink_pid_changed(nl), -ECHILD);
65f568bb 163 assert_return(message, -EINVAL);
3dd215e0 164 assert_return(!message->sealed, -EPERM);
65f568bb 165
409856d3 166 netlink_seal_message(nl, message);
65f568bb 167
bbe181b4
TG
168 r = socket_write_message(nl, message);
169 if (r < 0)
170 return r;
65f568bb 171
4555ec72 172 if (serial)
409856d3 173 *serial = message_get_serial(message);
65f568bb 174
4555ec72
TG
175 return 1;
176}
65f568bb 177
409856d3 178static int dispatch_rqueue(sd_netlink *nl, sd_netlink_message **message) {
4555ec72 179 int r;
65f568bb 180
409856d3 181 assert(nl);
4555ec72
TG
182 assert(message);
183
409856d3 184 if (nl->rqueue_size <= 0) {
1b89cf56 185 /* Try to read a new message */
409856d3 186 r = socket_read_message(nl);
71994cff 187 if (r == -ENOBUFS) { /* FIXME: ignore buffer overruns for now */
409856d3 188 log_debug_errno(r, "sd-netlink: Got ENOBUFS from netlink socket, ignoring.");
71994cff
LP
189 return 1;
190 }
1b89cf56
TG
191 if (r <= 0)
192 return r;
4555ec72
TG
193 }
194
1b89cf56 195 /* Dispatch a queued message */
409856d3
YW
196 *message = nl->rqueue[0];
197 nl->rqueue_size--;
198 memmove(nl->rqueue, nl->rqueue + 1, sizeof(sd_netlink_message*) * nl->rqueue_size);
4555ec72
TG
199
200 return 1;
201}
202
409856d3 203static int process_timeout(sd_netlink *nl) {
4afd3348 204 _cleanup_(sd_netlink_message_unrefp) sd_netlink_message *m = NULL;
e16bcf98 205 struct reply_callback *c;
ee38400b 206 sd_netlink_slot *slot;
e16bcf98
TG
207 usec_t n;
208 int r;
209
409856d3 210 assert(nl);
e16bcf98 211
409856d3 212 c = prioq_peek(nl->reply_callbacks_prioq);
e16bcf98
TG
213 if (!c)
214 return 0;
215
216 n = now(CLOCK_MONOTONIC);
217 if (c->timeout > n)
218 return 0;
219
409856d3 220 r = message_new_synthetic_error(nl, -ETIMEDOUT, c->serial, &m);
e16bcf98
TG
221 if (r < 0)
222 return r;
223
409856d3 224 assert_se(prioq_pop(nl->reply_callbacks_prioq) == c);
ee38400b 225 c->timeout = 0;
409856d3 226 hashmap_remove(nl->reply_callbacks, UINT32_TO_PTR(c->serial));
e16bcf98 227
ee38400b
YW
228 slot = container_of(c, sd_netlink_slot, reply_callback);
229
409856d3 230 r = c->callback(nl, m, slot->userdata);
233ba5c3 231 if (r < 0)
8190a388
YW
232 log_debug_errno(r, "sd-netlink: timedout callback %s%s%sfailed: %m",
233 slot->description ? "'" : "",
234 strempty(slot->description),
235 slot->description ? "' " : "");
233ba5c3 236
ee38400b
YW
237 if (slot->floating)
238 netlink_slot_disconnect(slot, true);
e16bcf98 239
233ba5c3 240 return 1;
e16bcf98
TG
241}
242
409856d3 243static int process_reply(sd_netlink *nl, sd_netlink_message *m) {
ee38400b
YW
244 struct reply_callback *c;
245 sd_netlink_slot *slot;
b522c4b9 246 uint32_t serial;
ea342a99 247 uint16_t type;
e16bcf98
TG
248 int r;
249
409856d3 250 assert(nl);
e16bcf98
TG
251 assert(m);
252
409856d3
YW
253 serial = message_get_serial(m);
254 c = hashmap_remove(nl->reply_callbacks, UINT32_TO_PTR(serial));
e16bcf98
TG
255 if (!c)
256 return 0;
257
ee38400b 258 if (c->timeout != 0) {
409856d3 259 prioq_remove(nl->reply_callbacks_prioq, c, &c->prioq_idx);
ee38400b
YW
260 c->timeout = 0;
261 }
e16bcf98 262
1c4baffc 263 r = sd_netlink_message_get_type(m, &type);
ea342a99 264 if (r < 0)
ee38400b 265 return r;
ea342a99
AR
266
267 if (type == NLMSG_DONE)
268 m = NULL;
269
ee38400b
YW
270 slot = container_of(c, sd_netlink_slot, reply_callback);
271
409856d3 272 r = c->callback(nl, m, slot->userdata);
233ba5c3 273 if (r < 0)
8190a388
YW
274 log_debug_errno(r, "sd-netlink: reply callback %s%s%sfailed: %m",
275 slot->description ? "'" : "",
276 strempty(slot->description),
277 slot->description ? "' " : "");
233ba5c3 278
ee38400b
YW
279 if (slot->floating)
280 netlink_slot_disconnect(slot, true);
545bab1f 281
233ba5c3 282 return 1;
e16bcf98
TG
283}
284
409856d3 285static int process_match(sd_netlink *nl, sd_netlink_message *m) {
8cec01b9 286 uint16_t type;
e1578f60 287 uint8_t cmd;
8cec01b9
TG
288 int r;
289
409856d3 290 assert(nl);
8cec01b9
TG
291 assert(m);
292
1c4baffc 293 r = sd_netlink_message_get_type(m, &type);
8cec01b9
TG
294 if (r < 0)
295 return r;
296
e1578f60
YW
297 if (m->protocol == NETLINK_GENERIC) {
298 r = sd_genl_message_get_command(nl, m, &cmd);
299 if (r < 0)
300 return r;
301 } else
302 cmd = 0;
303
409856d3 304 LIST_FOREACH(match_callbacks, c, nl->match_callbacks) {
e1578f60 305 sd_netlink_slot *slot;
4d4d898a 306 bool found = false;
e1578f60
YW
307
308 if (c->type != type)
309 continue;
310 if (c->cmd != 0 && c->cmd != cmd)
baf78f1a
LP
311 continue;
312
4d4d898a
YW
313 for (size_t i = 0; i < c->n_groups; i++)
314 if (c->groups[i] == m->multicast_group) {
315 found = true;
316 break;
317 }
318
319 if (!found)
320 continue;
321
baf78f1a
LP
322 slot = container_of(c, sd_netlink_slot, match_callback);
323
409856d3 324 r = c->callback(nl, m, slot->userdata);
baf78f1a
LP
325 if (r < 0)
326 log_debug_errno(r, "sd-netlink: match callback %s%s%sfailed: %m",
327 slot->description ? "'" : "",
328 strempty(slot->description),
329 slot->description ? "' " : "");
330 if (r != 0)
331 break;
8cec01b9
TG
332 }
333
233ba5c3 334 return 1;
8cec01b9
TG
335}
336
409856d3 337static int process_running(sd_netlink *nl, sd_netlink_message **ret) {
4afd3348 338 _cleanup_(sd_netlink_message_unrefp) sd_netlink_message *m = NULL;
4555ec72
TG
339 int r;
340
409856d3 341 assert(nl);
9d0db178 342
409856d3 343 r = process_timeout(nl);
e16bcf98
TG
344 if (r != 0)
345 goto null_message;
346
409856d3 347 r = dispatch_rqueue(nl, &m);
4555ec72
TG
348 if (r < 0)
349 return r;
350 if (!m)
351 goto null_message;
352
52888279 353 if (sd_netlink_message_is_broadcast(m))
409856d3 354 r = process_match(nl, m);
52888279 355 else
409856d3 356 r = process_reply(nl, m);
52888279
YW
357 if (r != 0)
358 goto null_message;
8cec01b9 359
4555ec72 360 if (ret) {
1cc6c93a 361 *ret = TAKE_PTR(m);
4555ec72
TG
362
363 return 1;
364 }
365
366 return 1;
367
368null_message:
369 if (r >= 0 && ret)
370 *ret = NULL;
371
372 return r;
373}
e16bcf98 374
409856d3
YW
375int sd_netlink_process(sd_netlink *nl, sd_netlink_message **ret) {
376 NETLINK_DONT_DESTROY(nl);
4555ec72
TG
377 int r;
378
409856d3
YW
379 assert_return(nl, -EINVAL);
380 assert_return(!netlink_pid_changed(nl), -ECHILD);
381 assert_return(!nl->processing, -EBUSY);
4555ec72 382
409856d3
YW
383 nl->processing = true;
384 r = process_running(nl, ret);
385 nl->processing = false;
4555ec72
TG
386
387 return r;
388}
389
390static usec_t calc_elapse(uint64_t usec) {
f5fbe71d 391 if (usec == UINT64_MAX)
4555ec72
TG
392 return 0;
393
394 if (usec == 0)
409856d3 395 usec = NETLINK_DEFAULT_TIMEOUT_USEC;
4555ec72 396
496db330 397 return usec_add(now(CLOCK_MONOTONIC), usec);
4555ec72
TG
398}
399
409856d3 400static int netlink_poll(sd_netlink *nl, bool need_more, usec_t timeout_usec) {
3a43da28 401 usec_t m = USEC_INFINITY;
b4f2a5b1
TG
402 int r, e;
403
409856d3 404 assert(nl);
4555ec72 405
409856d3 406 e = sd_netlink_get_events(nl);
b4f2a5b1
TG
407 if (e < 0)
408 return e;
4555ec72 409
b4f2a5b1
TG
410 if (need_more)
411 /* Caller wants more data, and doesn't care about
412 * what's been read or any other timeouts. */
f55dc7c9 413 e |= POLLIN;
b4f2a5b1
TG
414 else {
415 usec_t until;
11537375 416
b4f2a5b1
TG
417 /* Caller wants to process if there is something to
418 * process, but doesn't care otherwise */
419
409856d3 420 r = sd_netlink_get_timeout(nl, &until);
b4f2a5b1
TG
421 if (r < 0)
422 return r;
65f568bb 423
11537375
YW
424 m = usec_sub_unsigned(until, now(CLOCK_MONOTONIC));
425 }
b4f2a5b1 426
409856d3 427 r = fd_wait_for_event(nl->fd, e, MIN(m, timeout_usec));
8d16f29b 428 if (r <= 0)
0f2d351f 429 return r;
4555ec72 430
dad28bff 431 return 1;
4555ec72
TG
432}
433
1c4baffc 434int sd_netlink_wait(sd_netlink *nl, uint64_t timeout_usec) {
69858785
LP
435 int r;
436
4555ec72 437 assert_return(nl, -EINVAL);
409856d3 438 assert_return(!netlink_pid_changed(nl), -ECHILD);
4555ec72
TG
439
440 if (nl->rqueue_size > 0)
441 return 0;
442
69858785
LP
443 r = netlink_poll(nl, false, timeout_usec);
444 if (r < 0 && ERRNO_IS_TRANSIENT(r)) /* Convert EINTR to "something happened" and give user a chance to run some code before calling back into us */
445 return 1;
446 return r;
4555ec72
TG
447}
448
e16bcf98
TG
449static int timeout_compare(const void *a, const void *b) {
450 const struct reply_callback *x = a, *y = b;
451
452 if (x->timeout != 0 && y->timeout == 0)
453 return -1;
454
455 if (x->timeout == 0 && y->timeout != 0)
456 return 1;
457
9c57a73b 458 return CMP(x->timeout, y->timeout);
e16bcf98
TG
459}
460
dd35a61c 461int sd_netlink_call_async(
545bab1f 462 sd_netlink *nl,
ee38400b 463 sd_netlink_slot **ret_slot,
545bab1f
YW
464 sd_netlink_message *m,
465 sd_netlink_message_handler_t callback,
466 sd_netlink_destroy_t destroy_callback,
467 void *userdata,
8190a388
YW
468 uint64_t usec,
469 const char *description) {
2b012288 470
ee38400b 471 _cleanup_free_ sd_netlink_slot *slot = NULL;
e16bcf98
TG
472 int r, k;
473
474 assert_return(nl, -EINVAL);
475 assert_return(m, -EINVAL);
476 assert_return(callback, -EINVAL);
409856d3 477 assert_return(!netlink_pid_changed(nl), -ECHILD);
e16bcf98 478
b522c4b9
LP
479 if (hashmap_size(nl->reply_callbacks) >= REPLY_CALLBACKS_MAX)
480 return -ERANGE;
481
482 r = hashmap_ensure_allocated(&nl->reply_callbacks, &trivial_hash_ops);
e16bcf98
TG
483 if (r < 0)
484 return r;
485
f5fbe71d 486 if (usec != UINT64_MAX) {
e16bcf98
TG
487 r = prioq_ensure_allocated(&nl->reply_callbacks_prioq, timeout_compare);
488 if (r < 0)
489 return r;
490 }
491
5cd67116 492 r = netlink_slot_allocate(nl, !ret_slot, NETLINK_REPLY_CALLBACK, sizeof(struct reply_callback), userdata, description, &slot);
8190a388
YW
493 if (r < 0)
494 return r;
e16bcf98 495
ee38400b
YW
496 slot->reply_callback.callback = callback;
497 slot->reply_callback.timeout = calc_elapse(usec);
e16bcf98 498
b522c4b9 499 k = sd_netlink_send(nl, m, &slot->reply_callback.serial);
545bab1f 500 if (k < 0)
e16bcf98 501 return k;
e16bcf98 502
b522c4b9 503 r = hashmap_put(nl->reply_callbacks, UINT32_TO_PTR(slot->reply_callback.serial), &slot->reply_callback);
545bab1f 504 if (r < 0)
e16bcf98 505 return r;
e16bcf98 506
ee38400b
YW
507 if (slot->reply_callback.timeout != 0) {
508 r = prioq_put(nl->reply_callbacks_prioq, &slot->reply_callback, &slot->reply_callback.prioq_idx);
f6bdbd9e 509 if (r < 0) {
b522c4b9 510 (void) hashmap_remove(nl->reply_callbacks, UINT32_TO_PTR(slot->reply_callback.serial));
e16bcf98
TG
511 return r;
512 }
513 }
514
40c864af 515 /* Set this at last. Otherwise, some failures in above would call destroy_callback but some would not. */
5cd67116
YW
516 slot->destroy_callback = destroy_callback;
517
ee38400b
YW
518 if (ret_slot)
519 *ret_slot = slot;
e16bcf98 520
ee38400b 521 TAKE_PTR(slot);
545bab1f 522
e16bcf98
TG
523 return k;
524}
525
dd35a61c 526int sd_netlink_read(
409856d3 527 sd_netlink *nl,
2b012288
YW
528 uint32_t serial,
529 uint64_t usec,
530 sd_netlink_message **ret) {
531
4555ec72 532 usec_t timeout;
4555ec72
TG
533 int r;
534
409856d3
YW
535 assert_return(nl, -EINVAL);
536 assert_return(!netlink_pid_changed(nl), -ECHILD);
4555ec72
TG
537
538 timeout = calc_elapse(usec);
539
65f568bb 540 for (;;) {
4555ec72 541 usec_t left;
65f568bb 542
409856d3 543 for (unsigned i = 0; i < nl->rqueue_size; i++) {
2b012288 544 _cleanup_(sd_netlink_message_unrefp) sd_netlink_message *incoming = NULL;
1b89cf56 545 uint32_t received_serial;
2b012288 546 uint16_t type;
65f568bb 547
409856d3 548 received_serial = message_get_serial(nl->rqueue[i]);
2b012288
YW
549 if (received_serial != serial)
550 continue;
65f568bb 551
409856d3 552 incoming = nl->rqueue[i];
ea342a99 553
2b012288 554 /* found a match, remove from rqueue and return it */
409856d3
YW
555 memmove(nl->rqueue + i, nl->rqueue + i + 1,
556 sizeof(sd_netlink_message*) * (nl->rqueue_size - i - 1));
557 nl->rqueue_size--;
ea342a99 558
2b012288
YW
559 r = sd_netlink_message_get_errno(incoming);
560 if (r < 0)
561 return r;
1b89cf56 562
2b012288
YW
563 r = sd_netlink_message_get_type(incoming, &type);
564 if (r < 0)
565 return r;
ea342a99 566
2b012288 567 if (type == NLMSG_DONE) {
766417bd
YW
568 if (ret)
569 *ret = NULL;
2b012288 570 return 0;
65f568bb 571 }
2b012288
YW
572
573 if (ret)
574 *ret = TAKE_PTR(incoming);
575 return 1;
65f568bb 576 }
1b89cf56 577
409856d3 578 r = socket_read_message(nl);
1b89cf56
TG
579 if (r < 0)
580 return r;
581 if (r > 0)
6ff8806e 582 /* received message, so try to process straight away */
4555ec72 583 continue;
65f568bb 584
4555ec72
TG
585 if (timeout > 0) {
586 usec_t n;
587
588 n = now(CLOCK_MONOTONIC);
589 if (n >= timeout)
590 return -ETIMEDOUT;
591
11537375 592 left = usec_sub_unsigned(timeout, n);
4555ec72 593 } else
11537375 594 left = USEC_INFINITY;
4555ec72 595
409856d3 596 r = netlink_poll(nl, true, left);
4555ec72
TG
597 if (r < 0)
598 return r;
2b012288 599 if (r == 0)
b551ddd3 600 return -ETIMEDOUT;
b4f2a5b1
TG
601 }
602}
603
dd35a61c 604int sd_netlink_call(
409856d3 605 sd_netlink *nl,
4df42cd9
FW
606 sd_netlink_message *message,
607 uint64_t usec,
608 sd_netlink_message **ret) {
2b012288 609
4df42cd9
FW
610 uint32_t serial;
611 int r;
612
409856d3
YW
613 assert_return(nl, -EINVAL);
614 assert_return(!netlink_pid_changed(nl), -ECHILD);
4df42cd9
FW
615 assert_return(message, -EINVAL);
616
409856d3 617 r = sd_netlink_send(nl, message, &serial);
4df42cd9
FW
618 if (r < 0)
619 return r;
620
409856d3 621 return sd_netlink_read(nl, serial, usec, ret);
4df42cd9
FW
622}
623
dd35a61c 624int sd_netlink_get_events(sd_netlink *nl) {
409856d3
YW
625 assert_return(nl, -EINVAL);
626 assert_return(!netlink_pid_changed(nl), -ECHILD);
b4f2a5b1 627
409856d3 628 return nl->rqueue_size == 0 ? POLLIN : 0;
b4f2a5b1
TG
629}
630
dd35a61c 631int sd_netlink_get_timeout(sd_netlink *nl, uint64_t *timeout_usec) {
b4f2a5b1
TG
632 struct reply_callback *c;
633
409856d3 634 assert_return(nl, -EINVAL);
b4f2a5b1 635 assert_return(timeout_usec, -EINVAL);
409856d3 636 assert_return(!netlink_pid_changed(nl), -ECHILD);
b4f2a5b1 637
409856d3 638 if (nl->rqueue_size > 0) {
b4f2a5b1
TG
639 *timeout_usec = 0;
640 return 1;
641 }
642
409856d3 643 c = prioq_peek(nl->reply_callbacks_prioq);
b4f2a5b1 644 if (!c) {
f5fbe71d 645 *timeout_usec = UINT64_MAX;
b4f2a5b1
TG
646 return 0;
647 }
648
649 *timeout_usec = c->timeout;
650
651 return 1;
652}
653
654static int io_callback(sd_event_source *s, int fd, uint32_t revents, void *userdata) {
99534007 655 sd_netlink *nl = ASSERT_PTR(userdata);
b4f2a5b1
TG
656 int r;
657
409856d3 658 r = sd_netlink_process(nl, NULL);
b4f2a5b1
TG
659 if (r < 0)
660 return r;
661
662 return 1;
663}
664
665static int time_callback(sd_event_source *s, uint64_t usec, void *userdata) {
99534007 666 sd_netlink *nl = ASSERT_PTR(userdata);
b4f2a5b1
TG
667 int r;
668
409856d3 669 r = sd_netlink_process(nl, NULL);
b4f2a5b1
TG
670 if (r < 0)
671 return r;
672
673 return 1;
674}
675
676static int prepare_callback(sd_event_source *s, void *userdata) {
99534007 677 sd_netlink *nl = ASSERT_PTR(userdata);
40c864af 678 int r, enabled;
b4f2a5b1
TG
679 usec_t until;
680
681 assert(s);
b4f2a5b1 682
40c864af 683 r = sd_netlink_get_events(nl);
b4f2a5b1
TG
684 if (r < 0)
685 return r;
686
40c864af 687 r = sd_event_source_set_io_events(nl->io_event_source, r);
b4f2a5b1
TG
688 if (r < 0)
689 return r;
b4f2a5b1 690
40c864af
ZJS
691 enabled = sd_netlink_get_timeout(nl, &until);
692 if (enabled < 0)
693 return enabled;
694 if (enabled > 0) {
695 r = sd_event_source_set_time(nl->time_event_source, until);
696 if (r < 0)
697 return r;
b4f2a5b1
TG
698 }
699
93c0a5ec
ZJS
700 r = sd_event_source_set_enabled(nl->time_event_source,
701 enabled > 0 ? SD_EVENT_ONESHOT : SD_EVENT_OFF);
b4f2a5b1
TG
702 if (r < 0)
703 return r;
704
705 return 1;
706}
707
dd35a61c 708int sd_netlink_attach_event(sd_netlink *nl, sd_event *event, int64_t priority) {
b4f2a5b1
TG
709 int r;
710
409856d3
YW
711 assert_return(nl, -EINVAL);
712 assert_return(!nl->event, -EBUSY);
b4f2a5b1 713
409856d3
YW
714 assert(!nl->io_event_source);
715 assert(!nl->time_event_source);
b4f2a5b1
TG
716
717 if (event)
409856d3 718 nl->event = sd_event_ref(event);
b4f2a5b1 719 else {
409856d3 720 r = sd_event_default(&nl->event);
b4f2a5b1
TG
721 if (r < 0)
722 return r;
723 }
724
409856d3 725 r = sd_event_add_io(nl->event, &nl->io_event_source, nl->fd, 0, io_callback, nl);
b4f2a5b1
TG
726 if (r < 0)
727 goto fail;
728
409856d3 729 r = sd_event_source_set_priority(nl->io_event_source, priority);
b4f2a5b1
TG
730 if (r < 0)
731 goto fail;
732
409856d3 733 r = sd_event_source_set_description(nl->io_event_source, "netlink-receive-message");
9021bb9f
TG
734 if (r < 0)
735 goto fail;
736
409856d3 737 r = sd_event_source_set_prepare(nl->io_event_source, prepare_callback);
b4f2a5b1
TG
738 if (r < 0)
739 goto fail;
740
409856d3 741 r = sd_event_add_time(nl->event, &nl->time_event_source, CLOCK_MONOTONIC, 0, 0, time_callback, nl);
b4f2a5b1
TG
742 if (r < 0)
743 goto fail;
744
409856d3 745 r = sd_event_source_set_priority(nl->time_event_source, priority);
b4f2a5b1
TG
746 if (r < 0)
747 goto fail;
748
409856d3 749 r = sd_event_source_set_description(nl->time_event_source, "netlink-timer");
9021bb9f
TG
750 if (r < 0)
751 goto fail;
752
b4f2a5b1
TG
753 return 0;
754
755fail:
409856d3 756 sd_netlink_detach_event(nl);
b4f2a5b1
TG
757 return r;
758}
759
dd35a61c 760int sd_netlink_detach_event(sd_netlink *nl) {
409856d3
YW
761 assert_return(nl, -EINVAL);
762 assert_return(nl->event, -ENXIO);
b4f2a5b1 763
409856d3 764 nl->io_event_source = sd_event_source_unref(nl->io_event_source);
b4f2a5b1 765
409856d3 766 nl->time_event_source = sd_event_source_unref(nl->time_event_source);
b4f2a5b1 767
409856d3 768 nl->event = sd_event_unref(nl->event);
b4f2a5b1
TG
769
770 return 0;
771}
8cec01b9 772
3f60e448
YW
773int netlink_add_match_internal(
774 sd_netlink *nl,
ee38400b 775 sd_netlink_slot **ret_slot,
3f60e448
YW
776 const uint32_t *groups,
777 size_t n_groups,
ee38400b 778 uint16_t type,
e1578f60 779 uint8_t cmd,
ee38400b
YW
780 sd_netlink_message_handler_t callback,
781 sd_netlink_destroy_t destroy_callback,
8190a388
YW
782 void *userdata,
783 const char *description) {
409856d3 784
ee38400b 785 _cleanup_free_ sd_netlink_slot *slot = NULL;
31710be5 786 int r;
8cec01b9 787
3f60e448
YW
788 assert(groups);
789 assert(n_groups > 0);
790
791 for (size_t i = 0; i < n_groups; i++) {
792 r = socket_broadcast_group_ref(nl, groups[i]);
793 if (r < 0)
794 return r;
795 }
8cec01b9 796
3f60e448
YW
797 r = netlink_slot_allocate(nl, !ret_slot, NETLINK_MATCH_CALLBACK, sizeof(struct match_callback),
798 userdata, description, &slot);
8190a388
YW
799 if (r < 0)
800 return r;
8cec01b9 801
3f60e448
YW
802 slot->match_callback.groups = newdup(uint32_t, groups, n_groups);
803 if (!slot->match_callback.groups)
804 return -ENOMEM;
805
806 slot->match_callback.n_groups = n_groups;
ee38400b
YW
807 slot->match_callback.callback = callback;
808 slot->match_callback.type = type;
e1578f60 809 slot->match_callback.cmd = cmd;
8cec01b9 810
3f60e448
YW
811 LIST_PREPEND(match_callbacks, nl->match_callbacks, &slot->match_callback);
812
813 /* Set this at last. Otherwise, some failures in above call the destroy callback but some do not. */
814 slot->destroy_callback = destroy_callback;
815
816 if (ret_slot)
817 *ret_slot = slot;
818
819 TAKE_PTR(slot);
820 return 0;
821}
822
dd35a61c 823int sd_netlink_add_match(
3f60e448
YW
824 sd_netlink *rtnl,
825 sd_netlink_slot **ret_slot,
826 uint16_t type,
827 sd_netlink_message_handler_t callback,
828 sd_netlink_destroy_t destroy_callback,
829 void *userdata,
830 const char *description) {
831
832 static const uint32_t
833 address_groups[] = { RTNLGRP_IPV4_IFADDR, RTNLGRP_IPV6_IFADDR, },
834 link_groups[] = { RTNLGRP_LINK, },
835 neighbor_groups[] = { RTNLGRP_NEIGH, },
836 nexthop_groups[] = { RTNLGRP_NEXTHOP, },
837 route_groups[] = { RTNLGRP_IPV4_ROUTE, RTNLGRP_IPV6_ROUTE, },
27e93a4b
YW
838 rule_groups[] = { RTNLGRP_IPV4_RULE, RTNLGRP_IPV6_RULE, },
839 tc_groups[] = { RTNLGRP_TC };
3f60e448
YW
840 const uint32_t *groups;
841 size_t n_groups;
842
843 assert_return(rtnl, -EINVAL);
844 assert_return(callback, -EINVAL);
845 assert_return(!netlink_pid_changed(rtnl), -ECHILD);
846
31710be5
TG
847 switch (type) {
848 case RTM_NEWLINK:
31710be5 849 case RTM_DELLINK:
3f60e448
YW
850 groups = link_groups;
851 n_groups = ELEMENTSOF(link_groups);
31710be5
TG
852 break;
853 case RTM_NEWADDR:
31710be5 854 case RTM_DELADDR:
3f60e448
YW
855 groups = address_groups;
856 n_groups = ELEMENTSOF(address_groups);
d1bdafd2
WKI
857 break;
858 case RTM_NEWNEIGH:
859 case RTM_DELNEIGH:
3f60e448
YW
860 groups = neighbor_groups;
861 n_groups = ELEMENTSOF(neighbor_groups);
31710be5 862 break;
87e4c847
TG
863 case RTM_NEWROUTE:
864 case RTM_DELROUTE:
3f60e448
YW
865 groups = route_groups;
866 n_groups = ELEMENTSOF(route_groups);
87e4c847 867 break;
bce67bbe
SS
868 case RTM_NEWRULE:
869 case RTM_DELRULE:
3f60e448
YW
870 groups = rule_groups;
871 n_groups = ELEMENTSOF(rule_groups);
bce67bbe 872 break;
c16c7808
SS
873 case RTM_NEWNEXTHOP:
874 case RTM_DELNEXTHOP:
3f60e448
YW
875 groups = nexthop_groups;
876 n_groups = ELEMENTSOF(nexthop_groups);
877 break;
27e93a4b
YW
878 case RTM_NEWQDISC:
879 case RTM_DELQDISC:
880 case RTM_NEWTCLASS:
881 case RTM_DELTCLASS:
882 groups = tc_groups;
883 n_groups = ELEMENTSOF(tc_groups);
884 break;
31710be5
TG
885 default:
886 return -EOPNOTSUPP;
887 }
888
e1578f60 889 return netlink_add_match_internal(rtnl, ret_slot, groups, n_groups, type, 0, callback,
3f60e448 890 destroy_callback, userdata, description);
8cec01b9 891}
dc317a9a 892
dd35a61c 893int sd_netlink_attach_filter(sd_netlink *nl, size_t len, const struct sock_filter *filter) {
dc317a9a
YW
894 assert_return(nl, -EINVAL);
895 assert_return(len == 0 || filter, -EINVAL);
896
897 if (setsockopt(nl->fd, SOL_SOCKET,
898 len == 0 ? SO_DETACH_FILTER : SO_ATTACH_FILTER,
899 &(struct sock_fprog) {
900 .len = len,
f4f81a6b 901 .filter = (struct sock_filter*) filter,
dc317a9a
YW
902 }, sizeof(struct sock_fprog)) < 0)
903 return -errno;
904
905 return 0;
906}