2 This file is part of systemd.
4 Copyright 2013 Tom Gundersen <teg@jklm.no>
6 systemd is free software; you can redistribute it and/or modify it
7 under the terms of the GNU Lesser General Public License as published by
8 the Free Software Foundation; either version 2.1 of the License, or
9 (at your option) any later version.
11 systemd is distributed in the hope that it will be useful, but
12 WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 Lesser General Public License for more details.
16 You should have received a copy of the GNU Lesser General Public License
17 along with systemd; If not, see <http://www.gnu.org/licenses/>.
22 #include "alloc-util.h"
23 #include "conf-files.h"
24 #include "conf-parser.h"
27 #include "netlink-util.h"
28 #include "network-internal.h"
29 #include "netdev/netdev.h"
31 #include "siphash24.h"
32 #include "stat-util.h"
33 #include "string-table.h"
34 #include "string-util.h"
36 const NetDevVTable
* const netdev_vtable
[_NETDEV_KIND_MAX
] = {
37 [NETDEV_KIND_BRIDGE
] = &bridge_vtable
,
38 [NETDEV_KIND_BOND
] = &bond_vtable
,
39 [NETDEV_KIND_VLAN
] = &vlan_vtable
,
40 [NETDEV_KIND_MACVLAN
] = &macvlan_vtable
,
41 [NETDEV_KIND_MACVTAP
] = &macvtap_vtable
,
42 [NETDEV_KIND_IPVLAN
] = &ipvlan_vtable
,
43 [NETDEV_KIND_VXLAN
] = &vxlan_vtable
,
44 [NETDEV_KIND_IPIP
] = &ipip_vtable
,
45 [NETDEV_KIND_GRE
] = &gre_vtable
,
46 [NETDEV_KIND_GRETAP
] = &gretap_vtable
,
47 [NETDEV_KIND_IP6GRE
] = &ip6gre_vtable
,
48 [NETDEV_KIND_IP6GRETAP
] = &ip6gretap_vtable
,
49 [NETDEV_KIND_SIT
] = &sit_vtable
,
50 [NETDEV_KIND_VTI
] = &vti_vtable
,
51 [NETDEV_KIND_VTI6
] = &vti6_vtable
,
52 [NETDEV_KIND_VETH
] = &veth_vtable
,
53 [NETDEV_KIND_DUMMY
] = &dummy_vtable
,
54 [NETDEV_KIND_TUN
] = &tun_vtable
,
55 [NETDEV_KIND_TAP
] = &tap_vtable
,
56 [NETDEV_KIND_IP6TNL
] = &ip6tnl_vtable
,
57 [NETDEV_KIND_VRF
] = &vrf_vtable
,
58 [NETDEV_KIND_VCAN
] = &vcan_vtable
,
61 static const char* const netdev_kind_table
[_NETDEV_KIND_MAX
] = {
62 [NETDEV_KIND_BRIDGE
] = "bridge",
63 [NETDEV_KIND_BOND
] = "bond",
64 [NETDEV_KIND_VLAN
] = "vlan",
65 [NETDEV_KIND_MACVLAN
] = "macvlan",
66 [NETDEV_KIND_MACVTAP
] = "macvtap",
67 [NETDEV_KIND_IPVLAN
] = "ipvlan",
68 [NETDEV_KIND_VXLAN
] = "vxlan",
69 [NETDEV_KIND_IPIP
] = "ipip",
70 [NETDEV_KIND_GRE
] = "gre",
71 [NETDEV_KIND_GRETAP
] = "gretap",
72 [NETDEV_KIND_IP6GRE
] = "ip6gre",
73 [NETDEV_KIND_IP6GRETAP
] = "ip6gretap",
74 [NETDEV_KIND_SIT
] = "sit",
75 [NETDEV_KIND_VETH
] = "veth",
76 [NETDEV_KIND_VTI
] = "vti",
77 [NETDEV_KIND_VTI6
] = "vti6",
78 [NETDEV_KIND_DUMMY
] = "dummy",
79 [NETDEV_KIND_TUN
] = "tun",
80 [NETDEV_KIND_TAP
] = "tap",
81 [NETDEV_KIND_IP6TNL
] = "ip6tnl",
82 [NETDEV_KIND_VRF
] = "vrf",
83 [NETDEV_KIND_VCAN
] = "vcan",
86 DEFINE_STRING_TABLE_LOOKUP(netdev_kind
, NetDevKind
);
87 DEFINE_CONFIG_PARSE_ENUM(config_parse_netdev_kind
, netdev_kind
, NetDevKind
, "Failed to parse netdev kind");
89 static void netdev_cancel_callbacks(NetDev
*netdev
) {
90 _cleanup_(sd_netlink_message_unrefp
) sd_netlink_message
*m
= NULL
;
91 netdev_join_callback
*callback
;
96 rtnl_message_new_synthetic_error(-ENODEV
, 0, &m
);
98 while ((callback
= netdev
->callbacks
)) {
100 assert(callback
->link
);
101 assert(callback
->callback
);
102 assert(netdev
->manager
);
103 assert(netdev
->manager
->rtnl
);
105 callback
->callback(netdev
->manager
->rtnl
, m
, callback
->link
);
108 LIST_REMOVE(callbacks
, netdev
->callbacks
, callback
);
109 link_unref(callback
->link
);
114 static void netdev_free(NetDev
*netdev
) {
118 netdev_cancel_callbacks(netdev
);
121 hashmap_remove(netdev
->manager
->netdevs
, netdev
->ifname
);
123 free(netdev
->filename
);
125 free(netdev
->description
);
126 free(netdev
->ifname
);
129 condition_free_list(netdev
->match_host
);
130 condition_free_list(netdev
->match_virt
);
131 condition_free_list(netdev
->match_kernel
);
132 condition_free_list(netdev
->match_arch
);
134 if (NETDEV_VTABLE(netdev
) &&
135 NETDEV_VTABLE(netdev
)->done
)
136 NETDEV_VTABLE(netdev
)->done(netdev
);
141 NetDev
*netdev_unref(NetDev
*netdev
) {
142 if (netdev
&& (-- netdev
->n_ref
<= 0))
148 NetDev
*netdev_ref(NetDev
*netdev
) {
150 assert_se(++ netdev
->n_ref
>= 2);
155 void netdev_drop(NetDev
*netdev
) {
156 if (!netdev
|| netdev
->state
== NETDEV_STATE_LINGER
)
159 netdev
->state
= NETDEV_STATE_LINGER
;
161 log_netdev_debug(netdev
, "netdev removed");
163 netdev_cancel_callbacks(netdev
);
165 netdev_unref(netdev
);
170 int netdev_get(Manager
*manager
, const char *name
, NetDev
**ret
) {
177 netdev
= hashmap_get(manager
->netdevs
, name
);
188 static int netdev_enter_failed(NetDev
*netdev
) {
189 netdev
->state
= NETDEV_STATE_FAILED
;
191 netdev_cancel_callbacks(netdev
);
196 static int netdev_enslave_ready(NetDev
*netdev
, Link
* link
, sd_netlink_message_handler_t callback
) {
197 _cleanup_(sd_netlink_message_unrefp
) sd_netlink_message
*req
= NULL
;
201 assert(netdev
->state
== NETDEV_STATE_READY
);
202 assert(netdev
->manager
);
203 assert(netdev
->manager
->rtnl
);
204 assert(IN_SET(netdev
->kind
, NETDEV_KIND_BRIDGE
, NETDEV_KIND_BOND
, NETDEV_KIND_VRF
));
208 r
= sd_rtnl_message_new_link(netdev
->manager
->rtnl
, &req
, RTM_SETLINK
, link
->ifindex
);
210 return log_netdev_error_errno(netdev
, r
, "Could not allocate RTM_SETLINK message: %m");
212 r
= sd_netlink_message_append_u32(req
, IFLA_MASTER
, netdev
->ifindex
);
214 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_MASTER attribute: %m");
216 r
= sd_netlink_call_async(netdev
->manager
->rtnl
, req
, callback
, link
, 0, NULL
);
218 return log_netdev_error(netdev
, "Could not send rtnetlink message: %m");
222 log_netdev_debug(netdev
, "Enslaving link '%s'", link
->ifname
);
227 static int netdev_enter_ready(NetDev
*netdev
) {
228 netdev_join_callback
*callback
, *callback_next
;
232 assert(netdev
->ifname
);
234 if (netdev
->state
!= NETDEV_STATE_CREATING
)
237 netdev
->state
= NETDEV_STATE_READY
;
239 log_netdev_info(netdev
, "netdev ready");
241 LIST_FOREACH_SAFE(callbacks
, callback
, callback_next
, netdev
->callbacks
) {
242 /* enslave the links that were attempted to be enslaved before the
244 r
= netdev_enslave_ready(netdev
, callback
->link
, callback
->callback
);
248 LIST_REMOVE(callbacks
, netdev
->callbacks
, callback
);
249 link_unref(callback
->link
);
253 if (NETDEV_VTABLE(netdev
)->post_create
)
254 NETDEV_VTABLE(netdev
)->post_create(netdev
, NULL
, NULL
);
259 /* callback for netdev's created without a backing Link */
260 static int netdev_create_handler(sd_netlink
*rtnl
, sd_netlink_message
*m
, void *userdata
) {
261 _cleanup_netdev_unref_ NetDev
*netdev
= userdata
;
264 assert(netdev
->state
!= _NETDEV_STATE_INVALID
);
266 r
= sd_netlink_message_get_errno(m
);
268 log_netdev_info(netdev
, "netdev exists, using existing without changing its parameters");
270 log_netdev_warning_errno(netdev
, r
, "netdev could not be created: %m");
276 log_netdev_debug(netdev
, "Created");
281 int netdev_enslave(NetDev
*netdev
, Link
*link
, sd_netlink_message_handler_t callback
) {
285 assert(netdev
->manager
);
286 assert(netdev
->manager
->rtnl
);
287 assert(IN_SET(netdev
->kind
, NETDEV_KIND_BRIDGE
, NETDEV_KIND_BOND
, NETDEV_KIND_VRF
));
289 if (netdev
->state
== NETDEV_STATE_READY
) {
290 r
= netdev_enslave_ready(netdev
, link
, callback
);
293 } else if (IN_SET(netdev
->state
, NETDEV_STATE_LINGER
, NETDEV_STATE_FAILED
)) {
294 _cleanup_(sd_netlink_message_unrefp
) sd_netlink_message
*m
= NULL
;
296 r
= rtnl_message_new_synthetic_error(-ENODEV
, 0, &m
);
298 callback(netdev
->manager
->rtnl
, m
, link
);
300 /* the netdev is not yet read, save this request for when it is */
301 netdev_join_callback
*cb
;
303 cb
= new0(netdev_join_callback
, 1);
307 cb
->callback
= callback
;
311 LIST_PREPEND(callbacks
, netdev
->callbacks
, cb
);
313 log_netdev_debug(netdev
, "Will enslave '%s', when ready", link
->ifname
);
319 int netdev_set_ifindex(NetDev
*netdev
, sd_netlink_message
*message
) {
322 const char *received_kind
;
323 const char *received_name
;
329 r
= sd_netlink_message_get_type(message
, &type
);
331 return log_netdev_error_errno(netdev
, r
, "Could not get rtnl message type: %m");
333 if (type
!= RTM_NEWLINK
) {
334 log_netdev_error(netdev
, "Cannot set ifindex from unexpected rtnl message type.");
338 r
= sd_rtnl_message_link_get_ifindex(message
, &ifindex
);
340 log_netdev_error_errno(netdev
, r
, "Could not get ifindex: %m");
341 netdev_enter_failed(netdev
);
343 } else if (ifindex
<= 0) {
344 log_netdev_error(netdev
, "Got invalid ifindex: %d", ifindex
);
345 netdev_enter_failed(netdev
);
349 if (netdev
->ifindex
> 0) {
350 if (netdev
->ifindex
!= ifindex
) {
351 log_netdev_error(netdev
, "Could not set ifindex to %d, already set to %d",
352 ifindex
, netdev
->ifindex
);
353 netdev_enter_failed(netdev
);
356 /* ifindex already set to the same for this netdev */
360 r
= sd_netlink_message_read_string(message
, IFLA_IFNAME
, &received_name
);
362 return log_netdev_error_errno(netdev
, r
, "Could not get IFNAME: %m");
364 if (!streq(netdev
->ifname
, received_name
)) {
365 log_netdev_error(netdev
, "Received newlink with wrong IFNAME %s", received_name
);
366 netdev_enter_failed(netdev
);
370 r
= sd_netlink_message_enter_container(message
, IFLA_LINKINFO
);
372 return log_netdev_error_errno(netdev
, r
, "Could not get LINKINFO: %m");
374 r
= sd_netlink_message_read_string(message
, IFLA_INFO_KIND
, &received_kind
);
376 return log_netdev_error_errno(netdev
, r
, "Could not get KIND: %m");
378 r
= sd_netlink_message_exit_container(message
);
380 return log_netdev_error_errno(netdev
, r
, "Could not exit container: %m");
382 if (netdev
->kind
== NETDEV_KIND_TAP
)
383 /* the kernel does not distinguish between tun and tap */
386 kind
= netdev_kind_to_string(netdev
->kind
);
388 log_netdev_error(netdev
, "Could not get kind");
389 netdev_enter_failed(netdev
);
394 if (!streq(kind
, received_kind
)) {
395 log_netdev_error(netdev
,
396 "Received newlink with wrong KIND %s, "
397 "expected %s", received_kind
, kind
);
398 netdev_enter_failed(netdev
);
402 netdev
->ifindex
= ifindex
;
404 log_netdev_debug(netdev
, "netdev has index %d", netdev
->ifindex
);
406 netdev_enter_ready(netdev
);
411 #define HASH_KEY SD_ID128_MAKE(52,e1,45,bd,00,6f,29,96,21,c6,30,6d,83,71,04,48)
413 int netdev_get_mac(const char *ifname
, struct ether_addr
**ret
) {
414 _cleanup_free_
struct ether_addr
*mac
= NULL
;
423 mac
= new0(struct ether_addr
, 1);
428 sz
= sizeof(sd_id128_t
) + l
;
431 /* fetch some persistent data unique to the machine */
432 r
= sd_id128_get_machine((sd_id128_t
*) v
);
436 /* combine with some data unique (on this machine) to this
438 memcpy(v
+ sizeof(sd_id128_t
), ifname
, l
);
440 /* Let's hash the host machine ID plus the container name. We
441 * use a fixed, but originally randomly created hash key here. */
442 result
= siphash24(v
, sz
, HASH_KEY
.bytes
);
444 assert_cc(ETH_ALEN
<= sizeof(result
));
445 memcpy(mac
->ether_addr_octet
, &result
, ETH_ALEN
);
447 /* see eth_random_addr in the kernel */
448 mac
->ether_addr_octet
[0] &= 0xfe; /* clear multicast bit */
449 mac
->ether_addr_octet
[0] |= 0x02; /* set local assignment bit (IEEE802) */
457 static int netdev_create(NetDev
*netdev
, Link
*link
,
458 sd_netlink_message_handler_t callback
) {
462 assert(!link
|| callback
);
465 if (NETDEV_VTABLE(netdev
)->create
) {
468 r
= NETDEV_VTABLE(netdev
)->create(netdev
);
472 log_netdev_debug(netdev
, "Created");
474 _cleanup_(sd_netlink_message_unrefp
) sd_netlink_message
*m
= NULL
;
476 r
= sd_rtnl_message_new_link(netdev
->manager
->rtnl
, &m
, RTM_NEWLINK
, 0);
478 return log_netdev_error_errno(netdev
, r
, "Could not allocate RTM_NEWLINK message: %m");
480 r
= sd_netlink_message_append_string(m
, IFLA_IFNAME
, netdev
->ifname
);
482 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_IFNAME, attribute: %m");
485 r
= sd_netlink_message_append_ether_addr(m
, IFLA_ADDRESS
, netdev
->mac
);
487 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_ADDRESS attribute: %m");
491 r
= sd_netlink_message_append_u32(m
, IFLA_MTU
, netdev
->mtu
);
493 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_MTU attribute: %m");
497 r
= sd_netlink_message_append_u32(m
, IFLA_LINK
, link
->ifindex
);
499 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_LINK attribute: %m");
502 r
= sd_netlink_message_open_container(m
, IFLA_LINKINFO
);
504 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_LINKINFO attribute: %m");
506 r
= sd_netlink_message_open_container_union(m
, IFLA_INFO_DATA
, netdev_kind_to_string(netdev
->kind
));
508 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_INFO_DATA attribute: %m");
510 if (NETDEV_VTABLE(netdev
)->fill_message_create
) {
511 r
= NETDEV_VTABLE(netdev
)->fill_message_create(netdev
, link
, m
);
516 r
= sd_netlink_message_close_container(m
);
518 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_INFO_DATA attribute: %m");
520 r
= sd_netlink_message_close_container(m
);
522 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_LINKINFO attribute: %m");
525 r
= sd_netlink_call_async(netdev
->manager
->rtnl
, m
, callback
, link
, 0, NULL
);
527 return log_netdev_error_errno(netdev
, r
, "Could not send rtnetlink message: %m");
531 r
= sd_netlink_call_async(netdev
->manager
->rtnl
, m
, netdev_create_handler
, netdev
, 0, NULL
);
533 return log_netdev_error_errno(netdev
, r
, "Could not send rtnetlink message: %m");
538 netdev
->state
= NETDEV_STATE_CREATING
;
540 log_netdev_debug(netdev
, "Creating");
546 /* the callback must be called, possibly after a timeout, as otherwise the Link will hang */
547 int netdev_join(NetDev
*netdev
, Link
*link
, sd_netlink_message_handler_t callback
) {
551 assert(netdev
->manager
);
552 assert(netdev
->manager
->rtnl
);
553 assert(NETDEV_VTABLE(netdev
));
555 switch (NETDEV_VTABLE(netdev
)->create_type
) {
556 case NETDEV_CREATE_MASTER
:
557 r
= netdev_enslave(netdev
, link
, callback
);
562 case NETDEV_CREATE_STACKED
:
563 r
= netdev_create(netdev
, link
, callback
);
569 assert_not_reached("Can not join independent netdev");
575 static int netdev_load_one(Manager
*manager
, const char *filename
) {
576 _cleanup_netdev_unref_ NetDev
*netdev
= NULL
;
577 _cleanup_free_ NetDev
*netdev_raw
= NULL
;
578 _cleanup_fclose_
FILE *file
= NULL
;
579 const char *dropin_dirname
;
585 file
= fopen(filename
, "re");
593 if (null_or_empty_fd(fileno(file
))) {
594 log_debug("Skipping empty file: %s", filename
);
598 netdev_raw
= new0(NetDev
, 1);
602 netdev_raw
->kind
= _NETDEV_KIND_INVALID
;
603 dropin_dirname
= strjoina(basename(filename
), ".d");
605 r
= config_parse_many(filename
, network_dirs
, dropin_dirname
,
607 config_item_perf_lookup
, network_netdev_gperf_lookup
,
612 r
= fseek(file
, 0, SEEK_SET
);
616 /* skip out early if configuration does not match the environment */
617 if (net_match_config(NULL
, NULL
, NULL
, NULL
, NULL
,
618 netdev_raw
->match_host
, netdev_raw
->match_virt
,
619 netdev_raw
->match_kernel
, netdev_raw
->match_arch
,
620 NULL
, NULL
, NULL
, NULL
, NULL
, NULL
) <= 0)
623 if (netdev_raw
->kind
== _NETDEV_KIND_INVALID
) {
624 log_warning("NetDev has no Kind configured in %s. Ignoring", filename
);
628 if (!netdev_raw
->ifname
) {
629 log_warning("NetDev without Name configured in %s. Ignoring", filename
);
633 netdev
= malloc0(NETDEV_VTABLE(netdev_raw
)->object_size
);
638 netdev
->manager
= manager
;
639 netdev
->state
= _NETDEV_STATE_INVALID
;
640 netdev
->kind
= netdev_raw
->kind
;
641 netdev
->ifname
= netdev_raw
->ifname
;
643 if (NETDEV_VTABLE(netdev
)->init
)
644 NETDEV_VTABLE(netdev
)->init(netdev
);
646 r
= config_parse(NULL
, filename
, file
,
647 NETDEV_VTABLE(netdev
)->sections
,
648 config_item_perf_lookup
, network_netdev_gperf_lookup
,
649 false, false, false, netdev
);
653 /* verify configuration */
654 if (NETDEV_VTABLE(netdev
)->config_verify
) {
655 r
= NETDEV_VTABLE(netdev
)->config_verify(netdev
, filename
);
660 netdev
->filename
= strdup(filename
);
661 if (!netdev
->filename
)
664 if (!netdev
->mac
&& netdev
->kind
!= NETDEV_KIND_VLAN
) {
665 r
= netdev_get_mac(netdev
->ifname
, &netdev
->mac
);
667 return log_error_errno(r
, "Failed to generate predictable MAC address for %s: %m", netdev
->ifname
);
670 r
= hashmap_put(netdev
->manager
->netdevs
, netdev
->ifname
, netdev
);
674 LIST_HEAD_INIT(netdev
->callbacks
);
676 log_netdev_debug(netdev
, "loaded %s", netdev_kind_to_string(netdev
->kind
));
678 switch (NETDEV_VTABLE(netdev
)->create_type
) {
679 case NETDEV_CREATE_MASTER
:
680 case NETDEV_CREATE_INDEPENDENT
:
681 r
= netdev_create(netdev
, NULL
, NULL
);
695 int netdev_load(Manager
*manager
) {
696 _cleanup_strv_free_
char **files
= NULL
;
703 while ((netdev
= hashmap_first(manager
->netdevs
)))
704 netdev_unref(netdev
);
706 r
= conf_files_list_strv(&files
, ".netdev", NULL
, network_dirs
);
708 return log_error_errno(r
, "Failed to enumerate netdev files: %m");
710 STRV_FOREACH_BACKWARDS(f
, files
) {
711 r
= netdev_load_one(manager
, *f
);