2 This file is part of systemd.
4 Copyright 2013 Tom Gundersen <teg@jklm.no>
6 systemd is free software; you can redistribute it and/or modify it
7 under the terms of the GNU Lesser General Public License as published by
8 the Free Software Foundation; either version 2.1 of the License, or
9 (at your option) any later version.
11 systemd is distributed in the hope that it will be useful, but
12 WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 Lesser General Public License for more details.
16 You should have received a copy of the GNU Lesser General Public License
17 along with systemd; If not, see <http://www.gnu.org/licenses/>.
22 #include "alloc-util.h"
23 #include "conf-files.h"
24 #include "conf-parser.h"
27 #include "netlink-util.h"
28 #include "network-internal.h"
29 #include "networkd-netdev.h"
31 #include "siphash24.h"
32 #include "stat-util.h"
33 #include "string-table.h"
34 #include "string-util.h"
36 const NetDevVTable
* const netdev_vtable
[_NETDEV_KIND_MAX
] = {
38 [NETDEV_KIND_BRIDGE
] = &bridge_vtable
,
39 [NETDEV_KIND_BOND
] = &bond_vtable
,
40 [NETDEV_KIND_VLAN
] = &vlan_vtable
,
41 [NETDEV_KIND_MACVLAN
] = &macvlan_vtable
,
42 [NETDEV_KIND_MACVTAP
] = &macvtap_vtable
,
43 [NETDEV_KIND_IPVLAN
] = &ipvlan_vtable
,
44 [NETDEV_KIND_VXLAN
] = &vxlan_vtable
,
45 [NETDEV_KIND_IPIP
] = &ipip_vtable
,
46 [NETDEV_KIND_GRE
] = &gre_vtable
,
47 [NETDEV_KIND_GRETAP
] = &gretap_vtable
,
48 [NETDEV_KIND_IP6GRE
] = &ip6gre_vtable
,
49 [NETDEV_KIND_IP6GRETAP
] = &ip6gretap_vtable
,
50 [NETDEV_KIND_SIT
] = &sit_vtable
,
51 [NETDEV_KIND_VTI
] = &vti_vtable
,
52 [NETDEV_KIND_VTI6
] = &vti6_vtable
,
53 [NETDEV_KIND_VETH
] = &veth_vtable
,
54 [NETDEV_KIND_DUMMY
] = &dummy_vtable
,
55 [NETDEV_KIND_TUN
] = &tun_vtable
,
56 [NETDEV_KIND_TAP
] = &tap_vtable
,
57 [NETDEV_KIND_IP6TNL
] = &ip6tnl_vtable
,
58 [NETDEV_KIND_VRF
] = &vrf_vtable
,
59 [NETDEV_KIND_VCAN
] = &vcan_vtable
,
62 static const char* const netdev_kind_table
[_NETDEV_KIND_MAX
] = {
63 [NETDEV_KIND_BRIDGE
] = "bridge",
64 [NETDEV_KIND_BOND
] = "bond",
65 [NETDEV_KIND_VLAN
] = "vlan",
66 [NETDEV_KIND_MACVLAN
] = "macvlan",
67 [NETDEV_KIND_MACVTAP
] = "macvtap",
68 [NETDEV_KIND_IPVLAN
] = "ipvlan",
69 [NETDEV_KIND_VXLAN
] = "vxlan",
70 [NETDEV_KIND_IPIP
] = "ipip",
71 [NETDEV_KIND_GRE
] = "gre",
72 [NETDEV_KIND_GRETAP
] = "gretap",
73 [NETDEV_KIND_IP6GRE
] = "ip6gre",
74 [NETDEV_KIND_IP6GRETAP
] = "ip6gretap",
75 [NETDEV_KIND_SIT
] = "sit",
76 [NETDEV_KIND_VETH
] = "veth",
77 [NETDEV_KIND_VTI
] = "vti",
78 [NETDEV_KIND_VTI6
] = "vti6",
79 [NETDEV_KIND_DUMMY
] = "dummy",
80 [NETDEV_KIND_TUN
] = "tun",
81 [NETDEV_KIND_TAP
] = "tap",
82 [NETDEV_KIND_IP6TNL
] = "ip6tnl",
83 [NETDEV_KIND_VRF
] = "vrf",
84 [NETDEV_KIND_VCAN
] = "vcan",
87 DEFINE_STRING_TABLE_LOOKUP(netdev_kind
, NetDevKind
);
88 DEFINE_CONFIG_PARSE_ENUM(config_parse_netdev_kind
, netdev_kind
, NetDevKind
, "Failed to parse netdev kind");
90 static void netdev_cancel_callbacks(NetDev
*netdev
) {
91 _cleanup_(sd_netlink_message_unrefp
) sd_netlink_message
*m
= NULL
;
92 netdev_join_callback
*callback
;
97 rtnl_message_new_synthetic_error(-ENODEV
, 0, &m
);
99 while ((callback
= netdev
->callbacks
)) {
101 assert(callback
->link
);
102 assert(callback
->callback
);
103 assert(netdev
->manager
);
104 assert(netdev
->manager
->rtnl
);
106 callback
->callback(netdev
->manager
->rtnl
, m
, callback
->link
);
109 LIST_REMOVE(callbacks
, netdev
->callbacks
, callback
);
110 link_unref(callback
->link
);
115 static void netdev_free(NetDev
*netdev
) {
119 netdev_cancel_callbacks(netdev
);
122 hashmap_remove(netdev
->manager
->netdevs
, netdev
->ifname
);
124 free(netdev
->filename
);
126 free(netdev
->description
);
127 free(netdev
->ifname
);
130 condition_free_list(netdev
->match_host
);
131 condition_free_list(netdev
->match_virt
);
132 condition_free_list(netdev
->match_kernel
);
133 condition_free_list(netdev
->match_arch
);
135 if (NETDEV_VTABLE(netdev
) &&
136 NETDEV_VTABLE(netdev
)->done
)
137 NETDEV_VTABLE(netdev
)->done(netdev
);
142 NetDev
*netdev_unref(NetDev
*netdev
) {
143 if (netdev
&& (-- netdev
->n_ref
<= 0))
149 NetDev
*netdev_ref(NetDev
*netdev
) {
151 assert_se(++ netdev
->n_ref
>= 2);
156 void netdev_drop(NetDev
*netdev
) {
157 if (!netdev
|| netdev
->state
== NETDEV_STATE_LINGER
)
160 netdev
->state
= NETDEV_STATE_LINGER
;
162 log_netdev_debug(netdev
, "netdev removed");
164 netdev_cancel_callbacks(netdev
);
166 netdev_unref(netdev
);
171 int netdev_get(Manager
*manager
, const char *name
, NetDev
**ret
) {
178 netdev
= hashmap_get(manager
->netdevs
, name
);
189 static int netdev_enter_failed(NetDev
*netdev
) {
190 netdev
->state
= NETDEV_STATE_FAILED
;
192 netdev_cancel_callbacks(netdev
);
197 static int netdev_enslave_ready(NetDev
*netdev
, Link
* link
, sd_netlink_message_handler_t callback
) {
198 _cleanup_(sd_netlink_message_unrefp
) sd_netlink_message
*req
= NULL
;
202 assert(netdev
->state
== NETDEV_STATE_READY
);
203 assert(netdev
->manager
);
204 assert(netdev
->manager
->rtnl
);
205 assert(IN_SET(netdev
->kind
, NETDEV_KIND_BRIDGE
, NETDEV_KIND_BOND
, NETDEV_KIND_VRF
));
209 r
= sd_rtnl_message_new_link(netdev
->manager
->rtnl
, &req
, RTM_SETLINK
, link
->ifindex
);
211 return log_netdev_error_errno(netdev
, r
, "Could not allocate RTM_SETLINK message: %m");
213 r
= sd_netlink_message_append_u32(req
, IFLA_MASTER
, netdev
->ifindex
);
215 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_MASTER attribute: %m");
217 r
= sd_netlink_call_async(netdev
->manager
->rtnl
, req
, callback
, link
, 0, NULL
);
219 return log_netdev_error(netdev
, "Could not send rtnetlink message: %m");
223 log_netdev_debug(netdev
, "Enslaving link '%s'", link
->ifname
);
228 static int netdev_enter_ready(NetDev
*netdev
) {
229 netdev_join_callback
*callback
, *callback_next
;
233 assert(netdev
->ifname
);
235 if (netdev
->state
!= NETDEV_STATE_CREATING
)
238 netdev
->state
= NETDEV_STATE_READY
;
240 log_netdev_info(netdev
, "netdev ready");
242 LIST_FOREACH_SAFE(callbacks
, callback
, callback_next
, netdev
->callbacks
) {
243 /* enslave the links that were attempted to be enslaved before the
245 r
= netdev_enslave_ready(netdev
, callback
->link
, callback
->callback
);
249 LIST_REMOVE(callbacks
, netdev
->callbacks
, callback
);
250 link_unref(callback
->link
);
254 if (NETDEV_VTABLE(netdev
)->post_create
)
255 NETDEV_VTABLE(netdev
)->post_create(netdev
, NULL
, NULL
);
260 /* callback for netdev's created without a backing Link */
261 static int netdev_create_handler(sd_netlink
*rtnl
, sd_netlink_message
*m
, void *userdata
) {
262 _cleanup_netdev_unref_ NetDev
*netdev
= userdata
;
265 assert(netdev
->state
!= _NETDEV_STATE_INVALID
);
267 r
= sd_netlink_message_get_errno(m
);
269 log_netdev_info(netdev
, "netdev exists, using existing without changing its parameters");
271 log_netdev_warning_errno(netdev
, r
, "netdev could not be created: %m");
277 log_netdev_debug(netdev
, "Created");
282 int netdev_enslave(NetDev
*netdev
, Link
*link
, sd_netlink_message_handler_t callback
) {
286 assert(netdev
->manager
);
287 assert(netdev
->manager
->rtnl
);
288 assert(IN_SET(netdev
->kind
, NETDEV_KIND_BRIDGE
, NETDEV_KIND_BOND
, NETDEV_KIND_VRF
));
290 if (netdev
->state
== NETDEV_STATE_READY
) {
291 r
= netdev_enslave_ready(netdev
, link
, callback
);
294 } else if (IN_SET(netdev
->state
, NETDEV_STATE_LINGER
, NETDEV_STATE_FAILED
)) {
295 _cleanup_(sd_netlink_message_unrefp
) sd_netlink_message
*m
= NULL
;
297 r
= rtnl_message_new_synthetic_error(-ENODEV
, 0, &m
);
299 callback(netdev
->manager
->rtnl
, m
, link
);
301 /* the netdev is not yet read, save this request for when it is */
302 netdev_join_callback
*cb
;
304 cb
= new0(netdev_join_callback
, 1);
308 cb
->callback
= callback
;
312 LIST_PREPEND(callbacks
, netdev
->callbacks
, cb
);
314 log_netdev_debug(netdev
, "Will enslave '%s', when ready", link
->ifname
);
320 int netdev_set_ifindex(NetDev
*netdev
, sd_netlink_message
*message
) {
323 const char *received_kind
;
324 const char *received_name
;
330 r
= sd_netlink_message_get_type(message
, &type
);
332 return log_netdev_error_errno(netdev
, r
, "Could not get rtnl message type: %m");
334 if (type
!= RTM_NEWLINK
) {
335 log_netdev_error(netdev
, "Cannot set ifindex from unexpected rtnl message type.");
339 r
= sd_rtnl_message_link_get_ifindex(message
, &ifindex
);
341 log_netdev_error_errno(netdev
, r
, "Could not get ifindex: %m");
342 netdev_enter_failed(netdev
);
344 } else if (ifindex
<= 0) {
345 log_netdev_error(netdev
, "Got invalid ifindex: %d", ifindex
);
346 netdev_enter_failed(netdev
);
350 if (netdev
->ifindex
> 0) {
351 if (netdev
->ifindex
!= ifindex
) {
352 log_netdev_error(netdev
, "Could not set ifindex to %d, already set to %d",
353 ifindex
, netdev
->ifindex
);
354 netdev_enter_failed(netdev
);
357 /* ifindex already set to the same for this netdev */
361 r
= sd_netlink_message_read_string(message
, IFLA_IFNAME
, &received_name
);
363 return log_netdev_error_errno(netdev
, r
, "Could not get IFNAME: %m");
365 if (!streq(netdev
->ifname
, received_name
)) {
366 log_netdev_error(netdev
, "Received newlink with wrong IFNAME %s", received_name
);
367 netdev_enter_failed(netdev
);
371 r
= sd_netlink_message_enter_container(message
, IFLA_LINKINFO
);
373 return log_netdev_error_errno(netdev
, r
, "Could not get LINKINFO: %m");
375 r
= sd_netlink_message_read_string(message
, IFLA_INFO_KIND
, &received_kind
);
377 return log_netdev_error_errno(netdev
, r
, "Could not get KIND: %m");
379 r
= sd_netlink_message_exit_container(message
);
381 return log_netdev_error_errno(netdev
, r
, "Could not exit container: %m");
383 if (netdev
->kind
== NETDEV_KIND_TAP
)
384 /* the kernel does not distinguish between tun and tap */
387 kind
= netdev_kind_to_string(netdev
->kind
);
389 log_netdev_error(netdev
, "Could not get kind");
390 netdev_enter_failed(netdev
);
395 if (!streq(kind
, received_kind
)) {
396 log_netdev_error(netdev
,
397 "Received newlink with wrong KIND %s, "
398 "expected %s", received_kind
, kind
);
399 netdev_enter_failed(netdev
);
403 netdev
->ifindex
= ifindex
;
405 log_netdev_debug(netdev
, "netdev has index %d", netdev
->ifindex
);
407 netdev_enter_ready(netdev
);
412 #define HASH_KEY SD_ID128_MAKE(52,e1,45,bd,00,6f,29,96,21,c6,30,6d,83,71,04,48)
414 int netdev_get_mac(const char *ifname
, struct ether_addr
**ret
) {
415 _cleanup_free_
struct ether_addr
*mac
= NULL
;
424 mac
= new0(struct ether_addr
, 1);
429 sz
= sizeof(sd_id128_t
) + l
;
432 /* fetch some persistent data unique to the machine */
433 r
= sd_id128_get_machine((sd_id128_t
*) v
);
437 /* combine with some data unique (on this machine) to this
439 memcpy(v
+ sizeof(sd_id128_t
), ifname
, l
);
441 /* Let's hash the host machine ID plus the container name. We
442 * use a fixed, but originally randomly created hash key here. */
443 result
= siphash24(v
, sz
, HASH_KEY
.bytes
);
445 assert_cc(ETH_ALEN
<= sizeof(result
));
446 memcpy(mac
->ether_addr_octet
, &result
, ETH_ALEN
);
448 /* see eth_random_addr in the kernel */
449 mac
->ether_addr_octet
[0] &= 0xfe; /* clear multicast bit */
450 mac
->ether_addr_octet
[0] |= 0x02; /* set local assignment bit (IEEE802) */
458 static int netdev_create(NetDev
*netdev
, Link
*link
,
459 sd_netlink_message_handler_t callback
) {
463 assert(!link
|| callback
);
466 if (NETDEV_VTABLE(netdev
)->create
) {
469 r
= NETDEV_VTABLE(netdev
)->create(netdev
);
473 log_netdev_debug(netdev
, "Created");
475 _cleanup_(sd_netlink_message_unrefp
) sd_netlink_message
*m
= NULL
;
477 r
= sd_rtnl_message_new_link(netdev
->manager
->rtnl
, &m
, RTM_NEWLINK
, 0);
479 return log_netdev_error_errno(netdev
, r
, "Could not allocate RTM_NEWLINK message: %m");
481 r
= sd_netlink_message_append_string(m
, IFLA_IFNAME
, netdev
->ifname
);
483 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_IFNAME, attribute: %m");
486 r
= sd_netlink_message_append_ether_addr(m
, IFLA_ADDRESS
, netdev
->mac
);
488 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_ADDRESS attribute: %m");
492 r
= sd_netlink_message_append_u32(m
, IFLA_MTU
, netdev
->mtu
);
494 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_MTU attribute: %m");
498 r
= sd_netlink_message_append_u32(m
, IFLA_LINK
, link
->ifindex
);
500 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_LINK attribute: %m");
503 r
= sd_netlink_message_open_container(m
, IFLA_LINKINFO
);
505 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_LINKINFO attribute: %m");
507 r
= sd_netlink_message_open_container_union(m
, IFLA_INFO_DATA
, netdev_kind_to_string(netdev
->kind
));
509 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_INFO_DATA attribute: %m");
511 if (NETDEV_VTABLE(netdev
)->fill_message_create
) {
512 r
= NETDEV_VTABLE(netdev
)->fill_message_create(netdev
, link
, m
);
517 r
= sd_netlink_message_close_container(m
);
519 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_LINKINFO attribute: %m");
521 r
= sd_netlink_message_close_container(m
);
523 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_LINKINFO attribute: %m");
526 r
= sd_netlink_call_async(netdev
->manager
->rtnl
, m
, callback
, link
, 0, NULL
);
528 return log_netdev_error_errno(netdev
, r
, "Could not send rtnetlink message: %m");
532 r
= sd_netlink_call_async(netdev
->manager
->rtnl
, m
, netdev_create_handler
, netdev
, 0, NULL
);
534 return log_netdev_error_errno(netdev
, r
, "Could not send rtnetlink message: %m");
539 netdev
->state
= NETDEV_STATE_CREATING
;
541 log_netdev_debug(netdev
, "Creating");
547 /* the callback must be called, possibly after a timeout, as otherwise the Link will hang */
548 int netdev_join(NetDev
*netdev
, Link
*link
, sd_netlink_message_handler_t callback
) {
552 assert(netdev
->manager
);
553 assert(netdev
->manager
->rtnl
);
554 assert(NETDEV_VTABLE(netdev
));
556 switch (NETDEV_VTABLE(netdev
)->create_type
) {
557 case NETDEV_CREATE_MASTER
:
558 r
= netdev_enslave(netdev
, link
, callback
);
563 case NETDEV_CREATE_STACKED
:
564 r
= netdev_create(netdev
, link
, callback
);
570 assert_not_reached("Can not join independent netdev");
576 static int netdev_load_one(Manager
*manager
, const char *filename
) {
577 _cleanup_netdev_unref_ NetDev
*netdev
= NULL
;
578 _cleanup_free_ NetDev
*netdev_raw
= NULL
;
579 _cleanup_fclose_
FILE *file
= NULL
;
585 file
= fopen(filename
, "re");
593 if (null_or_empty_fd(fileno(file
))) {
594 log_debug("Skipping empty file: %s", filename
);
598 netdev_raw
= new0(NetDev
, 1);
602 netdev_raw
->kind
= _NETDEV_KIND_INVALID
;
604 r
= config_parse(NULL
, filename
, file
,
606 config_item_perf_lookup
, network_netdev_gperf_lookup
,
607 true, false, true, netdev_raw
);
611 r
= fseek(file
, 0, SEEK_SET
);
615 /* skip out early if configuration does not match the environment */
616 if (net_match_config(NULL
, NULL
, NULL
, NULL
, NULL
,
617 netdev_raw
->match_host
, netdev_raw
->match_virt
,
618 netdev_raw
->match_kernel
, netdev_raw
->match_arch
,
619 NULL
, NULL
, NULL
, NULL
, NULL
, NULL
) <= 0)
622 if (netdev_raw
->kind
== _NETDEV_KIND_INVALID
) {
623 log_warning("NetDev with invalid Kind configured in %s. Ignoring", filename
);
627 if (!netdev_raw
->ifname
) {
628 log_warning("NetDev without Name configured in %s. Ignoring", filename
);
632 netdev
= malloc0(NETDEV_VTABLE(netdev_raw
)->object_size
);
637 netdev
->manager
= manager
;
638 netdev
->state
= _NETDEV_STATE_INVALID
;
639 netdev
->kind
= netdev_raw
->kind
;
640 netdev
->ifname
= netdev_raw
->ifname
;
642 if (NETDEV_VTABLE(netdev
)->init
)
643 NETDEV_VTABLE(netdev
)->init(netdev
);
645 r
= config_parse(NULL
, filename
, file
,
646 NETDEV_VTABLE(netdev
)->sections
,
647 config_item_perf_lookup
, network_netdev_gperf_lookup
,
648 false, false, false, netdev
);
652 /* verify configuration */
653 if (NETDEV_VTABLE(netdev
)->config_verify
) {
654 r
= NETDEV_VTABLE(netdev
)->config_verify(netdev
, filename
);
659 netdev
->filename
= strdup(filename
);
660 if (!netdev
->filename
)
663 if (!netdev
->mac
&& netdev
->kind
!= NETDEV_KIND_VLAN
) {
664 r
= netdev_get_mac(netdev
->ifname
, &netdev
->mac
);
666 return log_error_errno(r
, "Failed to generate predictable MAC address for %s: %m", netdev
->ifname
);
669 r
= hashmap_put(netdev
->manager
->netdevs
, netdev
->ifname
, netdev
);
673 LIST_HEAD_INIT(netdev
->callbacks
);
675 log_netdev_debug(netdev
, "loaded %s", netdev_kind_to_string(netdev
->kind
));
677 switch (NETDEV_VTABLE(netdev
)->create_type
) {
678 case NETDEV_CREATE_MASTER
:
679 case NETDEV_CREATE_INDEPENDENT
:
680 r
= netdev_create(netdev
, NULL
, NULL
);
694 int netdev_load(Manager
*manager
) {
695 _cleanup_strv_free_
char **files
= NULL
;
702 while ((netdev
= hashmap_first(manager
->netdevs
)))
703 netdev_unref(netdev
);
705 r
= conf_files_list_strv(&files
, ".netdev", NULL
, network_dirs
);
707 return log_error_errno(r
, "Failed to enumerate netdev files: %m");
709 STRV_FOREACH_BACKWARDS(f
, files
) {
710 r
= netdev_load_one(manager
, *f
);