2 This file is part of systemd.
4 Copyright 2013 Tom Gundersen <teg@jklm.no>
6 systemd is free software; you can redistribute it and/or modify it
7 under the terms of the GNU Lesser General Public License as published by
8 the Free Software Foundation; either version 2.1 of the License, or
9 (at your option) any later version.
11 systemd is distributed in the hope that it will be useful, but
12 WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 Lesser General Public License for more details.
16 You should have received a copy of the GNU Lesser General Public License
17 along with systemd; If not, see <http://www.gnu.org/licenses/>.
22 #include "alloc-util.h"
23 #include "conf-files.h"
24 #include "conf-parser.h"
27 #include "netlink-util.h"
28 #include "network-internal.h"
29 #include "netdev/netdev.h"
30 #include "networkd-manager.h"
31 #include "networkd-link.h"
32 #include "siphash24.h"
33 #include "stat-util.h"
34 #include "string-table.h"
35 #include "string-util.h"
37 #include "netdev/bridge.h"
38 #include "netdev/bond.h"
39 #include "netdev/geneve.h"
40 #include "netdev/vlan.h"
41 #include "netdev/macvlan.h"
42 #include "netdev/ipvlan.h"
43 #include "netdev/vxlan.h"
44 #include "netdev/tunnel.h"
45 #include "netdev/tuntap.h"
46 #include "netdev/veth.h"
47 #include "netdev/dummy.h"
48 #include "netdev/vrf.h"
49 #include "netdev/vcan.h"
51 const NetDevVTable
* const netdev_vtable
[_NETDEV_KIND_MAX
] = {
52 [NETDEV_KIND_BRIDGE
] = &bridge_vtable
,
53 [NETDEV_KIND_BOND
] = &bond_vtable
,
54 [NETDEV_KIND_VLAN
] = &vlan_vtable
,
55 [NETDEV_KIND_MACVLAN
] = &macvlan_vtable
,
56 [NETDEV_KIND_MACVTAP
] = &macvtap_vtable
,
57 [NETDEV_KIND_IPVLAN
] = &ipvlan_vtable
,
58 [NETDEV_KIND_VXLAN
] = &vxlan_vtable
,
59 [NETDEV_KIND_IPIP
] = &ipip_vtable
,
60 [NETDEV_KIND_GRE
] = &gre_vtable
,
61 [NETDEV_KIND_GRETAP
] = &gretap_vtable
,
62 [NETDEV_KIND_IP6GRE
] = &ip6gre_vtable
,
63 [NETDEV_KIND_IP6GRETAP
] = &ip6gretap_vtable
,
64 [NETDEV_KIND_SIT
] = &sit_vtable
,
65 [NETDEV_KIND_VTI
] = &vti_vtable
,
66 [NETDEV_KIND_VTI6
] = &vti6_vtable
,
67 [NETDEV_KIND_VETH
] = &veth_vtable
,
68 [NETDEV_KIND_DUMMY
] = &dummy_vtable
,
69 [NETDEV_KIND_TUN
] = &tun_vtable
,
70 [NETDEV_KIND_TAP
] = &tap_vtable
,
71 [NETDEV_KIND_IP6TNL
] = &ip6tnl_vtable
,
72 [NETDEV_KIND_VRF
] = &vrf_vtable
,
73 [NETDEV_KIND_VCAN
] = &vcan_vtable
,
74 [NETDEV_KIND_GENEVE
] = &geneve_vtable
,
77 static const char* const netdev_kind_table
[_NETDEV_KIND_MAX
] = {
78 [NETDEV_KIND_BRIDGE
] = "bridge",
79 [NETDEV_KIND_BOND
] = "bond",
80 [NETDEV_KIND_VLAN
] = "vlan",
81 [NETDEV_KIND_MACVLAN
] = "macvlan",
82 [NETDEV_KIND_MACVTAP
] = "macvtap",
83 [NETDEV_KIND_IPVLAN
] = "ipvlan",
84 [NETDEV_KIND_VXLAN
] = "vxlan",
85 [NETDEV_KIND_IPIP
] = "ipip",
86 [NETDEV_KIND_GRE
] = "gre",
87 [NETDEV_KIND_GRETAP
] = "gretap",
88 [NETDEV_KIND_IP6GRE
] = "ip6gre",
89 [NETDEV_KIND_IP6GRETAP
] = "ip6gretap",
90 [NETDEV_KIND_SIT
] = "sit",
91 [NETDEV_KIND_VETH
] = "veth",
92 [NETDEV_KIND_VTI
] = "vti",
93 [NETDEV_KIND_VTI6
] = "vti6",
94 [NETDEV_KIND_DUMMY
] = "dummy",
95 [NETDEV_KIND_TUN
] = "tun",
96 [NETDEV_KIND_TAP
] = "tap",
97 [NETDEV_KIND_IP6TNL
] = "ip6tnl",
98 [NETDEV_KIND_VRF
] = "vrf",
99 [NETDEV_KIND_VCAN
] = "vcan",
100 [NETDEV_KIND_GENEVE
] = "geneve",
103 DEFINE_STRING_TABLE_LOOKUP(netdev_kind
, NetDevKind
);
104 DEFINE_CONFIG_PARSE_ENUM(config_parse_netdev_kind
, netdev_kind
, NetDevKind
, "Failed to parse netdev kind");
106 static void netdev_cancel_callbacks(NetDev
*netdev
) {
107 _cleanup_(sd_netlink_message_unrefp
) sd_netlink_message
*m
= NULL
;
108 netdev_join_callback
*callback
;
113 rtnl_message_new_synthetic_error(-ENODEV
, 0, &m
);
115 while ((callback
= netdev
->callbacks
)) {
117 assert(callback
->link
);
118 assert(callback
->callback
);
119 assert(netdev
->manager
);
120 assert(netdev
->manager
->rtnl
);
122 callback
->callback(netdev
->manager
->rtnl
, m
, callback
->link
);
125 LIST_REMOVE(callbacks
, netdev
->callbacks
, callback
);
126 link_unref(callback
->link
);
131 static void netdev_free(NetDev
*netdev
) {
135 netdev_cancel_callbacks(netdev
);
138 hashmap_remove(netdev
->manager
->netdevs
, netdev
->ifname
);
140 free(netdev
->filename
);
142 free(netdev
->description
);
143 free(netdev
->ifname
);
146 condition_free_list(netdev
->match_host
);
147 condition_free_list(netdev
->match_virt
);
148 condition_free_list(netdev
->match_kernel
);
149 condition_free_list(netdev
->match_arch
);
151 if (NETDEV_VTABLE(netdev
) &&
152 NETDEV_VTABLE(netdev
)->done
)
153 NETDEV_VTABLE(netdev
)->done(netdev
);
158 NetDev
*netdev_unref(NetDev
*netdev
) {
159 if (netdev
&& (-- netdev
->n_ref
<= 0))
165 NetDev
*netdev_ref(NetDev
*netdev
) {
167 assert_se(++ netdev
->n_ref
>= 2);
172 void netdev_drop(NetDev
*netdev
) {
173 if (!netdev
|| netdev
->state
== NETDEV_STATE_LINGER
)
176 netdev
->state
= NETDEV_STATE_LINGER
;
178 log_netdev_debug(netdev
, "netdev removed");
180 netdev_cancel_callbacks(netdev
);
182 netdev_unref(netdev
);
187 int netdev_get(Manager
*manager
, const char *name
, NetDev
**ret
) {
194 netdev
= hashmap_get(manager
->netdevs
, name
);
205 static int netdev_enter_failed(NetDev
*netdev
) {
206 netdev
->state
= NETDEV_STATE_FAILED
;
208 netdev_cancel_callbacks(netdev
);
213 static int netdev_enslave_ready(NetDev
*netdev
, Link
* link
, sd_netlink_message_handler_t callback
) {
214 _cleanup_(sd_netlink_message_unrefp
) sd_netlink_message
*req
= NULL
;
218 assert(netdev
->state
== NETDEV_STATE_READY
);
219 assert(netdev
->manager
);
220 assert(netdev
->manager
->rtnl
);
221 assert(IN_SET(netdev
->kind
, NETDEV_KIND_BRIDGE
, NETDEV_KIND_BOND
, NETDEV_KIND_VRF
));
225 if (link
->flags
& IFF_UP
) {
226 log_netdev_debug(netdev
, "Link '%s' was up when attempting to enslave it. Bringing link down.", link
->ifname
);
229 return log_netdev_error_errno(netdev
, r
, "Could not bring link down: %m");
232 r
= sd_rtnl_message_new_link(netdev
->manager
->rtnl
, &req
, RTM_SETLINK
, link
->ifindex
);
234 return log_netdev_error_errno(netdev
, r
, "Could not allocate RTM_SETLINK message: %m");
236 r
= sd_netlink_message_append_u32(req
, IFLA_MASTER
, netdev
->ifindex
);
238 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_MASTER attribute: %m");
240 r
= sd_netlink_call_async(netdev
->manager
->rtnl
, req
, callback
, link
, 0, NULL
);
242 return log_netdev_error(netdev
, "Could not send rtnetlink message: %m");
246 log_netdev_debug(netdev
, "Enslaving link '%s'", link
->ifname
);
251 static int netdev_enter_ready(NetDev
*netdev
) {
252 netdev_join_callback
*callback
, *callback_next
;
256 assert(netdev
->ifname
);
258 if (netdev
->state
!= NETDEV_STATE_CREATING
)
261 netdev
->state
= NETDEV_STATE_READY
;
263 log_netdev_info(netdev
, "netdev ready");
265 LIST_FOREACH_SAFE(callbacks
, callback
, callback_next
, netdev
->callbacks
) {
266 /* enslave the links that were attempted to be enslaved before the
268 r
= netdev_enslave_ready(netdev
, callback
->link
, callback
->callback
);
272 LIST_REMOVE(callbacks
, netdev
->callbacks
, callback
);
273 link_unref(callback
->link
);
277 if (NETDEV_VTABLE(netdev
)->post_create
)
278 NETDEV_VTABLE(netdev
)->post_create(netdev
, NULL
, NULL
);
283 /* callback for netdev's created without a backing Link */
284 static int netdev_create_handler(sd_netlink
*rtnl
, sd_netlink_message
*m
, void *userdata
) {
285 _cleanup_netdev_unref_ NetDev
*netdev
= userdata
;
288 assert(netdev
->state
!= _NETDEV_STATE_INVALID
);
290 r
= sd_netlink_message_get_errno(m
);
292 log_netdev_info(netdev
, "netdev exists, using existing without changing its parameters");
294 log_netdev_warning_errno(netdev
, r
, "netdev could not be created: %m");
300 log_netdev_debug(netdev
, "Created");
305 int netdev_enslave(NetDev
*netdev
, Link
*link
, sd_netlink_message_handler_t callback
) {
309 assert(netdev
->manager
);
310 assert(netdev
->manager
->rtnl
);
311 assert(IN_SET(netdev
->kind
, NETDEV_KIND_BRIDGE
, NETDEV_KIND_BOND
, NETDEV_KIND_VRF
));
313 if (netdev
->state
== NETDEV_STATE_READY
) {
314 r
= netdev_enslave_ready(netdev
, link
, callback
);
317 } else if (IN_SET(netdev
->state
, NETDEV_STATE_LINGER
, NETDEV_STATE_FAILED
)) {
318 _cleanup_(sd_netlink_message_unrefp
) sd_netlink_message
*m
= NULL
;
320 r
= rtnl_message_new_synthetic_error(-ENODEV
, 0, &m
);
322 callback(netdev
->manager
->rtnl
, m
, link
);
324 /* the netdev is not yet read, save this request for when it is */
325 netdev_join_callback
*cb
;
327 cb
= new0(netdev_join_callback
, 1);
331 cb
->callback
= callback
;
335 LIST_PREPEND(callbacks
, netdev
->callbacks
, cb
);
337 log_netdev_debug(netdev
, "Will enslave '%s', when ready", link
->ifname
);
343 int netdev_set_ifindex(NetDev
*netdev
, sd_netlink_message
*message
) {
346 const char *received_kind
;
347 const char *received_name
;
353 r
= sd_netlink_message_get_type(message
, &type
);
355 return log_netdev_error_errno(netdev
, r
, "Could not get rtnl message type: %m");
357 if (type
!= RTM_NEWLINK
) {
358 log_netdev_error(netdev
, "Cannot set ifindex from unexpected rtnl message type.");
362 r
= sd_rtnl_message_link_get_ifindex(message
, &ifindex
);
364 log_netdev_error_errno(netdev
, r
, "Could not get ifindex: %m");
365 netdev_enter_failed(netdev
);
367 } else if (ifindex
<= 0) {
368 log_netdev_error(netdev
, "Got invalid ifindex: %d", ifindex
);
369 netdev_enter_failed(netdev
);
373 if (netdev
->ifindex
> 0) {
374 if (netdev
->ifindex
!= ifindex
) {
375 log_netdev_error(netdev
, "Could not set ifindex to %d, already set to %d",
376 ifindex
, netdev
->ifindex
);
377 netdev_enter_failed(netdev
);
380 /* ifindex already set to the same for this netdev */
384 r
= sd_netlink_message_read_string(message
, IFLA_IFNAME
, &received_name
);
386 return log_netdev_error_errno(netdev
, r
, "Could not get IFNAME: %m");
388 if (!streq(netdev
->ifname
, received_name
)) {
389 log_netdev_error(netdev
, "Received newlink with wrong IFNAME %s", received_name
);
390 netdev_enter_failed(netdev
);
394 r
= sd_netlink_message_enter_container(message
, IFLA_LINKINFO
);
396 return log_netdev_error_errno(netdev
, r
, "Could not get LINKINFO: %m");
398 r
= sd_netlink_message_read_string(message
, IFLA_INFO_KIND
, &received_kind
);
400 return log_netdev_error_errno(netdev
, r
, "Could not get KIND: %m");
402 r
= sd_netlink_message_exit_container(message
);
404 return log_netdev_error_errno(netdev
, r
, "Could not exit container: %m");
406 if (netdev
->kind
== NETDEV_KIND_TAP
)
407 /* the kernel does not distinguish between tun and tap */
410 kind
= netdev_kind_to_string(netdev
->kind
);
412 log_netdev_error(netdev
, "Could not get kind");
413 netdev_enter_failed(netdev
);
418 if (!streq(kind
, received_kind
)) {
419 log_netdev_error(netdev
,
420 "Received newlink with wrong KIND %s, "
421 "expected %s", received_kind
, kind
);
422 netdev_enter_failed(netdev
);
426 netdev
->ifindex
= ifindex
;
428 log_netdev_debug(netdev
, "netdev has index %d", netdev
->ifindex
);
430 netdev_enter_ready(netdev
);
435 #define HASH_KEY SD_ID128_MAKE(52,e1,45,bd,00,6f,29,96,21,c6,30,6d,83,71,04,48)
437 int netdev_get_mac(const char *ifname
, struct ether_addr
**ret
) {
438 _cleanup_free_
struct ether_addr
*mac
= NULL
;
447 mac
= new0(struct ether_addr
, 1);
452 sz
= sizeof(sd_id128_t
) + l
;
455 /* fetch some persistent data unique to the machine */
456 r
= sd_id128_get_machine((sd_id128_t
*) v
);
460 /* combine with some data unique (on this machine) to this
462 memcpy(v
+ sizeof(sd_id128_t
), ifname
, l
);
464 /* Let's hash the host machine ID plus the container name. We
465 * use a fixed, but originally randomly created hash key here. */
466 result
= siphash24(v
, sz
, HASH_KEY
.bytes
);
468 assert_cc(ETH_ALEN
<= sizeof(result
));
469 memcpy(mac
->ether_addr_octet
, &result
, ETH_ALEN
);
471 /* see eth_random_addr in the kernel */
472 mac
->ether_addr_octet
[0] &= 0xfe; /* clear multicast bit */
473 mac
->ether_addr_octet
[0] |= 0x02; /* set local assignment bit (IEEE802) */
481 static int netdev_create(NetDev
*netdev
, Link
*link
,
482 sd_netlink_message_handler_t callback
) {
486 assert(!link
|| callback
);
489 if (NETDEV_VTABLE(netdev
)->create
) {
492 r
= NETDEV_VTABLE(netdev
)->create(netdev
);
496 log_netdev_debug(netdev
, "Created");
498 _cleanup_(sd_netlink_message_unrefp
) sd_netlink_message
*m
= NULL
;
500 r
= sd_rtnl_message_new_link(netdev
->manager
->rtnl
, &m
, RTM_NEWLINK
, 0);
502 return log_netdev_error_errno(netdev
, r
, "Could not allocate RTM_NEWLINK message: %m");
504 r
= sd_netlink_message_append_string(m
, IFLA_IFNAME
, netdev
->ifname
);
506 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_IFNAME, attribute: %m");
509 r
= sd_netlink_message_append_ether_addr(m
, IFLA_ADDRESS
, netdev
->mac
);
511 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_ADDRESS attribute: %m");
515 r
= sd_netlink_message_append_u32(m
, IFLA_MTU
, netdev
->mtu
);
517 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_MTU attribute: %m");
521 r
= sd_netlink_message_append_u32(m
, IFLA_LINK
, link
->ifindex
);
523 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_LINK attribute: %m");
526 r
= sd_netlink_message_open_container(m
, IFLA_LINKINFO
);
528 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_LINKINFO attribute: %m");
530 r
= sd_netlink_message_open_container_union(m
, IFLA_INFO_DATA
, netdev_kind_to_string(netdev
->kind
));
532 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_INFO_DATA attribute: %m");
534 if (NETDEV_VTABLE(netdev
)->fill_message_create
) {
535 r
= NETDEV_VTABLE(netdev
)->fill_message_create(netdev
, link
, m
);
540 r
= sd_netlink_message_close_container(m
);
542 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_INFO_DATA attribute: %m");
544 r
= sd_netlink_message_close_container(m
);
546 return log_netdev_error_errno(netdev
, r
, "Could not append IFLA_LINKINFO attribute: %m");
549 r
= sd_netlink_call_async(netdev
->manager
->rtnl
, m
, callback
, link
, 0, NULL
);
551 return log_netdev_error_errno(netdev
, r
, "Could not send rtnetlink message: %m");
555 r
= sd_netlink_call_async(netdev
->manager
->rtnl
, m
, netdev_create_handler
, netdev
, 0, NULL
);
557 return log_netdev_error_errno(netdev
, r
, "Could not send rtnetlink message: %m");
562 netdev
->state
= NETDEV_STATE_CREATING
;
564 log_netdev_debug(netdev
, "Creating");
570 /* the callback must be called, possibly after a timeout, as otherwise the Link will hang */
571 int netdev_join(NetDev
*netdev
, Link
*link
, sd_netlink_message_handler_t callback
) {
575 assert(netdev
->manager
);
576 assert(netdev
->manager
->rtnl
);
577 assert(NETDEV_VTABLE(netdev
));
579 switch (NETDEV_VTABLE(netdev
)->create_type
) {
580 case NETDEV_CREATE_MASTER
:
581 r
= netdev_enslave(netdev
, link
, callback
);
586 case NETDEV_CREATE_STACKED
:
587 r
= netdev_create(netdev
, link
, callback
);
593 assert_not_reached("Can not join independent netdev");
599 static int netdev_load_one(Manager
*manager
, const char *filename
) {
600 _cleanup_netdev_unref_ NetDev
*netdev
= NULL
;
601 _cleanup_free_ NetDev
*netdev_raw
= NULL
;
602 _cleanup_fclose_
FILE *file
= NULL
;
603 const char *dropin_dirname
;
604 bool independent
= false;
610 file
= fopen(filename
, "re");
618 if (null_or_empty_fd(fileno(file
))) {
619 log_debug("Skipping empty file: %s", filename
);
623 netdev_raw
= new0(NetDev
, 1);
627 netdev_raw
->kind
= _NETDEV_KIND_INVALID
;
628 dropin_dirname
= strjoina(basename(filename
), ".d");
630 r
= config_parse_many(filename
, network_dirs
, dropin_dirname
,
632 config_item_perf_lookup
, network_netdev_gperf_lookup
,
637 r
= fseek(file
, 0, SEEK_SET
);
641 /* skip out early if configuration does not match the environment */
642 if (net_match_config(NULL
, NULL
, NULL
, NULL
, NULL
,
643 netdev_raw
->match_host
, netdev_raw
->match_virt
,
644 netdev_raw
->match_kernel
, netdev_raw
->match_arch
,
645 NULL
, NULL
, NULL
, NULL
, NULL
, NULL
) <= 0)
648 if (netdev_raw
->kind
== _NETDEV_KIND_INVALID
) {
649 log_warning("NetDev has no Kind configured in %s. Ignoring", filename
);
653 if (!netdev_raw
->ifname
) {
654 log_warning("NetDev without Name configured in %s. Ignoring", filename
);
658 netdev
= malloc0(NETDEV_VTABLE(netdev_raw
)->object_size
);
663 netdev
->manager
= manager
;
664 netdev
->state
= _NETDEV_STATE_INVALID
;
665 netdev
->kind
= netdev_raw
->kind
;
666 netdev
->ifname
= netdev_raw
->ifname
;
668 if (NETDEV_VTABLE(netdev
)->init
)
669 NETDEV_VTABLE(netdev
)->init(netdev
);
671 r
= config_parse(NULL
, filename
, file
,
672 NETDEV_VTABLE(netdev
)->sections
,
673 config_item_perf_lookup
, network_netdev_gperf_lookup
,
674 false, false, false, netdev
);
678 /* verify configuration */
679 if (NETDEV_VTABLE(netdev
)->config_verify
) {
680 r
= NETDEV_VTABLE(netdev
)->config_verify(netdev
, filename
);
685 netdev
->filename
= strdup(filename
);
686 if (!netdev
->filename
)
689 if (!netdev
->mac
&& netdev
->kind
!= NETDEV_KIND_VLAN
) {
690 r
= netdev_get_mac(netdev
->ifname
, &netdev
->mac
);
692 return log_error_errno(r
, "Failed to generate predictable MAC address for %s: %m", netdev
->ifname
);
695 r
= hashmap_put(netdev
->manager
->netdevs
, netdev
->ifname
, netdev
);
699 LIST_HEAD_INIT(netdev
->callbacks
);
701 log_netdev_debug(netdev
, "loaded %s", netdev_kind_to_string(netdev
->kind
));
703 switch (NETDEV_VTABLE(netdev
)->create_type
) {
704 case NETDEV_CREATE_MASTER
:
705 case NETDEV_CREATE_INDEPENDENT
:
706 r
= netdev_create(netdev
, NULL
, NULL
);
715 switch (netdev
->kind
) {
716 case NETDEV_KIND_IPIP
:
717 independent
= IPIP(netdev
)->independent
;
719 case NETDEV_KIND_GRE
:
720 independent
= GRE(netdev
)->independent
;
722 case NETDEV_KIND_GRETAP
:
723 independent
= GRETAP(netdev
)->independent
;
725 case NETDEV_KIND_IP6GRE
:
726 independent
= IP6GRE(netdev
)->independent
;
728 case NETDEV_KIND_IP6GRETAP
:
729 independent
= IP6GRETAP(netdev
)->independent
;
731 case NETDEV_KIND_SIT
:
732 independent
= SIT(netdev
)->independent
;
734 case NETDEV_KIND_VTI
:
735 independent
= VTI(netdev
)->independent
;
737 case NETDEV_KIND_VTI6
:
738 independent
= VTI6(netdev
)->independent
;
740 case NETDEV_KIND_IP6TNL
:
741 independent
= IP6TNL(netdev
)->independent
;
748 r
= netdev_create(netdev
, NULL
, NULL
);
758 int netdev_load(Manager
*manager
) {
759 _cleanup_strv_free_
char **files
= NULL
;
766 while ((netdev
= hashmap_first(manager
->netdevs
)))
767 netdev_unref(netdev
);
769 r
= conf_files_list_strv(&files
, ".netdev", NULL
, 0, network_dirs
);
771 return log_error_errno(r
, "Failed to enumerate netdev files: %m");
773 STRV_FOREACH_BACKWARDS(f
, files
) {
774 r
= netdev_load_one(manager
, *f
);