]> git.ipfire.org Git - thirdparty/bird.git/blame - nest/route.h
KRT: Improve syncer code to avoid using temporary data in rtable
[thirdparty/bird.git] / nest / route.h
CommitLineData
58ef912c
MM
1/*
2 * BIRD Internet Routing Daemon -- Routing Table
3 *
50fe90ed 4 * (c) 1998--2000 Martin Mares <mj@ucw.cz>
58ef912c
MM
5 *
6 * Can be freely distributed and used under the terms of the GNU GPL.
7 */
8
9#ifndef _BIRD_ROUTE_H_
10#define _BIRD_ROUTE_H_
11
0e02abfd 12#include "lib/lists.h"
5ea39eaa 13#include "lib/bitmap.h"
1feea03e 14#include "lib/resource.h"
9b0a0ba9 15#include "lib/net.h"
58ef912c 16
f4a60a9b 17struct ea_list;
2326b001 18struct protocol;
4cc78c50 19struct proto;
f4a60a9b 20struct rte_src;
730f2e2c
MM
21struct symbol;
22struct filter;
23struct cli;
2326b001 24
58ef912c
MM
25/*
26 * Generic data structure for storing network prefixes. Also used
3ab001b9 27 * for the master routing table. Currently implemented as a hash
62aa008a 28 * table.
58ef912c
MM
29 *
30 * Available operations:
31 * - insertion of new entry
32 * - deletion of entry
62aa008a 33 * - searching for entry by network prefix
3ab001b9 34 * - asynchronous retrieval of fib contents
58ef912c
MM
35 */
36
37struct fib_node {
3ab001b9
MM
38 struct fib_node *next; /* Next in hash chain */
39 struct fib_iterator *readers; /* List of readers of this node */
fe9f1a6d 40 net_addr addr[0];
3ab001b9
MM
41};
42
43struct fib_iterator { /* See lib/slists.h for an explanation */
44 struct fib_iterator *prev, *next; /* Must be synced with struct fib_node! */
3ab001b9
MM
45 byte efef; /* 0xff to distinguish between iterator and node */
46 byte pad[3];
0ba8a614 47 struct fib_node *node; /* Or NULL if freshly merged */
ae80a2de 48 uint hash;
58ef912c
MM
49};
50
fe9f1a6d 51typedef void (*fib_init_fn)(void *);
ce4aca09 52
58ef912c 53struct fib {
62aa008a
MM
54 pool *fib_pool; /* Pool holding all our data */
55 slab *fib_slab; /* Slab holding all fib nodes */
56 struct fib_node **hash_table; /* Node hash table */
ae80a2de
PT
57 uint hash_size; /* Number of hash table entries (a power of two) */
58 uint hash_order; /* Binary logarithm of hash_size */
04632fd7 59 uint hash_shift; /* 32 - hash_order */
fe9f1a6d 60 uint addr_type; /* Type of address data stored in fib (NET_*) */
f4a60a9b
OZ
61 uint node_size; /* FIB node size, 0 for nonuniform */
62 uint node_offset; /* Offset of fib_node struct inside of user data */
ae80a2de
PT
63 uint entries; /* Number of entries */
64 uint entries_min, entries_max; /* Entry count limits (else start rehashing) */
fe9f1a6d 65 fib_init_fn init; /* Constructor */
58ef912c
MM
66};
67
600998fc
OZ
68static inline void * fib_node_to_user(struct fib *f, struct fib_node *e)
69{ return e ? (void *) ((char *) e - f->node_offset) : NULL; }
70
71static inline struct fib_node * fib_user_to_node(struct fib *f, void *e)
72{ return e ? (void *) ((char *) e + f->node_offset) : NULL; }
73
fe9f1a6d 74void fib_init(struct fib *f, pool *p, uint addr_type, uint node_size, uint node_offset, uint hash_order, fib_init_fn init);
0f7d5b1a 75void *fib_find(struct fib *, const net_addr *); /* Find or return NULL if doesn't exist */
0264ccf6 76void *fib_get_chain(struct fib *f, const net_addr *a); /* Find first node in linked list from hash table */
a82f692e 77void *fib_get(struct fib *, const net_addr *); /* Find or create new if nonexistent */
0f7d5b1a 78void *fib_route(struct fib *, const net_addr *); /* Longest-match routing lookup */
62aa008a 79void fib_delete(struct fib *, void *); /* Remove fib entry */
a8b60382 80void fib_free(struct fib *); /* Destroy the fib */
3ab001b9
MM
81void fib_check(struct fib *); /* Consistency check for debugging */
82
83void fit_init(struct fib_iterator *, struct fib *); /* Internal functions, don't call */
84struct fib_node *fit_get(struct fib *, struct fib_iterator *);
85void fit_put(struct fib_iterator *, struct fib_node *);
8465dccb
OZ
86void fit_put_next(struct fib *f, struct fib_iterator *i, struct fib_node *n, uint hpos);
87
600998fc
OZ
88
89#define FIB_WALK(fib, type, z) do { \
90 struct fib_node *fn_, **ff_ = (fib)->hash_table; \
91 uint count_ = (fib)->hash_size; \
92 type *z; \
93 while (count_--) \
94 for (fn_ = *ff_++; z = fib_node_to_user(fib, fn_); fn_=fn_->next)
236d4eb8
MM
95
96#define FIB_WALK_END } while (0)
a8b60382 97
3ab001b9
MM
98#define FIB_ITERATE_INIT(it, fib) fit_init(it, fib)
99
600998fc
OZ
100#define FIB_ITERATE_START(fib, it, type, z) do { \
101 struct fib_node *fn_ = fit_get(fib, it); \
102 uint count_ = (fib)->hash_size; \
103 uint hpos_ = (it)->hash; \
104 type *z; \
3ab001b9 105 for(;;) { \
600998fc 106 if (!fn_) \
a82f692e 107 { \
600998fc 108 if (++hpos_ >= count_) \
8abbde02 109 break; \
600998fc 110 fn_ = (fib)->hash_table[hpos_]; \
8abbde02 111 continue; \
600998fc
OZ
112 } \
113 z = fib_node_to_user(fib, fn_);
3ab001b9 114
600998fc 115#define FIB_ITERATE_END fn_ = fn_->next; } } while(0)
3ab001b9 116
600998fc 117#define FIB_ITERATE_PUT(it) fit_put(it, fn_)
3ab001b9 118
600998fc 119#define FIB_ITERATE_PUT_NEXT(it, fib) fit_put_next(fib, it, fn_, hpos_)
8465dccb
OZ
120
121#define FIB_ITERATE_UNLINK(it, fib) fit_get(fib, it)
122
123
58ef912c 124/*
08e2d625
MM
125 * Master Routing Tables. Generally speaking, each of them contains a FIB
126 * with each entry pointing to a list of route entries representing routes
127 * to given network (with the selected one at the head).
128 *
58ef912c 129 * Each of the RTE's contains variable data (the preference and protocol-dependent
62aa008a 130 * metrics) and a pointer to a route attribute block common for many routes).
08e2d625
MM
131 *
132 * It's guaranteed that there is at most one RTE for every (prefix,proto) pair.
58ef912c
MM
133 */
134
0e02abfd
MM
135struct rtable_config {
136 node n;
137 char *name;
138 struct rtable *table;
7de45ba4 139 struct proto_config *krt_attached; /* Kernel syncer attached to this table */
fe9f1a6d 140 uint addr_type; /* Type of address data stored in table (NET_*) */
b9626ec6
MM
141 int gc_max_ops; /* Maximum number of operations before GC is run */
142 int gc_min_time; /* Minimum time between two consecutive GC runs */
26822d8f 143 byte sorted; /* Routes of network are sorted according to rte_better() */
0e02abfd
MM
144};
145
62aa008a 146typedef struct rtable {
0e02abfd 147 node n; /* Node in list of all tables */
62aa008a
MM
148 struct fib fib;
149 char *name; /* Name of this table */
f4a60a9b 150 list channels; /* List of attached channels (struct channel) */
fe9f1a6d 151 uint addr_type; /* Type of address data stored in table (NET_*) */
9c11ec9e 152 int pipe_busy; /* Pipe loop detection */
50fe90ed 153 int use_count; /* Number of protocols using this table */
67d8665a 154 u32 rt_count; /* Number of routes in the table */
5ea39eaa 155 struct hmap id_map;
cfe34a31 156 struct hostcache *hostcache;
b9626ec6 157 struct rtable_config *config; /* Configuration of this table */
50fe90ed
MM
158 struct config *deleted; /* Table doesn't exist in current configuration,
159 * delete as soon as use_count becomes 0 and remove
160 * obstacle from this routing table.
161 */
cfe34a31 162 struct event *rt_event; /* Routing table event */
f047271c 163 btime gc_time; /* Time of last GC */
b9626ec6 164 int gc_counter; /* Number of operations since last GC */
9135c1f0 165 byte prune_state; /* Table prune state, 1 -> scheduled, 2-> running */
cfe34a31
OZ
166 byte hcu_scheduled; /* Hostcache update is scheduled */
167 byte nhu_state; /* Next Hop Update state */
fb829de6 168 struct fib_iterator prune_fit; /* Rtable prune FIB iterator */
cfe34a31 169 struct fib_iterator nhu_fit; /* Next Hop Update FIB iterator */
62aa008a
MM
170} rtable;
171
93f50ca3
JMM
172#define NHU_CLEAN 0
173#define NHU_SCHEDULED 1
174#define NHU_RUNNING 2
175#define NHU_DIRTY 3
176
58ef912c 177typedef struct network {
58ef912c 178 struct rte *routes; /* Available routes for this network */
fe9f1a6d 179 struct fib_node n; /* FIB flags reserved for kernel syncer */
58ef912c
MM
180} net;
181
cfe34a31 182struct hostcache {
f2b76f2c
OZ
183 slab *slab; /* Slab holding all hostentries */
184 struct hostentry **hash_table; /* Hash table for hostentries */
185 unsigned hash_order, hash_shift;
186 unsigned hash_max, hash_min;
187 unsigned hash_items;
c477f489
OZ
188 linpool *lp; /* Linpool for trie */
189 struct f_trie *trie; /* Trie of prefixes that might affect hostentries */
190 list hostentries; /* List of all hostentries */
cfe34a31
OZ
191 byte update_hostcache;
192};
193
194struct hostentry {
cfe34a31 195 node ln;
1b180121
OZ
196 ip_addr addr; /* IP address of host, part of key */
197 ip_addr link; /* (link-local) IP address of host, used as gw
198 if host is directly attached */
acb04cfd 199 struct rtable *tab; /* Dependent table, part of key */
f2b76f2c
OZ
200 struct hostentry *next; /* Next in hash chain */
201 unsigned hash_key; /* Hash key */
cfe34a31 202 unsigned uc; /* Use count */
7e95c05d 203 struct rta *src; /* Source rta entry */
cfe34a31 204 byte dest; /* Chosen route destination type (RTD_...) */
039a65d0 205 byte nexthop_linkable; /* Nexthop list is completely non-device */
d1e146f2 206 u32 igp_metric; /* Chosen route IGP metric */
cfe34a31
OZ
207};
208
58ef912c
MM
209typedef struct rte {
210 struct rte *next;
a0762910 211 net *net; /* Network this RTE belongs to */
f4a60a9b 212 struct channel *sender; /* Channel used to send the route to the routing table */
1b769b08 213 struct rta *attrs; /* Attributes of this route */
5ea39eaa 214 u32 id; /* Table specific route id */
58ef912c 215 byte flags; /* Flags (REF_...) */
481f6985 216 byte pflags; /* Protocol-specific flags */
58ef912c 217 word pref; /* Route preference */
f047271c 218 btime lastmod; /* Last modified */
58ef912c 219 union { /* Protocol-dependent data (metrics etc.) */
58ef912c
MM
220#ifdef CONFIG_RIP
221 struct {
8465dccb
OZ
222 struct iface *from; /* Incoming iface */
223 u8 metric; /* RIP metric */
481f6985 224 u16 tag; /* External route tag */
58ef912c
MM
225 } rip;
226#endif
227#ifdef CONFIG_OSPF
228 struct {
229 u32 metric1, metric2; /* OSPF Type 1 and Type 2 metrics */
481f6985 230 u32 tag; /* External route tag */
c27b2449 231 u32 router_id; /* Router that originated this route */
58ef912c 232 } ospf;
be4cd99a
OZ
233#endif
234#ifdef CONFIG_BGP
235 struct {
236 u8 suppressed; /* Used for deterministic MED comparison */
5bd73431 237 s8 stale; /* Route is LLGR_STALE, -1 if unknown */
be4cd99a 238 } bgp;
937e75d8
OZ
239#endif
240#ifdef CONFIG_BABEL
241 struct {
3b3b0910 242 u16 seqno; /* Babel seqno */
937e75d8
OZ
243 u16 metric; /* Babel metric */
244 u64 router_id; /* Babel router id */
245 } babel;
58ef912c 246#endif
c10421d3
MM
247 struct { /* Routes generated by krt sync (both temporary and inherited ones) */
248 s8 src; /* Alleged route source (see krt.h) */
249 u8 proto; /* Kernel source protocol ID */
c10421d3 250 u8 seen; /* Seen during last scan */
e86cfd41 251 u8 best; /* Best route in network, propagated to core */
c10421d3
MM
252 u32 metric; /* Kernel metric */
253 } krt;
58ef912c
MM
254 } u;
255} rte;
256
00a09f3c 257#define REF_COW 1 /* Copy this rte on write */
15550957 258#define REF_FILTERED 2 /* Route is rejected by import filter */
0c791f87
OZ
259#define REF_STALE 4 /* Route is stale in a refresh cycle */
260#define REF_DISCARD 8 /* Route is scheduled for discard */
5bd73431 261#define REF_MODIFY 16 /* Route is scheduled for modify */
cf98be7b
OZ
262
263/* Route is valid for propagation (may depend on other flags in the future), accepts NULL */
15550957 264static inline int rte_is_valid(rte *r) { return r && !(r->flags & REF_FILTERED); }
cf98be7b 265
15550957
OZ
266/* Route just has REF_FILTERED flag */
267static inline int rte_is_filtered(rte *r) { return !!(r->flags & REF_FILTERED); }
cf98be7b 268
e2dc2f30 269
23ac9e9a 270/* Types of route announcement, also used as flags */
f8aad5d5 271#define RA_UNDEF 0 /* Undefined RA type */
00a09f3c
OZ
272#define RA_OPTIMAL 1 /* Announcement of optimal route change */
273#define RA_ACCEPTED 2 /* Announcement of first accepted route */
274#define RA_ANY 3 /* Announcement of any route change */
8d9eef17 275#define RA_MERGED 4 /* Announcement of optimal route merged with next ones */
23ac9e9a 276
14375237 277/* Return value of preexport() callback */
36da2857
OZ
278#define RIC_ACCEPT 1 /* Accepted by protocol */
279#define RIC_PROCESS 0 /* Process it through import filter */
280#define RIC_REJECT -1 /* Rejected by protocol */
281#define RIC_DROP -2 /* Silently dropped by protocol */
282
863ecfc7 283extern list routing_tables;
0e02abfd 284struct config;
2326b001
MM
285
286void rt_init(void);
0e02abfd 287void rt_preconfig(struct config *);
50fe90ed
MM
288void rt_commit(struct config *new, struct config *old);
289void rt_lock_table(rtable *);
290void rt_unlock_table(rtable *);
28b3b551 291void rt_setup(pool *, rtable *, struct rtable_config *);
0264ccf6 292static inline net *net_find(rtable *tab, const net_addr *addr) { return (net *) fib_find(&tab->fib, addr); }
7ee07a3c
JMM
293static inline net *net_find_valid(rtable *tab, const net_addr *addr)
294{ net *n = net_find(tab, addr); return (n && rte_is_valid(n->routes)) ? n : NULL; }
0264ccf6 295static inline net *net_get(rtable *tab, const net_addr *addr) { return (net *) fib_get(&tab->fib, addr); }
286e2011
OZ
296void *net_route(rtable *tab, const net_addr *n);
297int net_roa_check(rtable *tab, const net_addr *n, u32 asn);
094d2bdb 298rte *rte_find(net *net, struct rte_src *src);
1b769b08 299rte *rte_get_temp(struct rta *);
65d2a88d 300void rte_update2(struct channel *c, const net_addr *n, rte *new, struct rte_src *src);
f4a60a9b 301/* rte_update() moved to protocol.h to avoid dependency conflicts */
0b39b1cb 302int rt_examine(rtable *t, net_addr *a, struct proto *p, const struct filter *filter);
13c0be19 303rte *rt_export_merged(struct channel *c, net *net, rte **rt_free, linpool *pool, int silent);
f4a60a9b
OZ
304void rt_refresh_begin(rtable *t, struct channel *c);
305void rt_refresh_end(rtable *t, struct channel *c);
5bd73431 306void rt_modify_stale(rtable *t, struct channel *c);
f4a60a9b 307void rt_schedule_prune(rtable *t);
a0762910 308void rte_dump(rte *);
04925e90 309void rte_free(rte *);
e2dc2f30
MM
310rte *rte_do_cow(rte *);
311static inline rte * rte_cow(rte *r) { return (r->flags & REF_COW) ? rte_do_cow(r) : r; }
8d9eef17 312rte *rte_cow_rta(rte *r, linpool *lp);
875cc073
OZ
313void rte_init_tmp_attrs(struct rte *r, linpool *lp, uint max);
314void rte_make_tmp_attr(struct rte *r, uint id, uint type, uintptr_t val);
315void rte_make_tmp_attrs(struct rte **r, struct linpool *pool, struct rta **old_attrs);
316uintptr_t rte_store_tmp_attr(struct rte *r, uint id);
2326b001 317void rt_dump(rtable *);
a2ccbb0b 318void rt_dump_all(void);
f4a60a9b
OZ
319int rt_feed_channel(struct channel *c);
320void rt_feed_channel_abort(struct channel *c);
682d3f7d
OZ
321int rte_update_in(struct channel *c, const net_addr *n, rte *new, struct rte_src *src);
322int rt_reload_channel(struct channel *c);
323void rt_reload_channel_abort(struct channel *c);
324void rt_prune_sync(rtable *t, int all);
b7d7599c 325int rte_update_out(struct channel *c, const net_addr *n, rte *new, rte *old0, int refeed);
fe9f1a6d 326struct rtable_config *rt_new_table(struct symbol *s, uint addr_type);
2326b001 327
682d3f7d 328
517d05df
OZ
329/* Default limit for ECMP next hops, defined in sysdep code */
330extern const int rt_default_ecmp;
0c791f87 331
2faf519c
JMM
332struct rt_show_data_rtable {
333 node n;
334 rtable *table;
b2949999 335 struct channel *export_channel;
2faf519c
JMM
336};
337
730f2e2c 338struct rt_show_data {
04632fd7 339 net_addr *addr;
b2949999
OZ
340 list tables;
341 struct rt_show_data_rtable *tab; /* Iterator over table list */
342 struct rt_show_data_rtable *last_table; /* Last table in output */
343 struct fib_iterator fit; /* Iterator over networks in table */
2faf519c 344 int verbose, tables_defined_by;
0b39b1cb 345 const struct filter *filter;
4d176e14 346 struct proto *show_protocol;
ea2ae6dd 347 struct proto *export_protocol;
f4a60a9b 348 struct channel *export_channel;
ce1da96e 349 struct config *running_on_config;
cc75b3e1 350 struct krt_proto *kernel;
b2949999
OZ
351 int export_mode, primary_only, filtered, stats, show_for;
352
353 int table_open; /* Iteration (fit) is open */
2faf519c
JMM
354 int net_counter, rt_counter, show_counter, table_counter;
355 int net_counter_last, rt_counter_last, show_counter_last;
730f2e2c 356};
b2949999 357
730f2e2c 358void rt_show(struct rt_show_data *);
b2949999 359struct rt_show_data_rtable * rt_show_add_table(struct rt_show_data *d, rtable *t);
2faf519c
JMM
360
361/* Value of table definition mode in struct rt_show_data */
362#define RSD_TDB_DEFAULT 0 /* no table specified */
363#define RSD_TDB_INDIRECT 0 /* show route ... protocol P ... */
364#define RSD_TDB_ALL RSD_TDB_SET /* show route ... table all ... */
365#define RSD_TDB_DIRECT RSD_TDB_SET | RSD_TDB_NMN /* show route ... table X table Y ... */
366
367#define RSD_TDB_SET 0x1 /* internal: show empty tables */
368#define RSD_TDB_NMN 0x2 /* internal: need matching net */
730f2e2c 369
7aa80901
OZ
370/* Value of export_mode in struct rt_show_data */
371#define RSEM_NONE 0 /* Export mode not used */
372#define RSEM_PREEXPORT 1 /* Routes ready for export, before filtering */
373#define RSEM_EXPORT 2 /* Routes accepted by export filter */
374#define RSEM_NOEXPORT 3 /* Routes rejected by export filter */
5ea39eaa 375#define RSEM_EXPORTED 4 /* Routes marked in export map */
7aa80901 376
58ef912c
MM
377/*
378 * Route Attributes
379 *
380 * Beware: All standard BGP attributes must be represented here instead
381 * of making them local to the route. This is needed to ensure proper
382 * construction of BGP route attribute lists.
383 */
384
4e276a89
JMM
385/* Nexthop structure */
386struct nexthop {
7e95c05d
OZ
387 ip_addr gw; /* Next hop */
388 struct iface *iface; /* Outgoing interface */
4e276a89 389 struct nexthop *next;
a1f5e514 390 byte flags;
e348ef01 391 byte weight;
039a65d0
JMM
392 byte labels_orig; /* Number of labels before hostentry was applied */
393 byte labels; /* Number of all labels */
ec5e5d23 394 u32 label[0];
7e95c05d
OZ
395};
396
a1f5e514
OZ
397#define RNF_ONLINK 0x1 /* Gateway is onlink regardless of IP ranges */
398
399
094d2bdb
OZ
400struct rte_src {
401 struct rte_src *next; /* Hash chain */
402 struct proto *proto; /* Protocol the source is based on */
403 u32 private_id; /* Private ID, assigned by the protocol */
404 u32 global_id; /* Globally unique ID of the source */
405 unsigned uc; /* Use count */
406};
407
408
1b769b08 409typedef struct rta {
ee76a92a 410 struct rta *next, **pprev; /* Hash chain */
9a74622c
JMM
411 u32 uc; /* Use count */
412 u32 hash_key; /* Hash over important fields */
9a74622c 413 struct ea_list *eattrs; /* Extended Attribute chain */
094d2bdb 414 struct rte_src *src; /* Route source that created the route */
9a74622c 415 struct hostentry *hostentry; /* Hostentry for recursive next-hops */
9a74622c
JMM
416 ip_addr from; /* Advertising router */
417 u32 igp_metric; /* IGP metric to next hop (for iBGP routes) */
5b208e29
JMM
418 u8 source; /* Route source (RTS_...) */
419 u8 scope; /* Route scope (SCOPE_... -- see ip.h) */
420 u8 dest; /* Route destination type (RTD_...) */
421 u8 aflags;
4e276a89 422 struct nexthop nh; /* Next hop */
58ef912c
MM
423} rta;
424
618533af 425#define RTS_DUMMY 0 /* Dummy route to be removed soon */
58ef912c
MM
426#define RTS_STATIC 1 /* Normal static route */
427#define RTS_INHERIT 2 /* Route inherited from kernel */
428#define RTS_DEVICE 3 /* Device route */
429#define RTS_STATIC_DEVICE 4 /* Static device route */
430#define RTS_REDIRECT 5 /* Learned via redirect */
431#define RTS_RIP 6 /* RIP route */
beaf86e1 432#define RTS_OSPF 7 /* OSPF route */
8bf684ec 433#define RTS_OSPF_IA 8 /* OSPF inter-area route */
98ac6176
OF
434#define RTS_OSPF_EXT1 9 /* OSPF external route type 1 */
435#define RTS_OSPF_EXT2 10 /* OSPF external route type 2 */
436#define RTS_BGP 11 /* BGP route */
437#define RTS_PIPE 12 /* Inter-table wormhole */
937e75d8 438#define RTS_BABEL 13 /* Babel route */
65d2a88d 439#define RTS_RPKI 14 /* Route Origin Authorization */
82b74253
MM
440#define RTS_PERF 15 /* Perf checker */
441#define RTS_MAX 16
58ef912c 442
58ef912c
MM
443#define RTC_UNICAST 0
444#define RTC_BROADCAST 1
445#define RTC_MULTICAST 2
446#define RTC_ANYCAST 3 /* IPv6 Anycast */
447
62e64905
OZ
448#define RTD_NONE 0 /* Undefined next hop */
449#define RTD_UNICAST 1 /* Next hop is neighbor router */
58ef912c
MM
450#define RTD_BLACKHOLE 2 /* Silently drop packets */
451#define RTD_UNREACHABLE 3 /* Reject as unreachable */
452#define RTD_PROHIBIT 4 /* Administratively prohibited */
665be7f6 453#define RTD_MAX 5
58ef912c 454
04925e90
MM
455#define RTAF_CACHED 1 /* This is a cached rta */
456
d1e146f2
OZ
457#define IGP_METRIC_UNKNOWN 0x80000000 /* Default igp_metric used when no other
458 protocol-specific metric is availabe */
459
8d9eef17 460
665be7f6
OZ
461const char * rta_dest_names[RTD_MAX];
462
463static inline const char *rta_dest_name(uint n)
464{ return (n < RTD_MAX) ? rta_dest_names[n] : "???"; }
465
8d9eef17
OZ
466/* Route has regular, reachable nexthop (i.e. not RTD_UNREACHABLE and like) */
467static inline int rte_is_reachable(rte *r)
62e64905 468{ return r->attrs->dest == RTD_UNICAST; }
8d9eef17
OZ
469
470
58ef912c
MM
471/*
472 * Extended Route Attributes
473 */
474
475typedef struct eattr {
ee7e2ffd 476 word id; /* EA_CODE(PROTOCOL_..., protocol-dependent ID) */
b77ae37d
MM
477 byte flags; /* Protocol-dependent flags */
478 byte type; /* Attribute type and several flags (EAF_...) */
58ef912c
MM
479 union {
480 u32 data;
4c553c5a 481 const struct adata *ptr; /* Attribute data elsewhere */
58ef912c
MM
482 } u;
483} eattr;
484
265419a3 485
b77ae37d 486#define EA_CODE(proto,id) (((proto) << 8) | (id))
b77ae37d 487#define EA_ID(ea) ((ea) & 0xff)
265419a3 488#define EA_PROTO(ea) ((ea) >> 8)
9aa77fcc 489#define EA_ID_FLAG(ea) (1 << EA_ID(ea))
265419a3
MM
490#define EA_CUSTOM(id) ((id) | EA_CUSTOM_BIT)
491#define EA_IS_CUSTOM(ea) ((ea) & EA_CUSTOM_BIT)
492#define EA_CUSTOM_ID(ea) ((ea) & ~EA_CUSTOM_BIT)
493
494const char *ea_custom_name(uint ea);
b77ae37d 495
ee7e2ffd 496#define EA_GEN_IGP_METRIC EA_CODE(PROTOCOL_NONE, 0)
ba5e5940 497
8d24b689 498#define EA_CODE_MASK 0xffff
265419a3 499#define EA_CUSTOM_BIT 0x8000
8d24b689 500#define EA_ALLOW_UNDEF 0x10000 /* ea_find: allow EAF_TYPE_UNDEF */
315f23a0 501#define EA_BIT(n) ((n) << 24) /* Used in bitfield accessors */
25566c68 502#define EA_BIT_GET(ea) ((ea) >> 24)
8d24b689 503
66dbdbd9 504#define EAF_TYPE_MASK 0x1f /* Mask with this to get type */
315f23a0 505#define EAF_TYPE_INT 0x01 /* 32-bit unsigned integer number */
b77ae37d 506#define EAF_TYPE_OPAQUE 0x02 /* Opaque byte string (not filterable) */
ca97b489
MM
507#define EAF_TYPE_IP_ADDRESS 0x04 /* IP address */
508#define EAF_TYPE_ROUTER_ID 0x05 /* Router ID (IPv4 address) */
b475c543 509#define EAF_TYPE_AS_PATH 0x06 /* BGP AS path (encoding per RFC 1771:4.3) */
315f23a0 510#define EAF_TYPE_BITFIELD 0x09 /* 32-bit embedded bitfield */
b475c543 511#define EAF_TYPE_INT_SET 0x0a /* Set of u32's (e.g., a community list) */
42a0c054 512#define EAF_TYPE_EC_SET 0x0e /* Set of pairs of u32's - ext. community list */
66dbdbd9
OZ
513#define EAF_TYPE_LC_SET 0x12 /* Set of triplets of u32's - large community list */
514#define EAF_TYPE_UNDEF 0x1f /* `force undefined' entry */
b77ae37d 515#define EAF_EMBEDDED 0x01 /* Data stored in eattr.u.data (part of type spec) */
ca97b489 516#define EAF_VAR_LENGTH 0x02 /* Attribute length is variable (part of type spec) */
d15b0b0a
OZ
517#define EAF_ORIGINATED 0x20 /* The attribute has originated locally */
518#define EAF_FRESH 0x40 /* An uncached attribute (e.g. modified in export filter) */
58ef912c 519
d15b0b0a 520typedef struct adata {
ae80a2de 521 uint length; /* Length of data */
58ef912c 522 byte data[0];
d15b0b0a
OZ
523} adata;
524
4c553c5a
MM
525extern const adata null_adata; /* adata of length 0 */
526
d15b0b0a
OZ
527static inline struct adata *
528lp_alloc_adata(struct linpool *pool, uint len)
529{
530 struct adata *ad = lp_alloc(pool, sizeof(struct adata) + len);
531 ad->length = len;
532 return ad;
533}
58ef912c 534
4c553c5a 535static inline int adata_same(const struct adata *a, const struct adata *b)
28a10f84
OZ
536{ return (a->length == b->length && !memcmp(a->data, b->data, a->length)); }
537
538
58ef912c
MM
539typedef struct ea_list {
540 struct ea_list *next; /* In case we have an override list */
b77ae37d 541 byte flags; /* Flags: EALF_... */
58ef912c 542 byte rfu;
b77ae37d 543 word count; /* Number of attributes */
58ef912c
MM
544 eattr attrs[0]; /* Attribute definitions themselves */
545} ea_list;
546
b77ae37d
MM
547#define EALF_SORTED 1 /* Attributes are sorted by code */
548#define EALF_BISECT 2 /* Use interval bisection for searching */
549#define EALF_CACHED 4 /* Attributes belonging to cached rta */
875cc073 550#define EALF_TEMP 8 /* Temporary ea_list added by make_tmp_attrs hooks */
58ef912c 551
094d2bdb
OZ
552struct rte_src *rt_find_source(struct proto *p, u32 id);
553struct rte_src *rt_get_source(struct proto *p, u32 id);
554static inline void rt_lock_source(struct rte_src *src) { src->uc++; }
555static inline void rt_unlock_source(struct rte_src *src) { src->uc--; }
556void rt_prune_sources(void);
557
9fdf9d29
OZ
558struct ea_walk_state {
559 ea_list *eattrs; /* Ccurrent ea_list, initially set by caller */
560 eattr *ea; /* Current eattr, initially NULL */
561 u32 visited[4]; /* Bitfield, limiting max to 128 */
562};
094d2bdb 563
b77ae37d 564eattr *ea_find(ea_list *, unsigned ea);
9fdf9d29 565eattr *ea_walk(struct ea_walk_state *s, uint id, uint max);
c0100454 566int ea_get_int(ea_list *, unsigned ea, int def);
b77ae37d
MM
567void ea_dump(ea_list *);
568void ea_sort(ea_list *); /* Sort entries in all sub-lists */
6f57dcc0 569unsigned ea_scan(ea_list *); /* How many bytes do we need for merged ea_list */
b77ae37d 570void ea_merge(ea_list *from, ea_list *to); /* Merge sub-lists to allocated buffer */
6f57dcc0 571int ea_same(ea_list *x, ea_list *y); /* Test whether two ea_lists are identical */
ae80a2de 572uint ea_hash(ea_list *e); /* Calculate 16-bit hash value */
ce1da96e 573ea_list *ea_append(ea_list *to, ea_list *what);
315f23a0 574void ea_format_bitfield(struct eattr *a, byte *buf, int bufsize, const char **names, int min, int max);
58ef912c 575
13c0be19
JMM
576#define ea_normalize(ea) do { \
577 if (ea->next) { \
578 ea_list *t = alloca(ea_scan(ea)); \
579 ea_merge(ea, t); \
580 ea = t; \
581 } \
582 ea_sort(ea); \
875cc073
OZ
583 if (ea->count == 0) \
584 ea = NULL; \
13c0be19
JMM
585} while(0) \
586
d493d0f1
OZ
587static inline eattr *
588ea_set_attr(ea_list **to, struct linpool *pool, uint id, uint flags, uint type, uintptr_t val)
589{
590 ea_list *a = lp_alloc(pool, sizeof(ea_list) + sizeof(eattr));
591 eattr *e = &a->attrs[0];
592
593 a->flags = EALF_SORTED;
594 a->count = 1;
595 a->next = *to;
596 *to = a;
597
598 e->id = id;
599 e->type = type;
600 e->flags = flags;
601
602 if (type & EAF_EMBEDDED)
603 e->u.data = (u32) val;
604 else
605 e->u.ptr = (struct adata *) val;
606
607 return e;
608}
609
610static inline void
611ea_set_attr_u32(ea_list **to, struct linpool *pool, uint id, uint flags, uint type, u32 val)
612{ ea_set_attr(to, pool, id, flags, type, (uintptr_t) val); }
613
614static inline void
615ea_set_attr_ptr(ea_list **to, struct linpool *pool, uint id, uint flags, uint type, struct adata *val)
616{ ea_set_attr(to, pool, id, flags, type, (uintptr_t) val); }
617
618static inline void
619ea_set_attr_data(ea_list **to, struct linpool *pool, uint id, uint flags, uint type, void *data, uint len)
620{
621 struct adata *a = lp_alloc_adata(pool, len);
622 memcpy(a->data, data, len);
623 ea_set_attr(to, pool, id, flags, type, (uintptr_t) a);
624}
625
626
d14f8c3c 627#define NEXTHOP_MAX_SIZE (sizeof(struct nexthop) + sizeof(u32)*MPLS_MAX_LABEL_STACK)
ec5e5d23
JMM
628
629static inline size_t nexthop_size(const struct nexthop *nh)
630{ return sizeof(struct nexthop) + sizeof(u32)*nh->labels; }
4e276a89
JMM
631int nexthop__same(struct nexthop *x, struct nexthop *y); /* Compare multipath nexthops */
632static inline int nexthop_same(struct nexthop *x, struct nexthop *y)
633{ return (x == y) || nexthop__same(x, y); }
634struct nexthop *nexthop_merge(struct nexthop *x, struct nexthop *y, int rx, int ry, int max, linpool *lp);
59d3a361 635struct nexthop *nexthop_sort(struct nexthop *x);
4e276a89 636static inline void nexthop_link(struct rta *a, struct nexthop *from)
ec5e5d23 637{ memcpy(&a->nh, from, nexthop_size(from)); }
62e64905 638void nexthop_insert(struct nexthop **n, struct nexthop *y);
4e276a89 639int nexthop_is_sorted(struct nexthop *x);
7e95c05d 640
2326b001 641void rta_init(void);
ec5e5d23 642static inline size_t rta_size(const rta *a) { return sizeof(rta) + sizeof(u32)*a->nh.labels; }
d14f8c3c 643#define RTA_MAX_SIZE (sizeof(rta) + sizeof(u32)*MPLS_MAX_LABEL_STACK)
2326b001 644rta *rta_lookup(rta *); /* Get rta equivalent to this one, uc++ */
094d2bdb 645static inline int rta_is_cached(rta *r) { return r->aflags & RTAF_CACHED; }
2326b001 646static inline rta *rta_clone(rta *r) { r->uc++; return r; }
b77ae37d
MM
647void rta__free(rta *r);
648static inline void rta_free(rta *r) { if (r && !--r->uc) rta__free(r); }
8d9eef17
OZ
649rta *rta_do_cow(rta *o, linpool *lp);
650static inline rta * rta_cow(rta *r, linpool *lp) { return rta_is_cached(r) ? rta_do_cow(r, lp) : r; }
2326b001
MM
651void rta_dump(rta *);
652void rta_dump_all(void);
13c0be19 653void rta_show(struct cli *, rta *);
1e37e35c 654
09ee846d 655u32 rt_get_igp_metric(rte *rt);
1e37e35c
OZ
656struct hostentry * rt_get_hostentry(rtable *tab, ip_addr a, ip_addr ll, rtable *dep);
657void rta_apply_hostentry(rta *a, struct hostentry *he, mpls_label_stack *mls);
658
659static inline void
660rta_set_recursive_next_hop(rtable *dep, rta *a, rtable *tab, ip_addr gw, ip_addr ll, mpls_label_stack *mls)
661{
662 rta_apply_hostentry(a, rt_get_hostentry(tab, gw, ll, dep), mls);
663}
cfe34a31
OZ
664
665/*
acb04cfd
OZ
666 * rta_set_recursive_next_hop() acquires hostentry from hostcache and fills
667 * rta->hostentry field. New hostentry has zero use count. Cached rta locks its
668 * hostentry (increases its use count), uncached rta does not lock it. Hostentry
669 * with zero use count is removed asynchronously during host cache update,
670 * therefore it is safe to hold such hostentry temorarily. Hostentry holds a
671 * lock for a 'source' rta, mainly to share multipath nexthops.
672 *
673 * There is no need to hold a lock for hostentry->dep table, because that table
674 * contains routes responsible for that hostentry, and therefore is non-empty if
675 * given hostentry has non-zero use count. If the hostentry has zero use count,
676 * the entry is removed before dep is referenced.
677 *
678 * The protocol responsible for routes with recursive next hops should hold a
679 * lock for a 'source' table governing that routes (argument tab to
680 * rta_set_recursive_next_hop()), because its routes reference hostentries
681 * (through rta) related to the governing table. When all such routes are
682 * removed, rtas are immediately removed achieving zero uc. Then the 'source'
683 * table lock could be immediately released, although hostentries may still
684 * exist - they will be freed together with the 'source' table.
cfe34a31
OZ
685 */
686
687static inline void rt_lock_hostentry(struct hostentry *he) { if (he) he->uc++; }
688static inline void rt_unlock_hostentry(struct hostentry *he) { if (he) he->uc--; }
689
a8b60382
MM
690/*
691 * Default protocol preferences
692 */
693
a82f692e 694#define DEF_PREF_DIRECT 240 /* Directly connected */
a8b60382 695#define DEF_PREF_STATIC 200 /* Static route */
916c8c0a 696#define DEF_PREF_OSPF 150 /* OSPF intra-area, inter-area and type 1 external routes */
937e75d8 697#define DEF_PREF_BABEL 130 /* Babel */
a8b60382
MM
698#define DEF_PREF_RIP 120 /* RIP */
699#define DEF_PREF_BGP 100 /* BGP */
65d2a88d 700#define DEF_PREF_RPKI 100 /* RPKI */
916c8c0a 701#define DEF_PREF_INHERITED 10 /* Routes inherited from other routing daemons */
a8b60382 702
af582c48
OZ
703/*
704 * Route Origin Authorization
705 */
706
650b4189
PT
707#define ROA_UNKNOWN 0
708#define ROA_VALID 1
709#define ROA_INVALID 2
af582c48 710
9656dce7 711#endif