]> git.ipfire.org Git - thirdparty/bird.git/blob - nest/route.h
eaaa5c3f643ce8dfba5ed25f1c6fa36e72ac7cd3
[thirdparty/bird.git] / nest / route.h
1 /*
2 * BIRD Internet Routing Daemon -- Routing Table
3 *
4 * (c) 1998--2000 Martin Mares <mj@ucw.cz>
5 *
6 * Can be freely distributed and used under the terms of the GNU GPL.
7 */
8
9 #ifndef _BIRD_ROUTE_H_
10 #define _BIRD_ROUTE_H_
11
12 #include "lib/lists.h"
13 #include "lib/bitmap.h"
14 #include "lib/resource.h"
15 #include "lib/net.h"
16
17 struct ea_list;
18 struct protocol;
19 struct proto;
20 struct rte_src;
21 struct symbol;
22 struct filter;
23 struct cli;
24
25 /*
26 * Generic data structure for storing network prefixes. Also used
27 * for the master routing table. Currently implemented as a hash
28 * table.
29 *
30 * Available operations:
31 * - insertion of new entry
32 * - deletion of entry
33 * - searching for entry by network prefix
34 * - asynchronous retrieval of fib contents
35 */
36
37 struct fib_node {
38 struct fib_node *next; /* Next in hash chain */
39 struct fib_iterator *readers; /* List of readers of this node */
40 byte flags; /* User-defined, will be removed */
41 net_addr addr[0];
42 };
43
44 struct fib_iterator { /* See lib/slists.h for an explanation */
45 struct fib_iterator *prev, *next; /* Must be synced with struct fib_node! */
46 byte efef; /* 0xff to distinguish between iterator and node */
47 byte pad[3];
48 struct fib_node *node; /* Or NULL if freshly merged */
49 uint hash;
50 };
51
52 typedef void (*fib_init_fn)(void *);
53
54 struct fib {
55 pool *fib_pool; /* Pool holding all our data */
56 slab *fib_slab; /* Slab holding all fib nodes */
57 struct fib_node **hash_table; /* Node hash table */
58 uint hash_size; /* Number of hash table entries (a power of two) */
59 uint hash_order; /* Binary logarithm of hash_size */
60 uint hash_shift; /* 32 - hash_order */
61 uint addr_type; /* Type of address data stored in fib (NET_*) */
62 uint node_size; /* FIB node size, 0 for nonuniform */
63 uint node_offset; /* Offset of fib_node struct inside of user data */
64 uint entries; /* Number of entries */
65 uint entries_min, entries_max; /* Entry count limits (else start rehashing) */
66 fib_init_fn init; /* Constructor */
67 };
68
69 static inline void * fib_node_to_user(struct fib *f, struct fib_node *e)
70 { return e ? (void *) ((char *) e - f->node_offset) : NULL; }
71
72 static inline struct fib_node * fib_user_to_node(struct fib *f, void *e)
73 { return e ? (void *) ((char *) e + f->node_offset) : NULL; }
74
75 void fib_init(struct fib *f, pool *p, uint addr_type, uint node_size, uint node_offset, uint hash_order, fib_init_fn init);
76 void *fib_find(struct fib *, const net_addr *); /* Find or return NULL if doesn't exist */
77 void *fib_get_chain(struct fib *f, const net_addr *a); /* Find first node in linked list from hash table */
78 void *fib_get(struct fib *, const net_addr *); /* Find or create new if nonexistent */
79 void *fib_route(struct fib *, const net_addr *); /* Longest-match routing lookup */
80 void fib_delete(struct fib *, void *); /* Remove fib entry */
81 void fib_free(struct fib *); /* Destroy the fib */
82 void fib_check(struct fib *); /* Consistency check for debugging */
83
84 void fit_init(struct fib_iterator *, struct fib *); /* Internal functions, don't call */
85 struct fib_node *fit_get(struct fib *, struct fib_iterator *);
86 void fit_put(struct fib_iterator *, struct fib_node *);
87 void fit_put_next(struct fib *f, struct fib_iterator *i, struct fib_node *n, uint hpos);
88
89
90 #define FIB_WALK(fib, type, z) do { \
91 struct fib_node *fn_, **ff_ = (fib)->hash_table; \
92 uint count_ = (fib)->hash_size; \
93 type *z; \
94 while (count_--) \
95 for (fn_ = *ff_++; z = fib_node_to_user(fib, fn_); fn_=fn_->next)
96
97 #define FIB_WALK_END } while (0)
98
99 #define FIB_ITERATE_INIT(it, fib) fit_init(it, fib)
100
101 #define FIB_ITERATE_START(fib, it, type, z) do { \
102 struct fib_node *fn_ = fit_get(fib, it); \
103 uint count_ = (fib)->hash_size; \
104 uint hpos_ = (it)->hash; \
105 type *z; \
106 for(;;) { \
107 if (!fn_) \
108 { \
109 if (++hpos_ >= count_) \
110 break; \
111 fn_ = (fib)->hash_table[hpos_]; \
112 continue; \
113 } \
114 z = fib_node_to_user(fib, fn_);
115
116 #define FIB_ITERATE_END fn_ = fn_->next; } } while(0)
117
118 #define FIB_ITERATE_PUT(it) fit_put(it, fn_)
119
120 #define FIB_ITERATE_PUT_NEXT(it, fib) fit_put_next(fib, it, fn_, hpos_)
121
122 #define FIB_ITERATE_UNLINK(it, fib) fit_get(fib, it)
123
124
125 /*
126 * Master Routing Tables. Generally speaking, each of them contains a FIB
127 * with each entry pointing to a list of route entries representing routes
128 * to given network (with the selected one at the head).
129 *
130 * Each of the RTE's contains variable data (the preference and protocol-dependent
131 * metrics) and a pointer to a route attribute block common for many routes).
132 *
133 * It's guaranteed that there is at most one RTE for every (prefix,proto) pair.
134 */
135
136 struct rtable_config {
137 node n;
138 char *name;
139 struct rtable *table;
140 struct proto_config *krt_attached; /* Kernel syncer attached to this table */
141 uint addr_type; /* Type of address data stored in table (NET_*) */
142 int gc_max_ops; /* Maximum number of operations before GC is run */
143 int gc_min_time; /* Minimum time between two consecutive GC runs */
144 byte sorted; /* Routes of network are sorted according to rte_better() */
145 };
146
147 typedef struct rtable {
148 node n; /* Node in list of all tables */
149 struct fib fib;
150 char *name; /* Name of this table */
151 list channels; /* List of attached channels (struct channel) */
152 uint addr_type; /* Type of address data stored in table (NET_*) */
153 int pipe_busy; /* Pipe loop detection */
154 int use_count; /* Number of protocols using this table */
155 u32 rt_count; /* Number of routes in the table */
156 struct hmap id_map;
157 struct hostcache *hostcache;
158 struct rtable_config *config; /* Configuration of this table */
159 struct config *deleted; /* Table doesn't exist in current configuration,
160 * delete as soon as use_count becomes 0 and remove
161 * obstacle from this routing table.
162 */
163 struct event *rt_event; /* Routing table event */
164 btime gc_time; /* Time of last GC */
165 int gc_counter; /* Number of operations since last GC */
166 byte prune_state; /* Table prune state, 1 -> scheduled, 2-> running */
167 byte hcu_scheduled; /* Hostcache update is scheduled */
168 byte nhu_state; /* Next Hop Update state */
169 struct fib_iterator prune_fit; /* Rtable prune FIB iterator */
170 struct fib_iterator nhu_fit; /* Next Hop Update FIB iterator */
171 } rtable;
172
173 #define NHU_CLEAN 0
174 #define NHU_SCHEDULED 1
175 #define NHU_RUNNING 2
176 #define NHU_DIRTY 3
177
178 typedef struct network {
179 struct rte *routes; /* Available routes for this network */
180 struct fib_node n; /* FIB flags reserved for kernel syncer */
181 } net;
182
183 struct hostcache {
184 slab *slab; /* Slab holding all hostentries */
185 struct hostentry **hash_table; /* Hash table for hostentries */
186 unsigned hash_order, hash_shift;
187 unsigned hash_max, hash_min;
188 unsigned hash_items;
189 linpool *lp; /* Linpool for trie */
190 struct f_trie *trie; /* Trie of prefixes that might affect hostentries */
191 list hostentries; /* List of all hostentries */
192 byte update_hostcache;
193 };
194
195 struct hostentry {
196 node ln;
197 ip_addr addr; /* IP address of host, part of key */
198 ip_addr link; /* (link-local) IP address of host, used as gw
199 if host is directly attached */
200 struct rtable *tab; /* Dependent table, part of key */
201 struct hostentry *next; /* Next in hash chain */
202 unsigned hash_key; /* Hash key */
203 unsigned uc; /* Use count */
204 struct rta *src; /* Source rta entry */
205 byte dest; /* Chosen route destination type (RTD_...) */
206 byte nexthop_linkable; /* Nexthop list is completely non-device */
207 u32 igp_metric; /* Chosen route IGP metric */
208 };
209
210 typedef struct rte {
211 struct rte *next;
212 net *net; /* Network this RTE belongs to */
213 struct channel *sender; /* Channel used to send the route to the routing table */
214 struct rta *attrs; /* Attributes of this route */
215 u32 id; /* Table specific route id */
216 byte flags; /* Flags (REF_...) */
217 byte pflags; /* Protocol-specific flags */
218 word pref; /* Route preference */
219 btime lastmod; /* Last modified */
220 union { /* Protocol-dependent data (metrics etc.) */
221 #ifdef CONFIG_RIP
222 struct {
223 struct iface *from; /* Incoming iface */
224 u8 metric; /* RIP metric */
225 u16 tag; /* External route tag */
226 } rip;
227 #endif
228 #ifdef CONFIG_OSPF
229 struct {
230 u32 metric1, metric2; /* OSPF Type 1 and Type 2 metrics */
231 u32 tag; /* External route tag */
232 u32 router_id; /* Router that originated this route */
233 } ospf;
234 #endif
235 #ifdef CONFIG_BGP
236 struct {
237 u8 suppressed; /* Used for deterministic MED comparison */
238 s8 stale; /* Route is LLGR_STALE, -1 if unknown */
239 } bgp;
240 #endif
241 #ifdef CONFIG_BABEL
242 struct {
243 u16 seqno; /* Babel seqno */
244 u16 metric; /* Babel metric */
245 u64 router_id; /* Babel router id */
246 } babel;
247 #endif
248 struct { /* Routes generated by krt sync (both temporary and inherited ones) */
249 s8 src; /* Alleged route source (see krt.h) */
250 u8 proto; /* Kernel source protocol ID */
251 u8 seen; /* Seen during last scan */
252 u8 best; /* Best route in network, propagated to core */
253 u32 metric; /* Kernel metric */
254 } krt;
255 } u;
256 } rte;
257
258 #define REF_COW 1 /* Copy this rte on write */
259 #define REF_FILTERED 2 /* Route is rejected by import filter */
260 #define REF_STALE 4 /* Route is stale in a refresh cycle */
261 #define REF_DISCARD 8 /* Route is scheduled for discard */
262 #define REF_MODIFY 16 /* Route is scheduled for modify */
263
264 /* Route is valid for propagation (may depend on other flags in the future), accepts NULL */
265 static inline int rte_is_valid(rte *r) { return r && !(r->flags & REF_FILTERED); }
266
267 /* Route just has REF_FILTERED flag */
268 static inline int rte_is_filtered(rte *r) { return !!(r->flags & REF_FILTERED); }
269
270
271 /* Types of route announcement, also used as flags */
272 #define RA_UNDEF 0 /* Undefined RA type */
273 #define RA_OPTIMAL 1 /* Announcement of optimal route change */
274 #define RA_ACCEPTED 2 /* Announcement of first accepted route */
275 #define RA_ANY 3 /* Announcement of any route change */
276 #define RA_MERGED 4 /* Announcement of optimal route merged with next ones */
277
278 /* Return value of preexport() callback */
279 #define RIC_ACCEPT 1 /* Accepted by protocol */
280 #define RIC_PROCESS 0 /* Process it through import filter */
281 #define RIC_REJECT -1 /* Rejected by protocol */
282 #define RIC_DROP -2 /* Silently dropped by protocol */
283
284 extern list routing_tables;
285 struct config;
286
287 void rt_init(void);
288 void rt_preconfig(struct config *);
289 void rt_commit(struct config *new, struct config *old);
290 void rt_lock_table(rtable *);
291 void rt_unlock_table(rtable *);
292 void rt_setup(pool *, rtable *, struct rtable_config *);
293 static inline net *net_find(rtable *tab, const net_addr *addr) { return (net *) fib_find(&tab->fib, addr); }
294 static inline net *net_find_valid(rtable *tab, const net_addr *addr)
295 { net *n = net_find(tab, addr); return (n && rte_is_valid(n->routes)) ? n : NULL; }
296 static inline net *net_get(rtable *tab, const net_addr *addr) { return (net *) fib_get(&tab->fib, addr); }
297 void *net_route(rtable *tab, const net_addr *n);
298 int net_roa_check(rtable *tab, const net_addr *n, u32 asn);
299 rte *rte_find(net *net, struct rte_src *src);
300 rte *rte_get_temp(struct rta *);
301 void rte_update2(struct channel *c, const net_addr *n, rte *new, struct rte_src *src);
302 /* rte_update() moved to protocol.h to avoid dependency conflicts */
303 int rt_examine(rtable *t, net_addr *a, struct proto *p, const struct filter *filter);
304 rte *rt_export_merged(struct channel *c, net *net, rte **rt_free, linpool *pool, int silent);
305 void rt_refresh_begin(rtable *t, struct channel *c);
306 void rt_refresh_end(rtable *t, struct channel *c);
307 void rt_modify_stale(rtable *t, struct channel *c);
308 void rt_schedule_prune(rtable *t);
309 void rte_dump(rte *);
310 void rte_free(rte *);
311 rte *rte_do_cow(rte *);
312 static inline rte * rte_cow(rte *r) { return (r->flags & REF_COW) ? rte_do_cow(r) : r; }
313 rte *rte_cow_rta(rte *r, linpool *lp);
314 void rte_init_tmp_attrs(struct rte *r, linpool *lp, uint max);
315 void rte_make_tmp_attr(struct rte *r, uint id, uint type, uintptr_t val);
316 void rte_make_tmp_attrs(struct rte **r, struct linpool *pool, struct rta **old_attrs);
317 uintptr_t rte_store_tmp_attr(struct rte *r, uint id);
318 void rt_dump(rtable *);
319 void rt_dump_all(void);
320 int rt_feed_channel(struct channel *c);
321 void rt_feed_channel_abort(struct channel *c);
322 int rte_update_in(struct channel *c, const net_addr *n, rte *new, struct rte_src *src);
323 int rt_reload_channel(struct channel *c);
324 void rt_reload_channel_abort(struct channel *c);
325 void rt_prune_sync(rtable *t, int all);
326 int rte_update_out(struct channel *c, const net_addr *n, rte *new, rte *old0, int refeed);
327 struct rtable_config *rt_new_table(struct symbol *s, uint addr_type);
328
329
330 /* Default limit for ECMP next hops, defined in sysdep code */
331 extern const int rt_default_ecmp;
332
333 struct rt_show_data_rtable {
334 node n;
335 rtable *table;
336 struct channel *export_channel;
337 };
338
339 struct rt_show_data {
340 net_addr *addr;
341 list tables;
342 struct rt_show_data_rtable *tab; /* Iterator over table list */
343 struct rt_show_data_rtable *last_table; /* Last table in output */
344 struct fib_iterator fit; /* Iterator over networks in table */
345 int verbose, tables_defined_by;
346 const struct filter *filter;
347 struct proto *show_protocol;
348 struct proto *export_protocol;
349 struct channel *export_channel;
350 struct config *running_on_config;
351 struct krt_proto *kernel;
352 int export_mode, primary_only, filtered, stats, show_for;
353
354 int table_open; /* Iteration (fit) is open */
355 int net_counter, rt_counter, show_counter, table_counter;
356 int net_counter_last, rt_counter_last, show_counter_last;
357 };
358
359 void rt_show(struct rt_show_data *);
360 struct rt_show_data_rtable * rt_show_add_table(struct rt_show_data *d, rtable *t);
361
362 /* Value of table definition mode in struct rt_show_data */
363 #define RSD_TDB_DEFAULT 0 /* no table specified */
364 #define RSD_TDB_INDIRECT 0 /* show route ... protocol P ... */
365 #define RSD_TDB_ALL RSD_TDB_SET /* show route ... table all ... */
366 #define RSD_TDB_DIRECT RSD_TDB_SET | RSD_TDB_NMN /* show route ... table X table Y ... */
367
368 #define RSD_TDB_SET 0x1 /* internal: show empty tables */
369 #define RSD_TDB_NMN 0x2 /* internal: need matching net */
370
371 /* Value of export_mode in struct rt_show_data */
372 #define RSEM_NONE 0 /* Export mode not used */
373 #define RSEM_PREEXPORT 1 /* Routes ready for export, before filtering */
374 #define RSEM_EXPORT 2 /* Routes accepted by export filter */
375 #define RSEM_NOEXPORT 3 /* Routes rejected by export filter */
376 #define RSEM_EXPORTED 4 /* Routes marked in export map */
377
378 /*
379 * Route Attributes
380 *
381 * Beware: All standard BGP attributes must be represented here instead
382 * of making them local to the route. This is needed to ensure proper
383 * construction of BGP route attribute lists.
384 */
385
386 /* Nexthop structure */
387 struct nexthop {
388 ip_addr gw; /* Next hop */
389 struct iface *iface; /* Outgoing interface */
390 struct nexthop *next;
391 byte flags;
392 byte weight;
393 byte labels_orig; /* Number of labels before hostentry was applied */
394 byte labels; /* Number of all labels */
395 u32 label[0];
396 };
397
398 #define RNF_ONLINK 0x1 /* Gateway is onlink regardless of IP ranges */
399
400
401 struct rte_src {
402 struct rte_src *next; /* Hash chain */
403 struct proto *proto; /* Protocol the source is based on */
404 u32 private_id; /* Private ID, assigned by the protocol */
405 u32 global_id; /* Globally unique ID of the source */
406 unsigned uc; /* Use count */
407 };
408
409
410 typedef struct rta {
411 struct rta *next, **pprev; /* Hash chain */
412 u32 uc; /* Use count */
413 u32 hash_key; /* Hash over important fields */
414 struct ea_list *eattrs; /* Extended Attribute chain */
415 struct rte_src *src; /* Route source that created the route */
416 struct hostentry *hostentry; /* Hostentry for recursive next-hops */
417 ip_addr from; /* Advertising router */
418 u32 igp_metric; /* IGP metric to next hop (for iBGP routes) */
419 u8 source; /* Route source (RTS_...) */
420 u8 scope; /* Route scope (SCOPE_... -- see ip.h) */
421 u8 dest; /* Route destination type (RTD_...) */
422 u8 aflags;
423 struct nexthop nh; /* Next hop */
424 } rta;
425
426 #define RTS_DUMMY 0 /* Dummy route to be removed soon */
427 #define RTS_STATIC 1 /* Normal static route */
428 #define RTS_INHERIT 2 /* Route inherited from kernel */
429 #define RTS_DEVICE 3 /* Device route */
430 #define RTS_STATIC_DEVICE 4 /* Static device route */
431 #define RTS_REDIRECT 5 /* Learned via redirect */
432 #define RTS_RIP 6 /* RIP route */
433 #define RTS_OSPF 7 /* OSPF route */
434 #define RTS_OSPF_IA 8 /* OSPF inter-area route */
435 #define RTS_OSPF_EXT1 9 /* OSPF external route type 1 */
436 #define RTS_OSPF_EXT2 10 /* OSPF external route type 2 */
437 #define RTS_BGP 11 /* BGP route */
438 #define RTS_PIPE 12 /* Inter-table wormhole */
439 #define RTS_BABEL 13 /* Babel route */
440 #define RTS_RPKI 14 /* Route Origin Authorization */
441 #define RTS_PERF 15 /* Perf checker */
442 #define RTS_MAX 16
443
444 #define RTC_UNICAST 0
445 #define RTC_BROADCAST 1
446 #define RTC_MULTICAST 2
447 #define RTC_ANYCAST 3 /* IPv6 Anycast */
448
449 #define RTD_NONE 0 /* Undefined next hop */
450 #define RTD_UNICAST 1 /* Next hop is neighbor router */
451 #define RTD_BLACKHOLE 2 /* Silently drop packets */
452 #define RTD_UNREACHABLE 3 /* Reject as unreachable */
453 #define RTD_PROHIBIT 4 /* Administratively prohibited */
454 #define RTD_MAX 5
455
456 #define RTAF_CACHED 1 /* This is a cached rta */
457
458 #define IGP_METRIC_UNKNOWN 0x80000000 /* Default igp_metric used when no other
459 protocol-specific metric is availabe */
460
461
462 const char * rta_dest_names[RTD_MAX];
463
464 static inline const char *rta_dest_name(uint n)
465 { return (n < RTD_MAX) ? rta_dest_names[n] : "???"; }
466
467 /* Route has regular, reachable nexthop (i.e. not RTD_UNREACHABLE and like) */
468 static inline int rte_is_reachable(rte *r)
469 { return r->attrs->dest == RTD_UNICAST; }
470
471
472 /*
473 * Extended Route Attributes
474 */
475
476 typedef struct eattr {
477 word id; /* EA_CODE(PROTOCOL_..., protocol-dependent ID) */
478 byte flags; /* Protocol-dependent flags */
479 byte type; /* Attribute type and several flags (EAF_...) */
480 union {
481 u32 data;
482 const struct adata *ptr; /* Attribute data elsewhere */
483 } u;
484 } eattr;
485
486
487 #define EA_CODE(proto,id) (((proto) << 8) | (id))
488 #define EA_ID(ea) ((ea) & 0xff)
489 #define EA_PROTO(ea) ((ea) >> 8)
490 #define EA_ID_FLAG(ea) (1 << EA_ID(ea))
491 #define EA_CUSTOM(id) ((id) | EA_CUSTOM_BIT)
492 #define EA_IS_CUSTOM(ea) ((ea) & EA_CUSTOM_BIT)
493 #define EA_CUSTOM_ID(ea) ((ea) & ~EA_CUSTOM_BIT)
494
495 const char *ea_custom_name(uint ea);
496
497 #define EA_GEN_IGP_METRIC EA_CODE(PROTOCOL_NONE, 0)
498
499 #define EA_CODE_MASK 0xffff
500 #define EA_CUSTOM_BIT 0x8000
501 #define EA_ALLOW_UNDEF 0x10000 /* ea_find: allow EAF_TYPE_UNDEF */
502 #define EA_BIT(n) ((n) << 24) /* Used in bitfield accessors */
503 #define EA_BIT_GET(ea) ((ea) >> 24)
504
505 #define EAF_TYPE_MASK 0x1f /* Mask with this to get type */
506 #define EAF_TYPE_INT 0x01 /* 32-bit unsigned integer number */
507 #define EAF_TYPE_OPAQUE 0x02 /* Opaque byte string (not filterable) */
508 #define EAF_TYPE_IP_ADDRESS 0x04 /* IP address */
509 #define EAF_TYPE_ROUTER_ID 0x05 /* Router ID (IPv4 address) */
510 #define EAF_TYPE_AS_PATH 0x06 /* BGP AS path (encoding per RFC 1771:4.3) */
511 #define EAF_TYPE_BITFIELD 0x09 /* 32-bit embedded bitfield */
512 #define EAF_TYPE_INT_SET 0x0a /* Set of u32's (e.g., a community list) */
513 #define EAF_TYPE_EC_SET 0x0e /* Set of pairs of u32's - ext. community list */
514 #define EAF_TYPE_LC_SET 0x12 /* Set of triplets of u32's - large community list */
515 #define EAF_TYPE_UNDEF 0x1f /* `force undefined' entry */
516 #define EAF_EMBEDDED 0x01 /* Data stored in eattr.u.data (part of type spec) */
517 #define EAF_VAR_LENGTH 0x02 /* Attribute length is variable (part of type spec) */
518 #define EAF_ORIGINATED 0x20 /* The attribute has originated locally */
519 #define EAF_FRESH 0x40 /* An uncached attribute (e.g. modified in export filter) */
520
521 typedef struct adata {
522 uint length; /* Length of data */
523 byte data[0];
524 } adata;
525
526 extern const adata null_adata; /* adata of length 0 */
527
528 static inline struct adata *
529 lp_alloc_adata(struct linpool *pool, uint len)
530 {
531 struct adata *ad = lp_alloc(pool, sizeof(struct adata) + len);
532 ad->length = len;
533 return ad;
534 }
535
536 static inline int adata_same(const struct adata *a, const struct adata *b)
537 { return (a->length == b->length && !memcmp(a->data, b->data, a->length)); }
538
539
540 typedef struct ea_list {
541 struct ea_list *next; /* In case we have an override list */
542 byte flags; /* Flags: EALF_... */
543 byte rfu;
544 word count; /* Number of attributes */
545 eattr attrs[0]; /* Attribute definitions themselves */
546 } ea_list;
547
548 #define EALF_SORTED 1 /* Attributes are sorted by code */
549 #define EALF_BISECT 2 /* Use interval bisection for searching */
550 #define EALF_CACHED 4 /* Attributes belonging to cached rta */
551 #define EALF_TEMP 8 /* Temporary ea_list added by make_tmp_attrs hooks */
552
553 struct rte_src *rt_find_source(struct proto *p, u32 id);
554 struct rte_src *rt_get_source(struct proto *p, u32 id);
555 static inline void rt_lock_source(struct rte_src *src) { src->uc++; }
556 static inline void rt_unlock_source(struct rte_src *src) { src->uc--; }
557 void rt_prune_sources(void);
558
559 struct ea_walk_state {
560 ea_list *eattrs; /* Ccurrent ea_list, initially set by caller */
561 eattr *ea; /* Current eattr, initially NULL */
562 u32 visited[4]; /* Bitfield, limiting max to 128 */
563 };
564
565 eattr *ea_find(ea_list *, unsigned ea);
566 eattr *ea_walk(struct ea_walk_state *s, uint id, uint max);
567 int ea_get_int(ea_list *, unsigned ea, int def);
568 void ea_dump(ea_list *);
569 void ea_sort(ea_list *); /* Sort entries in all sub-lists */
570 unsigned ea_scan(ea_list *); /* How many bytes do we need for merged ea_list */
571 void ea_merge(ea_list *from, ea_list *to); /* Merge sub-lists to allocated buffer */
572 int ea_same(ea_list *x, ea_list *y); /* Test whether two ea_lists are identical */
573 uint ea_hash(ea_list *e); /* Calculate 16-bit hash value */
574 ea_list *ea_append(ea_list *to, ea_list *what);
575 void ea_format_bitfield(struct eattr *a, byte *buf, int bufsize, const char **names, int min, int max);
576
577 #define ea_normalize(ea) do { \
578 if (ea->next) { \
579 ea_list *t = alloca(ea_scan(ea)); \
580 ea_merge(ea, t); \
581 ea = t; \
582 } \
583 ea_sort(ea); \
584 if (ea->count == 0) \
585 ea = NULL; \
586 } while(0) \
587
588 static inline eattr *
589 ea_set_attr(ea_list **to, struct linpool *pool, uint id, uint flags, uint type, uintptr_t val)
590 {
591 ea_list *a = lp_alloc(pool, sizeof(ea_list) + sizeof(eattr));
592 eattr *e = &a->attrs[0];
593
594 a->flags = EALF_SORTED;
595 a->count = 1;
596 a->next = *to;
597 *to = a;
598
599 e->id = id;
600 e->type = type;
601 e->flags = flags;
602
603 if (type & EAF_EMBEDDED)
604 e->u.data = (u32) val;
605 else
606 e->u.ptr = (struct adata *) val;
607
608 return e;
609 }
610
611 static inline void
612 ea_set_attr_u32(ea_list **to, struct linpool *pool, uint id, uint flags, uint type, u32 val)
613 { ea_set_attr(to, pool, id, flags, type, (uintptr_t) val); }
614
615 static inline void
616 ea_set_attr_ptr(ea_list **to, struct linpool *pool, uint id, uint flags, uint type, struct adata *val)
617 { ea_set_attr(to, pool, id, flags, type, (uintptr_t) val); }
618
619 static inline void
620 ea_set_attr_data(ea_list **to, struct linpool *pool, uint id, uint flags, uint type, void *data, uint len)
621 {
622 struct adata *a = lp_alloc_adata(pool, len);
623 memcpy(a->data, data, len);
624 ea_set_attr(to, pool, id, flags, type, (uintptr_t) a);
625 }
626
627
628 #define NEXTHOP_MAX_SIZE (sizeof(struct nexthop) + sizeof(u32)*MPLS_MAX_LABEL_STACK)
629
630 static inline size_t nexthop_size(const struct nexthop *nh)
631 { return sizeof(struct nexthop) + sizeof(u32)*nh->labels; }
632 int nexthop__same(struct nexthop *x, struct nexthop *y); /* Compare multipath nexthops */
633 static inline int nexthop_same(struct nexthop *x, struct nexthop *y)
634 { return (x == y) || nexthop__same(x, y); }
635 struct nexthop *nexthop_merge(struct nexthop *x, struct nexthop *y, int rx, int ry, int max, linpool *lp);
636 struct nexthop *nexthop_sort(struct nexthop *x);
637 static inline void nexthop_link(struct rta *a, struct nexthop *from)
638 { memcpy(&a->nh, from, nexthop_size(from)); }
639 void nexthop_insert(struct nexthop **n, struct nexthop *y);
640 int nexthop_is_sorted(struct nexthop *x);
641
642 void rta_init(void);
643 static inline size_t rta_size(const rta *a) { return sizeof(rta) + sizeof(u32)*a->nh.labels; }
644 #define RTA_MAX_SIZE (sizeof(rta) + sizeof(u32)*MPLS_MAX_LABEL_STACK)
645 rta *rta_lookup(rta *); /* Get rta equivalent to this one, uc++ */
646 static inline int rta_is_cached(rta *r) { return r->aflags & RTAF_CACHED; }
647 static inline rta *rta_clone(rta *r) { r->uc++; return r; }
648 void rta__free(rta *r);
649 static inline void rta_free(rta *r) { if (r && !--r->uc) rta__free(r); }
650 rta *rta_do_cow(rta *o, linpool *lp);
651 static inline rta * rta_cow(rta *r, linpool *lp) { return rta_is_cached(r) ? rta_do_cow(r, lp) : r; }
652 void rta_dump(rta *);
653 void rta_dump_all(void);
654 void rta_show(struct cli *, rta *);
655
656 u32 rt_get_igp_metric(rte *rt);
657 struct hostentry * rt_get_hostentry(rtable *tab, ip_addr a, ip_addr ll, rtable *dep);
658 void rta_apply_hostentry(rta *a, struct hostentry *he, mpls_label_stack *mls);
659
660 static inline void
661 rta_set_recursive_next_hop(rtable *dep, rta *a, rtable *tab, ip_addr gw, ip_addr ll, mpls_label_stack *mls)
662 {
663 rta_apply_hostentry(a, rt_get_hostentry(tab, gw, ll, dep), mls);
664 }
665
666 /*
667 * rta_set_recursive_next_hop() acquires hostentry from hostcache and fills
668 * rta->hostentry field. New hostentry has zero use count. Cached rta locks its
669 * hostentry (increases its use count), uncached rta does not lock it. Hostentry
670 * with zero use count is removed asynchronously during host cache update,
671 * therefore it is safe to hold such hostentry temorarily. Hostentry holds a
672 * lock for a 'source' rta, mainly to share multipath nexthops.
673 *
674 * There is no need to hold a lock for hostentry->dep table, because that table
675 * contains routes responsible for that hostentry, and therefore is non-empty if
676 * given hostentry has non-zero use count. If the hostentry has zero use count,
677 * the entry is removed before dep is referenced.
678 *
679 * The protocol responsible for routes with recursive next hops should hold a
680 * lock for a 'source' table governing that routes (argument tab to
681 * rta_set_recursive_next_hop()), because its routes reference hostentries
682 * (through rta) related to the governing table. When all such routes are
683 * removed, rtas are immediately removed achieving zero uc. Then the 'source'
684 * table lock could be immediately released, although hostentries may still
685 * exist - they will be freed together with the 'source' table.
686 */
687
688 static inline void rt_lock_hostentry(struct hostentry *he) { if (he) he->uc++; }
689 static inline void rt_unlock_hostentry(struct hostentry *he) { if (he) he->uc--; }
690
691 /*
692 * Default protocol preferences
693 */
694
695 #define DEF_PREF_DIRECT 240 /* Directly connected */
696 #define DEF_PREF_STATIC 200 /* Static route */
697 #define DEF_PREF_OSPF 150 /* OSPF intra-area, inter-area and type 1 external routes */
698 #define DEF_PREF_BABEL 130 /* Babel */
699 #define DEF_PREF_RIP 120 /* RIP */
700 #define DEF_PREF_BGP 100 /* BGP */
701 #define DEF_PREF_RPKI 100 /* RPKI */
702 #define DEF_PREF_INHERITED 10 /* Routes inherited from other routing daemons */
703
704 /*
705 * Route Origin Authorization
706 */
707
708 #define ROA_UNKNOWN 0
709 #define ROA_VALID 1
710 #define ROA_INVALID 2
711
712 #endif