master
1/*-
2 * SPDX-License-Identifier: BSD-3-Clause
3 *
4 * Copyright (c) 1980, 1986, 1993
5 * The Regents of the University of California. All rights reserved.
6 *
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
9 * are met:
10 * 1. Redistributions of source code must retain the above copyright
11 * notice, this list of conditions and the following disclaimer.
12 * 2. Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
15 * 3. Neither the name of the University nor the names of its contributors
16 * may be used to endorse or promote products derived from this software
17 * without specific prior written permission.
18 *
19 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
20 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
23 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 * SUCH DAMAGE.
30 *
31 * @(#)route.h 8.4 (Berkeley) 1/9/95
32 */
33
34#ifndef _NET_ROUTE_H_
35#define _NET_ROUTE_H_
36
37#include <net/vnet.h>
38
39/*
40 * Kernel resident routing tables.
41 *
42 * The routing tables are initialized when interface addresses
43 * are set by making entries for all directly connected interfaces.
44 */
45
46/*
47 * Struct route consiste of a destination address,
48 * a route entry pointer, link-layer prepend data pointer along
49 * with its length.
50 */
51struct route {
52 struct nhop_object *ro_nh;
53 struct llentry *ro_lle;
54 /*
55 * ro_prepend and ro_plen are only used for bpf to pass in a
56 * preformed header. They are not cacheable.
57 */
58 char *ro_prepend;
59 uint16_t ro_plen;
60 uint16_t ro_flags;
61 uint16_t ro_mtu; /* saved ro_rt mtu */
62 uint16_t spare;
63 struct sockaddr ro_dst;
64};
65
66#define RT_L2_ME_BIT 2 /* dst L2 addr is our address */
67#define RT_MAY_LOOP_BIT 3 /* dst may require loop copy */
68#define RT_HAS_HEADER_BIT 4 /* mbuf already have its header prepended */
69
70#define RT_L2_ME (1 << RT_L2_ME_BIT) /* 0x0004 */
71#define RT_MAY_LOOP (1 << RT_MAY_LOOP_BIT) /* 0x0008 */
72#define RT_HAS_HEADER (1 << RT_HAS_HEADER_BIT) /* 0x0010 */
73
74#define RT_REJECT 0x0020 /* Destination is reject */
75#define RT_BLACKHOLE 0x0040 /* Destination is blackhole */
76#define RT_HAS_GW 0x0080 /* Destination has GW */
77#define RT_LLE_CACHE 0x0100 /* Cache link layer */
78
79struct rt_metrics {
80 u_long rmx_locks; /* Kernel must leave these values alone */
81 u_long rmx_mtu; /* MTU for this path */
82 u_long rmx_hopcount; /* max hops expected */
83 u_long rmx_expire; /* lifetime for route, e.g. redirect */
84 u_long rmx_recvpipe; /* inbound delay-bandwidth product */
85 u_long rmx_sendpipe; /* outbound delay-bandwidth product */
86 u_long rmx_ssthresh; /* outbound gateway buffer limit */
87 u_long rmx_rtt; /* estimated round trip time */
88 u_long rmx_rttvar; /* estimated rtt variance */
89 u_long rmx_pksent; /* packets sent using this route */
90 u_long rmx_weight; /* route weight */
91 u_long rmx_nhidx; /* route nexhop index */
92 u_long rmx_filler[2]; /* will be used for T/TCP later */
93};
94
95/*
96 * rmx_rtt and rmx_rttvar are stored as microseconds;
97 */
98#define RTM_RTTUNIT 1000000 /* units for rtt, rttvar, as units per sec */
99
100/* lle state is exported in rmx_state rt_metrics field */
101#define rmx_state rmx_weight
102
103/* default route weight */
104#define RT_DEFAULT_WEIGHT 1
105#define RT_MAX_WEIGHT 16777215 /* 3 bytes */
106
107/*
108 * Keep a generation count of routing table, incremented on route addition,
109 * so we can invalidate caches. This is accessed without a lock, as precision
110 * is not required.
111 */
112typedef volatile u_int rt_gen_t; /* tree generation (for adds) */
113#define RT_GEN(fibnum, af) rt_tables_get_gen(fibnum, af)
114
115#define RT_DEFAULT_FIB 0 /* Explicitly mark fib=0 restricted cases */
116#define RT_ALL_FIBS -1 /* Announce event for every fib */
117#ifdef _KERNEL
118VNET_DECLARE(uint32_t, _rt_numfibs); /* number of existing route tables */
119#define V_rt_numfibs VNET(_rt_numfibs)
120/* temporary compat arg */
121#define rt_numfibs V_rt_numfibs
122VNET_DECLARE(u_int, rt_add_addr_allfibs); /* Announce interfaces to all fibs */
123#define V_rt_add_addr_allfibs VNET(rt_add_addr_allfibs)
124
125/* Calculate flowid for locally-originated packets */
126#define V_fib_hash_outbound VNET(fib_hash_outbound)
127VNET_DECLARE(u_int, fib_hash_outbound);
128
129/* Outbound flowid generation rules */
130#ifdef RSS
131
132#define fib4_calc_packet_hash xps_proto_software_hash_v4
133#define fib6_calc_packet_hash xps_proto_software_hash_v6
134#define CALC_FLOWID_OUTBOUND_SENDTO true
135
136#ifdef ROUTE_MPATH
137#define CALC_FLOWID_OUTBOUND V_fib_hash_outbound
138#else
139#define CALC_FLOWID_OUTBOUND false
140#endif
141
142#else /* !RSS */
143
144#define fib4_calc_packet_hash fib4_calc_software_hash
145#define fib6_calc_packet_hash fib6_calc_software_hash
146
147#ifdef ROUTE_MPATH
148#define CALC_FLOWID_OUTBOUND_SENDTO V_fib_hash_outbound
149#define CALC_FLOWID_OUTBOUND V_fib_hash_outbound
150#else
151#define CALC_FLOWID_OUTBOUND_SENDTO false
152#define CALC_FLOWID_OUTBOUND false
153#endif
154
155#endif /* RSS */
156
157
158#endif /* _KERNEL */
159
160/*
161 * We distinguish between routes to hosts and routes to networks,
162 * preferring the former if available. For each route we infer
163 * the interface to use from the gateway address supplied when
164 * the route was entered. Routes that forward packets through
165 * gateways are marked so that the output routines know to address the
166 * gateway rather than the ultimate destination.
167 */
168#define RTF_UP 0x1 /* route usable */
169#define RTF_GATEWAY 0x2 /* destination is a gateway */
170#define RTF_HOST 0x4 /* host entry (net otherwise) */
171#define RTF_REJECT 0x8 /* host or net unreachable */
172#define RTF_DYNAMIC 0x10 /* created dynamically (by redirect) */
173#define RTF_MODIFIED 0x20 /* modified dynamically (by redirect) */
174#define RTF_DONE 0x40 /* message confirmed */
175/* 0x80 unused, was RTF_DELCLONE */
176/* 0x100 unused, was RTF_CLONING */
177#define RTF_XRESOLVE 0x200 /* external daemon resolves name */
178#define RTF_LLINFO 0x400 /* DEPRECATED - exists ONLY for backward
179 compatibility */
180#define RTF_LLDATA 0x400 /* used by apps to add/del L2 entries */
181#define RTF_STATIC 0x800 /* manually added */
182#define RTF_BLACKHOLE 0x1000 /* just discard pkts (during updates) */
183#define RTF_PROTO2 0x4000 /* protocol specific routing flag */
184#define RTF_PROTO1 0x8000 /* protocol specific routing flag */
185/* 0x10000 unused, was RTF_PRCLONING */
186/* 0x20000 unused, was RTF_WASCLONED */
187#define RTF_PROTO3 0x40000 /* protocol specific routing flag */
188#define RTF_FIXEDMTU 0x80000 /* MTU was explicitly specified */
189#define RTF_PINNED 0x100000 /* route is immutable */
190#define RTF_LOCAL 0x200000 /* route represents a local address */
191#define RTF_BROADCAST 0x400000 /* route represents a bcast address */
192#define RTF_MULTICAST 0x800000 /* route represents a mcast address */
193 /* 0x8000000 and up unassigned */
194#define RTF_STICKY 0x10000000 /* always route dst->src */
195
196/* 0x40000000 unused, was RTF_RNH_LOCKED */
197
198#define RTF_GWFLAG_COMPAT 0x80000000 /* a compatibility bit for interacting
199 with existing routing apps */
200
201/* Mask of RTF flags that are allowed to be modified by RTM_CHANGE. */
202#define RTF_FMASK \
203 (RTF_PROTO1 | RTF_PROTO2 | RTF_PROTO3 | RTF_BLACKHOLE | \
204 RTF_REJECT | RTF_STATIC | RTF_STICKY)
205
206/*
207 * fib_ nexthop API flags.
208 */
209
210/* Consumer-visible nexthop info flags */
211#define NHF_MULTIPATH 0x0008 /* Nexhop is a nexthop group */
212#define NHF_REJECT 0x0010 /* RTF_REJECT */
213#define NHF_BLACKHOLE 0x0020 /* RTF_BLACKHOLE */
214#define NHF_REDIRECT 0x0040 /* RTF_DYNAMIC|RTF_MODIFIED */
215#define NHF_DEFAULT 0x0080 /* Default route */
216#define NHF_BROADCAST 0x0100 /* RTF_BROADCAST */
217#define NHF_GATEWAY 0x0200 /* RTF_GATEWAY */
218#define NHF_HOST 0x0400 /* RTF_HOST */
219
220/* Nexthop request flags */
221#define NHR_NONE 0x00 /* empty flags field */
222#define NHR_REF 0x01 /* reference nexhop */
223#define NHR_NODEFAULT 0x02 /* uRPF: do not consider default route */
224
225/* Control plane route request flags */
226#define NHR_COPY 0x100 /* Copy rte data */
227#define NHR_UNLOCKED 0x200 /* Do not lock table */
228
229/*
230 * Routing statistics.
231 */
232struct rtstat {
233 uint64_t rts_badredirect; /* bogus redirect calls */
234 uint64_t rts_dynamic; /* routes created by redirects */
235 uint64_t rts_newgateway; /* routes modified by redirects */
236 uint64_t rts_unreach; /* lookups which failed */
237 uint64_t rts_wildcard; /* lookups satisfied by a wildcard */
238 uint64_t rts_nh_idx_alloc_failure; /* nexthop index alloc failure*/
239 uint64_t rts_nh_alloc_failure; /* nexthop allocation failure*/
240 uint64_t rts_add_failure; /* # of route addition failures */
241 uint64_t rts_add_retry; /* # of route addition retries */
242 uint64_t rts_del_failure; /* # of route deletion failure */
243 uint64_t rts_del_retry; /* # of route deletion retries */
244};
245
246/*
247 * Structures for routing messages.
248 */
249struct rt_msghdr {
250 u_short rtm_msglen; /* to skip over non-understood messages */
251 u_char rtm_version; /* future binary compatibility */
252 u_char rtm_type; /* message type */
253 u_short rtm_index; /* index for associated ifp */
254 u_short _rtm_spare1;
255 int rtm_flags; /* flags, incl. kern & message, e.g. DONE */
256 int rtm_addrs; /* bitmask identifying sockaddrs in msg */
257 pid_t rtm_pid; /* identify sender */
258 int rtm_seq; /* for sender to identify action */
259 int rtm_errno; /* why failed */
260 int rtm_fmask; /* bitmask used in RTM_CHANGE message */
261 u_long rtm_inits; /* which metrics we are initializing */
262 struct rt_metrics rtm_rmx; /* metrics themselves */
263};
264
265#define RTM_VERSION 5 /* Up the ante and ignore older versions */
266
267#ifndef NETLINK_COMPAT
268/*
269 * Message types.
270 *
271 * The format for each message is annotated below using the following
272 * identifiers:
273 *
274 * (1) struct rt_msghdr
275 * (2) struct ifa_msghdr
276 * (3) struct if_msghdr
277 * (4) struct ifma_msghdr
278 * (5) struct if_announcemsghdr
279 *
280 */
281#define RTM_ADD 0x1 /* (1) Add Route */
282#define RTM_DELETE 0x2 /* (1) Delete Route */
283#define RTM_CHANGE 0x3 /* (1) Change Metrics or flags */
284#define RTM_GET 0x4 /* (1) Report Metrics */
285#define RTM_LOSING 0x5 /* (1) Kernel Suspects Partitioning */
286#define RTM_REDIRECT 0x6 /* (1) Told to use different route */
287#define RTM_MISS 0x7 /* (1) Lookup failed on this address */
288#define RTM_LOCK 0x8 /* (1) fix specified metrics */
289 /* 0x9 */
290 /* 0xa */
291#define RTM_RESOLVE 0xb /* (1) req to resolve dst to LL addr */
292#define RTM_NEWADDR 0xc /* (2) address being added to iface */
293#define RTM_DELADDR 0xd /* (2) address being removed from iface */
294#define RTM_IFINFO 0xe /* (3) iface going up/down etc. */
295#define RTM_NEWMADDR 0xf /* (4) mcast group membership being added to if */
296#define RTM_DELMADDR 0x10 /* (4) mcast group membership being deleted */
297#define RTM_IFANNOUNCE 0x11 /* (5) iface arrival/departure */
298#define RTM_IEEE80211 0x12 /* (5) IEEE80211 wireless event */
299
300#endif /* NETLINK_COMPAT*/
301
302/*
303 * Bitmask values for rtm_inits and rmx_locks.
304 */
305#define RTV_MTU 0x1 /* init or lock _mtu */
306#define RTV_HOPCOUNT 0x2 /* init or lock _hopcount */
307#define RTV_EXPIRE 0x4 /* init or lock _expire */
308#define RTV_RPIPE 0x8 /* init or lock _recvpipe */
309#define RTV_SPIPE 0x10 /* init or lock _sendpipe */
310#define RTV_SSTHRESH 0x20 /* init or lock _ssthresh */
311#define RTV_RTT 0x40 /* init or lock _rtt */
312#define RTV_RTTVAR 0x80 /* init or lock _rttvar */
313#define RTV_WEIGHT 0x100 /* init or lock _weight */
314
315#ifndef NETLINK_COMPAT
316
317/*
318 * Bitmask values for rtm_addrs.
319 */
320#define RTA_DST 0x1 /* destination sockaddr present */
321#define RTA_GATEWAY 0x2 /* gateway sockaddr present */
322#define RTA_NETMASK 0x4 /* netmask sockaddr present */
323#define RTA_GENMASK 0x8 /* cloning mask sockaddr present */
324#define RTA_IFP 0x10 /* interface name sockaddr present */
325#define RTA_IFA 0x20 /* interface addr sockaddr present */
326#define RTA_AUTHOR 0x40 /* sockaddr for author of redirect */
327#define RTA_BRD 0x80 /* for NEWADDR, broadcast or p-p dest addr */
328
329#endif /* NETLINK_COMPAT*/
330
331/*
332 * Index offsets for sockaddr array for alternate internal encoding.
333 */
334#define RTAX_DST 0 /* destination sockaddr present */
335#define RTAX_GATEWAY 1 /* gateway sockaddr present */
336#define RTAX_NETMASK 2 /* netmask sockaddr present */
337#define RTAX_GENMASK 3 /* cloning mask sockaddr present */
338#define RTAX_IFP 4 /* interface name sockaddr present */
339#define RTAX_IFA 5 /* interface addr sockaddr present */
340#define RTAX_AUTHOR 6 /* sockaddr for author of redirect */
341#define RTAX_BRD 7 /* for NEWADDR, broadcast or p-p dest addr */
342#define RTAX_MAX 8 /* size of array to allocate */
343
344struct rtentry;
345struct nhop_object;
346typedef int rib_filter_f_t(const struct rtentry *, const struct nhop_object *,
347 void *);
348
349struct rt_addrinfo {
350 int rti_addrs; /* Route RTF_ flags */
351 int rti_flags; /* Route RTF_ flags */
352 struct sockaddr *rti_info[RTAX_MAX]; /* Sockaddr data */
353 struct ifaddr *rti_ifa; /* value of rt_ifa addr */
354 struct ifnet *rti_ifp; /* route interface */
355 rib_filter_f_t *rti_filter; /* filter function */
356 void *rti_filterdata; /* filter parameters */
357 u_long rti_mflags; /* metrics RTV_ flags */
358 u_long rti_spare; /* Will be used for fib */
359 struct rt_metrics *rti_rmx; /* Pointer to route metrics */
360};
361
362/*
363 * This macro returns the size of a struct sockaddr when passed
364 * through a routing socket. Basically we round up sa_len to
365 * a multiple of sizeof(long), with a minimum of sizeof(long).
366 * The case sa_len == 0 should only apply to empty structures.
367 */
368#define SA_SIZE(sa) \
369 ( (((struct sockaddr *)(sa))->sa_len == 0) ? \
370 sizeof(long) : \
371 1 + ( (((struct sockaddr *)(sa))->sa_len - 1) | (sizeof(long) - 1) ) )
372
373#define sa_equal(a, b) ( \
374 (((const struct sockaddr *)(a))->sa_len == ((const struct sockaddr *)(b))->sa_len) && \
375 (bcmp((a), (b), ((const struct sockaddr *)(b))->sa_len) == 0))
376
377#ifdef _KERNEL
378
379#define RT_LINK_IS_UP(ifp) (!((ifp)->if_capabilities & IFCAP_LINKSTATE) \
380 || (ifp)->if_link_state == LINK_STATE_UP)
381
382#define RO_NHFREE(_ro) do { \
383 if ((_ro)->ro_nh) { \
384 NH_FREE((_ro)->ro_nh); \
385 (_ro)->ro_nh = NULL; \
386 } \
387} while (0)
388
389#define RO_INVALIDATE_CACHE(ro) do { \
390 if ((ro)->ro_lle != NULL) { \
391 LLE_FREE((ro)->ro_lle); \
392 (ro)->ro_lle = NULL; \
393 } \
394 if ((ro)->ro_nh != NULL) { \
395 NH_FREE((ro)->ro_nh); \
396 (ro)->ro_nh = NULL; \
397 } \
398 } while (0)
399
400#define RO_GET_FAMILY(ro, dst) ((ro) != NULL && \
401 (ro)->ro_flags & RT_HAS_GW \
402 ? (ro)->ro_dst.sa_family : (dst)->sa_family)
403
404/*
405 * Validate a cached route based on a supplied cookie. If there is an
406 * out-of-date cache, simply free it. Update the generation number
407 * for the new allocation
408 */
409#define NH_VALIDATE(ro, cookiep, fibnum) do { \
410 rt_gen_t cookie = RT_GEN(fibnum, (ro)->ro_dst.sa_family); \
411 if (*(cookiep) != cookie) { \
412 RO_INVALIDATE_CACHE(ro); \
413 *(cookiep) = cookie; \
414 } \
415} while (0)
416
417struct ifmultiaddr;
418struct rib_head;
419
420void rt_ieee80211msg(struct ifnet *, int, void *, size_t);
421void rt_ifmsg(struct ifnet *, int);
422void rt_missmsg(int, struct rt_addrinfo *, int, int);
423void rt_missmsg_fib(int, struct rt_addrinfo *, int, int, int);
424int rt_addrmsg(int, struct ifaddr *, int);
425int rt_routemsg(int, struct rtentry *, struct nhop_object *, int);
426int rt_routemsg_info(int, struct rt_addrinfo *, int);
427void rt_newmaddrmsg(int, struct ifmultiaddr *);
428void rt_maskedcopy(const struct sockaddr *, struct sockaddr *,
429 const struct sockaddr *);
430struct rib_head *rt_table_init(int, int, u_int);
431void rt_table_destroy(struct rib_head *);
432u_int rt_tables_get_gen(uint32_t table, sa_family_t family);
433
434struct sockaddr *rtsock_fix_netmask(const struct sockaddr *dst,
435 const struct sockaddr *smask, struct sockaddr_storage *dmask);
436
437void rt_updatemtu(struct ifnet *);
438
439void rt_flushifroutes(struct ifnet *ifp);
440
441/* XXX MRT NEW VERSIONS THAT USE FIBs
442 * For now the protocol indepedent versions are the same as the AF_INET ones
443 * but this will change..
444 */
445int rtioctl_fib(u_long, caddr_t, u_int);
446
447/* New API */
448void rib_flush_routes_family(int family);
449struct nhop_object *rib_lookup(uint32_t fibnum, const struct sockaddr *dst,
450 uint32_t flags, uint32_t flowid);
451const char *rib_print_family(int family);
452#endif
453
454#endif