2 * Copyright (c) 2011 Nicira Networks.
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at:
8 * http://www.apache.org/licenses/LICENSE-2.0
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
19 #include "route-table.h"
22 #include <arpa/inet.h>
23 #include <sys/socket.h>
24 #include <linux/rtnetlink.h>
30 #include "netlink-socket.h"
32 #include "rtnetlink.h"
35 VLOG_DEFINE_THIS_MODULE(route_table);
38 /* Copied from struct rtmsg. */
39 unsigned char rtm_dst_len;
41 /* Extracted from Netlink attributes. */
42 uint32_t rta_dst; /* Destination in host byte order. 0 if missing. */
43 int rta_oif; /* Output interface index. */
46 /* A digested version of a route message sent down by the kernel to indicate
47 * that a route has changed. */
48 struct route_table_msg {
49 int nlmsg_type; /* e.g. RTM_NEWROUTE, RTM_DELROUTE. */
50 struct route_data rd; /* Data parsed from this message. */
54 struct hmap_node node; /* Node in route_map. */
55 struct route_data rd; /* Data associated with this node. */
58 static struct vlog_rate_limit rl = VLOG_RATE_LIMIT_INIT(5, 20);
60 static unsigned int register_count = 0;
61 static struct rtnetlink *rtn = NULL;
62 static struct route_table_msg rtmsg;
63 static struct rtnetlink_notifier notifier;
64 static struct hmap route_map;
66 static int route_table_reset(void);
67 static bool route_table_parse(struct ofpbuf *, struct route_table_msg *);
68 static void route_table_change(const struct route_table_msg *, void *);
69 static struct route_node *route_node_lookup(const struct route_data *);
70 static struct route_node *route_node_lookup_by_ip(uint32_t ip);
71 static void route_map_clear(void);
72 static uint32_t hash_route_data(const struct route_data *);
74 /* Populates 'ifindex' with the interface index traffic destined for 'ip' is
75 * likely to egress. There is no hard guarantee that traffic destined for 'ip'
76 * will egress out the specified interface. 'ifindex' may refer to an
77 * interface which is not physical (such as a bridge port).
79 * Returns true if successful, otherwise false. */
81 route_table_get_ifindex(ovs_be32 ip_, int *ifindex)
83 struct route_node *rn;
84 uint32_t ip = ntohl(ip_);
88 rn = route_node_lookup_by_ip(ip);
91 *ifindex = rn->rd.rta_oif;
95 /* Choose a default route. */
96 HMAP_FOR_EACH(rn, node, &route_map) {
97 if (rn->rd.rta_dst == 0 && rn->rd.rtm_dst_len == 0) {
98 *ifindex = rn->rd.rta_oif;
106 /* Users of the route_table module should register themselves with this
107 * function before making any other route_table function calls. */
109 route_table_register(void)
111 if (!register_count) {
112 rtnetlink_parse_func *pf;
113 rtnetlink_notify_func *nf;
117 pf = (rtnetlink_parse_func *) route_table_parse;
118 nf = (rtnetlink_notify_func *) route_table_change;
120 rtn = rtnetlink_create(RTNLGRP_IPV4_ROUTE, pf, &rtmsg);
121 rtnetlink_notifier_register(rtn, ¬ifier, nf, NULL);
123 hmap_init(&route_map);
130 /* Users of the route_table module should unregister themselves with this
131 * function when they will no longer be making any more route_table fuction
134 route_table_unregister(void)
138 if (!register_count) {
139 rtnetlink_destroy(rtn);
143 hmap_destroy(&route_map);
147 /* Run periodically to update the locally maintained routing table. */
149 route_table_run(void)
152 rtnetlink_notifier_run(rtn);
156 /* Causes poll_block() to wake up when route_table updates are required. */
158 route_table_wait(void)
161 rtnetlink_notifier_wait(rtn);
166 route_table_reset(void)
170 struct rtgenmsg *rtmsg;
171 struct ofpbuf request, reply;
172 static struct nl_sock *rtnl_sock;
176 error = nl_sock_create(NETLINK_ROUTE, 0, 0, 0, &rtnl_sock);
178 VLOG_WARN_RL(&rl, "failed to reset routing table, "
179 "cannot create RTNETLINK_ROUTE socket");
183 ofpbuf_init(&request, 0);
185 nl_msg_put_nlmsghdr(&request, sizeof *rtmsg, RTM_GETROUTE, NLM_F_REQUEST);
187 rtmsg = ofpbuf_put_zeros(&request, sizeof *rtmsg);
188 rtmsg->rtgen_family = AF_INET;
190 nl_dump_start(&dump, rtnl_sock, &request);
192 while (nl_dump_next(&dump, &reply)) {
193 struct route_table_msg msg;
195 if (route_table_parse(&reply, &msg)) {
196 route_table_change(&msg, NULL);
200 error = nl_dump_done(&dump);
201 nl_sock_destroy(rtnl_sock);
208 route_table_parse(struct ofpbuf *buf, struct route_table_msg *change)
212 static const struct nl_policy policy[] = {
213 [RTA_DST] = { .type = NL_A_U32, .optional = true },
214 [RTA_OIF] = { .type = NL_A_U32, .optional = false },
217 static struct nlattr *attrs[ARRAY_SIZE(policy)];
219 parsed = nl_policy_parse(buf, NLMSG_HDRLEN + sizeof(struct rtmsg),
220 policy, attrs, ARRAY_SIZE(policy));
223 const struct rtmsg *rtm;
224 const struct nlmsghdr *nlmsg;
227 rtm = (const struct rtmsg *) ((const char *) buf->data + NLMSG_HDRLEN);
229 if (rtm->rtm_family != AF_INET) {
230 VLOG_DBG_RL(&rl, "received non AF_INET rtnetlink route message");
234 memset(change, 0, sizeof *change);
236 change->nlmsg_type = nlmsg->nlmsg_type;
237 change->rd.rtm_dst_len = rtm->rtm_dst_len;
238 change->rd.rta_oif = nl_attr_get_u32(attrs[RTA_OIF]);
240 if (attrs[RTA_DST]) {
241 change->rd.rta_dst = ntohl(nl_attr_get_be32(attrs[RTA_DST]));
245 VLOG_DBG_RL(&rl, "received unparseable rtnetlink route message");
252 route_table_change(const struct route_table_msg *change, void *aux OVS_UNUSED)
255 VLOG_DBG_RL(&rl, "received NULL change message");
257 } else if (change->nlmsg_type == RTM_NEWROUTE) {
258 if (!route_node_lookup(&change->rd)) {
259 struct route_node *rn;
261 rn = xzalloc(sizeof *rn);
262 memcpy(&rn->rd, &change->rd, sizeof change->rd);
264 hmap_insert(&route_map, &rn->node, hash_route_data(&rn->rd));
266 VLOG_DBG_RL(&rl, "skipping insertion of duplicate route entry");
268 } else if (change->nlmsg_type == RTM_DELROUTE) {
269 struct route_node *rn;
271 rn = route_node_lookup(&change->rd);
274 hmap_remove(&route_map, &rn->node);
277 VLOG_DBG_RL(&rl, "skipping deletion of non-existent route entry");
282 static struct route_node *
283 route_node_lookup(const struct route_data *rd)
285 struct route_node *rn;
287 HMAP_FOR_EACH_WITH_HASH(rn, node, hash_route_data(rd), &route_map) {
288 if (!memcmp(&rn->rd, rd, sizeof *rd)) {
296 static struct route_node *
297 route_node_lookup_by_ip(uint32_t ip)
300 struct route_node *rn, *rn_ret;
305 HMAP_FOR_EACH(rn, node, &route_map) {
306 uint32_t mask = 0xffffffff << (32 - rn->rd.rtm_dst_len);
308 if (rn->rd.rta_dst == 0 && rn->rd.rtm_dst_len == 0) {
313 if (rn->rd.rtm_dst_len > dst_len &&
314 (ip & mask) == (rn->rd.rta_dst & mask)) {
316 dst_len = rn->rd.rtm_dst_len;
324 route_map_clear(void)
326 struct route_node *rn, *rn_next;
328 HMAP_FOR_EACH_SAFE(rn, rn_next, node, &route_map) {
329 hmap_remove(&route_map, &rn->node);
335 hash_route_data(const struct route_data *rd)
337 return hash_bytes(rd, sizeof *rd, 0);