/*
- * Copyright (c) 2011 Nicira Networks.
+ * Copyright (c) 2011, 2012, 2013, 2014 Nicira, Inc.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
#include "route-table.h"
-#include <assert.h>
+#include <errno.h>
#include <arpa/inet.h>
#include <sys/socket.h>
#include <linux/rtnetlink.h>
#include <net/if.h>
#include "hash.h"
-#include "hmap.h"
#include "netlink.h"
+#include "netlink-notifier.h"
#include "netlink-socket.h"
#include "ofpbuf.h"
-#include "rtnetlink.h"
-#include "vlog.h"
+#include "ovs-router.h"
+#include "rtnetlink-link.h"
+#include "openvswitch/vlog.h"
VLOG_DEFINE_THIS_MODULE(route_table);
unsigned char rtm_dst_len;
/* Extracted from Netlink attributes. */
- uint32_t rta_dst; /* Destination in host byte order. 0 if missing. */
- int rta_oif; /* Output interface index. */
+ ovs_be32 rta_dst; /* 0 if missing. */
+ ovs_be32 rta_gw;
+ char ifname[IFNAMSIZ]; /* Interface name. */
};
/* A digested version of a route message sent down by the kernel to indicate
struct route_data rd; /* Data parsed from this message. */
};
-struct route_node {
- struct hmap_node node; /* Node in route_map. */
- struct route_data rd; /* Data associated with this node. */
-};
-
+static struct ovs_mutex route_table_mutex = OVS_MUTEX_INITIALIZER;
static struct vlog_rate_limit rl = VLOG_RATE_LIMIT_INIT(5, 20);
-static unsigned int register_count = 0;
-static struct rtnetlink *rtn = NULL;
+/* Global change number for route-table, which should be incremented
+ * every time route_table_reset() is called. */
+static uint64_t rt_change_seq;
+
+static struct nln *nln = NULL;
static struct route_table_msg rtmsg;
-static struct rtnetlink_notifier notifier;
+static struct nln_notifier *route_notifier = NULL;
+static struct nln_notifier *name_notifier = NULL;
static bool route_table_valid = false;
-static struct hmap route_map;
static int route_table_reset(void);
static void route_table_handle_msg(const struct route_table_msg *);
static bool route_table_parse(struct ofpbuf *, struct route_table_msg *);
static void route_table_change(const struct route_table_msg *, void *);
-static struct route_node *route_node_lookup(const struct route_data *);
-static struct route_node *route_node_lookup_by_ip(uint32_t ip);
static void route_map_clear(void);
-static uint32_t hash_route_data(const struct route_data *);
-
-/* Populates 'ifindex' with the interface index traffic destined for 'ip' is
- * likely to egress. There is no hard guarantee that traffic destined for 'ip'
- * will egress out the specified interface. 'ifindex' may refer to an
- * interface which is not physical (such as a bridge port).
- *
- * Returns true if successful, otherwise false. */
-bool
-route_table_get_ifindex(ovs_be32 ip_, int *ifindex)
-{
- struct route_node *rn;
- uint32_t ip = ntohl(ip_);
-
- *ifindex = 0;
- if (!route_table_valid) {
- route_table_reset();
- }
-
- rn = route_node_lookup_by_ip(ip);
-
- if (rn) {
- *ifindex = rn->rd.rta_oif;
- return true;
- }
+static void name_table_init(void);
+static void name_table_change(const struct rtnetlink_link_change *, void *);
- /* Choose a default route. */
- HMAP_FOR_EACH(rn, node, &route_map) {
- if (rn->rd.rta_dst == 0 && rn->rd.rtm_dst_len == 0) {
- *ifindex = rn->rd.rta_oif;
- return true;
- }
- }
-
- return false;
+uint64_t
+route_table_get_change_seq(void)
+{
+ return rt_change_seq;
}
/* Users of the route_table module should register themselves with this
* function before making any other route_table function calls. */
void
-route_table_register(void)
+route_table_init(void)
+ OVS_EXCLUDED(route_table_mutex)
{
- if (!register_count) {
- rtnetlink_parse_func *pf;
- rtnetlink_notify_func *nf;
-
- assert(!rtn);
+ ovs_mutex_lock(&route_table_mutex);
+ ovs_assert(!nln);
+ ovs_assert(!route_notifier);
- pf = (rtnetlink_parse_func *) route_table_parse;
- nf = (rtnetlink_notify_func *) route_table_change;
+ ovs_router_init();
+ nln = nln_create(NETLINK_ROUTE, RTNLGRP_IPV4_ROUTE,
+ (nln_parse_func *) route_table_parse, &rtmsg);
- rtn = rtnetlink_create(RTNLGRP_IPV4_ROUTE, pf, &rtmsg);
- rtnetlink_notifier_register(rtn, ¬ifier, nf, NULL);
+ route_notifier =
+ nln_notifier_create(nln, (nln_notify_func *) route_table_change,
+ NULL);
- hmap_init(&route_map);
- route_table_reset();
- }
+ route_table_reset();
+ name_table_init();
- register_count++;
-}
-
-/* Users of the route_table module should unregister themselves with this
- * function when they will no longer be making any more route_table fuction
- * calls. */
-void
-route_table_unregister(void)
-{
- register_count--;
-
- if (!register_count) {
- rtnetlink_destroy(rtn);
- rtn = NULL;
-
- route_map_clear();
- hmap_destroy(&route_map);
- }
+ ovs_mutex_unlock(&route_table_mutex);
}
/* Run periodically to update the locally maintained routing table. */
void
route_table_run(void)
+ OVS_EXCLUDED(route_table_mutex)
{
- if (rtn) {
- rtnetlink_notifier_run(rtn);
+ ovs_mutex_lock(&route_table_mutex);
+ if (nln) {
+ rtnetlink_link_run();
+ nln_run(nln);
+
+ if (!route_table_valid) {
+ route_table_reset();
+ }
}
+ ovs_mutex_unlock(&route_table_mutex);
}
/* Causes poll_block() to wake up when route_table updates are required. */
void
route_table_wait(void)
+ OVS_EXCLUDED(route_table_mutex)
{
- if (rtn) {
- rtnetlink_notifier_wait(rtn);
+ ovs_mutex_lock(&route_table_mutex);
+ if (nln) {
+ rtnetlink_link_wait();
+ nln_wait(nln);
}
+ ovs_mutex_unlock(&route_table_mutex);
}
static int
route_table_reset(void)
{
- int error;
struct nl_dump dump;
struct rtgenmsg *rtmsg;
- struct ofpbuf request, reply;
- static struct nl_sock *rtnl_sock;
+ uint64_t reply_stub[NL_DUMP_BUFSIZE / 8];
+ struct ofpbuf request, reply, buf;
route_map_clear();
route_table_valid = true;
-
- error = nl_sock_create(NETLINK_ROUTE, &rtnl_sock);
- if (error) {
- VLOG_WARN_RL(&rl, "failed to reset routing table, "
- "cannot create RTNETLINK_ROUTE socket");
- return error;
- }
+ rt_change_seq++;
ofpbuf_init(&request, 0);
rtmsg = ofpbuf_put_zeros(&request, sizeof *rtmsg);
rtmsg->rtgen_family = AF_INET;
- nl_dump_start(&dump, rtnl_sock, &request);
+ nl_dump_start(&dump, NETLINK_ROUTE, &request);
+ ofpbuf_uninit(&request);
- while (nl_dump_next(&dump, &reply)) {
+ ofpbuf_use_stub(&buf, reply_stub, sizeof reply_stub);
+ while (nl_dump_next(&dump, &reply, &buf)) {
struct route_table_msg msg;
if (route_table_parse(&reply, &msg)) {
route_table_handle_msg(&msg);
}
}
+ ofpbuf_uninit(&buf);
- error = nl_dump_done(&dump);
- nl_sock_destroy(rtnl_sock);
-
- return error;
+ return nl_dump_done(&dump);
}
static const struct nl_policy policy[] = {
[RTA_DST] = { .type = NL_A_U32, .optional = true },
[RTA_OIF] = { .type = NL_A_U32, .optional = false },
+ [RTA_GATEWAY] = { .type = NL_A_U32, .optional = true },
};
- static struct nlattr *attrs[ARRAY_SIZE(policy)];
+ struct nlattr *attrs[ARRAY_SIZE(policy)];
parsed = nl_policy_parse(buf, NLMSG_HDRLEN + sizeof(struct rtmsg),
policy, attrs, ARRAY_SIZE(policy));
if (parsed) {
const struct rtmsg *rtm;
const struct nlmsghdr *nlmsg;
+ int rta_oif; /* Output interface index. */
nlmsg = buf->data;
- rtm = (const struct rtmsg *) ((const char *) buf->data + NLMSG_HDRLEN);
+ rtm = ofpbuf_at(buf, NLMSG_HDRLEN, sizeof *rtm);
if (rtm->rtm_family != AF_INET) {
VLOG_DBG_RL(&rl, "received non AF_INET rtnetlink route message");
rtm->rtm_type != RTN_LOCAL) {
change->relevant = false;
}
-
change->nlmsg_type = nlmsg->nlmsg_type;
change->rd.rtm_dst_len = rtm->rtm_dst_len;
- change->rd.rta_oif = nl_attr_get_u32(attrs[RTA_OIF]);
+ rta_oif = nl_attr_get_u32(attrs[RTA_OIF]);
+
+ if (!if_indextoname(rta_oif, change->rd.ifname)) {
+ int error = errno;
+
+ VLOG_DBG_RL(&rl, "Could not find interface name[%u]: %s",
+ rta_oif, ovs_strerror(error));
+ return false;
+ }
if (attrs[RTA_DST]) {
- change->rd.rta_dst = ntohl(nl_attr_get_be32(attrs[RTA_DST]));
+ change->rd.rta_dst = nl_attr_get_be32(attrs[RTA_DST]);
+ }
+ if (attrs[RTA_GATEWAY]) {
+ change->rd.rta_gw = nl_attr_get_be32(attrs[RTA_GATEWAY]);
}
+
} else {
VLOG_DBG_RL(&rl, "received unparseable rtnetlink route message");
}
static void
route_table_handle_msg(const struct route_table_msg *change)
{
- if (change->relevant && change->nlmsg_type == RTM_NEWROUTE &&
- !route_node_lookup(&change->rd)) {
- struct route_node *rn;
-
- rn = xzalloc(sizeof *rn);
- memcpy(&rn->rd, &change->rd, sizeof change->rd);
+ if (change->relevant && change->nlmsg_type == RTM_NEWROUTE) {
+ const struct route_data *rd = &change->rd;
- hmap_insert(&route_map, &rn->node, hash_route_data(&rn->rd));
+ ovs_router_insert(rd->rta_dst, rd->rtm_dst_len,
+ rd->ifname, rd->rta_gw);
}
}
-static struct route_node *
-route_node_lookup(const struct route_data *rd)
+static void
+route_map_clear(void)
{
- struct route_node *rn;
-
- HMAP_FOR_EACH_WITH_HASH(rn, node, hash_route_data(rd), &route_map) {
- if (!memcmp(&rn->rd, rd, sizeof *rd)) {
- return rn;
- }
- }
-
- return NULL;
+ ovs_router_flush();
}
-static struct route_node *
-route_node_lookup_by_ip(uint32_t ip)
+bool
+route_table_fallback_lookup(ovs_be32 ip_dst OVS_UNUSED,
+ char output_bridge[] OVS_UNUSED,
+ ovs_be32 *gw)
{
- int dst_len;
- struct route_node *rn, *rn_ret;
-
- dst_len = -1;
- rn_ret = NULL;
-
- HMAP_FOR_EACH(rn, node, &route_map) {
- uint32_t mask = 0xffffffff << (32 - rn->rd.rtm_dst_len);
-
- if (rn->rd.rta_dst == 0 && rn->rd.rtm_dst_len == 0) {
- /* Default route. */
- continue;
- }
-
- if (rn->rd.rtm_dst_len > dst_len &&
- (ip & mask) == (rn->rd.rta_dst & mask)) {
- rn_ret = rn;
- dst_len = rn->rd.rtm_dst_len;
- }
- }
-
- return rn_ret;
+ *gw = 0;
+ return false;
}
+\f
+/* name_table . */
+
static void
-route_map_clear(void)
+name_table_init(void)
{
- struct route_node *rn, *rn_next;
-
- HMAP_FOR_EACH_SAFE(rn, rn_next, node, &route_map) {
- hmap_remove(&route_map, &rn->node);
- free(rn);
- }
+ name_notifier = rtnetlink_link_notifier_create(name_table_change, NULL);
}
-static uint32_t
-hash_route_data(const struct route_data *rd)
+
+static void
+name_table_change(const struct rtnetlink_link_change *change OVS_UNUSED,
+ void *aux OVS_UNUSED)
{
- return hash_bytes(rd, sizeof *rd, 0);
+ /* Changes to interface status can cause routing table changes that some
+ * versions of the linux kernel do not advertise for some reason. */
+ route_table_valid = false;
}