/*
- * Copyright (c) 2011, 2012, 2013, 2014 Nicira, Inc.
+ * Copyright (c) 2011, 2012, 2013, 2014, 2017 Nicira, Inc.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
#include "route-table.h"
#include <errno.h>
+#include <sys/types.h>
+#include <netinet/in.h>
#include <arpa/inet.h>
#include <sys/socket.h>
#include <linux/rtnetlink.h>
#include <net/if.h>
#include "hash.h"
+#include "netdev.h"
#include "netlink.h"
#include "netlink-notifier.h"
#include "netlink-socket.h"
-#include "ofpbuf.h"
+#include "openvswitch/ofpbuf.h"
#include "ovs-router.h"
-#include "ovs-router-linux.h"
-#include "rtnetlink-link.h"
-#include "vlog.h"
+#include "packets.h"
+#include "rtnetlink.h"
+#include "tnl-ports.h"
+#include "openvswitch/vlog.h"
+
+/* Linux 2.6.36 added RTA_MARK, so define it just in case we're building with
+ * old headers. (We can't test for it with #ifdef because it's an enum.) */
+#define RTA_MARK 16
VLOG_DEFINE_THIS_MODULE(route_table);
struct route_data {
/* Copied from struct rtmsg. */
unsigned char rtm_dst_len;
+ bool local;
/* Extracted from Netlink attributes. */
- ovs_be32 rta_dst; /* 0 if missing. */
- ovs_be32 rta_gw;
+ struct in6_addr rta_dst; /* 0 if missing. */
+ struct in6_addr rta_gw;
char ifname[IFNAMSIZ]; /* Interface name. */
+ uint32_t mark;
};
/* A digested version of a route message sent down by the kernel to indicate
* every time route_table_reset() is called. */
static uint64_t rt_change_seq;
-static unsigned int register_count = 0;
static struct nln *nln = NULL;
static struct route_table_msg rtmsg;
static struct nln_notifier *route_notifier = NULL;
+static struct nln_notifier *route6_notifier = NULL;
static struct nln_notifier *name_notifier = NULL;
static bool route_table_valid = false;
static int route_table_reset(void);
static void route_table_handle_msg(const struct route_table_msg *);
-static bool route_table_parse(struct ofpbuf *, struct route_table_msg *);
+static int route_table_parse(struct ofpbuf *, struct route_table_msg *);
static void route_table_change(const struct route_table_msg *, void *);
static void route_map_clear(void);
static void name_table_init(void);
-static void name_table_uninit(void);
-static void name_table_change(const struct rtnetlink_link_change *, void *);
+static void name_table_change(const struct rtnetlink_change *, void *);
uint64_t
route_table_get_change_seq(void)
/* Users of the route_table module should register themselves with this
* function before making any other route_table function calls. */
void
-route_table_register(void)
+route_table_init(void)
OVS_EXCLUDED(route_table_mutex)
{
ovs_mutex_lock(&route_table_mutex);
- if (!register_count) {
- ovs_assert(!nln);
- ovs_assert(!route_notifier);
-
- ovs_router_init();
- nln = nln_create(NETLINK_ROUTE, RTNLGRP_IPV4_ROUTE,
- (nln_parse_func *) route_table_parse, &rtmsg);
+ ovs_assert(!nln);
+ ovs_assert(!route_notifier);
+ ovs_assert(!route6_notifier);
- route_notifier =
- nln_notifier_create(nln, (nln_notify_func *) route_table_change,
- NULL);
+ ovs_router_init();
+ nln = nln_create(NETLINK_ROUTE, (nln_parse_func *) route_table_parse,
+ &rtmsg);
- route_table_reset();
- name_table_init();
- }
-
- register_count++;
- ovs_mutex_unlock(&route_table_mutex);
-}
-
-/* Users of the route_table module should unregister themselves with this
- * function when they will no longer be making any more route_table fuction
- * calls. */
-void
-route_table_unregister(void)
- OVS_EXCLUDED(route_table_mutex)
-{
- ovs_mutex_lock(&route_table_mutex);
- register_count--;
+ route_notifier =
+ nln_notifier_create(nln, RTNLGRP_IPV4_ROUTE,
+ (nln_notify_func *) route_table_change, NULL);
+ route6_notifier =
+ nln_notifier_create(nln, RTNLGRP_IPV6_ROUTE,
+ (nln_notify_func *) route_table_change, NULL);
- if (!register_count) {
- nln_notifier_destroy(route_notifier);
- route_notifier = NULL;
- nln_destroy(nln);
- nln = NULL;
+ route_table_reset();
+ name_table_init();
- route_map_clear();
- name_table_uninit();
- }
ovs_mutex_unlock(&route_table_mutex);
}
{
ovs_mutex_lock(&route_table_mutex);
if (nln) {
- rtnetlink_link_run();
+ rtnetlink_run();
nln_run(nln);
if (!route_table_valid) {
{
ovs_mutex_lock(&route_table_mutex);
if (nln) {
- rtnetlink_link_wait();
+ rtnetlink_wait();
nln_wait(nln);
}
ovs_mutex_unlock(&route_table_mutex);
route_table_reset(void)
{
struct nl_dump dump;
- struct rtgenmsg *rtmsg;
+ struct rtgenmsg *rtgenmsg;
uint64_t reply_stub[NL_DUMP_BUFSIZE / 8];
struct ofpbuf request, reply, buf;
route_map_clear();
+ netdev_get_addrs_list_flush();
route_table_valid = true;
rt_change_seq++;
ofpbuf_init(&request, 0);
- nl_msg_put_nlmsghdr(&request, sizeof *rtmsg, RTM_GETROUTE, NLM_F_REQUEST);
+ nl_msg_put_nlmsghdr(&request, sizeof *rtgenmsg, RTM_GETROUTE,
+ NLM_F_REQUEST);
- rtmsg = ofpbuf_put_zeros(&request, sizeof *rtmsg);
- rtmsg->rtgen_family = AF_INET;
+ rtgenmsg = ofpbuf_put_zeros(&request, sizeof *rtgenmsg);
+ rtgenmsg->rtgen_family = AF_UNSPEC;
nl_dump_start(&dump, NETLINK_ROUTE, &request);
ofpbuf_uninit(&request);
return nl_dump_done(&dump);
}
-
-static bool
+/* Return RTNLGRP_IPV4_ROUTE or RTNLGRP_IPV6_ROUTE on success, 0 on parse
+ * error. */
+static int
route_table_parse(struct ofpbuf *buf, struct route_table_msg *change)
{
- bool parsed;
+ bool parsed, ipv4 = false;
static const struct nl_policy policy[] = {
[RTA_DST] = { .type = NL_A_U32, .optional = true },
- [RTA_OIF] = { .type = NL_A_U32, .optional = false },
+ [RTA_OIF] = { .type = NL_A_U32, .optional = true },
[RTA_GATEWAY] = { .type = NL_A_U32, .optional = true },
+ [RTA_MARK] = { .type = NL_A_U32, .optional = true },
+ };
+
+ static const struct nl_policy policy6[] = {
+ [RTA_DST] = { .type = NL_A_IPV6, .optional = true },
+ [RTA_OIF] = { .type = NL_A_U32, .optional = true },
+ [RTA_MARK] = { .type = NL_A_U32, .optional = true },
+ [RTA_GATEWAY] = { .type = NL_A_IPV6, .optional = true },
};
struct nlattr *attrs[ARRAY_SIZE(policy)];
+ const struct rtmsg *rtm;
- parsed = nl_policy_parse(buf, NLMSG_HDRLEN + sizeof(struct rtmsg),
- policy, attrs, ARRAY_SIZE(policy));
+ rtm = ofpbuf_at(buf, NLMSG_HDRLEN, sizeof *rtm);
+
+ if (rtm->rtm_family == AF_INET) {
+ parsed = nl_policy_parse(buf, NLMSG_HDRLEN + sizeof(struct rtmsg),
+ policy, attrs, ARRAY_SIZE(policy));
+ ipv4 = true;
+ } else if (rtm->rtm_family == AF_INET6) {
+ parsed = nl_policy_parse(buf, NLMSG_HDRLEN + sizeof(struct rtmsg),
+ policy6, attrs, ARRAY_SIZE(policy6));
+ } else {
+ VLOG_DBG_RL(&rl, "received non AF_INET rtnetlink route message");
+ return 0;
+ }
if (parsed) {
- const struct rtmsg *rtm;
const struct nlmsghdr *nlmsg;
int rta_oif; /* Output interface index. */
- nlmsg = ofpbuf_data(buf);
- rtm = ofpbuf_at(buf, NLMSG_HDRLEN, sizeof *rtm);
-
- if (rtm->rtm_family != AF_INET) {
- VLOG_DBG_RL(&rl, "received non AF_INET rtnetlink route message");
- return false;
- }
+ nlmsg = buf->data;
memset(change, 0, sizeof *change);
change->relevant = true;
change->relevant = false;
}
change->nlmsg_type = nlmsg->nlmsg_type;
- change->rd.rtm_dst_len = rtm->rtm_dst_len;
- rta_oif = nl_attr_get_u32(attrs[RTA_OIF]);
-
- if (!if_indextoname(rta_oif, change->rd.ifname)) {
- int error = errno;
-
- VLOG_DBG_RL(&rl, "Could not find interface name[%u]: %s",
- rta_oif, ovs_strerror(error));
- return false;
+ change->rd.rtm_dst_len = rtm->rtm_dst_len + (ipv4 ? 96 : 0);
+ change->rd.local = rtm->rtm_type == RTN_LOCAL;
+ if (attrs[RTA_OIF]) {
+ rta_oif = nl_attr_get_u32(attrs[RTA_OIF]);
+
+ if (!if_indextoname(rta_oif, change->rd.ifname)) {
+ int error = errno;
+
+ VLOG_DBG_RL(&rl, "Could not find interface name[%u]: %s",
+ rta_oif, ovs_strerror(error));
+ if (error == ENXIO) {
+ change->relevant = false;
+ } else {
+ return 0;
+ }
+ }
}
if (attrs[RTA_DST]) {
- change->rd.rta_dst = nl_attr_get_be32(attrs[RTA_DST]);
+ if (ipv4) {
+ ovs_be32 dst;
+ dst = nl_attr_get_be32(attrs[RTA_DST]);
+ in6_addr_set_mapped_ipv4(&change->rd.rta_dst, dst);
+ } else {
+ change->rd.rta_dst = nl_attr_get_in6_addr(attrs[RTA_DST]);
+ }
+ } else if (ipv4) {
+ in6_addr_set_mapped_ipv4(&change->rd.rta_dst, 0);
}
if (attrs[RTA_GATEWAY]) {
- change->rd.rta_gw = nl_attr_get_be32(attrs[RTA_GATEWAY]);
+ if (ipv4) {
+ ovs_be32 gw;
+ gw = nl_attr_get_be32(attrs[RTA_GATEWAY]);
+ in6_addr_set_mapped_ipv4(&change->rd.rta_gw, gw);
+ } else {
+ change->rd.rta_gw = nl_attr_get_in6_addr(attrs[RTA_GATEWAY]);
+ }
+ }
+ if (attrs[RTA_MARK]) {
+ change->rd.mark = nl_attr_get_u32(attrs[RTA_MARK]);
}
-
-
} else {
VLOG_DBG_RL(&rl, "received unparseable rtnetlink route message");
+ return 0;
}
- return parsed;
+ /* Success. */
+ return ipv4 ? RTNLGRP_IPV4_ROUTE : RTNLGRP_IPV6_ROUTE;
}
static void
if (change->relevant && change->nlmsg_type == RTM_NEWROUTE) {
const struct route_data *rd = &change->rd;
- ovs_router_insert(rd->rta_dst, rd->rtm_dst_len,
- rd->ifname, rd->rta_gw);
+ ovs_router_insert(rd->mark, &rd->rta_dst, rd->rtm_dst_len,
+ rd->local, rd->ifname, &rd->rta_gw);
}
}
ovs_router_flush();
}
+bool
+route_table_fallback_lookup(const struct in6_addr *ip6_dst OVS_UNUSED,
+ char name[] OVS_UNUSED,
+ struct in6_addr *gw6)
+{
+ *gw6 = in6addr_any;
+ return false;
+}
+
\f
/* name_table . */
static void
name_table_init(void)
{
- name_notifier = rtnetlink_link_notifier_create(name_table_change, NULL);
+ name_notifier = rtnetlink_notifier_create(name_table_change, NULL);
}
-static void
-name_table_uninit(void)
-{
- rtnetlink_link_notifier_destroy(name_notifier);
- name_notifier = NULL;
-}
static void
-name_table_change(const struct rtnetlink_link_change *change OVS_UNUSED,
+name_table_change(const struct rtnetlink_change *change,
void *aux OVS_UNUSED)
{
/* Changes to interface status can cause routing table changes that some
* versions of the linux kernel do not advertise for some reason. */
route_table_valid = false;
+
+ if (change && change->nlmsg_type == RTM_DELLINK) {
+ if (change->ifname) {
+ tnl_port_map_delete_ipdev(change->ifname);
+ }
+ }
}