From: Anders K. Pedersen <a...@cohaesio.com>

Add nftables inet family support for an rt nexthop expression allowing
usage of the routing nexthop (i.e. the directly connected IP address that
an outgoing packet is sent to) for matching or accounting, eg.

 # nft add rule inet filter postrouting \
        ether type ip6 \
        ip6 daddr fd01::/16 rt ip6 nexthop != fd00::1 drop

This will drop any traffic to fd01::/16 that is not routed via fd00::1.
Note that "ether type" must be specified explicitly, when rt nexthop is
used from inet family tables.

 # nft add rule inet filter postrouting \
        ether type ip \
        flow table acct { rt ip nexthop timeout 600s counter }
 # nft add rule inet filter postrouting \
        ether type ip6 \
        flow table acct { rt ip6 nexthop6 timeout 600s counter }

These rules count outgoing traffic per nexthop. Note that the timeout
releases an entry if no traffic is seen for this nexthop within 10 minutes.

Signed-off-by: Anders K. Pedersen <a...@cohaesio.com>
---
 net/netfilter/Kconfig                    |   5 ++
 net/netfilter/Makefile                   |   1 +
 net/netfilter/nft_rt_inet.c              | 150 +++++++++++++++++++++++++++++++
 3 files changed, 156 insertions(+)

diff --git a/net/netfilter/Kconfig b/net/netfilter/Kconfig
--- a/net/netfilter/Kconfig
+++ b/net/netfilter/Kconfig
@@ -480,6 +480,11 @@ config NFT_META
          This option adds the "rt" expression that you can use to match
          packet routing information such as the packet nexthop.

+config NFT_RT_INET
+       depends on NF_TABLES_INET
+       default NFT_RT
+       tristate
+
 config NFT_NUMGEN
        tristate "Netfilter nf_tables number generator module"
        help
diff --git a/net/netfilter/Makefile b/net/netfilter/Makefile
--- a/net/netfilter/Makefile
+++ b/net/netfilter/Makefile
@@ -82,6 +82,7 @@ obj-$(CONFIG_NF_TABLES_NETDEV)        += nf_tables_netdev.o
 obj-$(CONFIG_NFT_EXTHDR)       += nft_exthdr.o
 obj-$(CONFIG_NFT_META)         += nft_meta.o
 obj-$(CONFIG_NFT_RT)           += nft_rt.o
+obj-$(CONFIG_NFT_RT_INET)      += nft_rt_inet.o
 obj-$(CONFIG_NFT_NUMGEN)       += nft_numgen.o
 obj-$(CONFIG_NFT_CT)           += nft_ct.o
 obj-$(CONFIG_NFT_LIMIT)                += nft_limit.o
diff --git a/net/netfilter/nft_rt_inet.c b/net/netfilter/nft_rt_inet.c
--- /dev/null
+++ b/net/netfilter/nft_rt_inet.c
@@ -0,0 +1,150 @@
+/*
+ * Copyright (c) 2016 Anders K. Pedersen <a...@cohaesio.com>
+ *
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License version 2 as
+ * published by the Free Software Foundation.
+ *
+ */
+
+#include <linux/kernel.h>
+#include <linux/init.h>
+#include <linux/module.h>
+#include <linux/netlink.h>
+#include <linux/netfilter.h>
+#include <linux/netfilter/nf_tables.h>
+#include <net/ip6_route.h>
+#include <net/route.h>
+#include <net/netfilter/nf_tables.h>
+#include <net/netfilter/nft_rt.h>
+
+static void nft_rt_inet_get_eval(const struct nft_expr *expr,
+                                struct nft_regs *regs,
+                                const struct nft_pktinfo *pkt)
+{
+       const struct nft_rt *priv = nft_expr_priv(expr);
+       const struct sk_buff *skb = pkt->skb;
+       u32 *dest = &regs->data[priv->dreg];
+
+       if (unlikely(pkt->pf != priv->family)) {
+               WARN_ONCE(1, "Address families do not match\n");
+               goto err;
+       }
+
+       switch (pkt->pf) {
+       case NFPROTO_IPV4:
+               switch (priv->key) {
+               case NFT_RT_NEXTHOP: {
+                       const struct rtable *rt = skb_rtable(skb);
+
+                       if (!rt)
+                               goto err;
+                       *dest = rt_nexthop(rt, ip_hdr(skb)->daddr);
+                       break;
+               }
+               default:
+                       goto out;
+               }
+               break;
+       case NFPROTO_IPV6:
+               switch (priv->key) {
+               case NFT_RT_NEXTHOP: {
+                       struct rt6_info *rt =
+                                       (struct rt6_info *)skb_dst(skb);
+
+                       if (!rt)
+                               goto err;
+                       memcpy(dest, rt6_nexthop(rt, &ipv6_hdr(skb)->daddr),
+                              sizeof(struct in6_addr));
+                       break;
+               }
+               default:
+                       goto out;
+               }
+               break;
+       }
+
+       return;
+out:
+       return nft_rt_get_eval(expr, regs, pkt);
+err:
+       regs->verdict.code = NFT_BREAK;
+}
+
+static int nft_rt_inet_get_init(const struct nft_ctx *ctx,
+                               const struct nft_expr *expr,
+                               const struct nlattr * const tb[])
+{
+       struct nft_rt *priv = nft_expr_priv(expr);
+       unsigned int len;
+
+       priv->key = ntohl(nla_get_be32(tb[NFTA_RT_KEY]));
+       priv->family = ntohl(nla_get_be32(tb[NFTA_RT_FAMILY]));
+       switch (priv->key) {
+       case NFT_RT_NEXTHOP:
+               switch (priv->family) {
+               case NFPROTO_IPV4:
+                       len = sizeof(u32);
+                       break;
+               case NFPROTO_IPV6:
+                       len = sizeof(struct in6_addr);
+                       break;
+               }
+               len = sizeof(u32);
+               break;
+       default:
+               return nft_rt_get_init(ctx, expr, tb);
+       }
+
+       priv->dreg = nft_parse_register(tb[NFTA_RT_DREG]);
+       return nft_validate_register_store(ctx, priv->dreg, NULL,
+                                          NFT_DATA_VALUE, len);
+}
+
+static struct nft_expr_type nft_rt_inet_type;
+static const struct nft_expr_ops nft_rt_inet_get_ops = {
+       .type           = &nft_rt_inet_type,
+       .size           = NFT_EXPR_SIZE(sizeof(struct nft_rt)),
+       .eval           = nft_rt_inet_get_eval,
+       .init           = nft_rt_inet_get_init,
+       .dump           = nft_rt_get_dump,
+};
+
+static const struct nft_expr_ops *
+nft_rt_inet_select_ops(const struct nft_ctx *ctx,
+                      const struct nlattr * const tb[])
+{
+       if (tb[NFTA_RT_KEY] == NULL)
+               return ERR_PTR(-EINVAL);
+
+       if (tb[NFTA_RT_DREG])
+               return &nft_rt_inet_get_ops;
+
+       return ERR_PTR(-EINVAL);
+}
+
+static struct nft_expr_type nft_rt_inet_type __read_mostly = {
+       .family         = NFPROTO_INET,
+       .name           = "rt",
+       .select_ops     = &nft_rt_inet_select_ops,
+       .policy         = nft_rt_policy,
+       .maxattr        = NFTA_RT_MAX,
+       .owner          = THIS_MODULE,
+};
+
+static int __init nft_rt_inet_module_init(void)
+{
+       return nft_register_expr(&nft_rt_inet_type);
+}
+
+static void __exit nft_rt_inet_module_exit(void)
+{
+       nft_unregister_expr(&nft_rt_inet_type);
+}
+
+module_init(nft_rt_inet_module_init);
+module_exit(nft_rt_inet_module_exit);
+
+MODULE_LICENSE("GPL");
+MODULE_AUTHOR("Anders K. Pedersen <a...@cohaesio.com>");
+MODULE_ALIAS_NFT_AF_EXPR(1, "rt");

Reply via email to