2 * Copyright (c) 2008-2009 Patrick McHardy <kaber@trash.net>
3 * Copyright (c) 2014 Intel Corporation
4 * Author: Tomasz Bursztyka <tomasz.bursztyka@linux.intel.com>
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 as
8 * published by the Free Software Foundation.
10 * Development of this code funded by Astaro AG (http://www.astaro.com/)
13 #include <linux/kernel.h>
14 #include <linux/netlink.h>
15 #include <linux/netfilter.h>
16 #include <linux/netfilter/nf_tables.h>
19 #include <linux/ipv6.h>
20 #include <linux/smp.h>
21 #include <linux/static_key.h>
24 #include <net/tcp_states.h> /* for TCP_TIME_WAIT */
25 #include <net/netfilter/nf_tables.h>
26 #include <net/netfilter/nf_tables_core.h>
28 #include <uapi/linux/netfilter_bridge.h> /* NF_BR_PRE_ROUTING */
31 enum nft_meta_keys key:8;
33 enum nft_registers dreg:8;
34 enum nft_registers sreg:8;
38 static DEFINE_PER_CPU(struct rnd_state, nft_prandom_state);
40 #ifdef CONFIG_NF_TABLES_BRIDGE
41 #include "../bridge/br_private.h"
44 void nft_meta_get_eval(const struct nft_expr *expr,
45 struct nft_regs *regs,
46 const struct nft_pktinfo *pkt)
48 const struct nft_meta *priv = nft_expr_priv(expr);
49 const struct sk_buff *skb = pkt->skb;
50 const struct net_device *in = nft_in(pkt), *out = nft_out(pkt);
52 u32 *dest = ®s->data[priv->dreg];
53 #ifdef CONFIG_NF_TABLES_BRIDGE
54 const struct net_bridge_port *p;
61 case NFT_META_PROTOCOL:
62 nft_reg_store16(dest, (__force u16)skb->protocol);
64 case NFT_META_NFPROTO:
65 nft_reg_store8(dest, nft_pf(pkt));
67 case NFT_META_L4PROTO:
70 nft_reg_store8(dest, pkt->tprot);
72 case NFT_META_PRIORITY:
73 *dest = skb->priority;
88 case NFT_META_IIFNAME:
91 strncpy((char *)dest, in->name, IFNAMSIZ);
93 case NFT_META_OIFNAME:
96 strncpy((char *)dest, out->name, IFNAMSIZ);
98 case NFT_META_IIFTYPE:
101 nft_reg_store16(dest, in->type);
103 case NFT_META_OIFTYPE:
106 nft_reg_store16(dest, out->type);
109 sk = skb_to_full_sk(skb);
110 if (!sk || !sk_fullsock(sk) ||
111 !net_eq(nft_net(pkt), sock_net(sk)))
114 read_lock_bh(&sk->sk_callback_lock);
115 if (sk->sk_socket == NULL ||
116 sk->sk_socket->file == NULL) {
117 read_unlock_bh(&sk->sk_callback_lock);
121 *dest = from_kuid_munged(&init_user_ns,
122 sk->sk_socket->file->f_cred->fsuid);
123 read_unlock_bh(&sk->sk_callback_lock);
126 sk = skb_to_full_sk(skb);
127 if (!sk || !sk_fullsock(sk) ||
128 !net_eq(nft_net(pkt), sock_net(sk)))
131 read_lock_bh(&sk->sk_callback_lock);
132 if (sk->sk_socket == NULL ||
133 sk->sk_socket->file == NULL) {
134 read_unlock_bh(&sk->sk_callback_lock);
137 *dest = from_kgid_munged(&init_user_ns,
138 sk->sk_socket->file->f_cred->fsgid);
139 read_unlock_bh(&sk->sk_callback_lock);
141 #ifdef CONFIG_IP_ROUTE_CLASSID
142 case NFT_META_RTCLASSID: {
143 const struct dst_entry *dst = skb_dst(skb);
147 *dest = dst->tclassid;
151 #ifdef CONFIG_NETWORK_SECMARK
152 case NFT_META_SECMARK:
153 *dest = skb->secmark;
156 case NFT_META_PKTTYPE:
157 if (skb->pkt_type != PACKET_LOOPBACK) {
158 nft_reg_store8(dest, skb->pkt_type);
162 switch (nft_pf(pkt)) {
164 if (ipv4_is_multicast(ip_hdr(skb)->daddr))
165 nft_reg_store8(dest, PACKET_MULTICAST);
167 nft_reg_store8(dest, PACKET_BROADCAST);
170 nft_reg_store8(dest, PACKET_MULTICAST);
173 switch (skb->protocol) {
174 case htons(ETH_P_IP): {
175 int noff = skb_network_offset(skb);
176 struct iphdr *iph, _iph;
178 iph = skb_header_pointer(skb, noff,
179 sizeof(_iph), &_iph);
183 if (ipv4_is_multicast(iph->daddr))
184 nft_reg_store8(dest, PACKET_MULTICAST);
186 nft_reg_store8(dest, PACKET_BROADCAST);
190 case htons(ETH_P_IPV6):
191 nft_reg_store8(dest, PACKET_MULTICAST);
204 *dest = raw_smp_processor_id();
206 case NFT_META_IIFGROUP:
211 case NFT_META_OIFGROUP:
216 #ifdef CONFIG_CGROUP_NET_CLASSID
217 case NFT_META_CGROUP:
218 sk = skb_to_full_sk(skb);
219 if (!sk || !sk_fullsock(sk) ||
220 !net_eq(nft_net(pkt), sock_net(sk)))
222 *dest = sock_cgroup_classid(&sk->sk_cgrp_data);
225 case NFT_META_PRANDOM: {
226 struct rnd_state *state = this_cpu_ptr(&nft_prandom_state);
227 *dest = prandom_u32_state(state);
231 case NFT_META_SECPATH:
232 nft_reg_store8(dest, secpath_exists(skb));
235 #ifdef CONFIG_NF_TABLES_BRIDGE
236 case NFT_META_BRI_IIFNAME:
237 if (in == NULL || (p = br_port_get_rcu(in)) == NULL)
239 strncpy((char *)dest, p->br->dev->name, IFNAMSIZ);
241 case NFT_META_BRI_OIFNAME:
242 if (out == NULL || (p = br_port_get_rcu(out)) == NULL)
244 strncpy((char *)dest, p->br->dev->name, IFNAMSIZ);
247 case NFT_META_IIFKIND:
248 if (in == NULL || in->rtnl_link_ops == NULL)
250 strncpy((char *)dest, in->rtnl_link_ops->kind, IFNAMSIZ);
252 case NFT_META_OIFKIND:
253 if (out == NULL || out->rtnl_link_ops == NULL)
255 strncpy((char *)dest, out->rtnl_link_ops->kind, IFNAMSIZ);
264 regs->verdict.code = NFT_BREAK;
267 static void nft_meta_set_eval(const struct nft_expr *expr,
268 struct nft_regs *regs,
269 const struct nft_pktinfo *pkt)
271 const struct nft_meta *meta = nft_expr_priv(expr);
272 struct sk_buff *skb = pkt->skb;
273 u32 *sreg = ®s->data[meta->sreg];
281 case NFT_META_PRIORITY:
282 skb->priority = value;
284 case NFT_META_PKTTYPE:
285 value8 = nft_reg_load8(sreg);
287 if (skb->pkt_type != value8 &&
288 skb_pkt_type_ok(value8) &&
289 skb_pkt_type_ok(skb->pkt_type))
290 skb->pkt_type = value8;
292 case NFT_META_NFTRACE:
293 value8 = nft_reg_load8(sreg);
295 skb->nf_trace = !!value8;
297 #ifdef CONFIG_NETWORK_SECMARK
298 case NFT_META_SECMARK:
299 skb->secmark = value;
307 static const struct nla_policy nft_meta_policy[NFTA_META_MAX + 1] = {
308 [NFTA_META_DREG] = { .type = NLA_U32 },
309 [NFTA_META_KEY] = { .type = NLA_U32 },
310 [NFTA_META_SREG] = { .type = NLA_U32 },
313 static int nft_meta_get_init(const struct nft_ctx *ctx,
314 const struct nft_expr *expr,
315 const struct nlattr * const tb[])
317 struct nft_meta *priv = nft_expr_priv(expr);
320 priv->key = ntohl(nla_get_be32(tb[NFTA_META_KEY]));
322 case NFT_META_PROTOCOL:
323 case NFT_META_IIFTYPE:
324 case NFT_META_OIFTYPE:
327 case NFT_META_NFPROTO:
328 case NFT_META_L4PROTO:
330 case NFT_META_PRIORITY:
336 #ifdef CONFIG_IP_ROUTE_CLASSID
337 case NFT_META_RTCLASSID:
339 #ifdef CONFIG_NETWORK_SECMARK
340 case NFT_META_SECMARK:
342 case NFT_META_PKTTYPE:
344 case NFT_META_IIFGROUP:
345 case NFT_META_OIFGROUP:
346 #ifdef CONFIG_CGROUP_NET_CLASSID
347 case NFT_META_CGROUP:
351 case NFT_META_IIFNAME:
352 case NFT_META_OIFNAME:
353 case NFT_META_IIFKIND:
354 case NFT_META_OIFKIND:
357 case NFT_META_PRANDOM:
358 prandom_init_once(&nft_prandom_state);
362 case NFT_META_SECPATH:
366 #ifdef CONFIG_NF_TABLES_BRIDGE
367 case NFT_META_BRI_IIFNAME:
368 case NFT_META_BRI_OIFNAME:
369 if (ctx->family != NFPROTO_BRIDGE)
378 priv->dreg = nft_parse_register(tb[NFTA_META_DREG]);
379 return nft_validate_register_store(ctx, priv->dreg, NULL,
380 NFT_DATA_VALUE, len);
383 static int nft_meta_get_validate(const struct nft_ctx *ctx,
384 const struct nft_expr *expr,
385 const struct nft_data **data)
388 const struct nft_meta *priv = nft_expr_priv(expr);
391 if (priv->key != NFT_META_SECPATH)
394 switch (ctx->family) {
396 hooks = 1 << NF_NETDEV_INGRESS;
401 hooks = (1 << NF_INET_PRE_ROUTING) |
402 (1 << NF_INET_LOCAL_IN) |
403 (1 << NF_INET_FORWARD);
409 return nft_chain_validate_hooks(ctx->chain, hooks);
415 static int nft_meta_set_validate(const struct nft_ctx *ctx,
416 const struct nft_expr *expr,
417 const struct nft_data **data)
419 struct nft_meta *priv = nft_expr_priv(expr);
422 if (priv->key != NFT_META_PKTTYPE)
425 switch (ctx->family) {
427 hooks = 1 << NF_BR_PRE_ROUTING;
430 hooks = 1 << NF_NETDEV_INGRESS;
435 hooks = 1 << NF_INET_PRE_ROUTING;
441 return nft_chain_validate_hooks(ctx->chain, hooks);
444 static int nft_meta_set_init(const struct nft_ctx *ctx,
445 const struct nft_expr *expr,
446 const struct nlattr * const tb[])
448 struct nft_meta *priv = nft_expr_priv(expr);
452 priv->key = ntohl(nla_get_be32(tb[NFTA_META_KEY]));
455 case NFT_META_PRIORITY:
456 #ifdef CONFIG_NETWORK_SECMARK
457 case NFT_META_SECMARK:
461 case NFT_META_NFTRACE:
464 case NFT_META_PKTTYPE:
471 priv->sreg = nft_parse_register(tb[NFTA_META_SREG]);
472 err = nft_validate_register_load(priv->sreg, len);
476 if (priv->key == NFT_META_NFTRACE)
477 static_branch_inc(&nft_trace_enabled);
482 static int nft_meta_get_dump(struct sk_buff *skb,
483 const struct nft_expr *expr)
485 const struct nft_meta *priv = nft_expr_priv(expr);
487 if (nla_put_be32(skb, NFTA_META_KEY, htonl(priv->key)))
488 goto nla_put_failure;
489 if (nft_dump_register(skb, NFTA_META_DREG, priv->dreg))
490 goto nla_put_failure;
497 static int nft_meta_set_dump(struct sk_buff *skb, const struct nft_expr *expr)
499 const struct nft_meta *priv = nft_expr_priv(expr);
501 if (nla_put_be32(skb, NFTA_META_KEY, htonl(priv->key)))
502 goto nla_put_failure;
503 if (nft_dump_register(skb, NFTA_META_SREG, priv->sreg))
504 goto nla_put_failure;
512 static void nft_meta_set_destroy(const struct nft_ctx *ctx,
513 const struct nft_expr *expr)
515 const struct nft_meta *priv = nft_expr_priv(expr);
517 if (priv->key == NFT_META_NFTRACE)
518 static_branch_dec(&nft_trace_enabled);
521 static const struct nft_expr_ops nft_meta_get_ops = {
522 .type = &nft_meta_type,
523 .size = NFT_EXPR_SIZE(sizeof(struct nft_meta)),
524 .eval = nft_meta_get_eval,
525 .init = nft_meta_get_init,
526 .dump = nft_meta_get_dump,
527 .validate = nft_meta_get_validate,
530 static const struct nft_expr_ops nft_meta_set_ops = {
531 .type = &nft_meta_type,
532 .size = NFT_EXPR_SIZE(sizeof(struct nft_meta)),
533 .eval = nft_meta_set_eval,
534 .init = nft_meta_set_init,
535 .destroy = nft_meta_set_destroy,
536 .dump = nft_meta_set_dump,
537 .validate = nft_meta_set_validate,
540 static const struct nft_expr_ops *
541 nft_meta_select_ops(const struct nft_ctx *ctx,
542 const struct nlattr * const tb[])
544 if (tb[NFTA_META_KEY] == NULL)
545 return ERR_PTR(-EINVAL);
547 if (tb[NFTA_META_DREG] && tb[NFTA_META_SREG])
548 return ERR_PTR(-EINVAL);
550 if (tb[NFTA_META_DREG])
551 return &nft_meta_get_ops;
553 if (tb[NFTA_META_SREG])
554 return &nft_meta_set_ops;
556 return ERR_PTR(-EINVAL);
559 struct nft_expr_type nft_meta_type __read_mostly = {
561 .select_ops = nft_meta_select_ops,
562 .policy = nft_meta_policy,
563 .maxattr = NFTA_META_MAX,
564 .owner = THIS_MODULE,
567 #ifdef CONFIG_NETWORK_SECMARK
573 static const struct nla_policy nft_secmark_policy[NFTA_SECMARK_MAX + 1] = {
574 [NFTA_SECMARK_CTX] = { .type = NLA_STRING, .len = NFT_SECMARK_CTX_MAXLEN },
577 static int nft_secmark_compute_secid(struct nft_secmark *priv)
582 err = security_secctx_to_secid(priv->ctx, strlen(priv->ctx), &tmp_secid);
589 err = security_secmark_relabel_packet(tmp_secid);
593 priv->secid = tmp_secid;
597 static void nft_secmark_obj_eval(struct nft_object *obj, struct nft_regs *regs,
598 const struct nft_pktinfo *pkt)
600 const struct nft_secmark *priv = nft_obj_data(obj);
601 struct sk_buff *skb = pkt->skb;
603 skb->secmark = priv->secid;
606 static int nft_secmark_obj_init(const struct nft_ctx *ctx,
607 const struct nlattr * const tb[],
608 struct nft_object *obj)
610 struct nft_secmark *priv = nft_obj_data(obj);
613 if (tb[NFTA_SECMARK_CTX] == NULL)
616 priv->ctx = nla_strdup(tb[NFTA_SECMARK_CTX], GFP_KERNEL);
620 err = nft_secmark_compute_secid(priv);
626 security_secmark_refcount_inc();
631 static int nft_secmark_obj_dump(struct sk_buff *skb, struct nft_object *obj,
634 struct nft_secmark *priv = nft_obj_data(obj);
637 if (nla_put_string(skb, NFTA_SECMARK_CTX, priv->ctx))
641 err = nft_secmark_compute_secid(priv);
649 static void nft_secmark_obj_destroy(const struct nft_ctx *ctx, struct nft_object *obj)
651 struct nft_secmark *priv = nft_obj_data(obj);
653 security_secmark_refcount_dec();
658 static const struct nft_object_ops nft_secmark_obj_ops = {
659 .type = &nft_secmark_obj_type,
660 .size = sizeof(struct nft_secmark),
661 .init = nft_secmark_obj_init,
662 .eval = nft_secmark_obj_eval,
663 .dump = nft_secmark_obj_dump,
664 .destroy = nft_secmark_obj_destroy,
666 struct nft_object_type nft_secmark_obj_type __read_mostly = {
667 .type = NFT_OBJECT_SECMARK,
668 .ops = &nft_secmark_obj_ops,
669 .maxattr = NFTA_SECMARK_MAX,
670 .policy = nft_secmark_policy,
671 .owner = THIS_MODULE,
673 #endif /* CONFIG_NETWORK_SECMARK */