Commit 7adaf56e authored by David S. Miller's avatar David S. Miller

Merge git://git.kernel.org/pub/scm/linux/kernel/git/pablo/nf-next

Pablo Neira Ayuso says:

====================
Netfilter/IPVS updates for net-next

The following patchset contains Netfilter/IPVS for net-next:

1) Add new run_estimation toggle to IPVS to stop the estimation_timer
   logic, from Dust Li.

2) Relax superfluous dynset check on NFT_SET_TIMEOUT.

3) Add egress hook, from Lukas Wunner.

4) Nowadays, almost all hook functions in x_table land just call the hook
   evaluation loop. Remove remaining hook wrappers from iptables and IPVS.
   From Florian Westphal.
====================
Signed-off-by: default avatarDavid S. Miller <davem@davemloft.net>
parents c87350ce ffdd33dd
...@@ -300,3 +300,14 @@ sync_version - INTEGER ...@@ -300,3 +300,14 @@ sync_version - INTEGER
Kernels with this sync_version entry are able to receive messages Kernels with this sync_version entry are able to receive messages
of both version 1 and version 2 of the synchronisation protocol. of both version 1 and version 2 of the synchronisation protocol.
run_estimation - BOOLEAN
0 - disabled
not 0 - enabled (default)
If disabled, the estimation will be stop, and you can't see
any update on speed estimation data.
You can always re-enable estimation by setting this value to 1.
But be careful, the first estimation after re-enable is not
accurate.
...@@ -31,6 +31,7 @@ ...@@ -31,6 +31,7 @@
#include <linux/init.h> #include <linux/init.h>
#include <linux/interrupt.h> #include <linux/interrupt.h>
#include <linux/moduleparam.h> #include <linux/moduleparam.h>
#include <linux/netfilter_netdev.h>
#include <net/pkt_sched.h> #include <net/pkt_sched.h>
#include <net/net_namespace.h> #include <net/net_namespace.h>
...@@ -75,8 +76,10 @@ static void ifb_ri_tasklet(struct tasklet_struct *t) ...@@ -75,8 +76,10 @@ static void ifb_ri_tasklet(struct tasklet_struct *t)
} }
while ((skb = __skb_dequeue(&txp->tq)) != NULL) { while ((skb = __skb_dequeue(&txp->tq)) != NULL) {
/* Skip tc and netfilter to prevent redirection loop. */
skb->redirected = 0; skb->redirected = 0;
skb->tc_skip_classify = 1; skb->tc_skip_classify = 1;
nf_skip_egress(skb, true);
u64_stats_update_begin(&txp->tsync); u64_stats_update_begin(&txp->tsync);
txp->tx_packets++; txp->tx_packets++;
......
...@@ -1861,6 +1861,7 @@ enum netdev_ml_priv_type { ...@@ -1861,6 +1861,7 @@ enum netdev_ml_priv_type {
* @xps_maps: XXX: need comments on this one * @xps_maps: XXX: need comments on this one
* @miniq_egress: clsact qdisc specific data for * @miniq_egress: clsact qdisc specific data for
* egress processing * egress processing
* @nf_hooks_egress: netfilter hooks executed for egress packets
* @qdisc_hash: qdisc hash table * @qdisc_hash: qdisc hash table
* @watchdog_timeo: Represents the timeout that is used by * @watchdog_timeo: Represents the timeout that is used by
* the watchdog (see dev_watchdog()) * the watchdog (see dev_watchdog())
...@@ -2160,6 +2161,9 @@ struct net_device { ...@@ -2160,6 +2161,9 @@ struct net_device {
#ifdef CONFIG_NET_CLS_ACT #ifdef CONFIG_NET_CLS_ACT
struct mini_Qdisc __rcu *miniq_egress; struct mini_Qdisc __rcu *miniq_egress;
#endif #endif
#ifdef CONFIG_NETFILTER_EGRESS
struct nf_hook_entries __rcu *nf_hooks_egress;
#endif
#ifdef CONFIG_NET_SCHED #ifdef CONFIG_NET_SCHED
DECLARE_HASHTABLE (qdisc_hash, 4); DECLARE_HASHTABLE (qdisc_hash, 4);
......
...@@ -54,9 +54,8 @@ int arpt_register_table(struct net *net, const struct xt_table *table, ...@@ -54,9 +54,8 @@ int arpt_register_table(struct net *net, const struct xt_table *table,
const struct nf_hook_ops *ops); const struct nf_hook_ops *ops);
void arpt_unregister_table(struct net *net, const char *name); void arpt_unregister_table(struct net *net, const char *name);
void arpt_unregister_table_pre_exit(struct net *net, const char *name); void arpt_unregister_table_pre_exit(struct net *net, const char *name);
extern unsigned int arpt_do_table(struct sk_buff *skb, extern unsigned int arpt_do_table(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state, const struct nf_hook_state *state);
struct xt_table *table);
#ifdef CONFIG_NETFILTER_XTABLES_COMPAT #ifdef CONFIG_NETFILTER_XTABLES_COMPAT
#include <net/compat.h> #include <net/compat.h>
......
...@@ -112,9 +112,8 @@ extern int ebt_register_table(struct net *net, ...@@ -112,9 +112,8 @@ extern int ebt_register_table(struct net *net,
const struct nf_hook_ops *ops); const struct nf_hook_ops *ops);
extern void ebt_unregister_table(struct net *net, const char *tablename); extern void ebt_unregister_table(struct net *net, const char *tablename);
void ebt_unregister_table_pre_exit(struct net *net, const char *tablename); void ebt_unregister_table_pre_exit(struct net *net, const char *tablename);
extern unsigned int ebt_do_table(struct sk_buff *skb, extern unsigned int ebt_do_table(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state, const struct nf_hook_state *state);
struct ebt_table *table);
/* True if the hook mask denotes that the rule is in a base chain, /* True if the hook mask denotes that the rule is in a base chain,
* used in the check() functions */ * used in the check() functions */
......
...@@ -63,9 +63,9 @@ struct ipt_error { ...@@ -63,9 +63,9 @@ struct ipt_error {
} }
extern void *ipt_alloc_initial_table(const struct xt_table *); extern void *ipt_alloc_initial_table(const struct xt_table *);
extern unsigned int ipt_do_table(struct sk_buff *skb, extern unsigned int ipt_do_table(void *priv,
const struct nf_hook_state *state, struct sk_buff *skb,
struct xt_table *table); const struct nf_hook_state *state);
#ifdef CONFIG_NETFILTER_XTABLES_COMPAT #ifdef CONFIG_NETFILTER_XTABLES_COMPAT
#include <net/compat.h> #include <net/compat.h>
......
...@@ -29,9 +29,8 @@ int ip6t_register_table(struct net *net, const struct xt_table *table, ...@@ -29,9 +29,8 @@ int ip6t_register_table(struct net *net, const struct xt_table *table,
const struct nf_hook_ops *ops); const struct nf_hook_ops *ops);
void ip6t_unregister_table_pre_exit(struct net *net, const char *name); void ip6t_unregister_table_pre_exit(struct net *net, const char *name);
void ip6t_unregister_table_exit(struct net *net, const char *name); void ip6t_unregister_table_exit(struct net *net, const char *name);
extern unsigned int ip6t_do_table(struct sk_buff *skb, extern unsigned int ip6t_do_table(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state, const struct nf_hook_state *state);
struct xt_table *table);
#ifdef CONFIG_NETFILTER_XTABLES_COMPAT #ifdef CONFIG_NETFILTER_XTABLES_COMPAT
#include <net/compat.h> #include <net/compat.h>
......
/* SPDX-License-Identifier: GPL-2.0 */ /* SPDX-License-Identifier: GPL-2.0 */
#ifndef _NETFILTER_INGRESS_H_ #ifndef _NETFILTER_NETDEV_H_
#define _NETFILTER_INGRESS_H_ #define _NETFILTER_NETDEV_H_
#include <linux/netfilter.h> #include <linux/netfilter.h>
#include <linux/netdevice.h> #include <linux/netdevice.h>
...@@ -38,10 +38,6 @@ static inline int nf_hook_ingress(struct sk_buff *skb) ...@@ -38,10 +38,6 @@ static inline int nf_hook_ingress(struct sk_buff *skb)
return ret; return ret;
} }
static inline void nf_hook_ingress_init(struct net_device *dev)
{
RCU_INIT_POINTER(dev->nf_hooks_ingress, NULL);
}
#else /* CONFIG_NETFILTER_INGRESS */ #else /* CONFIG_NETFILTER_INGRESS */
static inline int nf_hook_ingress_active(struct sk_buff *skb) static inline int nf_hook_ingress_active(struct sk_buff *skb)
{ {
...@@ -52,7 +48,99 @@ static inline int nf_hook_ingress(struct sk_buff *skb) ...@@ -52,7 +48,99 @@ static inline int nf_hook_ingress(struct sk_buff *skb)
{ {
return 0; return 0;
} }
static inline void nf_hook_ingress_init(struct net_device *dev) {}
#endif /* CONFIG_NETFILTER_INGRESS */ #endif /* CONFIG_NETFILTER_INGRESS */
#endif /* _NETFILTER_INGRESS_H_ */
#ifdef CONFIG_NETFILTER_EGRESS
static inline bool nf_hook_egress_active(void)
{
#ifdef CONFIG_JUMP_LABEL
if (!static_key_false(&nf_hooks_needed[NFPROTO_NETDEV][NF_NETDEV_EGRESS]))
return false;
#endif
return true;
}
/**
* nf_hook_egress - classify packets before transmission
* @skb: packet to be classified
* @rc: result code which shall be returned by __dev_queue_xmit() on failure
* @dev: netdev whose egress hooks shall be applied to @skb
*
* Returns @skb on success or %NULL if the packet was consumed or filtered.
* Caller must hold rcu_read_lock.
*
* On ingress, packets are classified first by tc, then by netfilter.
* On egress, the order is reversed for symmetry. Conceptually, tc and
* netfilter can be thought of as layers, with netfilter layered above tc:
* When tc redirects a packet to another interface, netfilter is not applied
* because the packet is on the tc layer.
*
* The nf_skip_egress flag controls whether netfilter is applied on egress.
* It is updated by __netif_receive_skb_core() and __dev_queue_xmit() when the
* packet passes through tc and netfilter. Because __dev_queue_xmit() may be
* called recursively by tunnel drivers such as vxlan, the flag is reverted to
* false after sch_handle_egress(). This ensures that netfilter is applied
* both on the overlay and underlying network.
*/
static inline struct sk_buff *nf_hook_egress(struct sk_buff *skb, int *rc,
struct net_device *dev)
{
struct nf_hook_entries *e;
struct nf_hook_state state;
int ret;
#ifdef CONFIG_NETFILTER_SKIP_EGRESS
if (skb->nf_skip_egress)
return skb;
#endif
e = rcu_dereference(dev->nf_hooks_egress);
if (!e)
return skb;
nf_hook_state_init(&state, NF_NETDEV_EGRESS,
NFPROTO_NETDEV, dev, NULL, NULL,
dev_net(dev), NULL);
ret = nf_hook_slow(skb, &state, e, 0);
if (ret == 1) {
return skb;
} else if (ret < 0) {
*rc = NET_XMIT_DROP;
return NULL;
} else { /* ret == 0 */
*rc = NET_XMIT_SUCCESS;
return NULL;
}
}
#else /* CONFIG_NETFILTER_EGRESS */
static inline bool nf_hook_egress_active(void)
{
return false;
}
static inline struct sk_buff *nf_hook_egress(struct sk_buff *skb, int *rc,
struct net_device *dev)
{
return skb;
}
#endif /* CONFIG_NETFILTER_EGRESS */
static inline void nf_skip_egress(struct sk_buff *skb, bool skip)
{
#ifdef CONFIG_NETFILTER_SKIP_EGRESS
skb->nf_skip_egress = skip;
#endif
}
static inline void nf_hook_netdev_init(struct net_device *dev)
{
#ifdef CONFIG_NETFILTER_INGRESS
RCU_INIT_POINTER(dev->nf_hooks_ingress, NULL);
#endif
#ifdef CONFIG_NETFILTER_EGRESS
RCU_INIT_POINTER(dev->nf_hooks_egress, NULL);
#endif
}
#endif /* _NETFILTER_NETDEV_H_ */
...@@ -652,6 +652,7 @@ typedef unsigned char *sk_buff_data_t; ...@@ -652,6 +652,7 @@ typedef unsigned char *sk_buff_data_t;
* @tc_at_ingress: used within tc_classify to distinguish in/egress * @tc_at_ingress: used within tc_classify to distinguish in/egress
* @redirected: packet was redirected by packet classifier * @redirected: packet was redirected by packet classifier
* @from_ingress: packet was redirected from the ingress path * @from_ingress: packet was redirected from the ingress path
* @nf_skip_egress: packet shall skip nf egress - see netfilter_netdev.h
* @peeked: this packet has been seen already, so stats have been * @peeked: this packet has been seen already, so stats have been
* done for it, don't do them again * done for it, don't do them again
* @nf_trace: netfilter packet trace flag * @nf_trace: netfilter packet trace flag
...@@ -868,6 +869,9 @@ struct sk_buff { ...@@ -868,6 +869,9 @@ struct sk_buff {
#ifdef CONFIG_NET_REDIRECT #ifdef CONFIG_NET_REDIRECT
__u8 from_ingress:1; __u8 from_ingress:1;
#endif #endif
#ifdef CONFIG_NETFILTER_SKIP_EGRESS
__u8 nf_skip_egress:1;
#endif
#ifdef CONFIG_TLS_DEVICE #ifdef CONFIG_TLS_DEVICE
__u8 decrypted:1; __u8 decrypted:1;
#endif #endif
......
...@@ -931,6 +931,7 @@ struct netns_ipvs { ...@@ -931,6 +931,7 @@ struct netns_ipvs {
int sysctl_conn_reuse_mode; int sysctl_conn_reuse_mode;
int sysctl_schedule_icmp; int sysctl_schedule_icmp;
int sysctl_ignore_tunneled; int sysctl_ignore_tunneled;
int sysctl_run_estimation;
/* ip_vs_lblc */ /* ip_vs_lblc */
int sysctl_lblc_expiration; int sysctl_lblc_expiration;
...@@ -1071,6 +1072,11 @@ static inline int sysctl_cache_bypass(struct netns_ipvs *ipvs) ...@@ -1071,6 +1072,11 @@ static inline int sysctl_cache_bypass(struct netns_ipvs *ipvs)
return ipvs->sysctl_cache_bypass; return ipvs->sysctl_cache_bypass;
} }
static inline int sysctl_run_estimation(struct netns_ipvs *ipvs)
{
return ipvs->sysctl_run_estimation;
}
#else #else
static inline int sysctl_sync_threshold(struct netns_ipvs *ipvs) static inline int sysctl_sync_threshold(struct netns_ipvs *ipvs)
...@@ -1163,6 +1169,11 @@ static inline int sysctl_cache_bypass(struct netns_ipvs *ipvs) ...@@ -1163,6 +1169,11 @@ static inline int sysctl_cache_bypass(struct netns_ipvs *ipvs)
return 0; return 0;
} }
static inline int sysctl_run_estimation(struct netns_ipvs *ipvs)
{
return 1;
}
#endif #endif
/* IPVS core functions /* IPVS core functions
......
...@@ -51,6 +51,7 @@ enum nf_inet_hooks { ...@@ -51,6 +51,7 @@ enum nf_inet_hooks {
enum nf_dev_hooks { enum nf_dev_hooks {
NF_NETDEV_INGRESS, NF_NETDEV_INGRESS,
NF_NETDEV_EGRESS,
NF_NETDEV_NUMHOOKS NF_NETDEV_NUMHOOKS
}; };
......
...@@ -66,7 +66,7 @@ static unsigned int ebt_broute(void *priv, struct sk_buff *skb, ...@@ -66,7 +66,7 @@ static unsigned int ebt_broute(void *priv, struct sk_buff *skb,
NFPROTO_BRIDGE, s->in, NULL, NULL, NFPROTO_BRIDGE, s->in, NULL, NULL,
s->net, NULL); s->net, NULL);
ret = ebt_do_table(skb, &state, priv); ret = ebt_do_table(priv, skb, &state);
if (ret != NF_DROP) if (ret != NF_DROP)
return ret; return ret;
......
...@@ -58,28 +58,21 @@ static const struct ebt_table frame_filter = { ...@@ -58,28 +58,21 @@ static const struct ebt_table frame_filter = {
.me = THIS_MODULE, .me = THIS_MODULE,
}; };
static unsigned int
ebt_filter_hook(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state)
{
return ebt_do_table(skb, state, priv);
}
static const struct nf_hook_ops ebt_ops_filter[] = { static const struct nf_hook_ops ebt_ops_filter[] = {
{ {
.hook = ebt_filter_hook, .hook = ebt_do_table,
.pf = NFPROTO_BRIDGE, .pf = NFPROTO_BRIDGE,
.hooknum = NF_BR_LOCAL_IN, .hooknum = NF_BR_LOCAL_IN,
.priority = NF_BR_PRI_FILTER_BRIDGED, .priority = NF_BR_PRI_FILTER_BRIDGED,
}, },
{ {
.hook = ebt_filter_hook, .hook = ebt_do_table,
.pf = NFPROTO_BRIDGE, .pf = NFPROTO_BRIDGE,
.hooknum = NF_BR_FORWARD, .hooknum = NF_BR_FORWARD,
.priority = NF_BR_PRI_FILTER_BRIDGED, .priority = NF_BR_PRI_FILTER_BRIDGED,
}, },
{ {
.hook = ebt_filter_hook, .hook = ebt_do_table,
.pf = NFPROTO_BRIDGE, .pf = NFPROTO_BRIDGE,
.hooknum = NF_BR_LOCAL_OUT, .hooknum = NF_BR_LOCAL_OUT,
.priority = NF_BR_PRI_FILTER_OTHER, .priority = NF_BR_PRI_FILTER_OTHER,
......
...@@ -58,27 +58,21 @@ static const struct ebt_table frame_nat = { ...@@ -58,27 +58,21 @@ static const struct ebt_table frame_nat = {
.me = THIS_MODULE, .me = THIS_MODULE,
}; };
static unsigned int ebt_nat_hook(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state)
{
return ebt_do_table(skb, state, priv);
}
static const struct nf_hook_ops ebt_ops_nat[] = { static const struct nf_hook_ops ebt_ops_nat[] = {
{ {
.hook = ebt_nat_hook, .hook = ebt_do_table,
.pf = NFPROTO_BRIDGE, .pf = NFPROTO_BRIDGE,
.hooknum = NF_BR_LOCAL_OUT, .hooknum = NF_BR_LOCAL_OUT,
.priority = NF_BR_PRI_NAT_DST_OTHER, .priority = NF_BR_PRI_NAT_DST_OTHER,
}, },
{ {
.hook = ebt_nat_hook, .hook = ebt_do_table,
.pf = NFPROTO_BRIDGE, .pf = NFPROTO_BRIDGE,
.hooknum = NF_BR_POST_ROUTING, .hooknum = NF_BR_POST_ROUTING,
.priority = NF_BR_PRI_NAT_SRC, .priority = NF_BR_PRI_NAT_SRC,
}, },
{ {
.hook = ebt_nat_hook, .hook = ebt_do_table,
.pf = NFPROTO_BRIDGE, .pf = NFPROTO_BRIDGE,
.hooknum = NF_BR_PRE_ROUTING, .hooknum = NF_BR_PRE_ROUTING,
.priority = NF_BR_PRI_NAT_DST_BRIDGED, .priority = NF_BR_PRI_NAT_DST_BRIDGED,
......
...@@ -189,10 +189,10 @@ ebt_get_target_c(const struct ebt_entry *e) ...@@ -189,10 +189,10 @@ ebt_get_target_c(const struct ebt_entry *e)
} }
/* Do some firewalling */ /* Do some firewalling */
unsigned int ebt_do_table(struct sk_buff *skb, unsigned int ebt_do_table(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state, const struct nf_hook_state *state)
struct ebt_table *table)
{ {
struct ebt_table *table = priv;
unsigned int hook = state->hook; unsigned int hook = state->hook;
int i, nentries; int i, nentries;
struct ebt_entry *point; struct ebt_entry *point;
......
...@@ -140,7 +140,7 @@ ...@@ -140,7 +140,7 @@
#include <linux/if_macvlan.h> #include <linux/if_macvlan.h>
#include <linux/errqueue.h> #include <linux/errqueue.h>
#include <linux/hrtimer.h> #include <linux/hrtimer.h>
#include <linux/netfilter_ingress.h> #include <linux/netfilter_netdev.h>
#include <linux/crash_dump.h> #include <linux/crash_dump.h>
#include <linux/sctp.h> #include <linux/sctp.h>
#include <net/udp_tunnel.h> #include <net/udp_tunnel.h>
...@@ -3926,6 +3926,7 @@ EXPORT_SYMBOL(dev_loopback_xmit); ...@@ -3926,6 +3926,7 @@ EXPORT_SYMBOL(dev_loopback_xmit);
static struct sk_buff * static struct sk_buff *
sch_handle_egress(struct sk_buff *skb, int *ret, struct net_device *dev) sch_handle_egress(struct sk_buff *skb, int *ret, struct net_device *dev)
{ {
#ifdef CONFIG_NET_CLS_ACT
struct mini_Qdisc *miniq = rcu_dereference_bh(dev->miniq_egress); struct mini_Qdisc *miniq = rcu_dereference_bh(dev->miniq_egress);
struct tcf_result cl_res; struct tcf_result cl_res;
...@@ -3961,6 +3962,7 @@ sch_handle_egress(struct sk_buff *skb, int *ret, struct net_device *dev) ...@@ -3961,6 +3962,7 @@ sch_handle_egress(struct sk_buff *skb, int *ret, struct net_device *dev)
default: default:
break; break;
} }
#endif /* CONFIG_NET_CLS_ACT */
return skb; return skb;
} }
...@@ -4154,13 +4156,20 @@ static int __dev_queue_xmit(struct sk_buff *skb, struct net_device *sb_dev) ...@@ -4154,13 +4156,20 @@ static int __dev_queue_xmit(struct sk_buff *skb, struct net_device *sb_dev)
qdisc_pkt_len_init(skb); qdisc_pkt_len_init(skb);
#ifdef CONFIG_NET_CLS_ACT #ifdef CONFIG_NET_CLS_ACT
skb->tc_at_ingress = 0; skb->tc_at_ingress = 0;
# ifdef CONFIG_NET_EGRESS #endif
#ifdef CONFIG_NET_EGRESS
if (static_branch_unlikely(&egress_needed_key)) { if (static_branch_unlikely(&egress_needed_key)) {
if (nf_hook_egress_active()) {
skb = nf_hook_egress(skb, &rc, dev);
if (!skb)
goto out;
}
nf_skip_egress(skb, true);
skb = sch_handle_egress(skb, &rc, dev); skb = sch_handle_egress(skb, &rc, dev);
if (!skb) if (!skb)
goto out; goto out;
nf_skip_egress(skb, false);
} }
# endif
#endif #endif
/* If device/qdisc don't need skb->dst, release it right now while /* If device/qdisc don't need skb->dst, release it right now while
* its hot in this cpu cache. * its hot in this cpu cache.
...@@ -5302,6 +5311,7 @@ static int __netif_receive_skb_core(struct sk_buff **pskb, bool pfmemalloc, ...@@ -5302,6 +5311,7 @@ static int __netif_receive_skb_core(struct sk_buff **pskb, bool pfmemalloc,
if (static_branch_unlikely(&ingress_needed_key)) { if (static_branch_unlikely(&ingress_needed_key)) {
bool another = false; bool another = false;
nf_skip_egress(skb, true);
skb = sch_handle_ingress(skb, &pt_prev, &ret, orig_dev, skb = sch_handle_ingress(skb, &pt_prev, &ret, orig_dev,
&another); &another);
if (another) if (another)
...@@ -5309,6 +5319,7 @@ static int __netif_receive_skb_core(struct sk_buff **pskb, bool pfmemalloc, ...@@ -5309,6 +5319,7 @@ static int __netif_receive_skb_core(struct sk_buff **pskb, bool pfmemalloc,
if (!skb) if (!skb)
goto out; goto out;
nf_skip_egress(skb, false);
if (nf_ingress(skb, &pt_prev, &ret, orig_dev) < 0) if (nf_ingress(skb, &pt_prev, &ret, orig_dev) < 0)
goto out; goto out;
} }
...@@ -10870,7 +10881,7 @@ struct net_device *alloc_netdev_mqs(int sizeof_priv, const char *name, ...@@ -10870,7 +10881,7 @@ struct net_device *alloc_netdev_mqs(int sizeof_priv, const char *name,
if (!dev->ethtool_ops) if (!dev->ethtool_ops)
dev->ethtool_ops = &default_ethtool_ops; dev->ethtool_ops = &default_ethtool_ops;
nf_hook_ingress_init(dev); nf_hook_netdev_init(dev);
return dev; return dev;
......
...@@ -179,10 +179,11 @@ struct arpt_entry *arpt_next_entry(const struct arpt_entry *entry) ...@@ -179,10 +179,11 @@ struct arpt_entry *arpt_next_entry(const struct arpt_entry *entry)
return (void *)entry + entry->next_offset; return (void *)entry + entry->next_offset;
} }
unsigned int arpt_do_table(struct sk_buff *skb, unsigned int arpt_do_table(void *priv,
const struct nf_hook_state *state, struct sk_buff *skb,
struct xt_table *table) const struct nf_hook_state *state)
{ {
const struct xt_table *table = priv;
unsigned int hook = state->hook; unsigned int hook = state->hook;
static const char nulldevname[IFNAMSIZ] __attribute__((aligned(sizeof(long)))); static const char nulldevname[IFNAMSIZ] __attribute__((aligned(sizeof(long))));
unsigned int verdict = NF_DROP; unsigned int verdict = NF_DROP;
......
...@@ -26,14 +26,6 @@ static const struct xt_table packet_filter = { ...@@ -26,14 +26,6 @@ static const struct xt_table packet_filter = {
.priority = NF_IP_PRI_FILTER, .priority = NF_IP_PRI_FILTER,
}; };
/* The work comes in here from netfilter.c */
static unsigned int
arptable_filter_hook(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state)
{
return arpt_do_table(skb, state, priv);
}
static struct nf_hook_ops *arpfilter_ops __read_mostly; static struct nf_hook_ops *arpfilter_ops __read_mostly;
static int arptable_filter_table_init(struct net *net) static int arptable_filter_table_init(struct net *net)
...@@ -72,7 +64,7 @@ static int __init arptable_filter_init(void) ...@@ -72,7 +64,7 @@ static int __init arptable_filter_init(void)
if (ret < 0) if (ret < 0)
return ret; return ret;
arpfilter_ops = xt_hook_ops_alloc(&packet_filter, arptable_filter_hook); arpfilter_ops = xt_hook_ops_alloc(&packet_filter, arpt_do_table);
if (IS_ERR(arpfilter_ops)) { if (IS_ERR(arpfilter_ops)) {
xt_unregister_template(&packet_filter); xt_unregister_template(&packet_filter);
return PTR_ERR(arpfilter_ops); return PTR_ERR(arpfilter_ops);
......
...@@ -222,10 +222,11 @@ struct ipt_entry *ipt_next_entry(const struct ipt_entry *entry) ...@@ -222,10 +222,11 @@ struct ipt_entry *ipt_next_entry(const struct ipt_entry *entry)
/* Returns one of the generic firewall policies, like NF_ACCEPT. */ /* Returns one of the generic firewall policies, like NF_ACCEPT. */
unsigned int unsigned int
ipt_do_table(struct sk_buff *skb, ipt_do_table(void *priv,
const struct nf_hook_state *state, struct sk_buff *skb,
struct xt_table *table) const struct nf_hook_state *state)
{ {
const struct xt_table *table = priv;
unsigned int hook = state->hook; unsigned int hook = state->hook;
static const char nulldevname[IFNAMSIZ] __attribute__((aligned(sizeof(long)))); static const char nulldevname[IFNAMSIZ] __attribute__((aligned(sizeof(long))));
const struct iphdr *ip; const struct iphdr *ip;
......
...@@ -28,13 +28,6 @@ static const struct xt_table packet_filter = { ...@@ -28,13 +28,6 @@ static const struct xt_table packet_filter = {
.priority = NF_IP_PRI_FILTER, .priority = NF_IP_PRI_FILTER,
}; };
static unsigned int
iptable_filter_hook(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state)
{
return ipt_do_table(skb, state, priv);
}
static struct nf_hook_ops *filter_ops __read_mostly; static struct nf_hook_ops *filter_ops __read_mostly;
/* Default to forward because I got too much mail already. */ /* Default to forward because I got too much mail already. */
...@@ -90,7 +83,7 @@ static int __init iptable_filter_init(void) ...@@ -90,7 +83,7 @@ static int __init iptable_filter_init(void)
if (ret < 0) if (ret < 0)
return ret; return ret;
filter_ops = xt_hook_ops_alloc(&packet_filter, iptable_filter_hook); filter_ops = xt_hook_ops_alloc(&packet_filter, ipt_do_table);
if (IS_ERR(filter_ops)) { if (IS_ERR(filter_ops)) {
xt_unregister_template(&packet_filter); xt_unregister_template(&packet_filter);
return PTR_ERR(filter_ops); return PTR_ERR(filter_ops);
......
...@@ -34,7 +34,7 @@ static const struct xt_table packet_mangler = { ...@@ -34,7 +34,7 @@ static const struct xt_table packet_mangler = {
}; };
static unsigned int static unsigned int
ipt_mangle_out(struct sk_buff *skb, const struct nf_hook_state *state, void *priv) ipt_mangle_out(void *priv, struct sk_buff *skb, const struct nf_hook_state *state)
{ {
unsigned int ret; unsigned int ret;
const struct iphdr *iph; const struct iphdr *iph;
...@@ -50,7 +50,7 @@ ipt_mangle_out(struct sk_buff *skb, const struct nf_hook_state *state, void *pri ...@@ -50,7 +50,7 @@ ipt_mangle_out(struct sk_buff *skb, const struct nf_hook_state *state, void *pri
daddr = iph->daddr; daddr = iph->daddr;
tos = iph->tos; tos = iph->tos;
ret = ipt_do_table(skb, state, priv); ret = ipt_do_table(priv, skb, state);
/* Reroute for ANY change. */ /* Reroute for ANY change. */
if (ret != NF_DROP && ret != NF_STOLEN) { if (ret != NF_DROP && ret != NF_STOLEN) {
iph = ip_hdr(skb); iph = ip_hdr(skb);
...@@ -75,8 +75,8 @@ iptable_mangle_hook(void *priv, ...@@ -75,8 +75,8 @@ iptable_mangle_hook(void *priv,
const struct nf_hook_state *state) const struct nf_hook_state *state)
{ {
if (state->hook == NF_INET_LOCAL_OUT) if (state->hook == NF_INET_LOCAL_OUT)
return ipt_mangle_out(skb, state, priv); return ipt_mangle_out(priv, skb, state);
return ipt_do_table(skb, state, priv); return ipt_do_table(priv, skb, state);
} }
static struct nf_hook_ops *mangle_ops __read_mostly; static struct nf_hook_ops *mangle_ops __read_mostly;
......
...@@ -29,34 +29,27 @@ static const struct xt_table nf_nat_ipv4_table = { ...@@ -29,34 +29,27 @@ static const struct xt_table nf_nat_ipv4_table = {
.af = NFPROTO_IPV4, .af = NFPROTO_IPV4,
}; };
static unsigned int iptable_nat_do_chain(void *priv,
struct sk_buff *skb,
const struct nf_hook_state *state)
{
return ipt_do_table(skb, state, priv);
}
static const struct nf_hook_ops nf_nat_ipv4_ops[] = { static const struct nf_hook_ops nf_nat_ipv4_ops[] = {
{ {
.hook = iptable_nat_do_chain, .hook = ipt_do_table,
.pf = NFPROTO_IPV4, .pf = NFPROTO_IPV4,
.hooknum = NF_INET_PRE_ROUTING, .hooknum = NF_INET_PRE_ROUTING,
.priority = NF_IP_PRI_NAT_DST, .priority = NF_IP_PRI_NAT_DST,
}, },
{ {
.hook = iptable_nat_do_chain, .hook = ipt_do_table,
.pf = NFPROTO_IPV4, .pf = NFPROTO_IPV4,
.hooknum = NF_INET_POST_ROUTING, .hooknum = NF_INET_POST_ROUTING,
.priority = NF_IP_PRI_NAT_SRC, .priority = NF_IP_PRI_NAT_SRC,
}, },
{ {
.hook = iptable_nat_do_chain, .hook = ipt_do_table,
.pf = NFPROTO_IPV4, .pf = NFPROTO_IPV4,
.hooknum = NF_INET_LOCAL_OUT, .hooknum = NF_INET_LOCAL_OUT,
.priority = NF_IP_PRI_NAT_DST, .priority = NF_IP_PRI_NAT_DST,
}, },
{ {
.hook = iptable_nat_do_chain, .hook = ipt_do_table,
.pf = NFPROTO_IPV4, .pf = NFPROTO_IPV4,
.hooknum = NF_INET_LOCAL_IN, .hooknum = NF_INET_LOCAL_IN,
.priority = NF_IP_PRI_NAT_SRC, .priority = NF_IP_PRI_NAT_SRC,
......
...@@ -32,14 +32,6 @@ static const struct xt_table packet_raw_before_defrag = { ...@@ -32,14 +32,6 @@ static const struct xt_table packet_raw_before_defrag = {
.priority = NF_IP_PRI_RAW_BEFORE_DEFRAG, .priority = NF_IP_PRI_RAW_BEFORE_DEFRAG,
}; };
/* The work comes in here from netfilter.c. */
static unsigned int
iptable_raw_hook(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state)
{
return ipt_do_table(skb, state, priv);
}
static struct nf_hook_ops *rawtable_ops __read_mostly; static struct nf_hook_ops *rawtable_ops __read_mostly;
static int iptable_raw_table_init(struct net *net) static int iptable_raw_table_init(struct net *net)
...@@ -90,7 +82,7 @@ static int __init iptable_raw_init(void) ...@@ -90,7 +82,7 @@ static int __init iptable_raw_init(void)
if (ret < 0) if (ret < 0)
return ret; return ret;
rawtable_ops = xt_hook_ops_alloc(table, iptable_raw_hook); rawtable_ops = xt_hook_ops_alloc(table, ipt_do_table);
if (IS_ERR(rawtable_ops)) { if (IS_ERR(rawtable_ops)) {
xt_unregister_template(table); xt_unregister_template(table);
return PTR_ERR(rawtable_ops); return PTR_ERR(rawtable_ops);
......
...@@ -33,13 +33,6 @@ static const struct xt_table security_table = { ...@@ -33,13 +33,6 @@ static const struct xt_table security_table = {
.priority = NF_IP_PRI_SECURITY, .priority = NF_IP_PRI_SECURITY,
}; };
static unsigned int
iptable_security_hook(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state)
{
return ipt_do_table(skb, state, priv);
}
static struct nf_hook_ops *sectbl_ops __read_mostly; static struct nf_hook_ops *sectbl_ops __read_mostly;
static int iptable_security_table_init(struct net *net) static int iptable_security_table_init(struct net *net)
...@@ -78,7 +71,7 @@ static int __init iptable_security_init(void) ...@@ -78,7 +71,7 @@ static int __init iptable_security_init(void)
if (ret < 0) if (ret < 0)
return ret; return ret;
sectbl_ops = xt_hook_ops_alloc(&security_table, iptable_security_hook); sectbl_ops = xt_hook_ops_alloc(&security_table, ipt_do_table);
if (IS_ERR(sectbl_ops)) { if (IS_ERR(sectbl_ops)) {
xt_unregister_template(&security_table); xt_unregister_template(&security_table);
return PTR_ERR(sectbl_ops); return PTR_ERR(sectbl_ops);
......
...@@ -247,10 +247,10 @@ ip6t_next_entry(const struct ip6t_entry *entry) ...@@ -247,10 +247,10 @@ ip6t_next_entry(const struct ip6t_entry *entry)
/* Returns one of the generic firewall policies, like NF_ACCEPT. */ /* Returns one of the generic firewall policies, like NF_ACCEPT. */
unsigned int unsigned int
ip6t_do_table(struct sk_buff *skb, ip6t_do_table(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state, const struct nf_hook_state *state)
struct xt_table *table)
{ {
const struct xt_table *table = priv;
unsigned int hook = state->hook; unsigned int hook = state->hook;
static const char nulldevname[IFNAMSIZ] __attribute__((aligned(sizeof(long)))); static const char nulldevname[IFNAMSIZ] __attribute__((aligned(sizeof(long))));
/* Initializing verdict to NF_DROP keeps gcc happy. */ /* Initializing verdict to NF_DROP keeps gcc happy. */
......
...@@ -27,14 +27,6 @@ static const struct xt_table packet_filter = { ...@@ -27,14 +27,6 @@ static const struct xt_table packet_filter = {
.priority = NF_IP6_PRI_FILTER, .priority = NF_IP6_PRI_FILTER,
}; };
/* The work comes in here from netfilter.c. */
static unsigned int
ip6table_filter_hook(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state)
{
return ip6t_do_table(skb, state, priv);
}
static struct nf_hook_ops *filter_ops __read_mostly; static struct nf_hook_ops *filter_ops __read_mostly;
/* Default to forward because I got too much mail already. */ /* Default to forward because I got too much mail already. */
...@@ -90,7 +82,7 @@ static int __init ip6table_filter_init(void) ...@@ -90,7 +82,7 @@ static int __init ip6table_filter_init(void)
if (ret < 0) if (ret < 0)
return ret; return ret;
filter_ops = xt_hook_ops_alloc(&packet_filter, ip6table_filter_hook); filter_ops = xt_hook_ops_alloc(&packet_filter, ip6t_do_table);
if (IS_ERR(filter_ops)) { if (IS_ERR(filter_ops)) {
xt_unregister_template(&packet_filter); xt_unregister_template(&packet_filter);
return PTR_ERR(filter_ops); return PTR_ERR(filter_ops);
......
...@@ -29,7 +29,7 @@ static const struct xt_table packet_mangler = { ...@@ -29,7 +29,7 @@ static const struct xt_table packet_mangler = {
}; };
static unsigned int static unsigned int
ip6t_mangle_out(struct sk_buff *skb, const struct nf_hook_state *state, void *priv) ip6t_mangle_out(void *priv, struct sk_buff *skb, const struct nf_hook_state *state)
{ {
unsigned int ret; unsigned int ret;
struct in6_addr saddr, daddr; struct in6_addr saddr, daddr;
...@@ -46,7 +46,7 @@ ip6t_mangle_out(struct sk_buff *skb, const struct nf_hook_state *state, void *pr ...@@ -46,7 +46,7 @@ ip6t_mangle_out(struct sk_buff *skb, const struct nf_hook_state *state, void *pr
/* flowlabel and prio (includes version, which shouldn't change either */ /* flowlabel and prio (includes version, which shouldn't change either */
flowlabel = *((u_int32_t *)ipv6_hdr(skb)); flowlabel = *((u_int32_t *)ipv6_hdr(skb));
ret = ip6t_do_table(skb, state, priv); ret = ip6t_do_table(priv, skb, state);
if (ret != NF_DROP && ret != NF_STOLEN && if (ret != NF_DROP && ret != NF_STOLEN &&
(!ipv6_addr_equal(&ipv6_hdr(skb)->saddr, &saddr) || (!ipv6_addr_equal(&ipv6_hdr(skb)->saddr, &saddr) ||
...@@ -68,8 +68,8 @@ ip6table_mangle_hook(void *priv, struct sk_buff *skb, ...@@ -68,8 +68,8 @@ ip6table_mangle_hook(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state) const struct nf_hook_state *state)
{ {
if (state->hook == NF_INET_LOCAL_OUT) if (state->hook == NF_INET_LOCAL_OUT)
return ip6t_mangle_out(skb, state, priv); return ip6t_mangle_out(priv, skb, state);
return ip6t_do_table(skb, state, priv); return ip6t_do_table(priv, skb, state);
} }
static struct nf_hook_ops *mangle_ops __read_mostly; static struct nf_hook_ops *mangle_ops __read_mostly;
......
...@@ -31,34 +31,27 @@ static const struct xt_table nf_nat_ipv6_table = { ...@@ -31,34 +31,27 @@ static const struct xt_table nf_nat_ipv6_table = {
.af = NFPROTO_IPV6, .af = NFPROTO_IPV6,
}; };
static unsigned int ip6table_nat_do_chain(void *priv,
struct sk_buff *skb,
const struct nf_hook_state *state)
{
return ip6t_do_table(skb, state, priv);
}
static const struct nf_hook_ops nf_nat_ipv6_ops[] = { static const struct nf_hook_ops nf_nat_ipv6_ops[] = {
{ {
.hook = ip6table_nat_do_chain, .hook = ip6t_do_table,
.pf = NFPROTO_IPV6, .pf = NFPROTO_IPV6,
.hooknum = NF_INET_PRE_ROUTING, .hooknum = NF_INET_PRE_ROUTING,
.priority = NF_IP6_PRI_NAT_DST, .priority = NF_IP6_PRI_NAT_DST,
}, },
{ {
.hook = ip6table_nat_do_chain, .hook = ip6t_do_table,
.pf = NFPROTO_IPV6, .pf = NFPROTO_IPV6,
.hooknum = NF_INET_POST_ROUTING, .hooknum = NF_INET_POST_ROUTING,
.priority = NF_IP6_PRI_NAT_SRC, .priority = NF_IP6_PRI_NAT_SRC,
}, },
{ {
.hook = ip6table_nat_do_chain, .hook = ip6t_do_table,
.pf = NFPROTO_IPV6, .pf = NFPROTO_IPV6,
.hooknum = NF_INET_LOCAL_OUT, .hooknum = NF_INET_LOCAL_OUT,
.priority = NF_IP6_PRI_NAT_DST, .priority = NF_IP6_PRI_NAT_DST,
}, },
{ {
.hook = ip6table_nat_do_chain, .hook = ip6t_do_table,
.pf = NFPROTO_IPV6, .pf = NFPROTO_IPV6,
.hooknum = NF_INET_LOCAL_IN, .hooknum = NF_INET_LOCAL_IN,
.priority = NF_IP6_PRI_NAT_SRC, .priority = NF_IP6_PRI_NAT_SRC,
......
...@@ -31,14 +31,6 @@ static const struct xt_table packet_raw_before_defrag = { ...@@ -31,14 +31,6 @@ static const struct xt_table packet_raw_before_defrag = {
.priority = NF_IP6_PRI_RAW_BEFORE_DEFRAG, .priority = NF_IP6_PRI_RAW_BEFORE_DEFRAG,
}; };
/* The work comes in here from netfilter.c. */
static unsigned int
ip6table_raw_hook(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state)
{
return ip6t_do_table(skb, state, priv);
}
static struct nf_hook_ops *rawtable_ops __read_mostly; static struct nf_hook_ops *rawtable_ops __read_mostly;
static int ip6table_raw_table_init(struct net *net) static int ip6table_raw_table_init(struct net *net)
...@@ -88,7 +80,7 @@ static int __init ip6table_raw_init(void) ...@@ -88,7 +80,7 @@ static int __init ip6table_raw_init(void)
return ret; return ret;
/* Register hooks */ /* Register hooks */
rawtable_ops = xt_hook_ops_alloc(table, ip6table_raw_hook); rawtable_ops = xt_hook_ops_alloc(table, ip6t_do_table);
if (IS_ERR(rawtable_ops)) { if (IS_ERR(rawtable_ops)) {
xt_unregister_template(table); xt_unregister_template(table);
return PTR_ERR(rawtable_ops); return PTR_ERR(rawtable_ops);
......
...@@ -32,13 +32,6 @@ static const struct xt_table security_table = { ...@@ -32,13 +32,6 @@ static const struct xt_table security_table = {
.priority = NF_IP6_PRI_SECURITY, .priority = NF_IP6_PRI_SECURITY,
}; };
static unsigned int
ip6table_security_hook(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state)
{
return ip6t_do_table(skb, state, priv);
}
static struct nf_hook_ops *sectbl_ops __read_mostly; static struct nf_hook_ops *sectbl_ops __read_mostly;
static int ip6table_security_table_init(struct net *net) static int ip6table_security_table_init(struct net *net)
...@@ -77,7 +70,7 @@ static int __init ip6table_security_init(void) ...@@ -77,7 +70,7 @@ static int __init ip6table_security_init(void)
if (ret < 0) if (ret < 0)
return ret; return ret;
sectbl_ops = xt_hook_ops_alloc(&security_table, ip6table_security_hook); sectbl_ops = xt_hook_ops_alloc(&security_table, ip6t_do_table);
if (IS_ERR(sectbl_ops)) { if (IS_ERR(sectbl_ops)) {
xt_unregister_template(&security_table); xt_unregister_template(&security_table);
return PTR_ERR(sectbl_ops); return PTR_ERR(sectbl_ops);
......
...@@ -10,6 +10,17 @@ config NETFILTER_INGRESS ...@@ -10,6 +10,17 @@ config NETFILTER_INGRESS
This allows you to classify packets from ingress using the Netfilter This allows you to classify packets from ingress using the Netfilter
infrastructure. infrastructure.
config NETFILTER_EGRESS
bool "Netfilter egress support"
default y
select NET_EGRESS
help
This allows you to classify packets before transmission using the
Netfilter infrastructure.
config NETFILTER_SKIP_EGRESS
def_bool NETFILTER_EGRESS && (NET_CLS_ACT || IFB)
config NETFILTER_NETLINK config NETFILTER_NETLINK
tristate tristate
......
...@@ -316,6 +316,12 @@ nf_hook_entry_head(struct net *net, int pf, unsigned int hooknum, ...@@ -316,6 +316,12 @@ nf_hook_entry_head(struct net *net, int pf, unsigned int hooknum,
if (dev && dev_net(dev) == net) if (dev && dev_net(dev) == net)
return &dev->nf_hooks_ingress; return &dev->nf_hooks_ingress;
} }
#endif
#ifdef CONFIG_NETFILTER_EGRESS
if (hooknum == NF_NETDEV_EGRESS) {
if (dev && dev_net(dev) == net)
return &dev->nf_hooks_egress;
}
#endif #endif
WARN_ON_ONCE(1); WARN_ON_ONCE(1);
return NULL; return NULL;
...@@ -335,7 +341,8 @@ static int nf_ingress_check(struct net *net, const struct nf_hook_ops *reg, ...@@ -335,7 +341,8 @@ static int nf_ingress_check(struct net *net, const struct nf_hook_ops *reg,
return 0; return 0;
} }
static inline bool nf_ingress_hook(const struct nf_hook_ops *reg, int pf) static inline bool __maybe_unused nf_ingress_hook(const struct nf_hook_ops *reg,
int pf)
{ {
if ((pf == NFPROTO_NETDEV && reg->hooknum == NF_NETDEV_INGRESS) || if ((pf == NFPROTO_NETDEV && reg->hooknum == NF_NETDEV_INGRESS) ||
(pf == NFPROTO_INET && reg->hooknum == NF_INET_INGRESS)) (pf == NFPROTO_INET && reg->hooknum == NF_INET_INGRESS))
...@@ -344,6 +351,12 @@ static inline bool nf_ingress_hook(const struct nf_hook_ops *reg, int pf) ...@@ -344,6 +351,12 @@ static inline bool nf_ingress_hook(const struct nf_hook_ops *reg, int pf)
return false; return false;
} }
static inline bool __maybe_unused nf_egress_hook(const struct nf_hook_ops *reg,
int pf)
{
return pf == NFPROTO_NETDEV && reg->hooknum == NF_NETDEV_EGRESS;
}
static void nf_static_key_inc(const struct nf_hook_ops *reg, int pf) static void nf_static_key_inc(const struct nf_hook_ops *reg, int pf)
{ {
#ifdef CONFIG_JUMP_LABEL #ifdef CONFIG_JUMP_LABEL
...@@ -383,9 +396,18 @@ static int __nf_register_net_hook(struct net *net, int pf, ...@@ -383,9 +396,18 @@ static int __nf_register_net_hook(struct net *net, int pf,
switch (pf) { switch (pf) {
case NFPROTO_NETDEV: case NFPROTO_NETDEV:
err = nf_ingress_check(net, reg, NF_NETDEV_INGRESS); #ifndef CONFIG_NETFILTER_INGRESS
if (err < 0) if (reg->hooknum == NF_NETDEV_INGRESS)
return err; return -EOPNOTSUPP;
#endif
#ifndef CONFIG_NETFILTER_EGRESS
if (reg->hooknum == NF_NETDEV_EGRESS)
return -EOPNOTSUPP;
#endif
if ((reg->hooknum != NF_NETDEV_INGRESS &&
reg->hooknum != NF_NETDEV_EGRESS) ||
!reg->dev || dev_net(reg->dev) != net)
return -EINVAL;
break; break;
case NFPROTO_INET: case NFPROTO_INET:
if (reg->hooknum != NF_INET_INGRESS) if (reg->hooknum != NF_INET_INGRESS)
...@@ -417,6 +439,10 @@ static int __nf_register_net_hook(struct net *net, int pf, ...@@ -417,6 +439,10 @@ static int __nf_register_net_hook(struct net *net, int pf,
#ifdef CONFIG_NETFILTER_INGRESS #ifdef CONFIG_NETFILTER_INGRESS
if (nf_ingress_hook(reg, pf)) if (nf_ingress_hook(reg, pf))
net_inc_ingress_queue(); net_inc_ingress_queue();
#endif
#ifdef CONFIG_NETFILTER_EGRESS
if (nf_egress_hook(reg, pf))
net_inc_egress_queue();
#endif #endif
nf_static_key_inc(reg, pf); nf_static_key_inc(reg, pf);
...@@ -474,6 +500,10 @@ static void __nf_unregister_net_hook(struct net *net, int pf, ...@@ -474,6 +500,10 @@ static void __nf_unregister_net_hook(struct net *net, int pf,
#ifdef CONFIG_NETFILTER_INGRESS #ifdef CONFIG_NETFILTER_INGRESS
if (nf_ingress_hook(reg, pf)) if (nf_ingress_hook(reg, pf))
net_dec_ingress_queue(); net_dec_ingress_queue();
#endif
#ifdef CONFIG_NETFILTER_EGRESS
if (nf_egress_hook(reg, pf))
net_dec_egress_queue();
#endif #endif
nf_static_key_dec(reg, pf); nf_static_key_dec(reg, pf);
} else { } else {
......
...@@ -1330,12 +1330,15 @@ handle_response(int af, struct sk_buff *skb, struct ip_vs_proto_data *pd, ...@@ -1330,12 +1330,15 @@ handle_response(int af, struct sk_buff *skb, struct ip_vs_proto_data *pd,
* Check if outgoing packet belongs to the established ip_vs_conn. * Check if outgoing packet belongs to the established ip_vs_conn.
*/ */
static unsigned int static unsigned int
ip_vs_out(struct netns_ipvs *ipvs, unsigned int hooknum, struct sk_buff *skb, int af) ip_vs_out_hook(void *priv, struct sk_buff *skb, const struct nf_hook_state *state)
{ {
struct netns_ipvs *ipvs = net_ipvs(state->net);
unsigned int hooknum = state->hook;
struct ip_vs_iphdr iph; struct ip_vs_iphdr iph;
struct ip_vs_protocol *pp; struct ip_vs_protocol *pp;
struct ip_vs_proto_data *pd; struct ip_vs_proto_data *pd;
struct ip_vs_conn *cp; struct ip_vs_conn *cp;
int af = state->pf;
struct sock *sk; struct sock *sk;
EnterFunction(11); EnterFunction(11);
...@@ -1468,56 +1471,6 @@ ip_vs_out(struct netns_ipvs *ipvs, unsigned int hooknum, struct sk_buff *skb, in ...@@ -1468,56 +1471,6 @@ ip_vs_out(struct netns_ipvs *ipvs, unsigned int hooknum, struct sk_buff *skb, in
return NF_ACCEPT; return NF_ACCEPT;
} }
/*
* It is hooked at the NF_INET_FORWARD and NF_INET_LOCAL_IN chain,
* used only for VS/NAT.
* Check if packet is reply for established ip_vs_conn.
*/
static unsigned int
ip_vs_reply4(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state)
{
return ip_vs_out(net_ipvs(state->net), state->hook, skb, AF_INET);
}
/*
* It is hooked at the NF_INET_LOCAL_OUT chain, used only for VS/NAT.
* Check if packet is reply for established ip_vs_conn.
*/
static unsigned int
ip_vs_local_reply4(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state)
{
return ip_vs_out(net_ipvs(state->net), state->hook, skb, AF_INET);
}
#ifdef CONFIG_IP_VS_IPV6
/*
* It is hooked at the NF_INET_FORWARD and NF_INET_LOCAL_IN chain,
* used only for VS/NAT.
* Check if packet is reply for established ip_vs_conn.
*/
static unsigned int
ip_vs_reply6(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state)
{
return ip_vs_out(net_ipvs(state->net), state->hook, skb, AF_INET6);
}
/*
* It is hooked at the NF_INET_LOCAL_OUT chain, used only for VS/NAT.
* Check if packet is reply for established ip_vs_conn.
*/
static unsigned int
ip_vs_local_reply6(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state)
{
return ip_vs_out(net_ipvs(state->net), state->hook, skb, AF_INET6);
}
#endif
static unsigned int static unsigned int
ip_vs_try_to_schedule(struct netns_ipvs *ipvs, int af, struct sk_buff *skb, ip_vs_try_to_schedule(struct netns_ipvs *ipvs, int af, struct sk_buff *skb,
struct ip_vs_proto_data *pd, struct ip_vs_proto_data *pd,
...@@ -1957,8 +1910,10 @@ static int ip_vs_in_icmp_v6(struct netns_ipvs *ipvs, struct sk_buff *skb, ...@@ -1957,8 +1910,10 @@ static int ip_vs_in_icmp_v6(struct netns_ipvs *ipvs, struct sk_buff *skb,
* and send it on its way... * and send it on its way...
*/ */
static unsigned int static unsigned int
ip_vs_in(struct netns_ipvs *ipvs, unsigned int hooknum, struct sk_buff *skb, int af) ip_vs_in_hook(void *priv, struct sk_buff *skb, const struct nf_hook_state *state)
{ {
struct netns_ipvs *ipvs = net_ipvs(state->net);
unsigned int hooknum = state->hook;
struct ip_vs_iphdr iph; struct ip_vs_iphdr iph;
struct ip_vs_protocol *pp; struct ip_vs_protocol *pp;
struct ip_vs_proto_data *pd; struct ip_vs_proto_data *pd;
...@@ -1966,6 +1921,7 @@ ip_vs_in(struct netns_ipvs *ipvs, unsigned int hooknum, struct sk_buff *skb, int ...@@ -1966,6 +1921,7 @@ ip_vs_in(struct netns_ipvs *ipvs, unsigned int hooknum, struct sk_buff *skb, int
int ret, pkts; int ret, pkts;
int conn_reuse_mode; int conn_reuse_mode;
struct sock *sk; struct sock *sk;
int af = state->pf;
/* Already marked as IPVS request or reply? */ /* Already marked as IPVS request or reply? */
if (skb->ipvs_property) if (skb->ipvs_property)
...@@ -2137,55 +2093,6 @@ ip_vs_in(struct netns_ipvs *ipvs, unsigned int hooknum, struct sk_buff *skb, int ...@@ -2137,55 +2093,6 @@ ip_vs_in(struct netns_ipvs *ipvs, unsigned int hooknum, struct sk_buff *skb, int
return ret; return ret;
} }
/*
* AF_INET handler in NF_INET_LOCAL_IN chain
* Schedule and forward packets from remote clients
*/
static unsigned int
ip_vs_remote_request4(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state)
{
return ip_vs_in(net_ipvs(state->net), state->hook, skb, AF_INET);
}
/*
* AF_INET handler in NF_INET_LOCAL_OUT chain
* Schedule and forward packets from local clients
*/
static unsigned int
ip_vs_local_request4(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state)
{
return ip_vs_in(net_ipvs(state->net), state->hook, skb, AF_INET);
}
#ifdef CONFIG_IP_VS_IPV6
/*
* AF_INET6 handler in NF_INET_LOCAL_IN chain
* Schedule and forward packets from remote clients
*/
static unsigned int
ip_vs_remote_request6(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state)
{
return ip_vs_in(net_ipvs(state->net), state->hook, skb, AF_INET6);
}
/*
* AF_INET6 handler in NF_INET_LOCAL_OUT chain
* Schedule and forward packets from local clients
*/
static unsigned int
ip_vs_local_request6(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state)
{
return ip_vs_in(net_ipvs(state->net), state->hook, skb, AF_INET6);
}
#endif
/* /*
* It is hooked at the NF_INET_FORWARD chain, in order to catch ICMP * It is hooked at the NF_INET_FORWARD chain, in order to catch ICMP
* related packets destined for 0.0.0.0/0. * related packets destined for 0.0.0.0/0.
...@@ -2199,45 +2106,36 @@ static unsigned int ...@@ -2199,45 +2106,36 @@ static unsigned int
ip_vs_forward_icmp(void *priv, struct sk_buff *skb, ip_vs_forward_icmp(void *priv, struct sk_buff *skb,
const struct nf_hook_state *state) const struct nf_hook_state *state)
{ {
int r;
struct netns_ipvs *ipvs = net_ipvs(state->net); struct netns_ipvs *ipvs = net_ipvs(state->net);
int r;
if (ip_hdr(skb)->protocol != IPPROTO_ICMP)
return NF_ACCEPT;
/* ipvs enabled in this netns ? */ /* ipvs enabled in this netns ? */
if (unlikely(sysctl_backup_only(ipvs) || !ipvs->enable)) if (unlikely(sysctl_backup_only(ipvs) || !ipvs->enable))
return NF_ACCEPT; return NF_ACCEPT;
return ip_vs_in_icmp(ipvs, skb, &r, state->hook); if (state->pf == NFPROTO_IPV4) {
} if (ip_hdr(skb)->protocol != IPPROTO_ICMP)
return NF_ACCEPT;
#ifdef CONFIG_IP_VS_IPV6 #ifdef CONFIG_IP_VS_IPV6
static unsigned int } else {
ip_vs_forward_icmp_v6(void *priv, struct sk_buff *skb, struct ip_vs_iphdr iphdr;
const struct nf_hook_state *state)
{
int r;
struct netns_ipvs *ipvs = net_ipvs(state->net);
struct ip_vs_iphdr iphdr;
ip_vs_fill_iph_skb(AF_INET6, skb, false, &iphdr); ip_vs_fill_iph_skb(AF_INET6, skb, false, &iphdr);
if (iphdr.protocol != IPPROTO_ICMPV6)
return NF_ACCEPT;
/* ipvs enabled in this netns ? */ if (iphdr.protocol != IPPROTO_ICMPV6)
if (unlikely(sysctl_backup_only(ipvs) || !ipvs->enable)) return NF_ACCEPT;
return NF_ACCEPT;
return ip_vs_in_icmp_v6(ipvs, skb, &r, state->hook, &iphdr); return ip_vs_in_icmp_v6(ipvs, skb, &r, state->hook, &iphdr);
}
#endif #endif
}
return ip_vs_in_icmp(ipvs, skb, &r, state->hook);
}
static const struct nf_hook_ops ip_vs_ops4[] = { static const struct nf_hook_ops ip_vs_ops4[] = {
/* After packet filtering, change source only for VS/NAT */ /* After packet filtering, change source only for VS/NAT */
{ {
.hook = ip_vs_reply4, .hook = ip_vs_out_hook,
.pf = NFPROTO_IPV4, .pf = NFPROTO_IPV4,
.hooknum = NF_INET_LOCAL_IN, .hooknum = NF_INET_LOCAL_IN,
.priority = NF_IP_PRI_NAT_SRC - 2, .priority = NF_IP_PRI_NAT_SRC - 2,
...@@ -2246,21 +2144,21 @@ static const struct nf_hook_ops ip_vs_ops4[] = { ...@@ -2246,21 +2144,21 @@ static const struct nf_hook_ops ip_vs_ops4[] = {
* or VS/NAT(change destination), so that filtering rules can be * or VS/NAT(change destination), so that filtering rules can be
* applied to IPVS. */ * applied to IPVS. */
{ {
.hook = ip_vs_remote_request4, .hook = ip_vs_in_hook,
.pf = NFPROTO_IPV4, .pf = NFPROTO_IPV4,
.hooknum = NF_INET_LOCAL_IN, .hooknum = NF_INET_LOCAL_IN,
.priority = NF_IP_PRI_NAT_SRC - 1, .priority = NF_IP_PRI_NAT_SRC - 1,
}, },
/* Before ip_vs_in, change source only for VS/NAT */ /* Before ip_vs_in, change source only for VS/NAT */
{ {
.hook = ip_vs_local_reply4, .hook = ip_vs_out_hook,
.pf = NFPROTO_IPV4, .pf = NFPROTO_IPV4,
.hooknum = NF_INET_LOCAL_OUT, .hooknum = NF_INET_LOCAL_OUT,
.priority = NF_IP_PRI_NAT_DST + 1, .priority = NF_IP_PRI_NAT_DST + 1,
}, },
/* After mangle, schedule and forward local requests */ /* After mangle, schedule and forward local requests */
{ {
.hook = ip_vs_local_request4, .hook = ip_vs_in_hook,
.pf = NFPROTO_IPV4, .pf = NFPROTO_IPV4,
.hooknum = NF_INET_LOCAL_OUT, .hooknum = NF_INET_LOCAL_OUT,
.priority = NF_IP_PRI_NAT_DST + 2, .priority = NF_IP_PRI_NAT_DST + 2,
...@@ -2275,7 +2173,7 @@ static const struct nf_hook_ops ip_vs_ops4[] = { ...@@ -2275,7 +2173,7 @@ static const struct nf_hook_ops ip_vs_ops4[] = {
}, },
/* After packet filtering, change source only for VS/NAT */ /* After packet filtering, change source only for VS/NAT */
{ {
.hook = ip_vs_reply4, .hook = ip_vs_out_hook,
.pf = NFPROTO_IPV4, .pf = NFPROTO_IPV4,
.hooknum = NF_INET_FORWARD, .hooknum = NF_INET_FORWARD,
.priority = 100, .priority = 100,
...@@ -2286,7 +2184,7 @@ static const struct nf_hook_ops ip_vs_ops4[] = { ...@@ -2286,7 +2184,7 @@ static const struct nf_hook_ops ip_vs_ops4[] = {
static const struct nf_hook_ops ip_vs_ops6[] = { static const struct nf_hook_ops ip_vs_ops6[] = {
/* After packet filtering, change source only for VS/NAT */ /* After packet filtering, change source only for VS/NAT */
{ {
.hook = ip_vs_reply6, .hook = ip_vs_out_hook,
.pf = NFPROTO_IPV6, .pf = NFPROTO_IPV6,
.hooknum = NF_INET_LOCAL_IN, .hooknum = NF_INET_LOCAL_IN,
.priority = NF_IP6_PRI_NAT_SRC - 2, .priority = NF_IP6_PRI_NAT_SRC - 2,
...@@ -2295,21 +2193,21 @@ static const struct nf_hook_ops ip_vs_ops6[] = { ...@@ -2295,21 +2193,21 @@ static const struct nf_hook_ops ip_vs_ops6[] = {
* or VS/NAT(change destination), so that filtering rules can be * or VS/NAT(change destination), so that filtering rules can be
* applied to IPVS. */ * applied to IPVS. */
{ {
.hook = ip_vs_remote_request6, .hook = ip_vs_in_hook,
.pf = NFPROTO_IPV6, .pf = NFPROTO_IPV6,
.hooknum = NF_INET_LOCAL_IN, .hooknum = NF_INET_LOCAL_IN,
.priority = NF_IP6_PRI_NAT_SRC - 1, .priority = NF_IP6_PRI_NAT_SRC - 1,
}, },
/* Before ip_vs_in, change source only for VS/NAT */ /* Before ip_vs_in, change source only for VS/NAT */
{ {
.hook = ip_vs_local_reply6, .hook = ip_vs_out_hook,
.pf = NFPROTO_IPV6, .pf = NFPROTO_IPV6,
.hooknum = NF_INET_LOCAL_OUT, .hooknum = NF_INET_LOCAL_OUT,
.priority = NF_IP6_PRI_NAT_DST + 1, .priority = NF_IP6_PRI_NAT_DST + 1,
}, },
/* After mangle, schedule and forward local requests */ /* After mangle, schedule and forward local requests */
{ {
.hook = ip_vs_local_request6, .hook = ip_vs_in_hook,
.pf = NFPROTO_IPV6, .pf = NFPROTO_IPV6,
.hooknum = NF_INET_LOCAL_OUT, .hooknum = NF_INET_LOCAL_OUT,
.priority = NF_IP6_PRI_NAT_DST + 2, .priority = NF_IP6_PRI_NAT_DST + 2,
...@@ -2317,14 +2215,14 @@ static const struct nf_hook_ops ip_vs_ops6[] = { ...@@ -2317,14 +2215,14 @@ static const struct nf_hook_ops ip_vs_ops6[] = {
/* After packet filtering (but before ip_vs_out_icmp), catch icmp /* After packet filtering (but before ip_vs_out_icmp), catch icmp
* destined for 0.0.0.0/0, which is for incoming IPVS connections */ * destined for 0.0.0.0/0, which is for incoming IPVS connections */
{ {
.hook = ip_vs_forward_icmp_v6, .hook = ip_vs_forward_icmp,
.pf = NFPROTO_IPV6, .pf = NFPROTO_IPV6,
.hooknum = NF_INET_FORWARD, .hooknum = NF_INET_FORWARD,
.priority = 99, .priority = 99,
}, },
/* After packet filtering, change source only for VS/NAT */ /* After packet filtering, change source only for VS/NAT */
{ {
.hook = ip_vs_reply6, .hook = ip_vs_out_hook,
.pf = NFPROTO_IPV6, .pf = NFPROTO_IPV6,
.hooknum = NF_INET_FORWARD, .hooknum = NF_INET_FORWARD,
.priority = 100, .priority = 100,
......
...@@ -2017,6 +2017,12 @@ static struct ctl_table vs_vars[] = { ...@@ -2017,6 +2017,12 @@ static struct ctl_table vs_vars[] = {
.mode = 0644, .mode = 0644,
.proc_handler = proc_dointvec, .proc_handler = proc_dointvec,
}, },
{
.procname = "run_estimation",
.maxlen = sizeof(int),
.mode = 0644,
.proc_handler = proc_dointvec,
},
#ifdef CONFIG_IP_VS_DEBUG #ifdef CONFIG_IP_VS_DEBUG
{ {
.procname = "debug_level", .procname = "debug_level",
...@@ -4090,6 +4096,8 @@ static int __net_init ip_vs_control_net_init_sysctl(struct netns_ipvs *ipvs) ...@@ -4090,6 +4096,8 @@ static int __net_init ip_vs_control_net_init_sysctl(struct netns_ipvs *ipvs)
tbl[idx++].data = &ipvs->sysctl_conn_reuse_mode; tbl[idx++].data = &ipvs->sysctl_conn_reuse_mode;
tbl[idx++].data = &ipvs->sysctl_schedule_icmp; tbl[idx++].data = &ipvs->sysctl_schedule_icmp;
tbl[idx++].data = &ipvs->sysctl_ignore_tunneled; tbl[idx++].data = &ipvs->sysctl_ignore_tunneled;
ipvs->sysctl_run_estimation = 1;
tbl[idx++].data = &ipvs->sysctl_run_estimation;
ipvs->sysctl_hdr = register_net_sysctl(net, "net/ipv4/vs", tbl); ipvs->sysctl_hdr = register_net_sysctl(net, "net/ipv4/vs", tbl);
if (ipvs->sysctl_hdr == NULL) { if (ipvs->sysctl_hdr == NULL) {
......
...@@ -100,6 +100,9 @@ static void estimation_timer(struct timer_list *t) ...@@ -100,6 +100,9 @@ static void estimation_timer(struct timer_list *t)
u64 rate; u64 rate;
struct netns_ipvs *ipvs = from_timer(ipvs, t, est_timer); struct netns_ipvs *ipvs = from_timer(ipvs, t, est_timer);
if (!sysctl_run_estimation(ipvs))
goto skip;
spin_lock(&ipvs->est_lock); spin_lock(&ipvs->est_lock);
list_for_each_entry(e, &ipvs->est_list, list) { list_for_each_entry(e, &ipvs->est_list, list) {
s = container_of(e, struct ip_vs_stats, est); s = container_of(e, struct ip_vs_stats, est);
...@@ -131,6 +134,8 @@ static void estimation_timer(struct timer_list *t) ...@@ -131,6 +134,8 @@ static void estimation_timer(struct timer_list *t)
spin_unlock(&s->lock); spin_unlock(&s->lock);
} }
spin_unlock(&ipvs->est_lock); spin_unlock(&ipvs->est_lock);
skip:
mod_timer(&ipvs->est_timer, jiffies + 2*HZ); mod_timer(&ipvs->est_timer, jiffies + 2*HZ);
} }
......
...@@ -185,7 +185,7 @@ static const struct nf_hook_entries * ...@@ -185,7 +185,7 @@ static const struct nf_hook_entries *
nfnl_hook_entries_head(u8 pf, unsigned int hook, struct net *net, const char *dev) nfnl_hook_entries_head(u8 pf, unsigned int hook, struct net *net, const char *dev)
{ {
const struct nf_hook_entries *hook_head = NULL; const struct nf_hook_entries *hook_head = NULL;
#ifdef CONFIG_NETFILTER_INGRESS #if defined(CONFIG_NETFILTER_INGRESS) || defined(CONFIG_NETFILTER_EGRESS)
struct net_device *netdev; struct net_device *netdev;
#endif #endif
...@@ -221,9 +221,9 @@ nfnl_hook_entries_head(u8 pf, unsigned int hook, struct net *net, const char *de ...@@ -221,9 +221,9 @@ nfnl_hook_entries_head(u8 pf, unsigned int hook, struct net *net, const char *de
hook_head = rcu_dereference(net->nf.hooks_decnet[hook]); hook_head = rcu_dereference(net->nf.hooks_decnet[hook]);
break; break;
#endif #endif
#ifdef CONFIG_NETFILTER_INGRESS #if defined(CONFIG_NETFILTER_INGRESS) || defined(CONFIG_NETFILTER_EGRESS)
case NFPROTO_NETDEV: case NFPROTO_NETDEV:
if (hook != NF_NETDEV_INGRESS) if (hook >= NF_NETDEV_NUMHOOKS)
return ERR_PTR(-EOPNOTSUPP); return ERR_PTR(-EOPNOTSUPP);
if (!dev) if (!dev)
...@@ -233,7 +233,15 @@ nfnl_hook_entries_head(u8 pf, unsigned int hook, struct net *net, const char *de ...@@ -233,7 +233,15 @@ nfnl_hook_entries_head(u8 pf, unsigned int hook, struct net *net, const char *de
if (!netdev) if (!netdev)
return ERR_PTR(-ENODEV); return ERR_PTR(-ENODEV);
return rcu_dereference(netdev->nf_hooks_ingress); #ifdef CONFIG_NETFILTER_INGRESS
if (hook == NF_NETDEV_INGRESS)
return rcu_dereference(netdev->nf_hooks_ingress);
#endif
#ifdef CONFIG_NETFILTER_EGRESS
if (hook == NF_NETDEV_EGRESS)
return rcu_dereference(netdev->nf_hooks_egress);
#endif
fallthrough;
#endif #endif
default: default:
return ERR_PTR(-EPROTONOSUPPORT); return ERR_PTR(-EPROTONOSUPPORT);
......
...@@ -310,9 +310,11 @@ static const struct nft_chain_type nft_chain_filter_netdev = { ...@@ -310,9 +310,11 @@ static const struct nft_chain_type nft_chain_filter_netdev = {
.name = "filter", .name = "filter",
.type = NFT_CHAIN_T_DEFAULT, .type = NFT_CHAIN_T_DEFAULT,
.family = NFPROTO_NETDEV, .family = NFPROTO_NETDEV,
.hook_mask = (1 << NF_NETDEV_INGRESS), .hook_mask = (1 << NF_NETDEV_INGRESS) |
(1 << NF_NETDEV_EGRESS),
.hooks = { .hooks = {
[NF_NETDEV_INGRESS] = nft_do_chain_netdev, [NF_NETDEV_INGRESS] = nft_do_chain_netdev,
[NF_NETDEV_EGRESS] = nft_do_chain_netdev,
}, },
}; };
......
...@@ -198,17 +198,8 @@ static int nft_dynset_init(const struct nft_ctx *ctx, ...@@ -198,17 +198,8 @@ static int nft_dynset_init(const struct nft_ctx *ctx,
return -EBUSY; return -EBUSY;
priv->op = ntohl(nla_get_be32(tb[NFTA_DYNSET_OP])); priv->op = ntohl(nla_get_be32(tb[NFTA_DYNSET_OP]));
switch (priv->op) { if (priv->op > NFT_DYNSET_OP_DELETE)
case NFT_DYNSET_OP_ADD:
case NFT_DYNSET_OP_DELETE:
break;
case NFT_DYNSET_OP_UPDATE:
if (!(set->flags & NFT_SET_TIMEOUT))
return -EOPNOTSUPP;
break;
default:
return -EOPNOTSUPP; return -EOPNOTSUPP;
}
timeout = 0; timeout = 0;
if (tb[NFTA_DYNSET_TIMEOUT] != NULL) { if (tb[NFTA_DYNSET_TIMEOUT] != NULL) {
......
...@@ -91,6 +91,7 @@ ...@@ -91,6 +91,7 @@
#endif #endif
#include <linux/bpf.h> #include <linux/bpf.h>
#include <net/compat.h> #include <net/compat.h>
#include <linux/netfilter_netdev.h>
#include "internal.h" #include "internal.h"
...@@ -241,8 +242,42 @@ struct packet_skb_cb { ...@@ -241,8 +242,42 @@ struct packet_skb_cb {
static void __fanout_unlink(struct sock *sk, struct packet_sock *po); static void __fanout_unlink(struct sock *sk, struct packet_sock *po);
static void __fanout_link(struct sock *sk, struct packet_sock *po); static void __fanout_link(struct sock *sk, struct packet_sock *po);
#ifdef CONFIG_NETFILTER_EGRESS
static noinline struct sk_buff *nf_hook_direct_egress(struct sk_buff *skb)
{
struct sk_buff *next, *head = NULL, *tail;
int rc;
rcu_read_lock();
for (; skb != NULL; skb = next) {
next = skb->next;
skb_mark_not_on_list(skb);
if (!nf_hook_egress(skb, &rc, skb->dev))
continue;
if (!head)
head = skb;
else
tail->next = skb;
tail = skb;
}
rcu_read_unlock();
return head;
}
#endif
static int packet_direct_xmit(struct sk_buff *skb) static int packet_direct_xmit(struct sk_buff *skb)
{ {
#ifdef CONFIG_NETFILTER_EGRESS
if (nf_hook_egress_active()) {
skb = nf_hook_direct_egress(skb);
if (!skb)
return NET_XMIT_DROP;
}
#endif
return dev_direct_xmit(skb, packet_pick_tx_queue(skb)); return dev_direct_xmit(skb, packet_pick_tx_queue(skb));
} }
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment