net: add CONFIG_NET_INGRESS to enable ingress filtering
[deliverable/linux.git] / net / netfilter / core.c
CommitLineData
601e68e1 1/* netfilter.c: look after the filters for various protocols.
f6ebe77f
HW
2 * Heavily influenced by the old firewall.c by David Bonn and Alan Cox.
3 *
4 * Thanks to Rob `CmdrTaco' Malda for not influencing this code in any
5 * way.
6 *
7 * Rusty Russell (C)2000 -- This code is GPL.
f229f6ce 8 * Patrick McHardy (c) 2006-2012
f6ebe77f 9 */
f6ebe77f
HW
10#include <linux/kernel.h>
11#include <linux/netfilter.h>
12#include <net/protocol.h>
13#include <linux/init.h>
14#include <linux/skbuff.h>
15#include <linux/wait.h>
16#include <linux/module.h>
17#include <linux/interrupt.h>
18#include <linux/if.h>
19#include <linux/netdevice.h>
56768644 20#include <linux/netfilter_ipv6.h>
f6ebe77f
HW
21#include <linux/inetdevice.h>
22#include <linux/proc_fs.h>
d486dd1f 23#include <linux/mutex.h>
5a0e3ad6 24#include <linux/slab.h>
457c4cbc 25#include <net/net_namespace.h>
f6ebe77f
HW
26#include <net/sock.h>
27
28#include "nf_internals.h"
29
d486dd1f 30static DEFINE_MUTEX(afinfo_mutex);
bce8032e 31
0906a372 32const struct nf_afinfo __rcu *nf_afinfo[NFPROTO_NUMPROTO] __read_mostly;
bce8032e 33EXPORT_SYMBOL(nf_afinfo);
2a7851bf
FW
34const struct nf_ipv6_ops __rcu *nf_ipv6_ops __read_mostly;
35EXPORT_SYMBOL_GPL(nf_ipv6_ops);
bce8032e 36
1e796fda 37int nf_register_afinfo(const struct nf_afinfo *afinfo)
bce8032e 38{
7926dbfa 39 mutex_lock(&afinfo_mutex);
a9b3cd7f 40 RCU_INIT_POINTER(nf_afinfo[afinfo->family], afinfo);
d486dd1f 41 mutex_unlock(&afinfo_mutex);
bce8032e
PM
42 return 0;
43}
44EXPORT_SYMBOL_GPL(nf_register_afinfo);
45
1e796fda 46void nf_unregister_afinfo(const struct nf_afinfo *afinfo)
bce8032e 47{
d486dd1f 48 mutex_lock(&afinfo_mutex);
a9b3cd7f 49 RCU_INIT_POINTER(nf_afinfo[afinfo->family], NULL);
d486dd1f 50 mutex_unlock(&afinfo_mutex);
bce8032e
PM
51 synchronize_rcu();
52}
53EXPORT_SYMBOL_GPL(nf_unregister_afinfo);
54
7e9c6eeb 55struct list_head nf_hooks[NFPROTO_NUMPROTO][NF_MAX_HOOKS] __read_mostly;
f6ebe77f 56EXPORT_SYMBOL(nf_hooks);
a2d7ec58 57
d1c85c2e 58#ifdef HAVE_JUMP_LABEL
c5905afb 59struct static_key nf_hooks_needed[NFPROTO_NUMPROTO][NF_MAX_HOOKS];
a2d7ec58
ED
60EXPORT_SYMBOL(nf_hooks_needed);
61#endif
62
fd706d69 63static DEFINE_MUTEX(nf_hook_mutex);
f6ebe77f
HW
64
65int nf_register_hook(struct nf_hook_ops *reg)
66{
4c610979 67 struct nf_hook_ops *elem;
f6ebe77f 68
7926dbfa 69 mutex_lock(&nf_hook_mutex);
4c610979
LZ
70 list_for_each_entry(elem, &nf_hooks[reg->pf][reg->hooknum], list) {
71 if (reg->priority < elem->priority)
f6ebe77f
HW
72 break;
73 }
4c610979 74 list_add_rcu(&reg->list, elem->list.prev);
fd706d69 75 mutex_unlock(&nf_hook_mutex);
d1c85c2e 76#ifdef HAVE_JUMP_LABEL
c5905afb 77 static_key_slow_inc(&nf_hooks_needed[reg->pf][reg->hooknum]);
a2d7ec58 78#endif
f6ebe77f
HW
79 return 0;
80}
81EXPORT_SYMBOL(nf_register_hook);
82
83void nf_unregister_hook(struct nf_hook_ops *reg)
84{
fd706d69 85 mutex_lock(&nf_hook_mutex);
f6ebe77f 86 list_del_rcu(&reg->list);
fd706d69 87 mutex_unlock(&nf_hook_mutex);
d1c85c2e 88#ifdef HAVE_JUMP_LABEL
c5905afb 89 static_key_slow_dec(&nf_hooks_needed[reg->pf][reg->hooknum]);
a2d7ec58 90#endif
f6ebe77f
HW
91 synchronize_net();
92}
93EXPORT_SYMBOL(nf_unregister_hook);
94
972d1cb1
PM
95int nf_register_hooks(struct nf_hook_ops *reg, unsigned int n)
96{
97 unsigned int i;
98 int err = 0;
99
100 for (i = 0; i < n; i++) {
101 err = nf_register_hook(&reg[i]);
102 if (err)
103 goto err;
104 }
105 return err;
106
107err:
108 if (i > 0)
109 nf_unregister_hooks(reg, i);
110 return err;
111}
112EXPORT_SYMBOL(nf_register_hooks);
113
114void nf_unregister_hooks(struct nf_hook_ops *reg, unsigned int n)
115{
f68c5301
CG
116 while (n-- > 0)
117 nf_unregister_hook(&reg[n]);
972d1cb1
PM
118}
119EXPORT_SYMBOL(nf_unregister_hooks);
120
f6ebe77f 121unsigned int nf_iterate(struct list_head *head,
3db05fea 122 struct sk_buff *skb,
cfdfab31
DM
123 struct nf_hook_state *state,
124 struct nf_hook_ops **elemp)
f6ebe77f
HW
125{
126 unsigned int verdict;
127
128 /*
129 * The caller must not block between calls to this
130 * function because of risk of continuing from deleted element.
131 */
2a6decfd 132 list_for_each_entry_continue_rcu((*elemp), head, list) {
cfdfab31 133 if (state->thresh > (*elemp)->priority)
f6ebe77f
HW
134 continue;
135
136 /* Optimization: we don't need to hold module
601e68e1 137 reference here, since function can't sleep. --RR */
de9963f0 138repeat:
238e54c9 139 verdict = (*elemp)->hook(*elemp, skb, state);
f6ebe77f
HW
140 if (verdict != NF_ACCEPT) {
141#ifdef CONFIG_NETFILTER_DEBUG
142 if (unlikely((verdict & NF_VERDICT_MASK)
143 > NF_MAX_VERDICT)) {
144 NFDEBUG("Evil return from %p(%u).\n",
cfdfab31 145 (*elemp)->hook, state->hook);
f6ebe77f
HW
146 continue;
147 }
148#endif
2a6decfd 149 if (verdict != NF_REPEAT)
f6ebe77f 150 return verdict;
de9963f0 151 goto repeat;
f6ebe77f
HW
152 }
153 }
154 return NF_ACCEPT;
155}
156
157
158/* Returns 1 if okfn() needs to be executed by the caller,
159 * -EPERM for NF_DROP, 0 otherwise. */
cfdfab31 160int nf_hook_slow(struct sk_buff *skb, struct nf_hook_state *state)
f6ebe77f 161{
2a6decfd 162 struct nf_hook_ops *elem;
f6ebe77f
HW
163 unsigned int verdict;
164 int ret = 0;
165
166 /* We may already have this, but read-locks nest anyway */
167 rcu_read_lock();
168
f7191483 169 elem = list_entry_rcu(state->hook_list, struct nf_hook_ops, list);
f6ebe77f 170next_hook:
f7191483 171 verdict = nf_iterate(state->hook_list, skb, state, &elem);
f6ebe77f
HW
172 if (verdict == NF_ACCEPT || verdict == NF_STOP) {
173 ret = 1;
da683650 174 } else if ((verdict & NF_VERDICT_MASK) == NF_DROP) {
3db05fea 175 kfree_skb(skb);
f615df76 176 ret = NF_DROP_GETERR(verdict);
da683650
EP
177 if (ret == 0)
178 ret = -EPERM;
f9c63990 179 } else if ((verdict & NF_VERDICT_MASK) == NF_QUEUE) {
cfdfab31
DM
180 int err = nf_queue(skb, elem, state,
181 verdict >> NF_VERDICT_QBITS);
563e1232
FW
182 if (err < 0) {
183 if (err == -ECANCELED)
06cdb634 184 goto next_hook;
563e1232 185 if (err == -ESRCH &&
94b27cc3
FW
186 (verdict & NF_VERDICT_FLAG_QUEUE_BYPASS))
187 goto next_hook;
06cdb634
FW
188 kfree_skb(skb);
189 }
f6ebe77f 190 }
f6ebe77f
HW
191 rcu_read_unlock();
192 return ret;
193}
194EXPORT_SYMBOL(nf_hook_slow);
195
196
37d41879 197int skb_make_writable(struct sk_buff *skb, unsigned int writable_len)
f6ebe77f 198{
37d41879 199 if (writable_len > skb->len)
f6ebe77f
HW
200 return 0;
201
202 /* Not exclusive use of packet? Must copy. */
37d41879
HX
203 if (!skb_cloned(skb)) {
204 if (writable_len <= skb_headlen(skb))
205 return 1;
206 } else if (skb_clone_writable(skb, writable_len))
207 return 1;
208
209 if (writable_len <= skb_headlen(skb))
210 writable_len = 0;
211 else
212 writable_len -= skb_headlen(skb);
213
214 return !!__pskb_pull_tail(skb, writable_len);
f6ebe77f
HW
215}
216EXPORT_SYMBOL(skb_make_writable);
217
c0cd1156 218#if IS_ENABLED(CONFIG_NF_CONNTRACK)
f6ebe77f
HW
219/* This does not belong here, but locally generated errors need it if connection
220 tracking in use: without this, connection may not be in hash table, and hence
221 manufactured ICMP or RST packets will not be associated with it. */
312a0c16
PM
222void (*ip_ct_attach)(struct sk_buff *, const struct sk_buff *)
223 __rcu __read_mostly;
f6ebe77f
HW
224EXPORT_SYMBOL(ip_ct_attach);
225
312a0c16 226void nf_ct_attach(struct sk_buff *new, const struct sk_buff *skb)
f6ebe77f 227{
312a0c16 228 void (*attach)(struct sk_buff *, const struct sk_buff *);
f6ebe77f 229
c3a47ab3
PM
230 if (skb->nfct) {
231 rcu_read_lock();
232 attach = rcu_dereference(ip_ct_attach);
233 if (attach)
234 attach(new, skb);
235 rcu_read_unlock();
f6ebe77f
HW
236 }
237}
238EXPORT_SYMBOL(nf_ct_attach);
de6e05c4 239
0e60ebe0 240void (*nf_ct_destroy)(struct nf_conntrack *) __rcu __read_mostly;
de6e05c4
YK
241EXPORT_SYMBOL(nf_ct_destroy);
242
243void nf_conntrack_destroy(struct nf_conntrack *nfct)
244{
245 void (*destroy)(struct nf_conntrack *);
246
247 rcu_read_lock();
248 destroy = rcu_dereference(nf_ct_destroy);
249 BUG_ON(destroy == NULL);
250 destroy(nfct);
251 rcu_read_unlock();
252}
253EXPORT_SYMBOL(nf_conntrack_destroy);
9cb01766 254
5a05fae5 255struct nfq_ct_hook __rcu *nfq_ct_hook __read_mostly;
9cb01766
PNA
256EXPORT_SYMBOL_GPL(nfq_ct_hook);
257
d584a61a
PNA
258struct nfq_ct_nat_hook __rcu *nfq_ct_nat_hook __read_mostly;
259EXPORT_SYMBOL_GPL(nfq_ct_nat_hook);
260
de6e05c4 261#endif /* CONFIG_NF_CONNTRACK */
f6ebe77f 262
c7232c99
PM
263#ifdef CONFIG_NF_NAT_NEEDED
264void (*nf_nat_decode_session_hook)(struct sk_buff *, struct flowi *);
265EXPORT_SYMBOL(nf_nat_decode_session_hook);
266#endif
267
f3c1a44a
G
268static int __net_init netfilter_net_init(struct net *net)
269{
270#ifdef CONFIG_PROC_FS
271 net->nf.proc_netfilter = proc_net_mkdir(net, "netfilter",
272 net->proc_net);
12202fa7
PNA
273 if (!net->nf.proc_netfilter) {
274 if (!net_eq(net, &init_net))
275 pr_err("cannot create netfilter proc entry");
276
f3c1a44a
G
277 return -ENOMEM;
278 }
279#endif
280 return 0;
281}
282
283static void __net_exit netfilter_net_exit(struct net *net)
284{
285 remove_proc_entry("netfilter", net->proc_net);
286}
287
288static struct pernet_operations netfilter_net_ops = {
289 .init = netfilter_net_init,
290 .exit = netfilter_net_exit,
291};
292
6d11cfdb 293int __init netfilter_init(void)
f6ebe77f 294{
6d11cfdb
PNA
295 int i, h, ret;
296
7e9c6eeb 297 for (i = 0; i < ARRAY_SIZE(nf_hooks); i++) {
f6ebe77f
HW
298 for (h = 0; h < NF_MAX_HOOKS; h++)
299 INIT_LIST_HEAD(&nf_hooks[i][h]);
300 }
301
6d11cfdb
PNA
302 ret = register_pernet_subsys(&netfilter_net_ops);
303 if (ret < 0)
304 goto err;
305
306 ret = netfilter_log_init();
307 if (ret < 0)
308 goto err_pernet;
f6ebe77f 309
6d11cfdb
PNA
310 return 0;
311err_pernet:
312 unregister_pernet_subsys(&netfilter_net_ops);
313err:
314 return ret;
f6ebe77f 315}
This page took 0.985567 seconds and 5 git commands to generate.