perf tools: Don't clone maps from parent when synthesizing forks
[linux/fpc-iii.git] / net / netfilter / nf_queue.c
blobd67a96a25a681e4ff99c3873cee6d856e3604812
1 /*
2 * Rusty Russell (C)2000 -- This code is GPL.
3 * Patrick McHardy (c) 2006-2012
4 */
6 #include <linux/kernel.h>
7 #include <linux/slab.h>
8 #include <linux/init.h>
9 #include <linux/module.h>
10 #include <linux/proc_fs.h>
11 #include <linux/skbuff.h>
12 #include <linux/netfilter.h>
13 #include <linux/netfilter_ipv4.h>
14 #include <linux/netfilter_ipv6.h>
15 #include <linux/netfilter_bridge.h>
16 #include <linux/seq_file.h>
17 #include <linux/rcupdate.h>
18 #include <net/protocol.h>
19 #include <net/netfilter/nf_queue.h>
20 #include <net/dst.h>
22 #include "nf_internals.h"
25 * Hook for nfnetlink_queue to register its queue handler.
26 * We do this so that most of the NFQUEUE code can be modular.
28 * Once the queue is registered it must reinject all packets it
29 * receives, no matter what.
32 /* return EBUSY when somebody else is registered, return EEXIST if the
33 * same handler is registered, return 0 in case of success. */
34 void nf_register_queue_handler(struct net *net, const struct nf_queue_handler *qh)
36 /* should never happen, we only have one queueing backend in kernel */
37 WARN_ON(rcu_access_pointer(net->nf.queue_handler));
38 rcu_assign_pointer(net->nf.queue_handler, qh);
40 EXPORT_SYMBOL(nf_register_queue_handler);
42 /* The caller must flush their queue before this */
43 void nf_unregister_queue_handler(struct net *net)
45 RCU_INIT_POINTER(net->nf.queue_handler, NULL);
47 EXPORT_SYMBOL(nf_unregister_queue_handler);
49 void nf_queue_entry_release_refs(struct nf_queue_entry *entry)
51 struct nf_hook_state *state = &entry->state;
53 /* Release those devices we held, or Alexey will kill me. */
54 if (state->in)
55 dev_put(state->in);
56 if (state->out)
57 dev_put(state->out);
58 if (state->sk)
59 sock_put(state->sk);
60 #if IS_ENABLED(CONFIG_BRIDGE_NETFILTER)
61 if (entry->skb->nf_bridge) {
62 struct net_device *physdev;
64 physdev = nf_bridge_get_physindev(entry->skb);
65 if (physdev)
66 dev_put(physdev);
67 physdev = nf_bridge_get_physoutdev(entry->skb);
68 if (physdev)
69 dev_put(physdev);
71 #endif
73 EXPORT_SYMBOL_GPL(nf_queue_entry_release_refs);
75 /* Bump dev refs so they don't vanish while packet is out */
76 void nf_queue_entry_get_refs(struct nf_queue_entry *entry)
78 struct nf_hook_state *state = &entry->state;
80 if (state->in)
81 dev_hold(state->in);
82 if (state->out)
83 dev_hold(state->out);
84 if (state->sk)
85 sock_hold(state->sk);
86 #if IS_ENABLED(CONFIG_BRIDGE_NETFILTER)
87 if (entry->skb->nf_bridge) {
88 struct net_device *physdev;
90 physdev = nf_bridge_get_physindev(entry->skb);
91 if (physdev)
92 dev_hold(physdev);
93 physdev = nf_bridge_get_physoutdev(entry->skb);
94 if (physdev)
95 dev_hold(physdev);
97 #endif
99 EXPORT_SYMBOL_GPL(nf_queue_entry_get_refs);
101 void nf_queue_nf_hook_drop(struct net *net)
103 const struct nf_queue_handler *qh;
105 rcu_read_lock();
106 qh = rcu_dereference(net->nf.queue_handler);
107 if (qh)
108 qh->nf_hook_drop(net);
109 rcu_read_unlock();
111 EXPORT_SYMBOL_GPL(nf_queue_nf_hook_drop);
113 static void nf_ip_saveroute(const struct sk_buff *skb,
114 struct nf_queue_entry *entry)
116 struct ip_rt_info *rt_info = nf_queue_entry_reroute(entry);
118 if (entry->state.hook == NF_INET_LOCAL_OUT) {
119 const struct iphdr *iph = ip_hdr(skb);
121 rt_info->tos = iph->tos;
122 rt_info->daddr = iph->daddr;
123 rt_info->saddr = iph->saddr;
124 rt_info->mark = skb->mark;
128 static void nf_ip6_saveroute(const struct sk_buff *skb,
129 struct nf_queue_entry *entry)
131 struct ip6_rt_info *rt_info = nf_queue_entry_reroute(entry);
133 if (entry->state.hook == NF_INET_LOCAL_OUT) {
134 const struct ipv6hdr *iph = ipv6_hdr(skb);
136 rt_info->daddr = iph->daddr;
137 rt_info->saddr = iph->saddr;
138 rt_info->mark = skb->mark;
142 static int __nf_queue(struct sk_buff *skb, const struct nf_hook_state *state,
143 const struct nf_hook_entries *entries,
144 unsigned int index, unsigned int queuenum)
146 int status = -ENOENT;
147 struct nf_queue_entry *entry = NULL;
148 const struct nf_queue_handler *qh;
149 struct net *net = state->net;
150 unsigned int route_key_size;
152 /* QUEUE == DROP if no one is waiting, to be safe. */
153 qh = rcu_dereference(net->nf.queue_handler);
154 if (!qh) {
155 status = -ESRCH;
156 goto err;
159 switch (state->pf) {
160 case AF_INET:
161 route_key_size = sizeof(struct ip_rt_info);
162 break;
163 case AF_INET6:
164 route_key_size = sizeof(struct ip6_rt_info);
165 break;
166 default:
167 route_key_size = 0;
168 break;
171 entry = kmalloc(sizeof(*entry) + route_key_size, GFP_ATOMIC);
172 if (!entry) {
173 status = -ENOMEM;
174 goto err;
177 *entry = (struct nf_queue_entry) {
178 .skb = skb,
179 .state = *state,
180 .hook_index = index,
181 .size = sizeof(*entry) + route_key_size,
184 nf_queue_entry_get_refs(entry);
185 skb_dst_force(skb);
187 switch (entry->state.pf) {
188 case AF_INET:
189 nf_ip_saveroute(skb, entry);
190 break;
191 case AF_INET6:
192 nf_ip6_saveroute(skb, entry);
193 break;
196 status = qh->outfn(entry, queuenum);
198 if (status < 0) {
199 nf_queue_entry_release_refs(entry);
200 goto err;
203 return 0;
205 err:
206 kfree(entry);
207 return status;
210 /* Packets leaving via this function must come back through nf_reinject(). */
211 int nf_queue(struct sk_buff *skb, struct nf_hook_state *state,
212 const struct nf_hook_entries *entries, unsigned int index,
213 unsigned int verdict)
215 int ret;
217 ret = __nf_queue(skb, state, entries, index, verdict >> NF_VERDICT_QBITS);
218 if (ret < 0) {
219 if (ret == -ESRCH &&
220 (verdict & NF_VERDICT_FLAG_QUEUE_BYPASS))
221 return 1;
222 kfree_skb(skb);
225 return 0;
228 static unsigned int nf_iterate(struct sk_buff *skb,
229 struct nf_hook_state *state,
230 const struct nf_hook_entries *hooks,
231 unsigned int *index)
233 const struct nf_hook_entry *hook;
234 unsigned int verdict, i = *index;
236 while (i < hooks->num_hook_entries) {
237 hook = &hooks->hooks[i];
238 repeat:
239 verdict = nf_hook_entry_hookfn(hook, skb, state);
240 if (verdict != NF_ACCEPT) {
241 if (verdict != NF_REPEAT)
242 return verdict;
243 goto repeat;
245 i++;
248 *index = i;
249 return NF_ACCEPT;
252 static struct nf_hook_entries *nf_hook_entries_head(const struct net *net, u8 pf, u8 hooknum)
254 switch (pf) {
255 #ifdef CONFIG_NETFILTER_FAMILY_BRIDGE
256 case NFPROTO_BRIDGE:
257 return rcu_dereference(net->nf.hooks_bridge[hooknum]);
258 #endif
259 case NFPROTO_IPV4:
260 return rcu_dereference(net->nf.hooks_ipv4[hooknum]);
261 case NFPROTO_IPV6:
262 return rcu_dereference(net->nf.hooks_ipv6[hooknum]);
263 default:
264 WARN_ON_ONCE(1);
265 return NULL;
268 return NULL;
271 /* Caller must hold rcu read-side lock */
272 void nf_reinject(struct nf_queue_entry *entry, unsigned int verdict)
274 const struct nf_hook_entry *hook_entry;
275 const struct nf_hook_entries *hooks;
276 struct sk_buff *skb = entry->skb;
277 const struct net *net;
278 unsigned int i;
279 int err;
280 u8 pf;
282 net = entry->state.net;
283 pf = entry->state.pf;
285 hooks = nf_hook_entries_head(net, pf, entry->state.hook);
287 nf_queue_entry_release_refs(entry);
289 i = entry->hook_index;
290 if (WARN_ON_ONCE(!hooks || i >= hooks->num_hook_entries)) {
291 kfree_skb(skb);
292 kfree(entry);
293 return;
296 hook_entry = &hooks->hooks[i];
298 /* Continue traversal iff userspace said ok... */
299 if (verdict == NF_REPEAT)
300 verdict = nf_hook_entry_hookfn(hook_entry, skb, &entry->state);
302 if (verdict == NF_ACCEPT) {
303 if (nf_reroute(skb, entry) < 0)
304 verdict = NF_DROP;
307 if (verdict == NF_ACCEPT) {
308 next_hook:
309 ++i;
310 verdict = nf_iterate(skb, &entry->state, hooks, &i);
313 switch (verdict & NF_VERDICT_MASK) {
314 case NF_ACCEPT:
315 case NF_STOP:
316 local_bh_disable();
317 entry->state.okfn(entry->state.net, entry->state.sk, skb);
318 local_bh_enable();
319 break;
320 case NF_QUEUE:
321 err = nf_queue(skb, &entry->state, hooks, i, verdict);
322 if (err == 1)
323 goto next_hook;
324 break;
325 case NF_STOLEN:
326 break;
327 default:
328 kfree_skb(skb);
331 kfree(entry);
333 EXPORT_SYMBOL(nf_reinject);