Merge tag 'pci-v4.21-changes' of git://git.kernel.org/pub/scm/linux/kernel/git/helgaa...
[linux] / net / netfilter / nf_queue.c
1 /*
2  * Rusty Russell (C)2000 -- This code is GPL.
3  * Patrick McHardy (c) 2006-2012
4  */
5
6 #include <linux/kernel.h>
7 #include <linux/slab.h>
8 #include <linux/init.h>
9 #include <linux/module.h>
10 #include <linux/proc_fs.h>
11 #include <linux/skbuff.h>
12 #include <linux/netfilter.h>
13 #include <linux/netfilter_ipv4.h>
14 #include <linux/netfilter_ipv6.h>
15 #include <linux/netfilter_bridge.h>
16 #include <linux/seq_file.h>
17 #include <linux/rcupdate.h>
18 #include <net/protocol.h>
19 #include <net/netfilter/nf_queue.h>
20 #include <net/dst.h>
21
22 #include "nf_internals.h"
23
24 /*
25  * Hook for nfnetlink_queue to register its queue handler.
26  * We do this so that most of the NFQUEUE code can be modular.
27  *
28  * Once the queue is registered it must reinject all packets it
29  * receives, no matter what.
30  */
31
32 /* return EBUSY when somebody else is registered, return EEXIST if the
33  * same handler is registered, return 0 in case of success. */
34 void nf_register_queue_handler(struct net *net, const struct nf_queue_handler *qh)
35 {
36         /* should never happen, we only have one queueing backend in kernel */
37         WARN_ON(rcu_access_pointer(net->nf.queue_handler));
38         rcu_assign_pointer(net->nf.queue_handler, qh);
39 }
40 EXPORT_SYMBOL(nf_register_queue_handler);
41
42 /* The caller must flush their queue before this */
43 void nf_unregister_queue_handler(struct net *net)
44 {
45         RCU_INIT_POINTER(net->nf.queue_handler, NULL);
46 }
47 EXPORT_SYMBOL(nf_unregister_queue_handler);
48
49 static void nf_queue_entry_release_br_nf_refs(struct sk_buff *skb)
50 {
51 #if IS_ENABLED(CONFIG_BRIDGE_NETFILTER)
52         struct nf_bridge_info *nf_bridge = nf_bridge_info_get(skb);
53
54         if (nf_bridge) {
55                 struct net_device *physdev;
56
57                 physdev = nf_bridge_get_physindev(skb);
58                 if (physdev)
59                         dev_put(physdev);
60                 physdev = nf_bridge_get_physoutdev(skb);
61                 if (physdev)
62                         dev_put(physdev);
63         }
64 #endif
65 }
66
67 void nf_queue_entry_release_refs(struct nf_queue_entry *entry)
68 {
69         struct nf_hook_state *state = &entry->state;
70
71         /* Release those devices we held, or Alexey will kill me. */
72         if (state->in)
73                 dev_put(state->in);
74         if (state->out)
75                 dev_put(state->out);
76         if (state->sk)
77                 sock_put(state->sk);
78
79         nf_queue_entry_release_br_nf_refs(entry->skb);
80 }
81 EXPORT_SYMBOL_GPL(nf_queue_entry_release_refs);
82
83 static void nf_queue_entry_get_br_nf_refs(struct sk_buff *skb)
84 {
85 #if IS_ENABLED(CONFIG_BRIDGE_NETFILTER)
86         struct nf_bridge_info *nf_bridge = nf_bridge_info_get(skb);
87
88         if (nf_bridge) {
89                 struct net_device *physdev;
90
91                 physdev = nf_bridge_get_physindev(skb);
92                 if (physdev)
93                         dev_hold(physdev);
94                 physdev = nf_bridge_get_physoutdev(skb);
95                 if (physdev)
96                         dev_hold(physdev);
97         }
98 #endif
99 }
100
101 /* Bump dev refs so they don't vanish while packet is out */
102 void nf_queue_entry_get_refs(struct nf_queue_entry *entry)
103 {
104         struct nf_hook_state *state = &entry->state;
105
106         if (state->in)
107                 dev_hold(state->in);
108         if (state->out)
109                 dev_hold(state->out);
110         if (state->sk)
111                 sock_hold(state->sk);
112
113         nf_queue_entry_get_br_nf_refs(entry->skb);
114 }
115 EXPORT_SYMBOL_GPL(nf_queue_entry_get_refs);
116
117 void nf_queue_nf_hook_drop(struct net *net)
118 {
119         const struct nf_queue_handler *qh;
120
121         rcu_read_lock();
122         qh = rcu_dereference(net->nf.queue_handler);
123         if (qh)
124                 qh->nf_hook_drop(net);
125         rcu_read_unlock();
126 }
127 EXPORT_SYMBOL_GPL(nf_queue_nf_hook_drop);
128
129 static void nf_ip_saveroute(const struct sk_buff *skb,
130                             struct nf_queue_entry *entry)
131 {
132         struct ip_rt_info *rt_info = nf_queue_entry_reroute(entry);
133
134         if (entry->state.hook == NF_INET_LOCAL_OUT) {
135                 const struct iphdr *iph = ip_hdr(skb);
136
137                 rt_info->tos = iph->tos;
138                 rt_info->daddr = iph->daddr;
139                 rt_info->saddr = iph->saddr;
140                 rt_info->mark = skb->mark;
141         }
142 }
143
144 static void nf_ip6_saveroute(const struct sk_buff *skb,
145                              struct nf_queue_entry *entry)
146 {
147         struct ip6_rt_info *rt_info = nf_queue_entry_reroute(entry);
148
149         if (entry->state.hook == NF_INET_LOCAL_OUT) {
150                 const struct ipv6hdr *iph = ipv6_hdr(skb);
151
152                 rt_info->daddr = iph->daddr;
153                 rt_info->saddr = iph->saddr;
154                 rt_info->mark = skb->mark;
155         }
156 }
157
158 static int __nf_queue(struct sk_buff *skb, const struct nf_hook_state *state,
159                       const struct nf_hook_entries *entries,
160                       unsigned int index, unsigned int queuenum)
161 {
162         int status = -ENOENT;
163         struct nf_queue_entry *entry = NULL;
164         const struct nf_queue_handler *qh;
165         struct net *net = state->net;
166         unsigned int route_key_size;
167
168         /* QUEUE == DROP if no one is waiting, to be safe. */
169         qh = rcu_dereference(net->nf.queue_handler);
170         if (!qh) {
171                 status = -ESRCH;
172                 goto err;
173         }
174
175         switch (state->pf) {
176         case AF_INET:
177                 route_key_size = sizeof(struct ip_rt_info);
178                 break;
179         case AF_INET6:
180                 route_key_size = sizeof(struct ip6_rt_info);
181                 break;
182         default:
183                 route_key_size = 0;
184                 break;
185         }
186
187         entry = kmalloc(sizeof(*entry) + route_key_size, GFP_ATOMIC);
188         if (!entry) {
189                 status = -ENOMEM;
190                 goto err;
191         }
192
193         *entry = (struct nf_queue_entry) {
194                 .skb    = skb,
195                 .state  = *state,
196                 .hook_index = index,
197                 .size   = sizeof(*entry) + route_key_size,
198         };
199
200         nf_queue_entry_get_refs(entry);
201         skb_dst_force(skb);
202
203         switch (entry->state.pf) {
204         case AF_INET:
205                 nf_ip_saveroute(skb, entry);
206                 break;
207         case AF_INET6:
208                 nf_ip6_saveroute(skb, entry);
209                 break;
210         }
211
212         status = qh->outfn(entry, queuenum);
213
214         if (status < 0) {
215                 nf_queue_entry_release_refs(entry);
216                 goto err;
217         }
218
219         return 0;
220
221 err:
222         kfree(entry);
223         return status;
224 }
225
226 /* Packets leaving via this function must come back through nf_reinject(). */
227 int nf_queue(struct sk_buff *skb, struct nf_hook_state *state,
228              const struct nf_hook_entries *entries, unsigned int index,
229              unsigned int verdict)
230 {
231         int ret;
232
233         ret = __nf_queue(skb, state, entries, index, verdict >> NF_VERDICT_QBITS);
234         if (ret < 0) {
235                 if (ret == -ESRCH &&
236                     (verdict & NF_VERDICT_FLAG_QUEUE_BYPASS))
237                         return 1;
238                 kfree_skb(skb);
239         }
240
241         return 0;
242 }
243
244 static unsigned int nf_iterate(struct sk_buff *skb,
245                                struct nf_hook_state *state,
246                                const struct nf_hook_entries *hooks,
247                                unsigned int *index)
248 {
249         const struct nf_hook_entry *hook;
250         unsigned int verdict, i = *index;
251
252         while (i < hooks->num_hook_entries) {
253                 hook = &hooks->hooks[i];
254 repeat:
255                 verdict = nf_hook_entry_hookfn(hook, skb, state);
256                 if (verdict != NF_ACCEPT) {
257                         if (verdict != NF_REPEAT)
258                                 return verdict;
259                         goto repeat;
260                 }
261                 i++;
262         }
263
264         *index = i;
265         return NF_ACCEPT;
266 }
267
268 static struct nf_hook_entries *nf_hook_entries_head(const struct net *net, u8 pf, u8 hooknum)
269 {
270         switch (pf) {
271 #ifdef CONFIG_NETFILTER_FAMILY_BRIDGE
272         case NFPROTO_BRIDGE:
273                 return rcu_dereference(net->nf.hooks_bridge[hooknum]);
274 #endif
275         case NFPROTO_IPV4:
276                 return rcu_dereference(net->nf.hooks_ipv4[hooknum]);
277         case NFPROTO_IPV6:
278                 return rcu_dereference(net->nf.hooks_ipv6[hooknum]);
279         default:
280                 WARN_ON_ONCE(1);
281                 return NULL;
282         }
283
284         return NULL;
285 }
286
287 /* Caller must hold rcu read-side lock */
288 void nf_reinject(struct nf_queue_entry *entry, unsigned int verdict)
289 {
290         const struct nf_hook_entry *hook_entry;
291         const struct nf_hook_entries *hooks;
292         struct sk_buff *skb = entry->skb;
293         const struct net *net;
294         unsigned int i;
295         int err;
296         u8 pf;
297
298         net = entry->state.net;
299         pf = entry->state.pf;
300
301         hooks = nf_hook_entries_head(net, pf, entry->state.hook);
302
303         nf_queue_entry_release_refs(entry);
304
305         i = entry->hook_index;
306         if (WARN_ON_ONCE(!hooks || i >= hooks->num_hook_entries)) {
307                 kfree_skb(skb);
308                 kfree(entry);
309                 return;
310         }
311
312         hook_entry = &hooks->hooks[i];
313
314         /* Continue traversal iff userspace said ok... */
315         if (verdict == NF_REPEAT)
316                 verdict = nf_hook_entry_hookfn(hook_entry, skb, &entry->state);
317
318         if (verdict == NF_ACCEPT) {
319                 if (nf_reroute(skb, entry) < 0)
320                         verdict = NF_DROP;
321         }
322
323         if (verdict == NF_ACCEPT) {
324 next_hook:
325                 ++i;
326                 verdict = nf_iterate(skb, &entry->state, hooks, &i);
327         }
328
329         switch (verdict & NF_VERDICT_MASK) {
330         case NF_ACCEPT:
331         case NF_STOP:
332                 local_bh_disable();
333                 entry->state.okfn(entry->state.net, entry->state.sk, skb);
334                 local_bh_enable();
335                 break;
336         case NF_QUEUE:
337                 err = nf_queue(skb, &entry->state, hooks, i, verdict);
338                 if (err == 1)
339                         goto next_hook;
340                 break;
341         case NF_STOLEN:
342                 break;
343         default:
344                 kfree_skb(skb);
345         }
346
347         kfree(entry);
348 }
349 EXPORT_SYMBOL(nf_reinject);