[IPCOMP]: Fetch nexthdr before ipch is destroyed
[powerpc.git] / net / ipv6 / netfilter / nf_conntrack_l3proto_ipv6.c
1 /*
2  * Copyright (C)2004 USAGI/WIDE Project
3  *
4  * This program is free software; you can redistribute it and/or modify
5  * it under the terms of the GNU General Public License version 2 as
6  * published by the Free Software Foundation.
7  *
8  * Author:
9  *      Yasuyuki Kozakai @USAGI <yasuyuki.kozakai@toshiba.co.jp>
10  */
11
12 #include <linux/types.h>
13 #include <linux/ipv6.h>
14 #include <linux/in6.h>
15 #include <linux/netfilter.h>
16 #include <linux/module.h>
17 #include <linux/skbuff.h>
18 #include <linux/icmp.h>
19 #include <linux/sysctl.h>
20 #include <net/ipv6.h>
21 #include <net/inet_frag.h>
22
23 #include <linux/netfilter_ipv6.h>
24 #include <net/netfilter/nf_conntrack.h>
25 #include <net/netfilter/nf_conntrack_helper.h>
26 #include <net/netfilter/nf_conntrack_l4proto.h>
27 #include <net/netfilter/nf_conntrack_l3proto.h>
28 #include <net/netfilter/nf_conntrack_core.h>
29
30 static int ipv6_pkt_to_tuple(const struct sk_buff *skb, unsigned int nhoff,
31                              struct nf_conntrack_tuple *tuple)
32 {
33         u_int32_t _addrs[8], *ap;
34
35         ap = skb_header_pointer(skb, nhoff + offsetof(struct ipv6hdr, saddr),
36                                 sizeof(_addrs), _addrs);
37         if (ap == NULL)
38                 return 0;
39
40         memcpy(tuple->src.u3.ip6, ap, sizeof(tuple->src.u3.ip6));
41         memcpy(tuple->dst.u3.ip6, ap + 4, sizeof(tuple->dst.u3.ip6));
42
43         return 1;
44 }
45
46 static int ipv6_invert_tuple(struct nf_conntrack_tuple *tuple,
47                              const struct nf_conntrack_tuple *orig)
48 {
49         memcpy(tuple->src.u3.ip6, orig->dst.u3.ip6, sizeof(tuple->src.u3.ip6));
50         memcpy(tuple->dst.u3.ip6, orig->src.u3.ip6, sizeof(tuple->dst.u3.ip6));
51
52         return 1;
53 }
54
55 static int ipv6_print_tuple(struct seq_file *s,
56                             const struct nf_conntrack_tuple *tuple)
57 {
58         return seq_printf(s, "src=" NIP6_FMT " dst=" NIP6_FMT " ",
59                           NIP6(*((struct in6_addr *)tuple->src.u3.ip6)),
60                           NIP6(*((struct in6_addr *)tuple->dst.u3.ip6)));
61 }
62
63 /*
64  * Based on ipv6_skip_exthdr() in net/ipv6/exthdr.c
65  *
66  * This function parses (probably truncated) exthdr set "hdr"
67  * of length "len". "nexthdrp" initially points to some place,
68  * where type of the first header can be found.
69  *
70  * It skips all well-known exthdrs, and returns pointer to the start
71  * of unparsable area i.e. the first header with unknown type.
72  * if success, *nexthdr is updated by type/protocol of this header.
73  *
74  * NOTES: - it may return pointer pointing beyond end of packet,
75  *          if the last recognized header is truncated in the middle.
76  *        - if packet is truncated, so that all parsed headers are skipped,
77  *          it returns -1.
78  *        - if packet is fragmented, return pointer of the fragment header.
79  *        - ESP is unparsable for now and considered like
80  *          normal payload protocol.
81  *        - Note also special handling of AUTH header. Thanks to IPsec wizards.
82  */
83
84 static int nf_ct_ipv6_skip_exthdr(const struct sk_buff *skb, int start,
85                                   u8 *nexthdrp, int len)
86 {
87         u8 nexthdr = *nexthdrp;
88
89         while (ipv6_ext_hdr(nexthdr)) {
90                 struct ipv6_opt_hdr hdr;
91                 int hdrlen;
92
93                 if (len < (int)sizeof(struct ipv6_opt_hdr))
94                         return -1;
95                 if (nexthdr == NEXTHDR_NONE)
96                         break;
97                 if (nexthdr == NEXTHDR_FRAGMENT)
98                         break;
99                 if (skb_copy_bits(skb, start, &hdr, sizeof(hdr)))
100                         BUG();
101                 if (nexthdr == NEXTHDR_AUTH)
102                         hdrlen = (hdr.hdrlen+2)<<2;
103                 else
104                         hdrlen = ipv6_optlen(&hdr);
105
106                 nexthdr = hdr.nexthdr;
107                 len -= hdrlen;
108                 start += hdrlen;
109         }
110
111         *nexthdrp = nexthdr;
112         return start;
113 }
114
115 static int ipv6_get_l4proto(const struct sk_buff *skb, unsigned int nhoff,
116                             unsigned int *dataoff, u_int8_t *protonum)
117 {
118         unsigned int extoff = nhoff + sizeof(struct ipv6hdr);
119         unsigned char pnum;
120         int protoff;
121
122         if (skb_copy_bits(skb, nhoff + offsetof(struct ipv6hdr, nexthdr),
123                           &pnum, sizeof(pnum)) != 0) {
124                 pr_debug("ip6_conntrack_core: can't get nexthdr\n");
125                 return -NF_ACCEPT;
126         }
127         protoff = nf_ct_ipv6_skip_exthdr(skb, extoff, &pnum, skb->len - extoff);
128         /*
129          * (protoff == skb->len) mean that the packet doesn't have no data
130          * except of IPv6 & ext headers. but it's tracked anyway. - YK
131          */
132         if ((protoff < 0) || (protoff > skb->len)) {
133                 pr_debug("ip6_conntrack_core: can't find proto in pkt\n");
134                 return -NF_ACCEPT;
135         }
136
137         *dataoff = protoff;
138         *protonum = pnum;
139         return NF_ACCEPT;
140 }
141
142 static unsigned int ipv6_confirm(unsigned int hooknum,
143                                  struct sk_buff *skb,
144                                  const struct net_device *in,
145                                  const struct net_device *out,
146                                  int (*okfn)(struct sk_buff *))
147 {
148         struct nf_conn *ct;
149         struct nf_conn_help *help;
150         struct nf_conntrack_helper *helper;
151         enum ip_conntrack_info ctinfo;
152         unsigned int ret, protoff;
153         unsigned int extoff = (u8 *)(ipv6_hdr(skb) + 1) - skb->data;
154         unsigned char pnum = ipv6_hdr(skb)->nexthdr;
155
156
157         /* This is where we call the helper: as the packet goes out. */
158         ct = nf_ct_get(skb, &ctinfo);
159         if (!ct || ctinfo == IP_CT_RELATED + IP_CT_IS_REPLY)
160                 goto out;
161
162         help = nfct_help(ct);
163         if (!help)
164                 goto out;
165         /* rcu_read_lock()ed by nf_hook_slow */
166         helper = rcu_dereference(help->helper);
167         if (!helper)
168                 goto out;
169
170         protoff = nf_ct_ipv6_skip_exthdr(skb, extoff, &pnum,
171                                          skb->len - extoff);
172         if (protoff > skb->len || pnum == NEXTHDR_FRAGMENT) {
173                 pr_debug("proto header not found\n");
174                 return NF_ACCEPT;
175         }
176
177         ret = helper->help(skb, protoff, ct, ctinfo);
178         if (ret != NF_ACCEPT)
179                 return ret;
180 out:
181         /* We've seen it coming out the other side: confirm it */
182         return nf_conntrack_confirm(skb);
183 }
184
185 static unsigned int ipv6_defrag(unsigned int hooknum,
186                                 struct sk_buff *skb,
187                                 const struct net_device *in,
188                                 const struct net_device *out,
189                                 int (*okfn)(struct sk_buff *))
190 {
191         struct sk_buff *reasm;
192
193         /* Previously seen (loopback)?  */
194         if (skb->nfct)
195                 return NF_ACCEPT;
196
197         reasm = nf_ct_frag6_gather(skb);
198
199         /* queued */
200         if (reasm == NULL)
201                 return NF_STOLEN;
202
203         /* error occured or not fragmented */
204         if (reasm == skb)
205                 return NF_ACCEPT;
206
207         nf_ct_frag6_output(hooknum, reasm, (struct net_device *)in,
208                            (struct net_device *)out, okfn);
209
210         return NF_STOLEN;
211 }
212
213 static unsigned int ipv6_conntrack_in(unsigned int hooknum,
214                                       struct sk_buff *skb,
215                                       const struct net_device *in,
216                                       const struct net_device *out,
217                                       int (*okfn)(struct sk_buff *))
218 {
219         struct sk_buff *reasm = skb->nfct_reasm;
220
221         /* This packet is fragmented and has reassembled packet. */
222         if (reasm) {
223                 /* Reassembled packet isn't parsed yet ? */
224                 if (!reasm->nfct) {
225                         unsigned int ret;
226
227                         ret = nf_conntrack_in(PF_INET6, hooknum, reasm);
228                         if (ret != NF_ACCEPT)
229                                 return ret;
230                 }
231                 nf_conntrack_get(reasm->nfct);
232                 skb->nfct = reasm->nfct;
233                 skb->nfctinfo = reasm->nfctinfo;
234                 return NF_ACCEPT;
235         }
236
237         return nf_conntrack_in(PF_INET6, hooknum, skb);
238 }
239
240 static unsigned int ipv6_conntrack_local(unsigned int hooknum,
241                                          struct sk_buff *skb,
242                                          const struct net_device *in,
243                                          const struct net_device *out,
244                                          int (*okfn)(struct sk_buff *))
245 {
246         /* root is playing with raw sockets. */
247         if (skb->len < sizeof(struct ipv6hdr)) {
248                 if (net_ratelimit())
249                         printk("ipv6_conntrack_local: packet too short\n");
250                 return NF_ACCEPT;
251         }
252         return ipv6_conntrack_in(hooknum, skb, in, out, okfn);
253 }
254
255 static struct nf_hook_ops ipv6_conntrack_ops[] __read_mostly = {
256         {
257                 .hook           = ipv6_defrag,
258                 .owner          = THIS_MODULE,
259                 .pf             = PF_INET6,
260                 .hooknum        = NF_INET_PRE_ROUTING,
261                 .priority       = NF_IP6_PRI_CONNTRACK_DEFRAG,
262         },
263         {
264                 .hook           = ipv6_conntrack_in,
265                 .owner          = THIS_MODULE,
266                 .pf             = PF_INET6,
267                 .hooknum        = NF_INET_PRE_ROUTING,
268                 .priority       = NF_IP6_PRI_CONNTRACK,
269         },
270         {
271                 .hook           = ipv6_conntrack_local,
272                 .owner          = THIS_MODULE,
273                 .pf             = PF_INET6,
274                 .hooknum        = NF_INET_LOCAL_OUT,
275                 .priority       = NF_IP6_PRI_CONNTRACK,
276         },
277         {
278                 .hook           = ipv6_defrag,
279                 .owner          = THIS_MODULE,
280                 .pf             = PF_INET6,
281                 .hooknum        = NF_INET_LOCAL_OUT,
282                 .priority       = NF_IP6_PRI_CONNTRACK_DEFRAG,
283         },
284         {
285                 .hook           = ipv6_confirm,
286                 .owner          = THIS_MODULE,
287                 .pf             = PF_INET6,
288                 .hooknum        = NF_INET_POST_ROUTING,
289                 .priority       = NF_IP6_PRI_LAST,
290         },
291         {
292                 .hook           = ipv6_confirm,
293                 .owner          = THIS_MODULE,
294                 .pf             = PF_INET6,
295                 .hooknum        = NF_INET_LOCAL_IN,
296                 .priority       = NF_IP6_PRI_LAST-1,
297         },
298 };
299
300 #if defined(CONFIG_NF_CT_NETLINK) || defined(CONFIG_NF_CT_NETLINK_MODULE)
301
302 #include <linux/netfilter/nfnetlink.h>
303 #include <linux/netfilter/nfnetlink_conntrack.h>
304
305 static int ipv6_tuple_to_nlattr(struct sk_buff *skb,
306                                 const struct nf_conntrack_tuple *tuple)
307 {
308         NLA_PUT(skb, CTA_IP_V6_SRC, sizeof(u_int32_t) * 4,
309                 &tuple->src.u3.ip6);
310         NLA_PUT(skb, CTA_IP_V6_DST, sizeof(u_int32_t) * 4,
311                 &tuple->dst.u3.ip6);
312         return 0;
313
314 nla_put_failure:
315         return -1;
316 }
317
318 static const struct nla_policy ipv6_nla_policy[CTA_IP_MAX+1] = {
319         [CTA_IP_V6_SRC] = { .len = sizeof(u_int32_t)*4 },
320         [CTA_IP_V6_DST] = { .len = sizeof(u_int32_t)*4 },
321 };
322
323 static int ipv6_nlattr_to_tuple(struct nlattr *tb[],
324                                 struct nf_conntrack_tuple *t)
325 {
326         if (!tb[CTA_IP_V6_SRC] || !tb[CTA_IP_V6_DST])
327                 return -EINVAL;
328
329         memcpy(&t->src.u3.ip6, nla_data(tb[CTA_IP_V6_SRC]),
330                sizeof(u_int32_t) * 4);
331         memcpy(&t->dst.u3.ip6, nla_data(tb[CTA_IP_V6_DST]),
332                sizeof(u_int32_t) * 4);
333
334         return 0;
335 }
336 #endif
337
338 struct nf_conntrack_l3proto nf_conntrack_l3proto_ipv6 __read_mostly = {
339         .l3proto                = PF_INET6,
340         .name                   = "ipv6",
341         .pkt_to_tuple           = ipv6_pkt_to_tuple,
342         .invert_tuple           = ipv6_invert_tuple,
343         .print_tuple            = ipv6_print_tuple,
344         .get_l4proto            = ipv6_get_l4proto,
345 #if defined(CONFIG_NF_CT_NETLINK) || defined(CONFIG_NF_CT_NETLINK_MODULE)
346         .tuple_to_nlattr        = ipv6_tuple_to_nlattr,
347         .nlattr_to_tuple        = ipv6_nlattr_to_tuple,
348         .nla_policy             = ipv6_nla_policy,
349 #endif
350 #ifdef CONFIG_SYSCTL
351         .ctl_table_path         = nf_net_netfilter_sysctl_path,
352         .ctl_table              = nf_ct_ipv6_sysctl_table,
353 #endif
354         .me                     = THIS_MODULE,
355 };
356
357 MODULE_ALIAS("nf_conntrack-" __stringify(AF_INET6));
358 MODULE_LICENSE("GPL");
359 MODULE_AUTHOR("Yasuyuki KOZAKAI @USAGI <yasuyuki.kozakai@toshiba.co.jp>");
360
361 static int __init nf_conntrack_l3proto_ipv6_init(void)
362 {
363         int ret = 0;
364
365         need_conntrack();
366
367         ret = nf_ct_frag6_init();
368         if (ret < 0) {
369                 printk("nf_conntrack_ipv6: can't initialize frag6.\n");
370                 return ret;
371         }
372         ret = nf_conntrack_l4proto_register(&nf_conntrack_l4proto_tcp6);
373         if (ret < 0) {
374                 printk("nf_conntrack_ipv6: can't register tcp.\n");
375                 goto cleanup_frag6;
376         }
377
378         ret = nf_conntrack_l4proto_register(&nf_conntrack_l4proto_udp6);
379         if (ret < 0) {
380                 printk("nf_conntrack_ipv6: can't register udp.\n");
381                 goto cleanup_tcp;
382         }
383
384         ret = nf_conntrack_l4proto_register(&nf_conntrack_l4proto_icmpv6);
385         if (ret < 0) {
386                 printk("nf_conntrack_ipv6: can't register icmpv6.\n");
387                 goto cleanup_udp;
388         }
389
390         ret = nf_conntrack_l3proto_register(&nf_conntrack_l3proto_ipv6);
391         if (ret < 0) {
392                 printk("nf_conntrack_ipv6: can't register ipv6\n");
393                 goto cleanup_icmpv6;
394         }
395
396         ret = nf_register_hooks(ipv6_conntrack_ops,
397                                 ARRAY_SIZE(ipv6_conntrack_ops));
398         if (ret < 0) {
399                 printk("nf_conntrack_ipv6: can't register pre-routing defrag "
400                        "hook.\n");
401                 goto cleanup_ipv6;
402         }
403         return ret;
404
405  cleanup_ipv6:
406         nf_conntrack_l3proto_unregister(&nf_conntrack_l3proto_ipv6);
407  cleanup_icmpv6:
408         nf_conntrack_l4proto_unregister(&nf_conntrack_l4proto_icmpv6);
409  cleanup_udp:
410         nf_conntrack_l4proto_unregister(&nf_conntrack_l4proto_udp6);
411  cleanup_tcp:
412         nf_conntrack_l4proto_unregister(&nf_conntrack_l4proto_tcp6);
413  cleanup_frag6:
414         nf_ct_frag6_cleanup();
415         return ret;
416 }
417
418 static void __exit nf_conntrack_l3proto_ipv6_fini(void)
419 {
420         synchronize_net();
421         nf_unregister_hooks(ipv6_conntrack_ops, ARRAY_SIZE(ipv6_conntrack_ops));
422         nf_conntrack_l3proto_unregister(&nf_conntrack_l3proto_ipv6);
423         nf_conntrack_l4proto_unregister(&nf_conntrack_l4proto_icmpv6);
424         nf_conntrack_l4proto_unregister(&nf_conntrack_l4proto_udp6);
425         nf_conntrack_l4proto_unregister(&nf_conntrack_l4proto_tcp6);
426         nf_ct_frag6_cleanup();
427 }
428
429 module_init(nf_conntrack_l3proto_ipv6_init);
430 module_exit(nf_conntrack_l3proto_ipv6_fini);