1 /*
2 * Copyright (c) 2011 Patrick McHardy <kaber@trash.net>
3 *
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License version 2 as
6 * published by the Free Software Foundation.
7 *
8 * Based on Rusty Russell's IPv4 NAT code. Development of IPv6 NAT
9 * funded by Astaro.
10 */
11
12 #include <linux/module.h>
13 #include <linux/netfilter.h>
14 #include <linux/netfilter_ipv6.h>
15 #include <linux/netfilter_ipv6/ip6_tables.h>
16 #include <linux/ipv6.h>
17 #include <net/ipv6.h>
18
19 #include <net/netfilter/nf_nat.h>
20 #include <net/netfilter/nf_nat_core.h>
21 #include <net/netfilter/nf_nat_l3proto.h>
22
23 static const struct xt_table nf_nat_ipv6_table = {
24 .name = "nat",
25 .valid_hooks = (1 << NF_INET_PRE_ROUTING) |
26 (1 << NF_INET_POST_ROUTING) |
27 (1 << NF_INET_LOCAL_OUT) |
28 (1 << NF_INET_LOCAL_IN),
29 .me = THIS_MODULE,
30 .af = NFPROTO_IPV6,
31 };
32
alloc_null_binding(struct nf_conn * ct,unsigned int hooknum)33 static unsigned int alloc_null_binding(struct nf_conn *ct, unsigned int hooknum)
34 {
35 /* Force range to this IP; let proto decide mapping for
36 * per-proto parts (hence not IP_NAT_RANGE_PROTO_SPECIFIED).
37 */
38 struct nf_nat_range range;
39
40 range.flags = 0;
41 pr_debug("Allocating NULL binding for %p (%pI6)\n", ct,
42 HOOK2MANIP(hooknum) == NF_NAT_MANIP_SRC ?
43 &ct->tuplehash[IP_CT_DIR_REPLY].tuple.dst.u3.ip6 :
44 &ct->tuplehash[IP_CT_DIR_REPLY].tuple.src.u3.ip6);
45
46 return nf_nat_setup_info(ct, &range, HOOK2MANIP(hooknum));
47 }
48
nf_nat_rule_find(struct sk_buff * skb,unsigned int hooknum,const struct net_device * in,const struct net_device * out,struct nf_conn * ct)49 static unsigned int nf_nat_rule_find(struct sk_buff *skb, unsigned int hooknum,
50 const struct net_device *in,
51 const struct net_device *out,
52 struct nf_conn *ct)
53 {
54 struct net *net = nf_ct_net(ct);
55 unsigned int ret;
56
57 ret = ip6t_do_table(skb, hooknum, in, out, net->ipv6.ip6table_nat);
58 if (ret == NF_ACCEPT) {
59 if (!nf_nat_initialized(ct, HOOK2MANIP(hooknum)))
60 ret = alloc_null_binding(ct, hooknum);
61 }
62 return ret;
63 }
64
65 static unsigned int
nf_nat_ipv6_fn(unsigned int hooknum,struct sk_buff * skb,const struct net_device * in,const struct net_device * out,int (* okfn)(struct sk_buff *))66 nf_nat_ipv6_fn(unsigned int hooknum,
67 struct sk_buff *skb,
68 const struct net_device *in,
69 const struct net_device *out,
70 int (*okfn)(struct sk_buff *))
71 {
72 struct nf_conn *ct;
73 enum ip_conntrack_info ctinfo;
74 struct nf_conn_nat *nat;
75 enum nf_nat_manip_type maniptype = HOOK2MANIP(hooknum);
76 __be16 frag_off;
77 int hdrlen;
78 u8 nexthdr;
79
80 ct = nf_ct_get(skb, &ctinfo);
81 /* Can't track? It's not due to stress, or conntrack would
82 * have dropped it. Hence it's the user's responsibilty to
83 * packet filter it out, or implement conntrack/NAT for that
84 * protocol. 8) --RR
85 */
86 if (!ct)
87 return NF_ACCEPT;
88
89 /* Don't try to NAT if this packet is not conntracked */
90 if (nf_ct_is_untracked(ct))
91 return NF_ACCEPT;
92
93 nat = nfct_nat(ct);
94 if (!nat) {
95 /* NAT module was loaded late. */
96 if (nf_ct_is_confirmed(ct))
97 return NF_ACCEPT;
98 nat = nf_ct_ext_add(ct, NF_CT_EXT_NAT, GFP_ATOMIC);
99 if (nat == NULL) {
100 pr_debug("failed to add NAT extension\n");
101 return NF_ACCEPT;
102 }
103 }
104
105 switch (ctinfo) {
106 case IP_CT_RELATED:
107 case IP_CT_RELATED_REPLY:
108 nexthdr = ipv6_hdr(skb)->nexthdr;
109 hdrlen = ipv6_skip_exthdr(skb, sizeof(struct ipv6hdr),
110 &nexthdr, &frag_off);
111
112 if (hdrlen >= 0 && nexthdr == IPPROTO_ICMPV6) {
113 if (!nf_nat_icmpv6_reply_translation(skb, ct, ctinfo,
114 hooknum, hdrlen))
115 return NF_DROP;
116 else
117 return NF_ACCEPT;
118 }
119 /* Fall thru... (Only ICMPs can be IP_CT_IS_REPLY) */
120 case IP_CT_NEW:
121 /* Seen it before? This can happen for loopback, retrans,
122 * or local packets.
123 */
124 if (!nf_nat_initialized(ct, maniptype)) {
125 unsigned int ret;
126
127 ret = nf_nat_rule_find(skb, hooknum, in, out, ct);
128 if (ret != NF_ACCEPT)
129 return ret;
130 } else {
131 pr_debug("Already setup manip %s for ct %p\n",
132 maniptype == NF_NAT_MANIP_SRC ? "SRC" : "DST",
133 ct);
134 if (nf_nat_oif_changed(hooknum, ctinfo, nat, out))
135 goto oif_changed;
136 }
137 break;
138
139 default:
140 /* ESTABLISHED */
141 NF_CT_ASSERT(ctinfo == IP_CT_ESTABLISHED ||
142 ctinfo == IP_CT_ESTABLISHED_REPLY);
143 if (nf_nat_oif_changed(hooknum, ctinfo, nat, out))
144 goto oif_changed;
145 }
146
147 return nf_nat_packet(ct, ctinfo, hooknum, skb);
148
149 oif_changed:
150 nf_ct_kill_acct(ct, ctinfo, skb);
151 return NF_DROP;
152 }
153
154 static unsigned int
nf_nat_ipv6_in(unsigned int hooknum,struct sk_buff * skb,const struct net_device * in,const struct net_device * out,int (* okfn)(struct sk_buff *))155 nf_nat_ipv6_in(unsigned int hooknum,
156 struct sk_buff *skb,
157 const struct net_device *in,
158 const struct net_device *out,
159 int (*okfn)(struct sk_buff *))
160 {
161 unsigned int ret;
162 struct in6_addr daddr = ipv6_hdr(skb)->daddr;
163
164 ret = nf_nat_ipv6_fn(hooknum, skb, in, out, okfn);
165 if (ret != NF_DROP && ret != NF_STOLEN &&
166 ipv6_addr_cmp(&daddr, &ipv6_hdr(skb)->daddr))
167 skb_dst_drop(skb);
168
169 return ret;
170 }
171
172 static unsigned int
nf_nat_ipv6_out(unsigned int hooknum,struct sk_buff * skb,const struct net_device * in,const struct net_device * out,int (* okfn)(struct sk_buff *))173 nf_nat_ipv6_out(unsigned int hooknum,
174 struct sk_buff *skb,
175 const struct net_device *in,
176 const struct net_device *out,
177 int (*okfn)(struct sk_buff *))
178 {
179 #ifdef CONFIG_XFRM
180 const struct nf_conn *ct;
181 enum ip_conntrack_info ctinfo;
182 int err;
183 #endif
184 unsigned int ret;
185
186 /* root is playing with raw sockets. */
187 if (skb->len < sizeof(struct ipv6hdr))
188 return NF_ACCEPT;
189
190 ret = nf_nat_ipv6_fn(hooknum, skb, in, out, okfn);
191 #ifdef CONFIG_XFRM
192 if (ret != NF_DROP && ret != NF_STOLEN &&
193 !(IP6CB(skb)->flags & IP6SKB_XFRM_TRANSFORMED) &&
194 (ct = nf_ct_get(skb, &ctinfo)) != NULL) {
195 enum ip_conntrack_dir dir = CTINFO2DIR(ctinfo);
196
197 if (!nf_inet_addr_cmp(&ct->tuplehash[dir].tuple.src.u3,
198 &ct->tuplehash[!dir].tuple.dst.u3) ||
199 (ct->tuplehash[dir].tuple.dst.protonum != IPPROTO_ICMPV6 &&
200 ct->tuplehash[dir].tuple.src.u.all !=
201 ct->tuplehash[!dir].tuple.dst.u.all)) {
202 err = nf_xfrm_me_harder(skb, AF_INET6);
203 if (err < 0)
204 ret = NF_DROP_ERR(err);
205 }
206 }
207 #endif
208 return ret;
209 }
210
211 static unsigned int
nf_nat_ipv6_local_fn(unsigned int hooknum,struct sk_buff * skb,const struct net_device * in,const struct net_device * out,int (* okfn)(struct sk_buff *))212 nf_nat_ipv6_local_fn(unsigned int hooknum,
213 struct sk_buff *skb,
214 const struct net_device *in,
215 const struct net_device *out,
216 int (*okfn)(struct sk_buff *))
217 {
218 const struct nf_conn *ct;
219 enum ip_conntrack_info ctinfo;
220 unsigned int ret;
221 int err;
222
223 /* root is playing with raw sockets. */
224 if (skb->len < sizeof(struct ipv6hdr))
225 return NF_ACCEPT;
226
227 ret = nf_nat_ipv6_fn(hooknum, skb, in, out, okfn);
228 if (ret != NF_DROP && ret != NF_STOLEN &&
229 (ct = nf_ct_get(skb, &ctinfo)) != NULL) {
230 enum ip_conntrack_dir dir = CTINFO2DIR(ctinfo);
231
232 if (!nf_inet_addr_cmp(&ct->tuplehash[dir].tuple.dst.u3,
233 &ct->tuplehash[!dir].tuple.src.u3)) {
234 err = ip6_route_me_harder(skb);
235 if (err < 0)
236 ret = NF_DROP_ERR(err);
237 }
238 #ifdef CONFIG_XFRM
239 else if (!(IP6CB(skb)->flags & IP6SKB_XFRM_TRANSFORMED) &&
240 ct->tuplehash[dir].tuple.dst.protonum != IPPROTO_ICMPV6 &&
241 ct->tuplehash[dir].tuple.dst.u.all !=
242 ct->tuplehash[!dir].tuple.src.u.all) {
243 err = nf_xfrm_me_harder(skb, AF_INET6);
244 if (err < 0)
245 ret = NF_DROP_ERR(err);
246 }
247 #endif
248 }
249 return ret;
250 }
251
252 static struct nf_hook_ops nf_nat_ipv6_ops[] __read_mostly = {
253 /* Before packet filtering, change destination */
254 {
255 .hook = nf_nat_ipv6_in,
256 .owner = THIS_MODULE,
257 .pf = NFPROTO_IPV6,
258 .hooknum = NF_INET_PRE_ROUTING,
259 .priority = NF_IP6_PRI_NAT_DST,
260 },
261 /* After packet filtering, change source */
262 {
263 .hook = nf_nat_ipv6_out,
264 .owner = THIS_MODULE,
265 .pf = NFPROTO_IPV6,
266 .hooknum = NF_INET_POST_ROUTING,
267 .priority = NF_IP6_PRI_NAT_SRC,
268 },
269 /* Before packet filtering, change destination */
270 {
271 .hook = nf_nat_ipv6_local_fn,
272 .owner = THIS_MODULE,
273 .pf = NFPROTO_IPV6,
274 .hooknum = NF_INET_LOCAL_OUT,
275 .priority = NF_IP6_PRI_NAT_DST,
276 },
277 /* After packet filtering, change source */
278 {
279 .hook = nf_nat_ipv6_fn,
280 .owner = THIS_MODULE,
281 .pf = NFPROTO_IPV6,
282 .hooknum = NF_INET_LOCAL_IN,
283 .priority = NF_IP6_PRI_NAT_SRC,
284 },
285 };
286
ip6table_nat_net_init(struct net * net)287 static int __net_init ip6table_nat_net_init(struct net *net)
288 {
289 struct ip6t_replace *repl;
290
291 repl = ip6t_alloc_initial_table(&nf_nat_ipv6_table);
292 if (repl == NULL)
293 return -ENOMEM;
294 net->ipv6.ip6table_nat = ip6t_register_table(net, &nf_nat_ipv6_table, repl);
295 kfree(repl);
296 return PTR_RET(net->ipv6.ip6table_nat);
297 }
298
ip6table_nat_net_exit(struct net * net)299 static void __net_exit ip6table_nat_net_exit(struct net *net)
300 {
301 ip6t_unregister_table(net, net->ipv6.ip6table_nat);
302 }
303
304 static struct pernet_operations ip6table_nat_net_ops = {
305 .init = ip6table_nat_net_init,
306 .exit = ip6table_nat_net_exit,
307 };
308
ip6table_nat_init(void)309 static int __init ip6table_nat_init(void)
310 {
311 int err;
312
313 err = register_pernet_subsys(&ip6table_nat_net_ops);
314 if (err < 0)
315 goto err1;
316
317 err = nf_register_hooks(nf_nat_ipv6_ops, ARRAY_SIZE(nf_nat_ipv6_ops));
318 if (err < 0)
319 goto err2;
320 return 0;
321
322 err2:
323 unregister_pernet_subsys(&ip6table_nat_net_ops);
324 err1:
325 return err;
326 }
327
ip6table_nat_exit(void)328 static void __exit ip6table_nat_exit(void)
329 {
330 nf_unregister_hooks(nf_nat_ipv6_ops, ARRAY_SIZE(nf_nat_ipv6_ops));
331 unregister_pernet_subsys(&ip6table_nat_net_ops);
332 }
333
334 module_init(ip6table_nat_init);
335 module_exit(ip6table_nat_exit);
336
337 MODULE_LICENSE("GPL");
338