x86/smpboot: Init apic mapping before usage
[cascardo/linux.git] / net / netfilter / nf_synproxy_core.c
1 /*
2  * Copyright (c) 2013 Patrick McHardy <kaber@trash.net>
3  *
4  * This program is free software; you can redistribute it and/or modify
5  * it under the terms of the GNU General Public License version 2 as
6  * published by the Free Software Foundation.
7  */
8
9 #include <linux/module.h>
10 #include <linux/skbuff.h>
11 #include <asm/unaligned.h>
12 #include <net/tcp.h>
13 #include <net/netns/generic.h>
14 #include <linux/proc_fs.h>
15
16 #include <linux/netfilter_ipv4/ip_tables.h>
17 #include <linux/netfilter/x_tables.h>
18 #include <linux/netfilter/xt_tcpudp.h>
19 #include <linux/netfilter/xt_SYNPROXY.h>
20
21 #include <net/netfilter/nf_conntrack.h>
22 #include <net/netfilter/nf_conntrack_extend.h>
23 #include <net/netfilter/nf_conntrack_seqadj.h>
24 #include <net/netfilter/nf_conntrack_synproxy.h>
25 #include <net/netfilter/nf_conntrack_zones.h>
26
27 int synproxy_net_id;
28 EXPORT_SYMBOL_GPL(synproxy_net_id);
29
30 bool
31 synproxy_parse_options(const struct sk_buff *skb, unsigned int doff,
32                        const struct tcphdr *th, struct synproxy_options *opts)
33 {
34         int length = (th->doff * 4) - sizeof(*th);
35         u8 buf[40], *ptr;
36
37         ptr = skb_header_pointer(skb, doff + sizeof(*th), length, buf);
38         if (ptr == NULL)
39                 return false;
40
41         opts->options = 0;
42         while (length > 0) {
43                 int opcode = *ptr++;
44                 int opsize;
45
46                 switch (opcode) {
47                 case TCPOPT_EOL:
48                         return true;
49                 case TCPOPT_NOP:
50                         length--;
51                         continue;
52                 default:
53                         opsize = *ptr++;
54                         if (opsize < 2)
55                                 return true;
56                         if (opsize > length)
57                                 return true;
58
59                         switch (opcode) {
60                         case TCPOPT_MSS:
61                                 if (opsize == TCPOLEN_MSS) {
62                                         opts->mss = get_unaligned_be16(ptr);
63                                         opts->options |= XT_SYNPROXY_OPT_MSS;
64                                 }
65                                 break;
66                         case TCPOPT_WINDOW:
67                                 if (opsize == TCPOLEN_WINDOW) {
68                                         opts->wscale = *ptr;
69                                         if (opts->wscale > 14)
70                                                 opts->wscale = 14;
71                                         opts->options |= XT_SYNPROXY_OPT_WSCALE;
72                                 }
73                                 break;
74                         case TCPOPT_TIMESTAMP:
75                                 if (opsize == TCPOLEN_TIMESTAMP) {
76                                         opts->tsval = get_unaligned_be32(ptr);
77                                         opts->tsecr = get_unaligned_be32(ptr + 4);
78                                         opts->options |= XT_SYNPROXY_OPT_TIMESTAMP;
79                                 }
80                                 break;
81                         case TCPOPT_SACK_PERM:
82                                 if (opsize == TCPOLEN_SACK_PERM)
83                                         opts->options |= XT_SYNPROXY_OPT_SACK_PERM;
84                                 break;
85                         }
86
87                         ptr += opsize - 2;
88                         length -= opsize;
89                 }
90         }
91         return true;
92 }
93 EXPORT_SYMBOL_GPL(synproxy_parse_options);
94
95 unsigned int synproxy_options_size(const struct synproxy_options *opts)
96 {
97         unsigned int size = 0;
98
99         if (opts->options & XT_SYNPROXY_OPT_MSS)
100                 size += TCPOLEN_MSS_ALIGNED;
101         if (opts->options & XT_SYNPROXY_OPT_TIMESTAMP)
102                 size += TCPOLEN_TSTAMP_ALIGNED;
103         else if (opts->options & XT_SYNPROXY_OPT_SACK_PERM)
104                 size += TCPOLEN_SACKPERM_ALIGNED;
105         if (opts->options & XT_SYNPROXY_OPT_WSCALE)
106                 size += TCPOLEN_WSCALE_ALIGNED;
107
108         return size;
109 }
110 EXPORT_SYMBOL_GPL(synproxy_options_size);
111
112 void
113 synproxy_build_options(struct tcphdr *th, const struct synproxy_options *opts)
114 {
115         __be32 *ptr = (__be32 *)(th + 1);
116         u8 options = opts->options;
117
118         if (options & XT_SYNPROXY_OPT_MSS)
119                 *ptr++ = htonl((TCPOPT_MSS << 24) |
120                                (TCPOLEN_MSS << 16) |
121                                opts->mss);
122
123         if (options & XT_SYNPROXY_OPT_TIMESTAMP) {
124                 if (options & XT_SYNPROXY_OPT_SACK_PERM)
125                         *ptr++ = htonl((TCPOPT_SACK_PERM << 24) |
126                                        (TCPOLEN_SACK_PERM << 16) |
127                                        (TCPOPT_TIMESTAMP << 8) |
128                                        TCPOLEN_TIMESTAMP);
129                 else
130                         *ptr++ = htonl((TCPOPT_NOP << 24) |
131                                        (TCPOPT_NOP << 16) |
132                                        (TCPOPT_TIMESTAMP << 8) |
133                                        TCPOLEN_TIMESTAMP);
134
135                 *ptr++ = htonl(opts->tsval);
136                 *ptr++ = htonl(opts->tsecr);
137         } else if (options & XT_SYNPROXY_OPT_SACK_PERM)
138                 *ptr++ = htonl((TCPOPT_NOP << 24) |
139                                (TCPOPT_NOP << 16) |
140                                (TCPOPT_SACK_PERM << 8) |
141                                TCPOLEN_SACK_PERM);
142
143         if (options & XT_SYNPROXY_OPT_WSCALE)
144                 *ptr++ = htonl((TCPOPT_NOP << 24) |
145                                (TCPOPT_WINDOW << 16) |
146                                (TCPOLEN_WINDOW << 8) |
147                                opts->wscale);
148 }
149 EXPORT_SYMBOL_GPL(synproxy_build_options);
150
151 void synproxy_init_timestamp_cookie(const struct xt_synproxy_info *info,
152                                     struct synproxy_options *opts)
153 {
154         opts->tsecr = opts->tsval;
155         opts->tsval = tcp_time_stamp & ~0x3f;
156
157         if (opts->options & XT_SYNPROXY_OPT_WSCALE) {
158                 opts->tsval |= opts->wscale;
159                 opts->wscale = info->wscale;
160         } else
161                 opts->tsval |= 0xf;
162
163         if (opts->options & XT_SYNPROXY_OPT_SACK_PERM)
164                 opts->tsval |= 1 << 4;
165
166         if (opts->options & XT_SYNPROXY_OPT_ECN)
167                 opts->tsval |= 1 << 5;
168 }
169 EXPORT_SYMBOL_GPL(synproxy_init_timestamp_cookie);
170
171 void synproxy_check_timestamp_cookie(struct synproxy_options *opts)
172 {
173         opts->wscale = opts->tsecr & 0xf;
174         if (opts->wscale != 0xf)
175                 opts->options |= XT_SYNPROXY_OPT_WSCALE;
176
177         opts->options |= opts->tsecr & (1 << 4) ? XT_SYNPROXY_OPT_SACK_PERM : 0;
178
179         opts->options |= opts->tsecr & (1 << 5) ? XT_SYNPROXY_OPT_ECN : 0;
180 }
181 EXPORT_SYMBOL_GPL(synproxy_check_timestamp_cookie);
182
183 unsigned int synproxy_tstamp_adjust(struct sk_buff *skb,
184                                     unsigned int protoff,
185                                     struct tcphdr *th,
186                                     struct nf_conn *ct,
187                                     enum ip_conntrack_info ctinfo,
188                                     const struct nf_conn_synproxy *synproxy)
189 {
190         unsigned int optoff, optend;
191         __be32 *ptr, old;
192
193         if (synproxy->tsoff == 0)
194                 return 1;
195
196         optoff = protoff + sizeof(struct tcphdr);
197         optend = protoff + th->doff * 4;
198
199         if (!skb_make_writable(skb, optend))
200                 return 0;
201
202         while (optoff < optend) {
203                 unsigned char *op = skb->data + optoff;
204
205                 switch (op[0]) {
206                 case TCPOPT_EOL:
207                         return 1;
208                 case TCPOPT_NOP:
209                         optoff++;
210                         continue;
211                 default:
212                         if (optoff + 1 == optend ||
213                             optoff + op[1] > optend ||
214                             op[1] < 2)
215                                 return 0;
216                         if (op[0] == TCPOPT_TIMESTAMP &&
217                             op[1] == TCPOLEN_TIMESTAMP) {
218                                 if (CTINFO2DIR(ctinfo) == IP_CT_DIR_REPLY) {
219                                         ptr = (__be32 *)&op[2];
220                                         old = *ptr;
221                                         *ptr = htonl(ntohl(*ptr) -
222                                                      synproxy->tsoff);
223                                 } else {
224                                         ptr = (__be32 *)&op[6];
225                                         old = *ptr;
226                                         *ptr = htonl(ntohl(*ptr) +
227                                                      synproxy->tsoff);
228                                 }
229                                 inet_proto_csum_replace4(&th->check, skb,
230                                                          old, *ptr, false);
231                                 return 1;
232                         }
233                         optoff += op[1];
234                 }
235         }
236         return 1;
237 }
238 EXPORT_SYMBOL_GPL(synproxy_tstamp_adjust);
239
240 static struct nf_ct_ext_type nf_ct_synproxy_extend __read_mostly = {
241         .len            = sizeof(struct nf_conn_synproxy),
242         .align          = __alignof__(struct nf_conn_synproxy),
243         .id             = NF_CT_EXT_SYNPROXY,
244 };
245
246 #ifdef CONFIG_PROC_FS
247 static void *synproxy_cpu_seq_start(struct seq_file *seq, loff_t *pos)
248 {
249         struct synproxy_net *snet = synproxy_pernet(seq_file_net(seq));
250         int cpu;
251
252         if (*pos == 0)
253                 return SEQ_START_TOKEN;
254
255         for (cpu = *pos - 1; cpu < nr_cpu_ids; cpu++) {
256                 if (!cpu_possible(cpu))
257                         continue;
258                 *pos = cpu + 1;
259                 return per_cpu_ptr(snet->stats, cpu);
260         }
261
262         return NULL;
263 }
264
265 static void *synproxy_cpu_seq_next(struct seq_file *seq, void *v, loff_t *pos)
266 {
267         struct synproxy_net *snet = synproxy_pernet(seq_file_net(seq));
268         int cpu;
269
270         for (cpu = *pos; cpu < nr_cpu_ids; cpu++) {
271                 if (!cpu_possible(cpu))
272                         continue;
273                 *pos = cpu + 1;
274                 return per_cpu_ptr(snet->stats, cpu);
275         }
276
277         return NULL;
278 }
279
280 static void synproxy_cpu_seq_stop(struct seq_file *seq, void *v)
281 {
282         return;
283 }
284
285 static int synproxy_cpu_seq_show(struct seq_file *seq, void *v)
286 {
287         struct synproxy_stats *stats = v;
288
289         if (v == SEQ_START_TOKEN) {
290                 seq_printf(seq, "entries\t\tsyn_received\t"
291                                 "cookie_invalid\tcookie_valid\t"
292                                 "cookie_retrans\tconn_reopened\n");
293                 return 0;
294         }
295
296         seq_printf(seq, "%08x\t%08x\t%08x\t%08x\t%08x\t%08x\n", 0,
297                    stats->syn_received,
298                    stats->cookie_invalid,
299                    stats->cookie_valid,
300                    stats->cookie_retrans,
301                    stats->conn_reopened);
302
303         return 0;
304 }
305
306 static const struct seq_operations synproxy_cpu_seq_ops = {
307         .start          = synproxy_cpu_seq_start,
308         .next           = synproxy_cpu_seq_next,
309         .stop           = synproxy_cpu_seq_stop,
310         .show           = synproxy_cpu_seq_show,
311 };
312
313 static int synproxy_cpu_seq_open(struct inode *inode, struct file *file)
314 {
315         return seq_open_net(inode, file, &synproxy_cpu_seq_ops,
316                             sizeof(struct seq_net_private));
317 }
318
319 static const struct file_operations synproxy_cpu_seq_fops = {
320         .owner          = THIS_MODULE,
321         .open           = synproxy_cpu_seq_open,
322         .read           = seq_read,
323         .llseek         = seq_lseek,
324         .release        = seq_release_net,
325 };
326
327 static int __net_init synproxy_proc_init(struct net *net)
328 {
329         if (!proc_create("synproxy", S_IRUGO, net->proc_net_stat,
330                          &synproxy_cpu_seq_fops))
331                 return -ENOMEM;
332         return 0;
333 }
334
335 static void __net_exit synproxy_proc_exit(struct net *net)
336 {
337         remove_proc_entry("synproxy", net->proc_net_stat);
338 }
339 #else
340 static int __net_init synproxy_proc_init(struct net *net)
341 {
342         return 0;
343 }
344
345 static void __net_exit synproxy_proc_exit(struct net *net)
346 {
347         return;
348 }
349 #endif /* CONFIG_PROC_FS */
350
351 static int __net_init synproxy_net_init(struct net *net)
352 {
353         struct synproxy_net *snet = synproxy_pernet(net);
354         struct nf_conn *ct;
355         int err = -ENOMEM;
356
357         ct = nf_ct_tmpl_alloc(net, &nf_ct_zone_dflt, GFP_KERNEL);
358         if (!ct)
359                 goto err1;
360
361         if (!nfct_seqadj_ext_add(ct))
362                 goto err2;
363         if (!nfct_synproxy_ext_add(ct))
364                 goto err2;
365
366         __set_bit(IPS_CONFIRMED_BIT, &ct->status);
367         nf_conntrack_get(&ct->ct_general);
368         snet->tmpl = ct;
369
370         snet->stats = alloc_percpu(struct synproxy_stats);
371         if (snet->stats == NULL)
372                 goto err2;
373
374         err = synproxy_proc_init(net);
375         if (err < 0)
376                 goto err3;
377
378         return 0;
379
380 err3:
381         free_percpu(snet->stats);
382 err2:
383         nf_ct_tmpl_free(ct);
384 err1:
385         return err;
386 }
387
388 static void __net_exit synproxy_net_exit(struct net *net)
389 {
390         struct synproxy_net *snet = synproxy_pernet(net);
391
392         nf_ct_put(snet->tmpl);
393         synproxy_proc_exit(net);
394         free_percpu(snet->stats);
395 }
396
397 static struct pernet_operations synproxy_net_ops = {
398         .init           = synproxy_net_init,
399         .exit           = synproxy_net_exit,
400         .id             = &synproxy_net_id,
401         .size           = sizeof(struct synproxy_net),
402 };
403
404 static int __init synproxy_core_init(void)
405 {
406         int err;
407
408         err = nf_ct_extend_register(&nf_ct_synproxy_extend);
409         if (err < 0)
410                 goto err1;
411
412         err = register_pernet_subsys(&synproxy_net_ops);
413         if (err < 0)
414                 goto err2;
415
416         return 0;
417
418 err2:
419         nf_ct_extend_unregister(&nf_ct_synproxy_extend);
420 err1:
421         return err;
422 }
423
424 static void __exit synproxy_core_exit(void)
425 {
426         unregister_pernet_subsys(&synproxy_net_ops);
427         nf_ct_extend_unregister(&nf_ct_synproxy_extend);
428 }
429
430 module_init(synproxy_core_init);
431 module_exit(synproxy_core_exit);
432
433 MODULE_LICENSE("GPL");
434 MODULE_AUTHOR("Patrick McHardy <kaber@trash.net>");