]> git.kernelconcepts.de Git - karo-tx-linux.git/blob - net/ipv4/ipcomp.c
Merge branch 'for-linus' of git://git.kernel.dk/linux-2.6-block
[karo-tx-linux.git] / net / ipv4 / ipcomp.c
1 /*
2  * IP Payload Compression Protocol (IPComp) - RFC3173.
3  *
4  * Copyright (c) 2003 James Morris <jmorris@intercode.com.au>
5  *
6  * This program is free software; you can redistribute it and/or modify it
7  * under the terms of the GNU General Public License as published by the Free
8  * Software Foundation; either version 2 of the License, or (at your option)
9  * any later version.
10  *
11  * Todo:
12  *   - Tunable compression parameters.
13  *   - Compression stats.
14  *   - Adaptive compression.
15  */
16 #include <linux/module.h>
17 #include <asm/semaphore.h>
18 #include <linux/crypto.h>
19 #include <linux/err.h>
20 #include <linux/pfkeyv2.h>
21 #include <linux/percpu.h>
22 #include <linux/smp.h>
23 #include <linux/list.h>
24 #include <linux/vmalloc.h>
25 #include <linux/rtnetlink.h>
26 #include <linux/mutex.h>
27 #include <net/ip.h>
28 #include <net/xfrm.h>
29 #include <net/icmp.h>
30 #include <net/ipcomp.h>
31 #include <net/protocol.h>
32
33 struct ipcomp_tfms {
34         struct list_head list;
35         struct crypto_comp **tfms;
36         int users;
37 };
38
39 static DEFINE_MUTEX(ipcomp_resource_mutex);
40 static void **ipcomp_scratches;
41 static int ipcomp_scratch_users;
42 static LIST_HEAD(ipcomp_tfms_list);
43
44 static int ipcomp_decompress(struct xfrm_state *x, struct sk_buff *skb)
45 {
46         struct ipcomp_data *ipcd = x->data;
47         const int plen = skb->len;
48         int dlen = IPCOMP_SCRATCH_SIZE;
49         const u8 *start = skb->data;
50         const int cpu = get_cpu();
51         u8 *scratch = *per_cpu_ptr(ipcomp_scratches, cpu);
52         struct crypto_comp *tfm = *per_cpu_ptr(ipcd->tfms, cpu);
53         int err = crypto_comp_decompress(tfm, start, plen, scratch, &dlen);
54
55         if (err)
56                 goto out;
57
58         if (dlen < (plen + sizeof(struct ip_comp_hdr))) {
59                 err = -EINVAL;
60                 goto out;
61         }
62
63         err = pskb_expand_head(skb, 0, dlen - plen, GFP_ATOMIC);
64         if (err)
65                 goto out;
66
67         skb->truesize += dlen - plen;
68         __skb_put(skb, dlen - plen);
69         skb_copy_to_linear_data(skb, scratch, dlen);
70 out:
71         put_cpu();
72         return err;
73 }
74
75 static int ipcomp_input(struct xfrm_state *x, struct sk_buff *skb)
76 {
77         int err = -ENOMEM;
78         struct ip_comp_hdr *ipch;
79
80         if (skb_linearize_cow(skb))
81                 goto out;
82
83         skb->ip_summed = CHECKSUM_NONE;
84
85         /* Remove ipcomp header and decompress original payload */
86         ipch = (void *)skb->data;
87         skb->transport_header = skb->network_header + sizeof(*ipch);
88         __skb_pull(skb, sizeof(*ipch));
89         err = ipcomp_decompress(x, skb);
90         if (err)
91                 goto out;
92
93         err = ipch->nexthdr;
94
95 out:
96         return err;
97 }
98
99 static int ipcomp_compress(struct xfrm_state *x, struct sk_buff *skb)
100 {
101         struct ipcomp_data *ipcd = x->data;
102         const int plen = skb->len;
103         int dlen = IPCOMP_SCRATCH_SIZE;
104         u8 *start = skb->data;
105         const int cpu = get_cpu();
106         u8 *scratch = *per_cpu_ptr(ipcomp_scratches, cpu);
107         struct crypto_comp *tfm = *per_cpu_ptr(ipcd->tfms, cpu);
108         int err = crypto_comp_compress(tfm, start, plen, scratch, &dlen);
109
110         if (err)
111                 goto out;
112
113         if ((dlen + sizeof(struct ip_comp_hdr)) >= plen) {
114                 err = -EMSGSIZE;
115                 goto out;
116         }
117
118         memcpy(start + sizeof(struct ip_comp_hdr), scratch, dlen);
119         put_cpu();
120
121         pskb_trim(skb, dlen + sizeof(struct ip_comp_hdr));
122         return 0;
123
124 out:
125         put_cpu();
126         return err;
127 }
128
129 static int ipcomp_output(struct xfrm_state *x, struct sk_buff *skb)
130 {
131         int err;
132         struct ip_comp_hdr *ipch;
133         struct ipcomp_data *ipcd = x->data;
134
135         if (skb->len < ipcd->threshold) {
136                 /* Don't bother compressing */
137                 goto out_ok;
138         }
139
140         if (skb_linearize_cow(skb))
141                 goto out_ok;
142
143         err = ipcomp_compress(x, skb);
144
145         if (err) {
146                 goto out_ok;
147         }
148
149         /* Install ipcomp header, convert into ipcomp datagram. */
150         ipch = ip_comp_hdr(skb);
151         ipch->nexthdr = *skb_mac_header(skb);
152         ipch->flags = 0;
153         ipch->cpi = htons((u16 )ntohl(x->id.spi));
154         *skb_mac_header(skb) = IPPROTO_COMP;
155 out_ok:
156         skb_push(skb, -skb_network_offset(skb));
157         return 0;
158 }
159
160 static void ipcomp4_err(struct sk_buff *skb, u32 info)
161 {
162         __be32 spi;
163         struct iphdr *iph = (struct iphdr *)skb->data;
164         struct ip_comp_hdr *ipch = (struct ip_comp_hdr *)(skb->data+(iph->ihl<<2));
165         struct xfrm_state *x;
166
167         if (icmp_hdr(skb)->type != ICMP_DEST_UNREACH ||
168             icmp_hdr(skb)->code != ICMP_FRAG_NEEDED)
169                 return;
170
171         spi = htonl(ntohs(ipch->cpi));
172         x = xfrm_state_lookup((xfrm_address_t *)&iph->daddr,
173                               spi, IPPROTO_COMP, AF_INET);
174         if (!x)
175                 return;
176         NETDEBUG(KERN_DEBUG "pmtu discovery on SA IPCOMP/%08x/%u.%u.%u.%u\n",
177                  spi, NIPQUAD(iph->daddr));
178         xfrm_state_put(x);
179 }
180
181 /* We always hold one tunnel user reference to indicate a tunnel */
182 static struct xfrm_state *ipcomp_tunnel_create(struct xfrm_state *x)
183 {
184         struct xfrm_state *t;
185         u8 mode = XFRM_MODE_TUNNEL;
186
187         t = xfrm_state_alloc();
188         if (t == NULL)
189                 goto out;
190
191         t->id.proto = IPPROTO_IPIP;
192         t->id.spi = x->props.saddr.a4;
193         t->id.daddr.a4 = x->id.daddr.a4;
194         memcpy(&t->sel, &x->sel, sizeof(t->sel));
195         t->props.family = AF_INET;
196         if (x->props.mode == XFRM_MODE_BEET)
197                 mode = x->props.mode;
198         t->props.mode = mode;
199         t->props.saddr.a4 = x->props.saddr.a4;
200         t->props.flags = x->props.flags;
201
202         if (xfrm_init_state(t))
203                 goto error;
204
205         atomic_set(&t->tunnel_users, 1);
206 out:
207         return t;
208
209 error:
210         t->km.state = XFRM_STATE_DEAD;
211         xfrm_state_put(t);
212         t = NULL;
213         goto out;
214 }
215
216 /*
217  * Must be protected by xfrm_cfg_mutex.  State and tunnel user references are
218  * always incremented on success.
219  */
220 static int ipcomp_tunnel_attach(struct xfrm_state *x)
221 {
222         int err = 0;
223         struct xfrm_state *t;
224
225         t = xfrm_state_lookup((xfrm_address_t *)&x->id.daddr.a4,
226                               x->props.saddr.a4, IPPROTO_IPIP, AF_INET);
227         if (!t) {
228                 t = ipcomp_tunnel_create(x);
229                 if (!t) {
230                         err = -EINVAL;
231                         goto out;
232                 }
233                 xfrm_state_insert(t);
234                 xfrm_state_hold(t);
235         }
236         x->tunnel = t;
237         atomic_inc(&t->tunnel_users);
238 out:
239         return err;
240 }
241
242 static void ipcomp_free_scratches(void)
243 {
244         int i;
245         void **scratches;
246
247         if (--ipcomp_scratch_users)
248                 return;
249
250         scratches = ipcomp_scratches;
251         if (!scratches)
252                 return;
253
254         for_each_possible_cpu(i)
255                 vfree(*per_cpu_ptr(scratches, i));
256
257         free_percpu(scratches);
258 }
259
260 static void **ipcomp_alloc_scratches(void)
261 {
262         int i;
263         void **scratches;
264
265         if (ipcomp_scratch_users++)
266                 return ipcomp_scratches;
267
268         scratches = alloc_percpu(void *);
269         if (!scratches)
270                 return NULL;
271
272         ipcomp_scratches = scratches;
273
274         for_each_possible_cpu(i) {
275                 void *scratch = vmalloc(IPCOMP_SCRATCH_SIZE);
276                 if (!scratch)
277                         return NULL;
278                 *per_cpu_ptr(scratches, i) = scratch;
279         }
280
281         return scratches;
282 }
283
284 static void ipcomp_free_tfms(struct crypto_comp **tfms)
285 {
286         struct ipcomp_tfms *pos;
287         int cpu;
288
289         list_for_each_entry(pos, &ipcomp_tfms_list, list) {
290                 if (pos->tfms == tfms)
291                         break;
292         }
293
294         BUG_TRAP(pos);
295
296         if (--pos->users)
297                 return;
298
299         list_del(&pos->list);
300         kfree(pos);
301
302         if (!tfms)
303                 return;
304
305         for_each_possible_cpu(cpu) {
306                 struct crypto_comp *tfm = *per_cpu_ptr(tfms, cpu);
307                 crypto_free_comp(tfm);
308         }
309         free_percpu(tfms);
310 }
311
312 static struct crypto_comp **ipcomp_alloc_tfms(const char *alg_name)
313 {
314         struct ipcomp_tfms *pos;
315         struct crypto_comp **tfms;
316         int cpu;
317
318         /* This can be any valid CPU ID so we don't need locking. */
319         cpu = raw_smp_processor_id();
320
321         list_for_each_entry(pos, &ipcomp_tfms_list, list) {
322                 struct crypto_comp *tfm;
323
324                 tfms = pos->tfms;
325                 tfm = *per_cpu_ptr(tfms, cpu);
326
327                 if (!strcmp(crypto_comp_name(tfm), alg_name)) {
328                         pos->users++;
329                         return tfms;
330                 }
331         }
332
333         pos = kmalloc(sizeof(*pos), GFP_KERNEL);
334         if (!pos)
335                 return NULL;
336
337         pos->users = 1;
338         INIT_LIST_HEAD(&pos->list);
339         list_add(&pos->list, &ipcomp_tfms_list);
340
341         pos->tfms = tfms = alloc_percpu(struct crypto_comp *);
342         if (!tfms)
343                 goto error;
344
345         for_each_possible_cpu(cpu) {
346                 struct crypto_comp *tfm = crypto_alloc_comp(alg_name, 0,
347                                                             CRYPTO_ALG_ASYNC);
348                 if (IS_ERR(tfm))
349                         goto error;
350                 *per_cpu_ptr(tfms, cpu) = tfm;
351         }
352
353         return tfms;
354
355 error:
356         ipcomp_free_tfms(tfms);
357         return NULL;
358 }
359
360 static void ipcomp_free_data(struct ipcomp_data *ipcd)
361 {
362         if (ipcd->tfms)
363                 ipcomp_free_tfms(ipcd->tfms);
364         ipcomp_free_scratches();
365 }
366
367 static void ipcomp_destroy(struct xfrm_state *x)
368 {
369         struct ipcomp_data *ipcd = x->data;
370         if (!ipcd)
371                 return;
372         xfrm_state_delete_tunnel(x);
373         mutex_lock(&ipcomp_resource_mutex);
374         ipcomp_free_data(ipcd);
375         mutex_unlock(&ipcomp_resource_mutex);
376         kfree(ipcd);
377 }
378
379 static int ipcomp_init_state(struct xfrm_state *x)
380 {
381         int err;
382         struct ipcomp_data *ipcd;
383         struct xfrm_algo_desc *calg_desc;
384
385         err = -EINVAL;
386         if (!x->calg)
387                 goto out;
388
389         if (x->encap)
390                 goto out;
391
392         err = -ENOMEM;
393         ipcd = kzalloc(sizeof(*ipcd), GFP_KERNEL);
394         if (!ipcd)
395                 goto out;
396
397         x->props.header_len = 0;
398         if (x->props.mode == XFRM_MODE_TUNNEL)
399                 x->props.header_len += sizeof(struct iphdr);
400
401         mutex_lock(&ipcomp_resource_mutex);
402         if (!ipcomp_alloc_scratches())
403                 goto error;
404
405         ipcd->tfms = ipcomp_alloc_tfms(x->calg->alg_name);
406         if (!ipcd->tfms)
407                 goto error;
408         mutex_unlock(&ipcomp_resource_mutex);
409
410         if (x->props.mode == XFRM_MODE_TUNNEL) {
411                 err = ipcomp_tunnel_attach(x);
412                 if (err)
413                         goto error_tunnel;
414         }
415
416         calg_desc = xfrm_calg_get_byname(x->calg->alg_name, 0);
417         BUG_ON(!calg_desc);
418         ipcd->threshold = calg_desc->uinfo.comp.threshold;
419         x->data = ipcd;
420         err = 0;
421 out:
422         return err;
423
424 error_tunnel:
425         mutex_lock(&ipcomp_resource_mutex);
426 error:
427         ipcomp_free_data(ipcd);
428         mutex_unlock(&ipcomp_resource_mutex);
429         kfree(ipcd);
430         goto out;
431 }
432
433 static struct xfrm_type ipcomp_type = {
434         .description    = "IPCOMP4",
435         .owner          = THIS_MODULE,
436         .proto          = IPPROTO_COMP,
437         .init_state     = ipcomp_init_state,
438         .destructor     = ipcomp_destroy,
439         .input          = ipcomp_input,
440         .output         = ipcomp_output
441 };
442
443 static struct net_protocol ipcomp4_protocol = {
444         .handler        =       xfrm4_rcv,
445         .err_handler    =       ipcomp4_err,
446         .no_policy      =       1,
447 };
448
449 static int __init ipcomp4_init(void)
450 {
451         if (xfrm_register_type(&ipcomp_type, AF_INET) < 0) {
452                 printk(KERN_INFO "ipcomp init: can't add xfrm type\n");
453                 return -EAGAIN;
454         }
455         if (inet_add_protocol(&ipcomp4_protocol, IPPROTO_COMP) < 0) {
456                 printk(KERN_INFO "ipcomp init: can't add protocol\n");
457                 xfrm_unregister_type(&ipcomp_type, AF_INET);
458                 return -EAGAIN;
459         }
460         return 0;
461 }
462
463 static void __exit ipcomp4_fini(void)
464 {
465         if (inet_del_protocol(&ipcomp4_protocol, IPPROTO_COMP) < 0)
466                 printk(KERN_INFO "ip ipcomp close: can't remove protocol\n");
467         if (xfrm_unregister_type(&ipcomp_type, AF_INET) < 0)
468                 printk(KERN_INFO "ip ipcomp close: can't remove xfrm type\n");
469 }
470
471 module_init(ipcomp4_init);
472 module_exit(ipcomp4_fini);
473
474 MODULE_LICENSE("GPL");
475 MODULE_DESCRIPTION("IP Payload Compression Protocol (IPComp) - RFC3173");
476 MODULE_AUTHOR("James Morris <jmorris@intercode.com.au>");
477
478 MODULE_ALIAS_XFRM_TYPE(AF_INET, XFRM_PROTO_COMP);