[PATCH] slab: cache_reap(): further reduction in interrupt holdoff
[linux-2.6/linux-2.6-openrd.git] / net / ipv4 / ipcomp.c
blobc95020f7c81e38a2bdb0672fc7ecf5660c2f78d6
1 /*
2 * IP Payload Compression Protocol (IPComp) - RFC3173.
4 * Copyright (c) 2003 James Morris <jmorris@intercode.com.au>
6 * This program is free software; you can redistribute it and/or modify it
7 * under the terms of the GNU General Public License as published by the Free
8 * Software Foundation; either version 2 of the License, or (at your option)
9 * any later version.
11 * Todo:
12 * - Tunable compression parameters.
13 * - Compression stats.
14 * - Adaptive compression.
16 #include <linux/config.h>
17 #include <linux/module.h>
18 #include <asm/scatterlist.h>
19 #include <asm/semaphore.h>
20 #include <linux/crypto.h>
21 #include <linux/pfkeyv2.h>
22 #include <linux/percpu.h>
23 #include <linux/smp.h>
24 #include <linux/list.h>
25 #include <linux/vmalloc.h>
26 #include <linux/rtnetlink.h>
27 #include <linux/mutex.h>
28 #include <net/ip.h>
29 #include <net/xfrm.h>
30 #include <net/icmp.h>
31 #include <net/ipcomp.h>
32 #include <net/protocol.h>
34 struct ipcomp_tfms {
35 struct list_head list;
36 struct crypto_tfm **tfms;
37 int users;
40 static DEFINE_MUTEX(ipcomp_resource_mutex);
41 static void **ipcomp_scratches;
42 static int ipcomp_scratch_users;
43 static LIST_HEAD(ipcomp_tfms_list);
45 static int ipcomp_decompress(struct xfrm_state *x, struct sk_buff *skb)
47 int err, plen, dlen;
48 struct iphdr *iph;
49 struct ipcomp_data *ipcd = x->data;
50 u8 *start, *scratch;
51 struct crypto_tfm *tfm;
52 int cpu;
54 plen = skb->len;
55 dlen = IPCOMP_SCRATCH_SIZE;
56 start = skb->data;
58 cpu = get_cpu();
59 scratch = *per_cpu_ptr(ipcomp_scratches, cpu);
60 tfm = *per_cpu_ptr(ipcd->tfms, cpu);
62 err = crypto_comp_decompress(tfm, start, plen, scratch, &dlen);
63 if (err)
64 goto out;
66 if (dlen < (plen + sizeof(struct ip_comp_hdr))) {
67 err = -EINVAL;
68 goto out;
71 err = pskb_expand_head(skb, 0, dlen - plen, GFP_ATOMIC);
72 if (err)
73 goto out;
75 skb_put(skb, dlen - plen);
76 memcpy(skb->data, scratch, dlen);
77 iph = skb->nh.iph;
78 iph->tot_len = htons(dlen + iph->ihl * 4);
79 out:
80 put_cpu();
81 return err;
84 static int ipcomp_input(struct xfrm_state *x,
85 struct xfrm_decap_state *decap, struct sk_buff *skb)
87 u8 nexthdr;
88 int err = 0;
89 struct iphdr *iph;
90 union {
91 struct iphdr iph;
92 char buf[60];
93 } tmp_iph;
96 if ((skb_is_nonlinear(skb) || skb_cloned(skb)) &&
97 skb_linearize(skb, GFP_ATOMIC) != 0) {
98 err = -ENOMEM;
99 goto out;
102 skb->ip_summed = CHECKSUM_NONE;
104 /* Remove ipcomp header and decompress original payload */
105 iph = skb->nh.iph;
106 memcpy(&tmp_iph, iph, iph->ihl * 4);
107 nexthdr = *(u8 *)skb->data;
108 skb_pull(skb, sizeof(struct ip_comp_hdr));
109 skb->nh.raw += sizeof(struct ip_comp_hdr);
110 memcpy(skb->nh.raw, &tmp_iph, tmp_iph.iph.ihl * 4);
111 iph = skb->nh.iph;
112 iph->tot_len = htons(ntohs(iph->tot_len) - sizeof(struct ip_comp_hdr));
113 iph->protocol = nexthdr;
114 skb->h.raw = skb->data;
115 err = ipcomp_decompress(x, skb);
117 out:
118 return err;
121 static int ipcomp_compress(struct xfrm_state *x, struct sk_buff *skb)
123 int err, plen, dlen, ihlen;
124 struct iphdr *iph = skb->nh.iph;
125 struct ipcomp_data *ipcd = x->data;
126 u8 *start, *scratch;
127 struct crypto_tfm *tfm;
128 int cpu;
130 ihlen = iph->ihl * 4;
131 plen = skb->len - ihlen;
132 dlen = IPCOMP_SCRATCH_SIZE;
133 start = skb->data + ihlen;
135 cpu = get_cpu();
136 scratch = *per_cpu_ptr(ipcomp_scratches, cpu);
137 tfm = *per_cpu_ptr(ipcd->tfms, cpu);
139 err = crypto_comp_compress(tfm, start, plen, scratch, &dlen);
140 if (err)
141 goto out;
143 if ((dlen + sizeof(struct ip_comp_hdr)) >= plen) {
144 err = -EMSGSIZE;
145 goto out;
148 memcpy(start + sizeof(struct ip_comp_hdr), scratch, dlen);
149 put_cpu();
151 pskb_trim(skb, ihlen + dlen + sizeof(struct ip_comp_hdr));
152 return 0;
154 out:
155 put_cpu();
156 return err;
159 static int ipcomp_output(struct xfrm_state *x, struct sk_buff *skb)
161 int err;
162 struct iphdr *iph;
163 struct ip_comp_hdr *ipch;
164 struct ipcomp_data *ipcd = x->data;
165 int hdr_len = 0;
167 iph = skb->nh.iph;
168 iph->tot_len = htons(skb->len);
169 hdr_len = iph->ihl * 4;
170 if ((skb->len - hdr_len) < ipcd->threshold) {
171 /* Don't bother compressing */
172 goto out_ok;
175 if ((skb_is_nonlinear(skb) || skb_cloned(skb)) &&
176 skb_linearize(skb, GFP_ATOMIC) != 0) {
177 goto out_ok;
180 err = ipcomp_compress(x, skb);
181 iph = skb->nh.iph;
183 if (err) {
184 goto out_ok;
187 /* Install ipcomp header, convert into ipcomp datagram. */
188 iph->tot_len = htons(skb->len);
189 ipch = (struct ip_comp_hdr *)((char *)iph + iph->ihl * 4);
190 ipch->nexthdr = iph->protocol;
191 ipch->flags = 0;
192 ipch->cpi = htons((u16 )ntohl(x->id.spi));
193 iph->protocol = IPPROTO_COMP;
194 ip_send_check(iph);
195 return 0;
197 out_ok:
198 if (x->props.mode)
199 ip_send_check(iph);
200 return 0;
203 static void ipcomp4_err(struct sk_buff *skb, u32 info)
205 u32 spi;
206 struct iphdr *iph = (struct iphdr *)skb->data;
207 struct ip_comp_hdr *ipch = (struct ip_comp_hdr *)(skb->data+(iph->ihl<<2));
208 struct xfrm_state *x;
210 if (skb->h.icmph->type != ICMP_DEST_UNREACH ||
211 skb->h.icmph->code != ICMP_FRAG_NEEDED)
212 return;
214 spi = ntohl(ntohs(ipch->cpi));
215 x = xfrm_state_lookup((xfrm_address_t *)&iph->daddr,
216 spi, IPPROTO_COMP, AF_INET);
217 if (!x)
218 return;
219 NETDEBUG(KERN_DEBUG "pmtu discovery on SA IPCOMP/%08x/%u.%u.%u.%u\n",
220 spi, NIPQUAD(iph->daddr));
221 xfrm_state_put(x);
224 /* We always hold one tunnel user reference to indicate a tunnel */
225 static struct xfrm_state *ipcomp_tunnel_create(struct xfrm_state *x)
227 struct xfrm_state *t;
229 t = xfrm_state_alloc();
230 if (t == NULL)
231 goto out;
233 t->id.proto = IPPROTO_IPIP;
234 t->id.spi = x->props.saddr.a4;
235 t->id.daddr.a4 = x->id.daddr.a4;
236 memcpy(&t->sel, &x->sel, sizeof(t->sel));
237 t->props.family = AF_INET;
238 t->props.mode = 1;
239 t->props.saddr.a4 = x->props.saddr.a4;
240 t->props.flags = x->props.flags;
242 if (xfrm_init_state(t))
243 goto error;
245 atomic_set(&t->tunnel_users, 1);
246 out:
247 return t;
249 error:
250 t->km.state = XFRM_STATE_DEAD;
251 xfrm_state_put(t);
252 t = NULL;
253 goto out;
257 * Must be protected by xfrm_cfg_mutex. State and tunnel user references are
258 * always incremented on success.
260 static int ipcomp_tunnel_attach(struct xfrm_state *x)
262 int err = 0;
263 struct xfrm_state *t;
265 t = xfrm_state_lookup((xfrm_address_t *)&x->id.daddr.a4,
266 x->props.saddr.a4, IPPROTO_IPIP, AF_INET);
267 if (!t) {
268 t = ipcomp_tunnel_create(x);
269 if (!t) {
270 err = -EINVAL;
271 goto out;
273 xfrm_state_insert(t);
274 xfrm_state_hold(t);
276 x->tunnel = t;
277 atomic_inc(&t->tunnel_users);
278 out:
279 return err;
282 static void ipcomp_free_scratches(void)
284 int i;
285 void **scratches;
287 if (--ipcomp_scratch_users)
288 return;
290 scratches = ipcomp_scratches;
291 if (!scratches)
292 return;
294 for_each_cpu(i) {
295 void *scratch = *per_cpu_ptr(scratches, i);
296 if (scratch)
297 vfree(scratch);
300 free_percpu(scratches);
303 static void **ipcomp_alloc_scratches(void)
305 int i;
306 void **scratches;
308 if (ipcomp_scratch_users++)
309 return ipcomp_scratches;
311 scratches = alloc_percpu(void *);
312 if (!scratches)
313 return NULL;
315 ipcomp_scratches = scratches;
317 for_each_cpu(i) {
318 void *scratch = vmalloc(IPCOMP_SCRATCH_SIZE);
319 if (!scratch)
320 return NULL;
321 *per_cpu_ptr(scratches, i) = scratch;
324 return scratches;
327 static void ipcomp_free_tfms(struct crypto_tfm **tfms)
329 struct ipcomp_tfms *pos;
330 int cpu;
332 list_for_each_entry(pos, &ipcomp_tfms_list, list) {
333 if (pos->tfms == tfms)
334 break;
337 BUG_TRAP(pos);
339 if (--pos->users)
340 return;
342 list_del(&pos->list);
343 kfree(pos);
345 if (!tfms)
346 return;
348 for_each_cpu(cpu) {
349 struct crypto_tfm *tfm = *per_cpu_ptr(tfms, cpu);
350 crypto_free_tfm(tfm);
352 free_percpu(tfms);
355 static struct crypto_tfm **ipcomp_alloc_tfms(const char *alg_name)
357 struct ipcomp_tfms *pos;
358 struct crypto_tfm **tfms;
359 int cpu;
361 /* This can be any valid CPU ID so we don't need locking. */
362 cpu = raw_smp_processor_id();
364 list_for_each_entry(pos, &ipcomp_tfms_list, list) {
365 struct crypto_tfm *tfm;
367 tfms = pos->tfms;
368 tfm = *per_cpu_ptr(tfms, cpu);
370 if (!strcmp(crypto_tfm_alg_name(tfm), alg_name)) {
371 pos->users++;
372 return tfms;
376 pos = kmalloc(sizeof(*pos), GFP_KERNEL);
377 if (!pos)
378 return NULL;
380 pos->users = 1;
381 INIT_LIST_HEAD(&pos->list);
382 list_add(&pos->list, &ipcomp_tfms_list);
384 pos->tfms = tfms = alloc_percpu(struct crypto_tfm *);
385 if (!tfms)
386 goto error;
388 for_each_cpu(cpu) {
389 struct crypto_tfm *tfm = crypto_alloc_tfm(alg_name, 0);
390 if (!tfm)
391 goto error;
392 *per_cpu_ptr(tfms, cpu) = tfm;
395 return tfms;
397 error:
398 ipcomp_free_tfms(tfms);
399 return NULL;
402 static void ipcomp_free_data(struct ipcomp_data *ipcd)
404 if (ipcd->tfms)
405 ipcomp_free_tfms(ipcd->tfms);
406 ipcomp_free_scratches();
409 static void ipcomp_destroy(struct xfrm_state *x)
411 struct ipcomp_data *ipcd = x->data;
412 if (!ipcd)
413 return;
414 xfrm_state_delete_tunnel(x);
415 mutex_lock(&ipcomp_resource_mutex);
416 ipcomp_free_data(ipcd);
417 mutex_unlock(&ipcomp_resource_mutex);
418 kfree(ipcd);
421 static int ipcomp_init_state(struct xfrm_state *x)
423 int err;
424 struct ipcomp_data *ipcd;
425 struct xfrm_algo_desc *calg_desc;
427 err = -EINVAL;
428 if (!x->calg)
429 goto out;
431 if (x->encap)
432 goto out;
434 err = -ENOMEM;
435 ipcd = kmalloc(sizeof(*ipcd), GFP_KERNEL);
436 if (!ipcd)
437 goto out;
439 memset(ipcd, 0, sizeof(*ipcd));
440 x->props.header_len = 0;
441 if (x->props.mode)
442 x->props.header_len += sizeof(struct iphdr);
444 mutex_lock(&ipcomp_resource_mutex);
445 if (!ipcomp_alloc_scratches())
446 goto error;
448 ipcd->tfms = ipcomp_alloc_tfms(x->calg->alg_name);
449 if (!ipcd->tfms)
450 goto error;
451 mutex_unlock(&ipcomp_resource_mutex);
453 if (x->props.mode) {
454 err = ipcomp_tunnel_attach(x);
455 if (err)
456 goto error_tunnel;
459 calg_desc = xfrm_calg_get_byname(x->calg->alg_name, 0);
460 BUG_ON(!calg_desc);
461 ipcd->threshold = calg_desc->uinfo.comp.threshold;
462 x->data = ipcd;
463 err = 0;
464 out:
465 return err;
467 error_tunnel:
468 mutex_lock(&ipcomp_resource_mutex);
469 error:
470 ipcomp_free_data(ipcd);
471 mutex_unlock(&ipcomp_resource_mutex);
472 kfree(ipcd);
473 goto out;
476 static struct xfrm_type ipcomp_type = {
477 .description = "IPCOMP4",
478 .owner = THIS_MODULE,
479 .proto = IPPROTO_COMP,
480 .init_state = ipcomp_init_state,
481 .destructor = ipcomp_destroy,
482 .input = ipcomp_input,
483 .output = ipcomp_output
486 static struct net_protocol ipcomp4_protocol = {
487 .handler = xfrm4_rcv,
488 .err_handler = ipcomp4_err,
489 .no_policy = 1,
492 static int __init ipcomp4_init(void)
494 if (xfrm_register_type(&ipcomp_type, AF_INET) < 0) {
495 printk(KERN_INFO "ipcomp init: can't add xfrm type\n");
496 return -EAGAIN;
498 if (inet_add_protocol(&ipcomp4_protocol, IPPROTO_COMP) < 0) {
499 printk(KERN_INFO "ipcomp init: can't add protocol\n");
500 xfrm_unregister_type(&ipcomp_type, AF_INET);
501 return -EAGAIN;
503 return 0;
506 static void __exit ipcomp4_fini(void)
508 if (inet_del_protocol(&ipcomp4_protocol, IPPROTO_COMP) < 0)
509 printk(KERN_INFO "ip ipcomp close: can't remove protocol\n");
510 if (xfrm_unregister_type(&ipcomp_type, AF_INET) < 0)
511 printk(KERN_INFO "ip ipcomp close: can't remove xfrm type\n");
514 module_init(ipcomp4_init);
515 module_exit(ipcomp4_fini);
517 MODULE_LICENSE("GPL");
518 MODULE_DESCRIPTION("IP Payload Compression Protocol (IPComp) - RFC3173");
519 MODULE_AUTHOR("James Morris <jmorris@intercode.com.au>");