blob: aa704b88f014fa7118a8ccfc92fc067b65108c48 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * IP Payload Compression Protocol (IPComp) - RFC3173.
3 *
4 * Copyright (c) 2003 James Morris <jmorris@intercode.com.au>
5 *
6 * This program is free software; you can redistribute it and/or modify it
7 * under the terms of the GNU General Public License as published by the Free
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09008 * Software Foundation; either version 2 of the License, or (at your option)
Linus Torvalds1da177e2005-04-16 15:20:36 -07009 * any later version.
10 *
11 * Todo:
12 * - Tunable compression parameters.
13 * - Compression stats.
14 * - Adaptive compression.
15 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070016#include <linux/module.h>
17#include <asm/scatterlist.h>
18#include <asm/semaphore.h>
19#include <linux/crypto.h>
20#include <linux/pfkeyv2.h>
21#include <linux/percpu.h>
22#include <linux/smp.h>
23#include <linux/list.h>
24#include <linux/vmalloc.h>
25#include <linux/rtnetlink.h>
Arjan van de Ven4a3e2f72006-03-20 22:33:17 -080026#include <linux/mutex.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070027#include <net/ip.h>
28#include <net/xfrm.h>
29#include <net/icmp.h>
30#include <net/ipcomp.h>
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -020031#include <net/protocol.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070032
33struct ipcomp_tfms {
34 struct list_head list;
Herbert Xue4d5b792006-08-26 18:12:40 +100035 struct crypto_comp **tfms;
Linus Torvalds1da177e2005-04-16 15:20:36 -070036 int users;
37};
38
Arjan van de Ven4a3e2f72006-03-20 22:33:17 -080039static DEFINE_MUTEX(ipcomp_resource_mutex);
Linus Torvalds1da177e2005-04-16 15:20:36 -070040static void **ipcomp_scratches;
41static int ipcomp_scratch_users;
42static LIST_HEAD(ipcomp_tfms_list);
43
44static int ipcomp_decompress(struct xfrm_state *x, struct sk_buff *skb)
45{
46 int err, plen, dlen;
Linus Torvalds1da177e2005-04-16 15:20:36 -070047 struct ipcomp_data *ipcd = x->data;
48 u8 *start, *scratch;
Herbert Xue4d5b792006-08-26 18:12:40 +100049 struct crypto_comp *tfm;
Linus Torvalds1da177e2005-04-16 15:20:36 -070050 int cpu;
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090051
Linus Torvalds1da177e2005-04-16 15:20:36 -070052 plen = skb->len;
53 dlen = IPCOMP_SCRATCH_SIZE;
54 start = skb->data;
55
56 cpu = get_cpu();
57 scratch = *per_cpu_ptr(ipcomp_scratches, cpu);
58 tfm = *per_cpu_ptr(ipcd->tfms, cpu);
59
60 err = crypto_comp_decompress(tfm, start, plen, scratch, &dlen);
61 if (err)
62 goto out;
63
64 if (dlen < (plen + sizeof(struct ip_comp_hdr))) {
65 err = -EINVAL;
66 goto out;
67 }
68
69 err = pskb_expand_head(skb, 0, dlen - plen, GFP_ATOMIC);
70 if (err)
71 goto out;
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090072
Herbert Xuda952312006-07-11 13:50:09 -070073 skb->truesize += dlen - plen;
74 __skb_put(skb, dlen - plen);
Linus Torvalds1da177e2005-04-16 15:20:36 -070075 memcpy(skb->data, scratch, dlen);
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090076out:
Linus Torvalds1da177e2005-04-16 15:20:36 -070077 put_cpu();
78 return err;
79}
80
Herbert Xue6956332006-04-01 00:52:46 -080081static int ipcomp_input(struct xfrm_state *x, struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -070082{
Herbert Xu364c6ba2006-06-09 16:10:40 -070083 int err = -ENOMEM;
Linus Torvalds1da177e2005-04-16 15:20:36 -070084 struct iphdr *iph;
Herbert Xu31a4ab92006-05-27 23:06:13 -070085 struct ip_comp_hdr *ipch;
Linus Torvalds1da177e2005-04-16 15:20:36 -070086
Herbert Xu364c6ba2006-06-09 16:10:40 -070087 if (skb_linearize_cow(skb))
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090088 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -070089
90 skb->ip_summed = CHECKSUM_NONE;
91
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090092 /* Remove ipcomp header and decompress original payload */
Linus Torvalds1da177e2005-04-16 15:20:36 -070093 iph = skb->nh.iph;
Herbert Xu31a4ab92006-05-27 23:06:13 -070094 ipch = (void *)skb->data;
95 iph->protocol = ipch->nexthdr;
96 skb->h.raw = skb->nh.raw + sizeof(*ipch);
97 __skb_pull(skb, sizeof(*ipch));
Linus Torvalds1da177e2005-04-16 15:20:36 -070098 err = ipcomp_decompress(x, skb);
99
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900100out:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700101 return err;
102}
103
104static int ipcomp_compress(struct xfrm_state *x, struct sk_buff *skb)
105{
106 int err, plen, dlen, ihlen;
107 struct iphdr *iph = skb->nh.iph;
108 struct ipcomp_data *ipcd = x->data;
109 u8 *start, *scratch;
Herbert Xue4d5b792006-08-26 18:12:40 +1000110 struct crypto_comp *tfm;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700111 int cpu;
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900112
Linus Torvalds1da177e2005-04-16 15:20:36 -0700113 ihlen = iph->ihl * 4;
114 plen = skb->len - ihlen;
115 dlen = IPCOMP_SCRATCH_SIZE;
116 start = skb->data + ihlen;
117
118 cpu = get_cpu();
119 scratch = *per_cpu_ptr(ipcomp_scratches, cpu);
120 tfm = *per_cpu_ptr(ipcd->tfms, cpu);
121
122 err = crypto_comp_compress(tfm, start, plen, scratch, &dlen);
123 if (err)
124 goto out;
125
126 if ((dlen + sizeof(struct ip_comp_hdr)) >= plen) {
127 err = -EMSGSIZE;
128 goto out;
129 }
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900130
Linus Torvalds1da177e2005-04-16 15:20:36 -0700131 memcpy(start + sizeof(struct ip_comp_hdr), scratch, dlen);
132 put_cpu();
133
134 pskb_trim(skb, ihlen + dlen + sizeof(struct ip_comp_hdr));
135 return 0;
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900136
137out:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700138 put_cpu();
139 return err;
140}
141
142static int ipcomp_output(struct xfrm_state *x, struct sk_buff *skb)
143{
144 int err;
145 struct iphdr *iph;
146 struct ip_comp_hdr *ipch;
147 struct ipcomp_data *ipcd = x->data;
148 int hdr_len = 0;
149
150 iph = skb->nh.iph;
151 iph->tot_len = htons(skb->len);
152 hdr_len = iph->ihl * 4;
153 if ((skb->len - hdr_len) < ipcd->threshold) {
154 /* Don't bother compressing */
155 goto out_ok;
156 }
157
Herbert Xu364c6ba2006-06-09 16:10:40 -0700158 if (skb_linearize_cow(skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700159 goto out_ok;
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900160
Linus Torvalds1da177e2005-04-16 15:20:36 -0700161 err = ipcomp_compress(x, skb);
162 iph = skb->nh.iph;
163
164 if (err) {
165 goto out_ok;
166 }
167
168 /* Install ipcomp header, convert into ipcomp datagram. */
169 iph->tot_len = htons(skb->len);
170 ipch = (struct ip_comp_hdr *)((char *)iph + iph->ihl * 4);
171 ipch->nexthdr = iph->protocol;
172 ipch->flags = 0;
173 ipch->cpi = htons((u16 )ntohl(x->id.spi));
174 iph->protocol = IPPROTO_COMP;
175 ip_send_check(iph);
176 return 0;
177
178out_ok:
Masahide NAKAMURA7e49e6d2006-09-22 15:05:15 -0700179 if (x->props.mode == XFRM_MODE_TUNNEL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700180 ip_send_check(iph);
181 return 0;
182}
183
184static void ipcomp4_err(struct sk_buff *skb, u32 info)
185{
Al Viroa94cfd12006-09-27 18:47:24 -0700186 __be32 spi;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700187 struct iphdr *iph = (struct iphdr *)skb->data;
188 struct ip_comp_hdr *ipch = (struct ip_comp_hdr *)(skb->data+(iph->ihl<<2));
189 struct xfrm_state *x;
190
191 if (skb->h.icmph->type != ICMP_DEST_UNREACH ||
192 skb->h.icmph->code != ICMP_FRAG_NEEDED)
193 return;
194
Alexey Dobriyan4195f812006-05-22 16:53:22 -0700195 spi = htonl(ntohs(ipch->cpi));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700196 x = xfrm_state_lookup((xfrm_address_t *)&iph->daddr,
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900197 spi, IPPROTO_COMP, AF_INET);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700198 if (!x)
199 return;
Patrick McHardy64ce2072005-08-09 20:50:53 -0700200 NETDEBUG(KERN_DEBUG "pmtu discovery on SA IPCOMP/%08x/%u.%u.%u.%u\n",
201 spi, NIPQUAD(iph->daddr));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700202 xfrm_state_put(x);
203}
204
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900205/* We always hold one tunnel user reference to indicate a tunnel */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700206static struct xfrm_state *ipcomp_tunnel_create(struct xfrm_state *x)
207{
208 struct xfrm_state *t;
Diego Beltrami0a69452c2006-10-03 23:47:05 -0700209 u8 mode = XFRM_MODE_TUNNEL;
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900210
Linus Torvalds1da177e2005-04-16 15:20:36 -0700211 t = xfrm_state_alloc();
212 if (t == NULL)
213 goto out;
214
215 t->id.proto = IPPROTO_IPIP;
216 t->id.spi = x->props.saddr.a4;
217 t->id.daddr.a4 = x->id.daddr.a4;
218 memcpy(&t->sel, &x->sel, sizeof(t->sel));
219 t->props.family = AF_INET;
Diego Beltrami0a69452c2006-10-03 23:47:05 -0700220 if (x->props.mode == XFRM_MODE_BEET)
221 mode = x->props.mode;
222 t->props.mode = mode;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700223 t->props.saddr.a4 = x->props.saddr.a4;
224 t->props.flags = x->props.flags;
Herbert Xu72cb6962005-06-20 13:18:08 -0700225
226 if (xfrm_init_state(t))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700227 goto error;
228
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229 atomic_set(&t->tunnel_users, 1);
230out:
231 return t;
232
233error:
234 t->km.state = XFRM_STATE_DEAD;
235 xfrm_state_put(t);
236 t = NULL;
237 goto out;
238}
239
240/*
Arjan van de Ven4a3e2f72006-03-20 22:33:17 -0800241 * Must be protected by xfrm_cfg_mutex. State and tunnel user references are
Linus Torvalds1da177e2005-04-16 15:20:36 -0700242 * always incremented on success.
243 */
244static int ipcomp_tunnel_attach(struct xfrm_state *x)
245{
246 int err = 0;
247 struct xfrm_state *t;
248
249 t = xfrm_state_lookup((xfrm_address_t *)&x->id.daddr.a4,
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900250 x->props.saddr.a4, IPPROTO_IPIP, AF_INET);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700251 if (!t) {
252 t = ipcomp_tunnel_create(x);
253 if (!t) {
254 err = -EINVAL;
255 goto out;
256 }
257 xfrm_state_insert(t);
258 xfrm_state_hold(t);
259 }
260 x->tunnel = t;
261 atomic_inc(&t->tunnel_users);
262out:
263 return err;
264}
265
266static void ipcomp_free_scratches(void)
267{
268 int i;
269 void **scratches;
270
271 if (--ipcomp_scratch_users)
272 return;
273
274 scratches = ipcomp_scratches;
275 if (!scratches)
276 return;
277
Jesper Juhl63903ca2006-04-18 14:51:44 -0700278 for_each_possible_cpu(i)
279 vfree(*per_cpu_ptr(scratches, i));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700280
281 free_percpu(scratches);
282}
283
284static void **ipcomp_alloc_scratches(void)
285{
286 int i;
287 void **scratches;
288
289 if (ipcomp_scratch_users++)
290 return ipcomp_scratches;
291
292 scratches = alloc_percpu(void *);
293 if (!scratches)
294 return NULL;
295
296 ipcomp_scratches = scratches;
297
KAMEZAWA Hiroyuki6f912042006-04-10 22:52:50 -0700298 for_each_possible_cpu(i) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700299 void *scratch = vmalloc(IPCOMP_SCRATCH_SIZE);
300 if (!scratch)
301 return NULL;
302 *per_cpu_ptr(scratches, i) = scratch;
303 }
304
305 return scratches;
306}
307
Herbert Xue4d5b792006-08-26 18:12:40 +1000308static void ipcomp_free_tfms(struct crypto_comp **tfms)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700309{
310 struct ipcomp_tfms *pos;
311 int cpu;
312
313 list_for_each_entry(pos, &ipcomp_tfms_list, list) {
314 if (pos->tfms == tfms)
315 break;
316 }
317
318 BUG_TRAP(pos);
319
320 if (--pos->users)
321 return;
322
323 list_del(&pos->list);
324 kfree(pos);
325
326 if (!tfms)
327 return;
328
KAMEZAWA Hiroyuki6f912042006-04-10 22:52:50 -0700329 for_each_possible_cpu(cpu) {
Herbert Xue4d5b792006-08-26 18:12:40 +1000330 struct crypto_comp *tfm = *per_cpu_ptr(tfms, cpu);
331 crypto_free_comp(tfm);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700332 }
333 free_percpu(tfms);
334}
335
Herbert Xue4d5b792006-08-26 18:12:40 +1000336static struct crypto_comp **ipcomp_alloc_tfms(const char *alg_name)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700337{
338 struct ipcomp_tfms *pos;
Herbert Xue4d5b792006-08-26 18:12:40 +1000339 struct crypto_comp **tfms;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700340 int cpu;
341
342 /* This can be any valid CPU ID so we don't need locking. */
Herbert Xu6fc8b9e2005-08-18 14:36:59 -0700343 cpu = raw_smp_processor_id();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700344
345 list_for_each_entry(pos, &ipcomp_tfms_list, list) {
Herbert Xue4d5b792006-08-26 18:12:40 +1000346 struct crypto_comp *tfm;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700347
348 tfms = pos->tfms;
349 tfm = *per_cpu_ptr(tfms, cpu);
350
Herbert Xue4d5b792006-08-26 18:12:40 +1000351 if (!strcmp(crypto_comp_name(tfm), alg_name)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700352 pos->users++;
353 return tfms;
354 }
355 }
356
357 pos = kmalloc(sizeof(*pos), GFP_KERNEL);
358 if (!pos)
359 return NULL;
360
361 pos->users = 1;
362 INIT_LIST_HEAD(&pos->list);
363 list_add(&pos->list, &ipcomp_tfms_list);
364
Herbert Xue4d5b792006-08-26 18:12:40 +1000365 pos->tfms = tfms = alloc_percpu(struct crypto_comp *);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700366 if (!tfms)
367 goto error;
368
KAMEZAWA Hiroyuki6f912042006-04-10 22:52:50 -0700369 for_each_possible_cpu(cpu) {
Herbert Xue4d5b792006-08-26 18:12:40 +1000370 struct crypto_comp *tfm = crypto_alloc_comp(alg_name, 0,
371 CRYPTO_ALG_ASYNC);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700372 if (!tfm)
373 goto error;
374 *per_cpu_ptr(tfms, cpu) = tfm;
375 }
376
377 return tfms;
378
379error:
380 ipcomp_free_tfms(tfms);
381 return NULL;
382}
383
384static void ipcomp_free_data(struct ipcomp_data *ipcd)
385{
386 if (ipcd->tfms)
387 ipcomp_free_tfms(ipcd->tfms);
388 ipcomp_free_scratches();
389}
390
391static void ipcomp_destroy(struct xfrm_state *x)
392{
393 struct ipcomp_data *ipcd = x->data;
394 if (!ipcd)
395 return;
396 xfrm_state_delete_tunnel(x);
Arjan van de Ven4a3e2f72006-03-20 22:33:17 -0800397 mutex_lock(&ipcomp_resource_mutex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700398 ipcomp_free_data(ipcd);
Arjan van de Ven4a3e2f72006-03-20 22:33:17 -0800399 mutex_unlock(&ipcomp_resource_mutex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700400 kfree(ipcd);
401}
402
Herbert Xu72cb6962005-06-20 13:18:08 -0700403static int ipcomp_init_state(struct xfrm_state *x)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700404{
405 int err;
406 struct ipcomp_data *ipcd;
407 struct xfrm_algo_desc *calg_desc;
408
409 err = -EINVAL;
410 if (!x->calg)
411 goto out;
412
413 if (x->encap)
414 goto out;
415
416 err = -ENOMEM;
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700417 ipcd = kzalloc(sizeof(*ipcd), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700418 if (!ipcd)
419 goto out;
420
Linus Torvalds1da177e2005-04-16 15:20:36 -0700421 x->props.header_len = 0;
Masahide NAKAMURA7e49e6d2006-09-22 15:05:15 -0700422 if (x->props.mode == XFRM_MODE_TUNNEL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700423 x->props.header_len += sizeof(struct iphdr);
424
Arjan van de Ven4a3e2f72006-03-20 22:33:17 -0800425 mutex_lock(&ipcomp_resource_mutex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700426 if (!ipcomp_alloc_scratches())
427 goto error;
428
429 ipcd->tfms = ipcomp_alloc_tfms(x->calg->alg_name);
430 if (!ipcd->tfms)
431 goto error;
Arjan van de Ven4a3e2f72006-03-20 22:33:17 -0800432 mutex_unlock(&ipcomp_resource_mutex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700433
Masahide NAKAMURA7e49e6d2006-09-22 15:05:15 -0700434 if (x->props.mode == XFRM_MODE_TUNNEL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700435 err = ipcomp_tunnel_attach(x);
436 if (err)
437 goto error_tunnel;
438 }
439
440 calg_desc = xfrm_calg_get_byname(x->calg->alg_name, 0);
441 BUG_ON(!calg_desc);
442 ipcd->threshold = calg_desc->uinfo.comp.threshold;
443 x->data = ipcd;
444 err = 0;
445out:
446 return err;
447
448error_tunnel:
Arjan van de Ven4a3e2f72006-03-20 22:33:17 -0800449 mutex_lock(&ipcomp_resource_mutex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700450error:
451 ipcomp_free_data(ipcd);
Arjan van de Ven4a3e2f72006-03-20 22:33:17 -0800452 mutex_unlock(&ipcomp_resource_mutex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700453 kfree(ipcd);
454 goto out;
455}
456
457static struct xfrm_type ipcomp_type = {
458 .description = "IPCOMP4",
459 .owner = THIS_MODULE,
460 .proto = IPPROTO_COMP,
461 .init_state = ipcomp_init_state,
462 .destructor = ipcomp_destroy,
463 .input = ipcomp_input,
464 .output = ipcomp_output
465};
466
467static struct net_protocol ipcomp4_protocol = {
468 .handler = xfrm4_rcv,
469 .err_handler = ipcomp4_err,
470 .no_policy = 1,
471};
472
473static int __init ipcomp4_init(void)
474{
475 if (xfrm_register_type(&ipcomp_type, AF_INET) < 0) {
476 printk(KERN_INFO "ipcomp init: can't add xfrm type\n");
477 return -EAGAIN;
478 }
479 if (inet_add_protocol(&ipcomp4_protocol, IPPROTO_COMP) < 0) {
480 printk(KERN_INFO "ipcomp init: can't add protocol\n");
481 xfrm_unregister_type(&ipcomp_type, AF_INET);
482 return -EAGAIN;
483 }
484 return 0;
485}
486
487static void __exit ipcomp4_fini(void)
488{
489 if (inet_del_protocol(&ipcomp4_protocol, IPPROTO_COMP) < 0)
490 printk(KERN_INFO "ip ipcomp close: can't remove protocol\n");
491 if (xfrm_unregister_type(&ipcomp_type, AF_INET) < 0)
492 printk(KERN_INFO "ip ipcomp close: can't remove xfrm type\n");
493}
494
495module_init(ipcomp4_init);
496module_exit(ipcomp4_fini);
497
498MODULE_LICENSE("GPL");
499MODULE_DESCRIPTION("IP Payload Compression Protocol (IPComp) - RFC3173");
500MODULE_AUTHOR("James Morris <jmorris@intercode.com.au>");
501