blob: 1fb60aba1e6ce7e42ea9ebfd3e1726bc1c316ac1 [file] [log] [blame]
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +09001/* net/sched/sch_ingress.c - Ingress qdisc
Linus Torvalds1da177e2005-04-16 15:20:36 -07002 * This program is free software; you can redistribute it and/or
3 * modify it under the terms of the GNU General Public License
4 * as published by the Free Software Foundation; either version
5 * 2 of the License, or (at your option) any later version.
6 *
7 * Authors: Jamal Hadi Salim 1999
8 */
9
Linus Torvalds1da177e2005-04-16 15:20:36 -070010#include <linux/module.h>
11#include <linux/types.h>
12#include <linux/skbuff.h>
13#include <linux/netdevice.h>
14#include <linux/rtnetlink.h>
15#include <linux/netfilter_ipv4.h>
16#include <linux/netfilter_ipv6.h>
17#include <linux/netfilter.h>
18#include <linux/smp.h>
Arnaldo Carvalho de Melodc5fc572007-03-25 23:06:12 -070019#include <net/netlink.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070020#include <net/pkt_sched.h>
21#include <asm/byteorder.h>
22#include <asm/uaccess.h>
23#include <linux/kmod.h>
24#include <linux/stat.h>
25#include <linux/interrupt.h>
26#include <linux/list.h>
27
28
29#undef DEBUG_INGRESS
30
31#ifdef DEBUG_INGRESS /* control */
32#define DPRINTK(format,args...) printk(KERN_DEBUG format,##args)
33#else
34#define DPRINTK(format,args...)
35#endif
36
37#if 0 /* data */
38#define D2PRINTK(format,args...) printk(KERN_DEBUG format,##args)
39#else
40#define D2PRINTK(format,args...)
41#endif
42
43
44#define PRIV(sch) qdisc_priv(sch)
45
46
47/* Thanks to Doron Oz for this hack
48*/
49#ifndef CONFIG_NET_CLS_ACT
50#ifdef CONFIG_NETFILTER
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +090051static int nf_registered;
Linus Torvalds1da177e2005-04-16 15:20:36 -070052#endif
53#endif
54
55struct ingress_qdisc_data {
56 struct Qdisc *q;
57 struct tcf_proto *filter_list;
58};
59
60
61/* ------------------------- Class/flow operations ------------------------- */
62
63
64static int ingress_graft(struct Qdisc *sch,unsigned long arg,
65 struct Qdisc *new,struct Qdisc **old)
66{
67#ifdef DEBUG_INGRESS
68 struct ingress_qdisc_data *p = PRIV(sch);
69#endif
70
71 DPRINTK("ingress_graft(sch %p,[qdisc %p],new %p,old %p)\n",
72 sch, p, new, old);
73 DPRINTK("\n ingress_graft: You cannot add qdiscs to classes");
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +090074 return 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -070075}
76
77
78static struct Qdisc *ingress_leaf(struct Qdisc *sch, unsigned long arg)
79{
80 return NULL;
81}
82
83
84static unsigned long ingress_get(struct Qdisc *sch,u32 classid)
85{
86#ifdef DEBUG_INGRESS
87 struct ingress_qdisc_data *p = PRIV(sch);
88#endif
89 DPRINTK("ingress_get(sch %p,[qdisc %p],classid %x)\n", sch, p, classid);
90 return TC_H_MIN(classid) + 1;
91}
92
93
94static unsigned long ingress_bind_filter(struct Qdisc *sch,
95 unsigned long parent, u32 classid)
96{
97 return ingress_get(sch, classid);
98}
99
100
101static void ingress_put(struct Qdisc *sch, unsigned long cl)
102{
103}
104
105
106static int ingress_change(struct Qdisc *sch, u32 classid, u32 parent,
107 struct rtattr **tca, unsigned long *arg)
108{
109#ifdef DEBUG_INGRESS
110 struct ingress_qdisc_data *p = PRIV(sch);
111#endif
112 DPRINTK("ingress_change(sch %p,[qdisc %p],classid %x,parent %x),"
113 "arg 0x%lx\n", sch, p, classid, parent, *arg);
114 DPRINTK("No effect. sch_ingress doesn't maintain classes at the moment");
115 return 0;
116}
117
118
119
120static void ingress_walk(struct Qdisc *sch,struct qdisc_walker *walker)
121{
122#ifdef DEBUG_INGRESS
123 struct ingress_qdisc_data *p = PRIV(sch);
124#endif
125 DPRINTK("ingress_walk(sch %p,[qdisc %p],walker %p)\n", sch, p, walker);
126 DPRINTK("No effect. sch_ingress doesn't maintain classes at the moment");
127}
128
129
130static struct tcf_proto **ingress_find_tcf(struct Qdisc *sch,unsigned long cl)
131{
132 struct ingress_qdisc_data *p = PRIV(sch);
133
134 return &p->filter_list;
135}
136
137
138/* --------------------------- Qdisc operations ---------------------------- */
139
140
141static int ingress_enqueue(struct sk_buff *skb,struct Qdisc *sch)
142{
143 struct ingress_qdisc_data *p = PRIV(sch);
144 struct tcf_result res;
145 int result;
146
147 D2PRINTK("ingress_enqueue(skb %p,sch %p,[qdisc %p])\n", skb, sch, p);
148 result = tc_classify(skb, p->filter_list, &res);
149 D2PRINTK("result %d class 0x%04x\n", result, res.classid);
150 /*
151 * Unlike normal "enqueue" functions, ingress_enqueue returns a
152 * firewall FW_* code.
153 */
154#ifdef CONFIG_NET_CLS_ACT
155 sch->bstats.packets++;
156 sch->bstats.bytes += skb->len;
157 switch (result) {
158 case TC_ACT_SHOT:
159 result = TC_ACT_SHOT;
160 sch->qstats.drops++;
161 break;
162 case TC_ACT_STOLEN:
163 case TC_ACT_QUEUED:
164 result = TC_ACT_STOLEN;
165 break;
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900166 case TC_ACT_RECLASSIFY:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700167 case TC_ACT_OK:
168 case TC_ACT_UNSPEC:
169 default:
170 skb->tc_index = TC_H_MIN(res.classid);
171 result = TC_ACT_OK;
172 break;
173 };
174/* backward compat */
175#else
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900176#ifdef CONFIG_NET_CLS_POLICE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700177 switch (result) {
178 case TC_POLICE_SHOT:
179 result = NF_DROP;
180 sch->qstats.drops++;
181 break;
182 case TC_POLICE_RECLASSIFY: /* DSCP remarking here ? */
183 case TC_POLICE_OK:
184 case TC_POLICE_UNSPEC:
185 default:
186 sch->bstats.packets++;
187 sch->bstats.bytes += skb->len;
188 result = NF_ACCEPT;
189 break;
190 };
191
192#else
193 D2PRINTK("Overriding result to ACCEPT\n");
194 result = NF_ACCEPT;
195 sch->bstats.packets++;
196 sch->bstats.bytes += skb->len;
197#endif
198#endif
199
200 return result;
201}
202
203
204static struct sk_buff *ingress_dequeue(struct Qdisc *sch)
205{
206/*
207 struct ingress_qdisc_data *p = PRIV(sch);
208 D2PRINTK("ingress_dequeue(sch %p,[qdisc %p])\n",sch,PRIV(p));
209*/
210 return NULL;
211}
212
213
214static int ingress_requeue(struct sk_buff *skb,struct Qdisc *sch)
215{
216/*
217 struct ingress_qdisc_data *p = PRIV(sch);
218 D2PRINTK("ingress_requeue(skb %p,sch %p,[qdisc %p])\n",skb,sch,PRIV(p));
219*/
220 return 0;
221}
222
223static unsigned int ingress_drop(struct Qdisc *sch)
224{
225#ifdef DEBUG_INGRESS
226 struct ingress_qdisc_data *p = PRIV(sch);
227#endif
228 DPRINTK("ingress_drop(sch %p,[qdisc %p])\n", sch, p);
229 return 0;
230}
231
232#ifndef CONFIG_NET_CLS_ACT
233#ifdef CONFIG_NETFILTER
234static unsigned int
235ing_hook(unsigned int hook, struct sk_buff **pskb,
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900236 const struct net_device *indev,
237 const struct net_device *outdev,
238 int (*okfn)(struct sk_buff *))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700239{
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900240
Linus Torvalds1da177e2005-04-16 15:20:36 -0700241 struct Qdisc *q;
242 struct sk_buff *skb = *pskb;
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900243 struct net_device *dev = skb->dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700244 int fwres=NF_ACCEPT;
245
246 DPRINTK("ing_hook: skb %s dev=%s len=%u\n",
247 skb->sk ? "(owned)" : "(unowned)",
248 skb->dev ? (*pskb)->dev->name : "(no dev)",
249 skb->len);
250
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900251/*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700252revisit later: Use a private since lock dev->queue_lock is also
253used on the egress (might slow things for an iota)
254*/
255
256 if (dev->qdisc_ingress) {
257 spin_lock(&dev->queue_lock);
258 if ((q = dev->qdisc_ingress) != NULL)
259 fwres = q->enqueue(skb, q);
260 spin_unlock(&dev->queue_lock);
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900261 }
262
Linus Torvalds1da177e2005-04-16 15:20:36 -0700263 return fwres;
264}
265
266/* after ipt_filter */
267static struct nf_hook_ops ing_ops = {
268 .hook = ing_hook,
269 .owner = THIS_MODULE,
270 .pf = PF_INET,
271 .hooknum = NF_IP_PRE_ROUTING,
272 .priority = NF_IP_PRI_FILTER + 1,
273};
274
275static struct nf_hook_ops ing6_ops = {
276 .hook = ing_hook,
277 .owner = THIS_MODULE,
278 .pf = PF_INET6,
279 .hooknum = NF_IP6_PRE_ROUTING,
280 .priority = NF_IP6_PRI_FILTER + 1,
281};
282
283#endif
284#endif
285
286static int ingress_init(struct Qdisc *sch,struct rtattr *opt)
287{
288 struct ingress_qdisc_data *p = PRIV(sch);
289
290/* Make sure either netfilter or preferably CLS_ACT is
291* compiled in */
292#ifndef CONFIG_NET_CLS_ACT
293#ifndef CONFIG_NETFILTER
294 printk("You MUST compile classifier actions into the kernel\n");
295 return -EINVAL;
296#else
297 printk("Ingress scheduler: Classifier actions prefered over netfilter\n");
298#endif
299#endif
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900300
Linus Torvalds1da177e2005-04-16 15:20:36 -0700301#ifndef CONFIG_NET_CLS_ACT
302#ifdef CONFIG_NETFILTER
303 if (!nf_registered) {
304 if (nf_register_hook(&ing_ops) < 0) {
305 printk("ingress qdisc registration error \n");
306 return -EINVAL;
307 }
308 nf_registered++;
309
310 if (nf_register_hook(&ing6_ops) < 0) {
311 printk("IPv6 ingress qdisc registration error, " \
312 "disabling IPv6 support.\n");
313 } else
314 nf_registered++;
315 }
316#endif
317#endif
318
319 DPRINTK("ingress_init(sch %p,[qdisc %p],opt %p)\n",sch,p,opt);
320 p->q = &noop_qdisc;
321 return 0;
322}
323
324
325static void ingress_reset(struct Qdisc *sch)
326{
327 struct ingress_qdisc_data *p = PRIV(sch);
328
329 DPRINTK("ingress_reset(sch %p,[qdisc %p])\n", sch, p);
330
331/*
332#if 0
333*/
334/* for future use */
335 qdisc_reset(p->q);
336/*
337#endif
338*/
339}
340
341/* ------------------------------------------------------------- */
342
343
344/* ------------------------------------------------------------- */
345
346static void ingress_destroy(struct Qdisc *sch)
347{
348 struct ingress_qdisc_data *p = PRIV(sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700349
350 DPRINTK("ingress_destroy(sch %p,[qdisc %p])\n", sch, p);
Patrick McHardya48b5a62007-03-23 11:29:43 -0700351 tcf_destroy_chain(p->filter_list);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700352#if 0
353/* for future use */
354 qdisc_destroy(p->q);
355#endif
356}
357
358
359static int ingress_dump(struct Qdisc *sch, struct sk_buff *skb)
360{
Arnaldo Carvalho de Melo27a884d2007-04-19 20:29:13 -0700361 unsigned char *b = skb_tail_pointer(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700362 struct rtattr *rta;
363
364 rta = (struct rtattr *) b;
365 RTA_PUT(skb, TCA_OPTIONS, 0, NULL);
Arnaldo Carvalho de Melo27a884d2007-04-19 20:29:13 -0700366 rta->rta_len = skb_tail_pointer(skb) - b;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700367 return skb->len;
368
369rtattr_failure:
Arnaldo Carvalho de Melodc5fc572007-03-25 23:06:12 -0700370 nlmsg_trim(skb, b);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700371 return -1;
372}
373
374static struct Qdisc_class_ops ingress_class_ops = {
375 .graft = ingress_graft,
376 .leaf = ingress_leaf,
377 .get = ingress_get,
378 .put = ingress_put,
379 .change = ingress_change,
380 .delete = NULL,
381 .walk = ingress_walk,
382 .tcf_chain = ingress_find_tcf,
383 .bind_tcf = ingress_bind_filter,
384 .unbind_tcf = ingress_put,
385 .dump = NULL,
386};
387
388static struct Qdisc_ops ingress_qdisc_ops = {
389 .next = NULL,
390 .cl_ops = &ingress_class_ops,
391 .id = "ingress",
392 .priv_size = sizeof(struct ingress_qdisc_data),
393 .enqueue = ingress_enqueue,
394 .dequeue = ingress_dequeue,
395 .requeue = ingress_requeue,
396 .drop = ingress_drop,
397 .init = ingress_init,
398 .reset = ingress_reset,
399 .destroy = ingress_destroy,
400 .change = NULL,
401 .dump = ingress_dump,
402 .owner = THIS_MODULE,
403};
404
405static int __init ingress_module_init(void)
406{
407 int ret = 0;
408
409 if ((ret = register_qdisc(&ingress_qdisc_ops)) < 0) {
410 printk("Unable to register Ingress qdisc\n");
411 return ret;
412 }
413
414 return ret;
415}
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900416static void __exit ingress_module_exit(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700417{
418 unregister_qdisc(&ingress_qdisc_ops);
419#ifndef CONFIG_NET_CLS_ACT
420#ifdef CONFIG_NETFILTER
421 if (nf_registered) {
422 nf_unregister_hook(&ing_ops);
423 if (nf_registered > 1)
424 nf_unregister_hook(&ing6_ops);
425 }
426#endif
427#endif
428}
429module_init(ingress_module_init)
430module_exit(ingress_module_exit)
431MODULE_LICENSE("GPL");