[NET_SCHED]: Convert packet schedulers from rtnetlink to new netlink API
[deliverable/linux.git] / net / sched / sch_red.c
CommitLineData
1da177e4
LT
1/*
2 * net/sched/sch_red.c Random Early Detection queue.
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
10 *
11 * Changes:
dba051f3 12 * J Hadi Salim 980914: computation fixes
1da177e4 13 * Alexey Makarenko <makar@phoenix.kharkov.ua> 990814: qave on idle link was calculated incorrectly.
dba051f3 14 * J Hadi Salim 980816: ECN support
1da177e4
LT
15 */
16
1da177e4 17#include <linux/module.h>
1da177e4
LT
18#include <linux/types.h>
19#include <linux/kernel.h>
1da177e4 20#include <linux/skbuff.h>
1da177e4
LT
21#include <net/pkt_sched.h>
22#include <net/inet_ecn.h>
6b31b28a 23#include <net/red.h>
1da177e4
LT
24
25
6b31b28a 26/* Parameters, settable by user:
1da177e4
LT
27 -----------------------------
28
29 limit - bytes (must be > qth_max + burst)
30
31 Hard limit on queue length, should be chosen >qth_max
32 to allow packet bursts. This parameter does not
33 affect the algorithms behaviour and can be chosen
34 arbitrarily high (well, less than ram size)
35 Really, this limit will never be reached
36 if RED works correctly.
1da177e4
LT
37 */
38
39struct red_sched_data
40{
6b31b28a
TG
41 u32 limit; /* HARD maximal queue length */
42 unsigned char flags;
43 struct red_parms parms;
44 struct red_stats stats;
f38c39d6 45 struct Qdisc *qdisc;
1da177e4
LT
46};
47
6b31b28a 48static inline int red_use_ecn(struct red_sched_data *q)
1da177e4 49{
6b31b28a 50 return q->flags & TC_RED_ECN;
1da177e4
LT
51}
52
bdc450a0
TG
53static inline int red_use_harddrop(struct red_sched_data *q)
54{
55 return q->flags & TC_RED_HARDDROP;
56}
57
dba051f3 58static int red_enqueue(struct sk_buff *skb, struct Qdisc* sch)
1da177e4
LT
59{
60 struct red_sched_data *q = qdisc_priv(sch);
f38c39d6
PM
61 struct Qdisc *child = q->qdisc;
62 int ret;
1da177e4 63
f38c39d6 64 q->parms.qavg = red_calc_qavg(&q->parms, child->qstats.backlog);
1da177e4 65
6b31b28a
TG
66 if (red_is_idling(&q->parms))
67 red_end_of_idle_period(&q->parms);
1da177e4 68
6b31b28a
TG
69 switch (red_action(&q->parms, q->parms.qavg)) {
70 case RED_DONT_MARK:
71 break;
1da177e4 72
6b31b28a
TG
73 case RED_PROB_MARK:
74 sch->qstats.overlimits++;
75 if (!red_use_ecn(q) || !INET_ECN_set_ce(skb)) {
76 q->stats.prob_drop++;
77 goto congestion_drop;
78 }
1da177e4 79
6b31b28a
TG
80 q->stats.prob_mark++;
81 break;
82
83 case RED_HARD_MARK:
84 sch->qstats.overlimits++;
bdc450a0
TG
85 if (red_use_harddrop(q) || !red_use_ecn(q) ||
86 !INET_ECN_set_ce(skb)) {
6b31b28a
TG
87 q->stats.forced_drop++;
88 goto congestion_drop;
89 }
90
91 q->stats.forced_mark++;
92 break;
1da177e4
LT
93 }
94
f38c39d6
PM
95 ret = child->enqueue(skb, child);
96 if (likely(ret == NET_XMIT_SUCCESS)) {
97 sch->bstats.bytes += skb->len;
98 sch->bstats.packets++;
99 sch->q.qlen++;
100 } else {
101 q->stats.pdrop++;
102 sch->qstats.drops++;
103 }
104 return ret;
6b31b28a
TG
105
106congestion_drop:
9e178ff2 107 qdisc_drop(skb, sch);
1da177e4
LT
108 return NET_XMIT_CN;
109}
110
dba051f3 111static int red_requeue(struct sk_buff *skb, struct Qdisc* sch)
1da177e4
LT
112{
113 struct red_sched_data *q = qdisc_priv(sch);
f38c39d6
PM
114 struct Qdisc *child = q->qdisc;
115 int ret;
1da177e4 116
6b31b28a
TG
117 if (red_is_idling(&q->parms))
118 red_end_of_idle_period(&q->parms);
1da177e4 119
f38c39d6
PM
120 ret = child->ops->requeue(skb, child);
121 if (likely(ret == NET_XMIT_SUCCESS)) {
122 sch->qstats.requeues++;
123 sch->q.qlen++;
124 }
125 return ret;
1da177e4
LT
126}
127
dba051f3 128static struct sk_buff * red_dequeue(struct Qdisc* sch)
1da177e4
LT
129{
130 struct sk_buff *skb;
131 struct red_sched_data *q = qdisc_priv(sch);
f38c39d6 132 struct Qdisc *child = q->qdisc;
1da177e4 133
f38c39d6
PM
134 skb = child->dequeue(child);
135 if (skb)
136 sch->q.qlen--;
137 else if (!red_is_idling(&q->parms))
9e178ff2
TG
138 red_start_of_idle_period(&q->parms);
139
140 return skb;
1da177e4
LT
141}
142
143static unsigned int red_drop(struct Qdisc* sch)
144{
1da177e4 145 struct red_sched_data *q = qdisc_priv(sch);
f38c39d6
PM
146 struct Qdisc *child = q->qdisc;
147 unsigned int len;
1da177e4 148
f38c39d6 149 if (child->ops->drop && (len = child->ops->drop(child)) > 0) {
6b31b28a 150 q->stats.other++;
f38c39d6
PM
151 sch->qstats.drops++;
152 sch->q.qlen--;
1da177e4
LT
153 return len;
154 }
6b31b28a 155
6a1b63d4
TG
156 if (!red_is_idling(&q->parms))
157 red_start_of_idle_period(&q->parms);
158
1da177e4
LT
159 return 0;
160}
161
162static void red_reset(struct Qdisc* sch)
163{
164 struct red_sched_data *q = qdisc_priv(sch);
165
f38c39d6
PM
166 qdisc_reset(q->qdisc);
167 sch->q.qlen = 0;
6b31b28a 168 red_restart(&q->parms);
1da177e4
LT
169}
170
f38c39d6
PM
171static void red_destroy(struct Qdisc *sch)
172{
173 struct red_sched_data *q = qdisc_priv(sch);
174 qdisc_destroy(q->qdisc);
175}
176
9f9afec4 177static struct Qdisc *red_create_dflt(struct Qdisc *sch, u32 limit)
f38c39d6 178{
9f9afec4 179 struct Qdisc *q;
1e90474c 180 struct nlattr *nla;
f38c39d6
PM
181 int ret;
182
9f9afec4
PM
183 q = qdisc_create_dflt(sch->dev, &bfifo_qdisc_ops,
184 TC_H_MAKE(sch->handle, 1));
f38c39d6 185 if (q) {
1e90474c 186 nla = kmalloc(nla_attr_size(sizeof(struct tc_fifo_qopt)),
10297b99 187 GFP_KERNEL);
1e90474c
PM
188 if (nla) {
189 nla->nla_type = RTM_NEWQDISC;
190 nla->nla_len = nla_attr_size(sizeof(struct tc_fifo_qopt));
191 ((struct tc_fifo_qopt *)nla_data(nla))->limit = limit;
f38c39d6 192
1e90474c
PM
193 ret = q->ops->change(q, nla);
194 kfree(nla);
f38c39d6
PM
195
196 if (ret == 0)
197 return q;
198 }
199 qdisc_destroy(q);
200 }
201 return NULL;
202}
203
1e90474c 204static int red_change(struct Qdisc *sch, struct nlattr *opt)
1da177e4
LT
205{
206 struct red_sched_data *q = qdisc_priv(sch);
1e90474c 207 struct nlattr *tb[TCA_RED_MAX + 1];
1da177e4 208 struct tc_red_qopt *ctl;
f38c39d6 209 struct Qdisc *child = NULL;
1da177e4 210
1e90474c 211 if (opt == NULL || nla_parse_nested(tb, TCA_RED_MAX, opt, NULL))
dba051f3
TG
212 return -EINVAL;
213
1e90474c
PM
214 if (tb[TCA_RED_PARMS] == NULL ||
215 nla_len(tb[TCA_RED_PARMS]) < sizeof(*ctl) ||
216 tb[TCA_RED_STAB] == NULL ||
217 nla_len(tb[TCA_RED_STAB]) < RED_STAB_SIZE)
1da177e4
LT
218 return -EINVAL;
219
1e90474c 220 ctl = nla_data(tb[TCA_RED_PARMS]);
1da177e4 221
f38c39d6 222 if (ctl->limit > 0) {
9f9afec4 223 child = red_create_dflt(sch, ctl->limit);
f38c39d6
PM
224 if (child == NULL)
225 return -ENOMEM;
226 }
227
1da177e4
LT
228 sch_tree_lock(sch);
229 q->flags = ctl->flags;
1da177e4 230 q->limit = ctl->limit;
5e50da01
PM
231 if (child) {
232 qdisc_tree_decrease_qlen(q->qdisc, q->qdisc->q.qlen);
f38c39d6 233 qdisc_destroy(xchg(&q->qdisc, child));
5e50da01 234 }
1da177e4 235
6b31b28a
TG
236 red_set_parms(&q->parms, ctl->qth_min, ctl->qth_max, ctl->Wlog,
237 ctl->Plog, ctl->Scell_log,
1e90474c 238 nla_data(tb[TCA_RED_STAB]));
6b31b28a 239
b03efcfb 240 if (skb_queue_empty(&sch->q))
6b31b28a 241 red_end_of_idle_period(&q->parms);
dba051f3 242
1da177e4
LT
243 sch_tree_unlock(sch);
244 return 0;
245}
246
1e90474c 247static int red_init(struct Qdisc* sch, struct nlattr *opt)
1da177e4 248{
f38c39d6
PM
249 struct red_sched_data *q = qdisc_priv(sch);
250
251 q->qdisc = &noop_qdisc;
1da177e4
LT
252 return red_change(sch, opt);
253}
254
255static int red_dump(struct Qdisc *sch, struct sk_buff *skb)
256{
257 struct red_sched_data *q = qdisc_priv(sch);
1e90474c 258 struct nlattr *opts = NULL;
6b31b28a
TG
259 struct tc_red_qopt opt = {
260 .limit = q->limit,
261 .flags = q->flags,
262 .qth_min = q->parms.qth_min >> q->parms.Wlog,
263 .qth_max = q->parms.qth_max >> q->parms.Wlog,
264 .Wlog = q->parms.Wlog,
265 .Plog = q->parms.Plog,
266 .Scell_log = q->parms.Scell_log,
267 };
1da177e4 268
1e90474c
PM
269 opts = nla_nest_start(skb, TCA_OPTIONS);
270 if (opts == NULL)
271 goto nla_put_failure;
272 NLA_PUT(skb, TCA_RED_PARMS, sizeof(opt), &opt);
273 return nla_nest_end(skb, opts);
1da177e4 274
1e90474c
PM
275nla_put_failure:
276 return nla_nest_cancel(skb, opts);
1da177e4
LT
277}
278
279static int red_dump_stats(struct Qdisc *sch, struct gnet_dump *d)
280{
281 struct red_sched_data *q = qdisc_priv(sch);
6b31b28a
TG
282 struct tc_red_xstats st = {
283 .early = q->stats.prob_drop + q->stats.forced_drop,
284 .pdrop = q->stats.pdrop,
285 .other = q->stats.other,
286 .marked = q->stats.prob_mark + q->stats.forced_mark,
287 };
288
289 return gnet_stats_copy_app(d, &st, sizeof(st));
1da177e4
LT
290}
291
f38c39d6
PM
292static int red_dump_class(struct Qdisc *sch, unsigned long cl,
293 struct sk_buff *skb, struct tcmsg *tcm)
294{
295 struct red_sched_data *q = qdisc_priv(sch);
296
297 if (cl != 1)
298 return -ENOENT;
299 tcm->tcm_handle |= TC_H_MIN(1);
300 tcm->tcm_info = q->qdisc->handle;
301 return 0;
302}
303
304static int red_graft(struct Qdisc *sch, unsigned long arg, struct Qdisc *new,
305 struct Qdisc **old)
306{
307 struct red_sched_data *q = qdisc_priv(sch);
308
309 if (new == NULL)
310 new = &noop_qdisc;
311
312 sch_tree_lock(sch);
313 *old = xchg(&q->qdisc, new);
5e50da01 314 qdisc_tree_decrease_qlen(*old, (*old)->q.qlen);
f38c39d6 315 qdisc_reset(*old);
f38c39d6
PM
316 sch_tree_unlock(sch);
317 return 0;
318}
319
320static struct Qdisc *red_leaf(struct Qdisc *sch, unsigned long arg)
321{
322 struct red_sched_data *q = qdisc_priv(sch);
323 return q->qdisc;
324}
325
326static unsigned long red_get(struct Qdisc *sch, u32 classid)
327{
328 return 1;
329}
330
331static void red_put(struct Qdisc *sch, unsigned long arg)
332{
333 return;
334}
335
336static int red_change_class(struct Qdisc *sch, u32 classid, u32 parentid,
1e90474c 337 struct nlattr **tca, unsigned long *arg)
f38c39d6
PM
338{
339 return -ENOSYS;
340}
341
342static int red_delete(struct Qdisc *sch, unsigned long cl)
343{
344 return -ENOSYS;
345}
346
347static void red_walk(struct Qdisc *sch, struct qdisc_walker *walker)
348{
349 if (!walker->stop) {
350 if (walker->count >= walker->skip)
351 if (walker->fn(sch, 1, walker) < 0) {
352 walker->stop = 1;
353 return;
354 }
355 walker->count++;
356 }
357}
358
359static struct tcf_proto **red_find_tcf(struct Qdisc *sch, unsigned long cl)
360{
361 return NULL;
362}
363
20fea08b 364static const struct Qdisc_class_ops red_class_ops = {
f38c39d6
PM
365 .graft = red_graft,
366 .leaf = red_leaf,
367 .get = red_get,
368 .put = red_put,
369 .change = red_change_class,
370 .delete = red_delete,
371 .walk = red_walk,
372 .tcf_chain = red_find_tcf,
373 .dump = red_dump_class,
374};
375
20fea08b 376static struct Qdisc_ops red_qdisc_ops __read_mostly = {
1da177e4
LT
377 .id = "red",
378 .priv_size = sizeof(struct red_sched_data),
f38c39d6 379 .cl_ops = &red_class_ops,
1da177e4
LT
380 .enqueue = red_enqueue,
381 .dequeue = red_dequeue,
382 .requeue = red_requeue,
383 .drop = red_drop,
384 .init = red_init,
385 .reset = red_reset,
f38c39d6 386 .destroy = red_destroy,
1da177e4
LT
387 .change = red_change,
388 .dump = red_dump,
389 .dump_stats = red_dump_stats,
390 .owner = THIS_MODULE,
391};
392
393static int __init red_module_init(void)
394{
395 return register_qdisc(&red_qdisc_ops);
396}
dba051f3
TG
397
398static void __exit red_module_exit(void)
1da177e4
LT
399{
400 unregister_qdisc(&red_qdisc_ops);
401}
dba051f3 402
1da177e4
LT
403module_init(red_module_init)
404module_exit(red_module_exit)
dba051f3 405
1da177e4 406MODULE_LICENSE("GPL");
This page took 0.335435 seconds and 5 git commands to generate.