Merge branch 'liquidio-next'
[linux-2.6-block.git] / net / sched / sch_red.c
CommitLineData
1da177e4
LT
1/*
2 * net/sched/sch_red.c Random Early Detection queue.
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
10 *
11 * Changes:
dba051f3 12 * J Hadi Salim 980914: computation fixes
1da177e4 13 * Alexey Makarenko <makar@phoenix.kharkov.ua> 990814: qave on idle link was calculated incorrectly.
dba051f3 14 * J Hadi Salim 980816: ECN support
1da177e4
LT
15 */
16
1da177e4 17#include <linux/module.h>
1da177e4
LT
18#include <linux/types.h>
19#include <linux/kernel.h>
1da177e4 20#include <linux/skbuff.h>
1da177e4
LT
21#include <net/pkt_sched.h>
22#include <net/inet_ecn.h>
6b31b28a 23#include <net/red.h>
1da177e4
LT
24
25
6b31b28a 26/* Parameters, settable by user:
1da177e4
LT
27 -----------------------------
28
29 limit - bytes (must be > qth_max + burst)
30
31 Hard limit on queue length, should be chosen >qth_max
32 to allow packet bursts. This parameter does not
33 affect the algorithms behaviour and can be chosen
34 arbitrarily high (well, less than ram size)
35 Really, this limit will never be reached
36 if RED works correctly.
1da177e4
LT
37 */
38
cc7ec456 39struct red_sched_data {
6b31b28a
TG
40 u32 limit; /* HARD maximal queue length */
41 unsigned char flags;
8af2a218 42 struct timer_list adapt_timer;
6b31b28a 43 struct red_parms parms;
eeca6688 44 struct red_vars vars;
6b31b28a 45 struct red_stats stats;
f38c39d6 46 struct Qdisc *qdisc;
1da177e4
LT
47};
48
6b31b28a 49static inline int red_use_ecn(struct red_sched_data *q)
1da177e4 50{
6b31b28a 51 return q->flags & TC_RED_ECN;
1da177e4
LT
52}
53
bdc450a0
TG
54static inline int red_use_harddrop(struct red_sched_data *q)
55{
56 return q->flags & TC_RED_HARDDROP;
57}
58
cc7ec456 59static int red_enqueue(struct sk_buff *skb, struct Qdisc *sch)
1da177e4
LT
60{
61 struct red_sched_data *q = qdisc_priv(sch);
f38c39d6
PM
62 struct Qdisc *child = q->qdisc;
63 int ret;
1da177e4 64
eeca6688
ED
65 q->vars.qavg = red_calc_qavg(&q->parms,
66 &q->vars,
67 child->qstats.backlog);
1da177e4 68
eeca6688
ED
69 if (red_is_idling(&q->vars))
70 red_end_of_idle_period(&q->vars);
1da177e4 71
eeca6688 72 switch (red_action(&q->parms, &q->vars, q->vars.qavg)) {
cc7ec456
ED
73 case RED_DONT_MARK:
74 break;
75
76 case RED_PROB_MARK:
25331d6c 77 qdisc_qstats_overlimit(sch);
cc7ec456
ED
78 if (!red_use_ecn(q) || !INET_ECN_set_ce(skb)) {
79 q->stats.prob_drop++;
80 goto congestion_drop;
81 }
82
83 q->stats.prob_mark++;
84 break;
85
86 case RED_HARD_MARK:
25331d6c 87 qdisc_qstats_overlimit(sch);
cc7ec456
ED
88 if (red_use_harddrop(q) || !red_use_ecn(q) ||
89 !INET_ECN_set_ce(skb)) {
90 q->stats.forced_drop++;
91 goto congestion_drop;
92 }
93
94 q->stats.forced_mark++;
95 break;
1da177e4
LT
96 }
97
5f86173b 98 ret = qdisc_enqueue(skb, child);
f38c39d6 99 if (likely(ret == NET_XMIT_SUCCESS)) {
d7f4f332 100 qdisc_qstats_backlog_inc(sch, skb);
f38c39d6 101 sch->q.qlen++;
378a2f09 102 } else if (net_xmit_drop_count(ret)) {
f38c39d6 103 q->stats.pdrop++;
25331d6c 104 qdisc_qstats_drop(sch);
f38c39d6
PM
105 }
106 return ret;
6b31b28a
TG
107
108congestion_drop:
9e178ff2 109 qdisc_drop(skb, sch);
1da177e4
LT
110 return NET_XMIT_CN;
111}
112
cc7ec456 113static struct sk_buff *red_dequeue(struct Qdisc *sch)
1da177e4
LT
114{
115 struct sk_buff *skb;
116 struct red_sched_data *q = qdisc_priv(sch);
f38c39d6 117 struct Qdisc *child = q->qdisc;
1da177e4 118
f38c39d6 119 skb = child->dequeue(child);
9190b3b3
ED
120 if (skb) {
121 qdisc_bstats_update(sch, skb);
d7f4f332 122 qdisc_qstats_backlog_dec(sch, skb);
f38c39d6 123 sch->q.qlen--;
9190b3b3 124 } else {
eeca6688
ED
125 if (!red_is_idling(&q->vars))
126 red_start_of_idle_period(&q->vars);
9190b3b3 127 }
9e178ff2 128 return skb;
1da177e4
LT
129}
130
cc7ec456 131static struct sk_buff *red_peek(struct Qdisc *sch)
8e3af978
JP
132{
133 struct red_sched_data *q = qdisc_priv(sch);
134 struct Qdisc *child = q->qdisc;
135
136 return child->ops->peek(child);
137}
138
cc7ec456 139static void red_reset(struct Qdisc *sch)
1da177e4
LT
140{
141 struct red_sched_data *q = qdisc_priv(sch);
142
f38c39d6 143 qdisc_reset(q->qdisc);
d7f4f332 144 sch->qstats.backlog = 0;
f38c39d6 145 sch->q.qlen = 0;
eeca6688 146 red_restart(&q->vars);
1da177e4
LT
147}
148
f38c39d6
PM
149static void red_destroy(struct Qdisc *sch)
150{
151 struct red_sched_data *q = qdisc_priv(sch);
8af2a218
ED
152
153 del_timer_sync(&q->adapt_timer);
f38c39d6
PM
154 qdisc_destroy(q->qdisc);
155}
156
27a3421e
PM
157static const struct nla_policy red_policy[TCA_RED_MAX + 1] = {
158 [TCA_RED_PARMS] = { .len = sizeof(struct tc_red_qopt) },
159 [TCA_RED_STAB] = { .len = RED_STAB_SIZE },
a73ed26b 160 [TCA_RED_MAX_P] = { .type = NLA_U32 },
27a3421e
PM
161};
162
1e90474c 163static int red_change(struct Qdisc *sch, struct nlattr *opt)
1da177e4
LT
164{
165 struct red_sched_data *q = qdisc_priv(sch);
1e90474c 166 struct nlattr *tb[TCA_RED_MAX + 1];
1da177e4 167 struct tc_red_qopt *ctl;
f38c39d6 168 struct Qdisc *child = NULL;
cee63723 169 int err;
a73ed26b 170 u32 max_P;
1da177e4 171
cee63723 172 if (opt == NULL)
dba051f3
TG
173 return -EINVAL;
174
27a3421e 175 err = nla_parse_nested(tb, TCA_RED_MAX, opt, red_policy);
cee63723
PM
176 if (err < 0)
177 return err;
178
1e90474c 179 if (tb[TCA_RED_PARMS] == NULL ||
27a3421e 180 tb[TCA_RED_STAB] == NULL)
1da177e4
LT
181 return -EINVAL;
182
a73ed26b
ED
183 max_P = tb[TCA_RED_MAX_P] ? nla_get_u32(tb[TCA_RED_MAX_P]) : 0;
184
1e90474c 185 ctl = nla_data(tb[TCA_RED_PARMS]);
1da177e4 186
f38c39d6 187 if (ctl->limit > 0) {
fb0305ce
PM
188 child = fifo_create_dflt(sch, &bfifo_qdisc_ops, ctl->limit);
189 if (IS_ERR(child))
190 return PTR_ERR(child);
f38c39d6
PM
191 }
192
1da177e4
LT
193 sch_tree_lock(sch);
194 q->flags = ctl->flags;
1da177e4 195 q->limit = ctl->limit;
5e50da01 196 if (child) {
2ccccf5f
WC
197 qdisc_tree_reduce_backlog(q->qdisc, q->qdisc->q.qlen,
198 q->qdisc->qstats.backlog);
b94c8afc
PM
199 qdisc_destroy(q->qdisc);
200 q->qdisc = child;
5e50da01 201 }
1da177e4 202
eeca6688
ED
203 red_set_parms(&q->parms,
204 ctl->qth_min, ctl->qth_max, ctl->Wlog,
a73ed26b
ED
205 ctl->Plog, ctl->Scell_log,
206 nla_data(tb[TCA_RED_STAB]),
207 max_P);
eeca6688 208 red_set_vars(&q->vars);
6b31b28a 209
8af2a218
ED
210 del_timer(&q->adapt_timer);
211 if (ctl->flags & TC_RED_ADAPTATIVE)
212 mod_timer(&q->adapt_timer, jiffies + HZ/2);
213
1ee5fa1e 214 if (!q->qdisc->q.qlen)
eeca6688 215 red_start_of_idle_period(&q->vars);
dba051f3 216
1da177e4
LT
217 sch_tree_unlock(sch);
218 return 0;
219}
220
8af2a218
ED
221static inline void red_adaptative_timer(unsigned long arg)
222{
223 struct Qdisc *sch = (struct Qdisc *)arg;
224 struct red_sched_data *q = qdisc_priv(sch);
225 spinlock_t *root_lock = qdisc_lock(qdisc_root_sleeping(sch));
226
227 spin_lock(root_lock);
eeca6688 228 red_adaptative_algo(&q->parms, &q->vars);
8af2a218
ED
229 mod_timer(&q->adapt_timer, jiffies + HZ/2);
230 spin_unlock(root_lock);
231}
232
cc7ec456 233static int red_init(struct Qdisc *sch, struct nlattr *opt)
1da177e4 234{
f38c39d6
PM
235 struct red_sched_data *q = qdisc_priv(sch);
236
237 q->qdisc = &noop_qdisc;
8af2a218 238 setup_timer(&q->adapt_timer, red_adaptative_timer, (unsigned long)sch);
1da177e4
LT
239 return red_change(sch, opt);
240}
241
242static int red_dump(struct Qdisc *sch, struct sk_buff *skb)
243{
244 struct red_sched_data *q = qdisc_priv(sch);
1e90474c 245 struct nlattr *opts = NULL;
6b31b28a
TG
246 struct tc_red_qopt opt = {
247 .limit = q->limit,
248 .flags = q->flags,
249 .qth_min = q->parms.qth_min >> q->parms.Wlog,
250 .qth_max = q->parms.qth_max >> q->parms.Wlog,
251 .Wlog = q->parms.Wlog,
252 .Plog = q->parms.Plog,
253 .Scell_log = q->parms.Scell_log,
254 };
1da177e4 255
0dfb33a0 256 sch->qstats.backlog = q->qdisc->qstats.backlog;
1e90474c
PM
257 opts = nla_nest_start(skb, TCA_OPTIONS);
258 if (opts == NULL)
259 goto nla_put_failure;
1b34ec43
DM
260 if (nla_put(skb, TCA_RED_PARMS, sizeof(opt), &opt) ||
261 nla_put_u32(skb, TCA_RED_MAX_P, q->parms.max_P))
262 goto nla_put_failure;
1e90474c 263 return nla_nest_end(skb, opts);
1da177e4 264
1e90474c 265nla_put_failure:
bc3ed28c
TG
266 nla_nest_cancel(skb, opts);
267 return -EMSGSIZE;
1da177e4
LT
268}
269
270static int red_dump_stats(struct Qdisc *sch, struct gnet_dump *d)
271{
272 struct red_sched_data *q = qdisc_priv(sch);
6b31b28a
TG
273 struct tc_red_xstats st = {
274 .early = q->stats.prob_drop + q->stats.forced_drop,
275 .pdrop = q->stats.pdrop,
276 .other = q->stats.other,
277 .marked = q->stats.prob_mark + q->stats.forced_mark,
278 };
279
280 return gnet_stats_copy_app(d, &st, sizeof(st));
1da177e4
LT
281}
282
f38c39d6
PM
283static int red_dump_class(struct Qdisc *sch, unsigned long cl,
284 struct sk_buff *skb, struct tcmsg *tcm)
285{
286 struct red_sched_data *q = qdisc_priv(sch);
287
f38c39d6
PM
288 tcm->tcm_handle |= TC_H_MIN(1);
289 tcm->tcm_info = q->qdisc->handle;
290 return 0;
291}
292
293static int red_graft(struct Qdisc *sch, unsigned long arg, struct Qdisc *new,
294 struct Qdisc **old)
295{
296 struct red_sched_data *q = qdisc_priv(sch);
297
298 if (new == NULL)
299 new = &noop_qdisc;
300
86a7996c 301 *old = qdisc_replace(sch, new, &q->qdisc);
f38c39d6
PM
302 return 0;
303}
304
305static struct Qdisc *red_leaf(struct Qdisc *sch, unsigned long arg)
306{
307 struct red_sched_data *q = qdisc_priv(sch);
308 return q->qdisc;
309}
310
311static unsigned long red_get(struct Qdisc *sch, u32 classid)
312{
313 return 1;
314}
315
316static void red_put(struct Qdisc *sch, unsigned long arg)
317{
f38c39d6
PM
318}
319
f38c39d6
PM
320static void red_walk(struct Qdisc *sch, struct qdisc_walker *walker)
321{
322 if (!walker->stop) {
323 if (walker->count >= walker->skip)
324 if (walker->fn(sch, 1, walker) < 0) {
325 walker->stop = 1;
326 return;
327 }
328 walker->count++;
329 }
330}
331
20fea08b 332static const struct Qdisc_class_ops red_class_ops = {
f38c39d6
PM
333 .graft = red_graft,
334 .leaf = red_leaf,
335 .get = red_get,
336 .put = red_put,
f38c39d6 337 .walk = red_walk,
f38c39d6
PM
338 .dump = red_dump_class,
339};
340
20fea08b 341static struct Qdisc_ops red_qdisc_ops __read_mostly = {
1da177e4
LT
342 .id = "red",
343 .priv_size = sizeof(struct red_sched_data),
f38c39d6 344 .cl_ops = &red_class_ops,
1da177e4
LT
345 .enqueue = red_enqueue,
346 .dequeue = red_dequeue,
8e3af978 347 .peek = red_peek,
1da177e4
LT
348 .init = red_init,
349 .reset = red_reset,
f38c39d6 350 .destroy = red_destroy,
1da177e4
LT
351 .change = red_change,
352 .dump = red_dump,
353 .dump_stats = red_dump_stats,
354 .owner = THIS_MODULE,
355};
356
357static int __init red_module_init(void)
358{
359 return register_qdisc(&red_qdisc_ops);
360}
dba051f3
TG
361
362static void __exit red_module_exit(void)
1da177e4
LT
363{
364 unregister_qdisc(&red_qdisc_ops);
365}
dba051f3 366
1da177e4
LT
367module_init(red_module_init)
368module_exit(red_module_exit)
dba051f3 369
1da177e4 370MODULE_LICENSE("GPL");