]> git.proxmox.com Git - mirror_ubuntu-bionic-kernel.git/blame - net/sched/sch_gred.c
[NET] RXRPC: Fix whitespace errors.
[mirror_ubuntu-bionic-kernel.git] / net / sched / sch_gred.c
CommitLineData
1da177e4
LT
1/*
2 * net/sched/sch_gred.c Generic Random Early Detection queue.
3 *
4 *
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License
7 * as published by the Free Software Foundation; either version
8 * 2 of the License, or (at your option) any later version.
9 *
10 * Authors: J Hadi Salim (hadi@cyberus.ca) 1998-2002
11 *
12 * 991129: - Bug fix with grio mode
13 * - a better sing. AvgQ mode with Grio(WRED)
14 * - A finer grained VQ dequeue based on sugestion
15 * from Ren Liu
16 * - More error checks
17 *
1e4dfaf9 18 * For all the glorious comments look at include/net/red.h
1da177e4
LT
19 */
20
1da177e4 21#include <linux/module.h>
1da177e4
LT
22#include <linux/types.h>
23#include <linux/kernel.h>
1da177e4 24#include <linux/netdevice.h>
1da177e4 25#include <linux/skbuff.h>
1da177e4 26#include <net/pkt_sched.h>
22b33429 27#include <net/red.h>
1da177e4 28
f62d6b93 29#define GRED_DEF_PRIO (MAX_DPs / 2)
716a1b40 30#define GRED_VQ_MASK (MAX_DPs - 1)
f62d6b93 31
1da177e4
LT
32struct gred_sched_data;
33struct gred_sched;
34
35struct gred_sched_data
36{
1da177e4 37 u32 limit; /* HARD maximal queue length */
1da177e4 38 u32 DP; /* the drop pramaters */
1da177e4
LT
39 u32 bytesin; /* bytes seen on virtualQ so far*/
40 u32 packetsin; /* packets seen on virtualQ so far*/
41 u32 backlog; /* bytes on the virtualQ */
1e4dfaf9 42 u8 prio; /* the prio of this vq */
1da177e4 43
22b33429
TG
44 struct red_parms parms;
45 struct red_stats stats;
1da177e4
LT
46};
47
dea3f628
TG
48enum {
49 GRED_WRED_MODE = 1,
d6fd4e96 50 GRED_RIO_MODE,
dea3f628
TG
51};
52
1da177e4
LT
53struct gred_sched
54{
55 struct gred_sched_data *tab[MAX_DPs];
dea3f628 56 unsigned long flags;
b38c7eef 57 u32 red_flags;
1e4dfaf9
TG
58 u32 DPs;
59 u32 def;
7051703b 60 struct red_parms wred_set;
1da177e4
LT
61};
62
dea3f628
TG
63static inline int gred_wred_mode(struct gred_sched *table)
64{
65 return test_bit(GRED_WRED_MODE, &table->flags);
66}
67
68static inline void gred_enable_wred_mode(struct gred_sched *table)
69{
70 __set_bit(GRED_WRED_MODE, &table->flags);
71}
72
73static inline void gred_disable_wred_mode(struct gred_sched *table)
74{
75 __clear_bit(GRED_WRED_MODE, &table->flags);
76}
77
d6fd4e96
TG
78static inline int gred_rio_mode(struct gred_sched *table)
79{
80 return test_bit(GRED_RIO_MODE, &table->flags);
81}
82
83static inline void gred_enable_rio_mode(struct gred_sched *table)
84{
85 __set_bit(GRED_RIO_MODE, &table->flags);
86}
87
88static inline void gred_disable_rio_mode(struct gred_sched *table)
89{
90 __clear_bit(GRED_RIO_MODE, &table->flags);
91}
92
dea3f628
TG
93static inline int gred_wred_mode_check(struct Qdisc *sch)
94{
95 struct gred_sched *table = qdisc_priv(sch);
96 int i;
97
98 /* Really ugly O(n^2) but shouldn't be necessary too frequent. */
99 for (i = 0; i < table->DPs; i++) {
100 struct gred_sched_data *q = table->tab[i];
101 int n;
102
103 if (q == NULL)
104 continue;
105
106 for (n = 0; n < table->DPs; n++)
107 if (table->tab[n] && table->tab[n] != q &&
108 table->tab[n]->prio == q->prio)
109 return 1;
110 }
111
112 return 0;
113}
114
22b33429
TG
115static inline unsigned int gred_backlog(struct gred_sched *table,
116 struct gred_sched_data *q,
117 struct Qdisc *sch)
118{
119 if (gred_wred_mode(table))
120 return sch->qstats.backlog;
121 else
122 return q->backlog;
123}
124
716a1b40
TG
125static inline u16 tc_index_to_dp(struct sk_buff *skb)
126{
127 return skb->tc_index & GRED_VQ_MASK;
128}
129
7051703b
TG
130static inline void gred_load_wred_set(struct gred_sched *table,
131 struct gred_sched_data *q)
132{
133 q->parms.qavg = table->wred_set.qavg;
134 q->parms.qidlestart = table->wred_set.qidlestart;
135}
136
137static inline void gred_store_wred_set(struct gred_sched *table,
138 struct gred_sched_data *q)
139{
140 table->wred_set.qavg = q->parms.qavg;
141}
142
b38c7eef
TG
143static inline int gred_use_ecn(struct gred_sched *t)
144{
145 return t->red_flags & TC_RED_ECN;
146}
147
bdc450a0
TG
148static inline int gred_use_harddrop(struct gred_sched *t)
149{
150 return t->red_flags & TC_RED_HARDDROP;
151}
152
1e4dfaf9 153static int gred_enqueue(struct sk_buff *skb, struct Qdisc* sch)
1da177e4 154{
1da177e4
LT
155 struct gred_sched_data *q=NULL;
156 struct gred_sched *t= qdisc_priv(sch);
22b33429 157 unsigned long qavg = 0;
4a591834 158 u16 dp = tc_index_to_dp(skb);
1da177e4 159
716a1b40 160 if (dp >= t->DPs || (q = t->tab[dp]) == NULL) {
18e3fb84
TG
161 dp = t->def;
162
163 if ((q = t->tab[dp]) == NULL) {
164 /* Pass through packets not assigned to a DP
165 * if no default DP has been configured. This
166 * allows for DP flows to be left untouched.
167 */
168 if (skb_queue_len(&sch->q) < sch->dev->tx_queue_len)
169 return qdisc_enqueue_tail(skb, sch);
170 else
171 goto drop;
1da177e4 172 }
18e3fb84 173
1da177e4
LT
174 /* fix tc_index? --could be controvesial but needed for
175 requeueing */
18e3fb84 176 skb->tc_index = (skb->tc_index & ~GRED_VQ_MASK) | dp;
1da177e4
LT
177 }
178
1e4dfaf9 179 /* sum up all the qaves of prios <= to ours to get the new qave */
d6fd4e96 180 if (!gred_wred_mode(t) && gred_rio_mode(t)) {
1e4dfaf9
TG
181 int i;
182
183 for (i = 0; i < t->DPs; i++) {
184 if (t->tab[i] && t->tab[i]->prio < q->prio &&
22b33429
TG
185 !red_is_idling(&t->tab[i]->parms))
186 qavg +=t->tab[i]->parms.qavg;
1da177e4 187 }
1e4dfaf9 188
1da177e4
LT
189 }
190
191 q->packetsin++;
1e4dfaf9 192 q->bytesin += skb->len;
1da177e4 193
1e4dfaf9 194 if (gred_wred_mode(t))
7051703b 195 gred_load_wred_set(t, q);
1da177e4 196
22b33429 197 q->parms.qavg = red_calc_qavg(&q->parms, gred_backlog(t, q, sch));
1da177e4 198
22b33429
TG
199 if (red_is_idling(&q->parms))
200 red_end_of_idle_period(&q->parms);
1da177e4 201
dea3f628 202 if (gred_wred_mode(t))
7051703b 203 gred_store_wred_set(t, q);
1da177e4 204
22b33429
TG
205 switch (red_action(&q->parms, q->parms.qavg + qavg)) {
206 case RED_DONT_MARK:
207 break;
1da177e4 208
22b33429
TG
209 case RED_PROB_MARK:
210 sch->qstats.overlimits++;
b38c7eef
TG
211 if (!gred_use_ecn(t) || !INET_ECN_set_ce(skb)) {
212 q->stats.prob_drop++;
213 goto congestion_drop;
214 }
215
216 q->stats.prob_mark++;
217 break;
22b33429
TG
218
219 case RED_HARD_MARK:
220 sch->qstats.overlimits++;
bdc450a0
TG
221 if (gred_use_harddrop(t) || !gred_use_ecn(t) ||
222 !INET_ECN_set_ce(skb)) {
b38c7eef
TG
223 q->stats.forced_drop++;
224 goto congestion_drop;
225 }
226 q->stats.forced_mark++;
227 break;
1da177e4 228 }
22b33429
TG
229
230 if (q->backlog + skb->len <= q->limit) {
231 q->backlog += skb->len;
edf7a7b1 232 return qdisc_enqueue_tail(skb, sch);
1da177e4 233 }
22b33429
TG
234
235 q->stats.pdrop++;
236drop:
edf7a7b1 237 return qdisc_drop(skb, sch);
c3b553cd
TG
238
239congestion_drop:
edf7a7b1 240 qdisc_drop(skb, sch);
c3b553cd 241 return NET_XMIT_CN;
1da177e4
LT
242}
243
1e4dfaf9 244static int gred_requeue(struct sk_buff *skb, struct Qdisc* sch)
1da177e4 245{
716a1b40 246 struct gred_sched *t = qdisc_priv(sch);
18e3fb84
TG
247 struct gred_sched_data *q;
248 u16 dp = tc_index_to_dp(skb);
249
250 if (dp >= t->DPs || (q = t->tab[dp]) == NULL) {
251 if (net_ratelimit())
252 printk(KERN_WARNING "GRED: Unable to relocate VQ 0x%x "
253 "for requeue, screwing up backlog.\n",
254 tc_index_to_dp(skb));
255 } else {
256 if (red_is_idling(&q->parms))
257 red_end_of_idle_period(&q->parms);
258 q->backlog += skb->len;
259 }
1da177e4 260
edf7a7b1 261 return qdisc_requeue(skb, sch);
1da177e4
LT
262}
263
1e4dfaf9 264static struct sk_buff *gred_dequeue(struct Qdisc* sch)
1da177e4
LT
265{
266 struct sk_buff *skb;
1e4dfaf9 267 struct gred_sched *t = qdisc_priv(sch);
1da177e4 268
edf7a7b1
TG
269 skb = qdisc_dequeue_head(sch);
270
1da177e4 271 if (skb) {
1e4dfaf9 272 struct gred_sched_data *q;
18e3fb84
TG
273 u16 dp = tc_index_to_dp(skb);
274
275 if (dp >= t->DPs || (q = t->tab[dp]) == NULL) {
276 if (net_ratelimit())
277 printk(KERN_WARNING "GRED: Unable to relocate "
278 "VQ 0x%x after dequeue, screwing up "
279 "backlog.\n", tc_index_to_dp(skb));
280 } else {
1da177e4 281 q->backlog -= skb->len;
18e3fb84 282
dea3f628 283 if (!q->backlog && !gred_wred_mode(t))
22b33429 284 red_start_of_idle_period(&q->parms);
1da177e4 285 }
18e3fb84 286
1da177e4
LT
287 return skb;
288 }
289
d8f64e19 290 if (gred_wred_mode(t) && !red_is_idling(&t->wred_set))
7051703b 291 red_start_of_idle_period(&t->wred_set);
1da177e4
LT
292
293 return NULL;
294}
295
296static unsigned int gred_drop(struct Qdisc* sch)
297{
298 struct sk_buff *skb;
1e4dfaf9 299 struct gred_sched *t = qdisc_priv(sch);
1da177e4 300
edf7a7b1 301 skb = qdisc_dequeue_tail(sch);
1da177e4
LT
302 if (skb) {
303 unsigned int len = skb->len;
1e4dfaf9 304 struct gred_sched_data *q;
18e3fb84
TG
305 u16 dp = tc_index_to_dp(skb);
306
307 if (dp >= t->DPs || (q = t->tab[dp]) == NULL) {
308 if (net_ratelimit())
309 printk(KERN_WARNING "GRED: Unable to relocate "
310 "VQ 0x%x while dropping, screwing up "
311 "backlog.\n", tc_index_to_dp(skb));
312 } else {
1da177e4 313 q->backlog -= len;
22b33429 314 q->stats.other++;
18e3fb84 315
dea3f628 316 if (!q->backlog && !gred_wred_mode(t))
22b33429 317 red_start_of_idle_period(&q->parms);
1da177e4
LT
318 }
319
edf7a7b1 320 qdisc_drop(skb, sch);
1da177e4
LT
321 return len;
322 }
323
d8f64e19 324 if (gred_wred_mode(t) && !red_is_idling(&t->wred_set))
7051703b 325 red_start_of_idle_period(&t->wred_set);
1da177e4 326
1da177e4
LT
327 return 0;
328
329}
330
331static void gred_reset(struct Qdisc* sch)
332{
333 int i;
1e4dfaf9 334 struct gred_sched *t = qdisc_priv(sch);
1da177e4 335
edf7a7b1 336 qdisc_reset_queue(sch);
1da177e4 337
1e4dfaf9
TG
338 for (i = 0; i < t->DPs; i++) {
339 struct gred_sched_data *q = t->tab[i];
340
341 if (!q)
342 continue;
343
22b33429 344 red_restart(&q->parms);
1da177e4 345 q->backlog = 0;
1da177e4
LT
346 }
347}
348
6639607e
TG
349static inline void gred_destroy_vq(struct gred_sched_data *q)
350{
351 kfree(q);
352}
353
354static inline int gred_change_table_def(struct Qdisc *sch, struct rtattr *dps)
1da177e4
LT
355{
356 struct gred_sched *table = qdisc_priv(sch);
1da177e4 357 struct tc_gred_sopt *sopt;
6639607e 358 int i;
1da177e4 359
6639607e 360 if (dps == NULL || RTA_PAYLOAD(dps) < sizeof(*sopt))
1da177e4
LT
361 return -EINVAL;
362
6639607e 363 sopt = RTA_DATA(dps);
1da177e4 364
6639607e
TG
365 if (sopt->DPs > MAX_DPs || sopt->DPs == 0 || sopt->def_DP >= sopt->DPs)
366 return -EINVAL;
1da177e4 367
6639607e
TG
368 sch_tree_lock(sch);
369 table->DPs = sopt->DPs;
370 table->def = sopt->def_DP;
b38c7eef 371 table->red_flags = sopt->flags;
dea3f628 372
6639607e
TG
373 /*
374 * Every entry point to GRED is synchronized with the above code
375 * and the DP is checked against DPs, i.e. shadowed VQs can no
376 * longer be found so we can unlock right here.
377 */
378 sch_tree_unlock(sch);
dea3f628 379
6639607e
TG
380 if (sopt->grio) {
381 gred_enable_rio_mode(table);
382 gred_disable_wred_mode(table);
383 if (gred_wred_mode_check(sch))
384 gred_enable_wred_mode(table);
385 } else {
386 gred_disable_rio_mode(table);
387 gred_disable_wred_mode(table);
388 }
389
390 for (i = table->DPs; i < MAX_DPs; i++) {
391 if (table->tab[i]) {
392 printk(KERN_WARNING "GRED: Warning: Destroying "
393 "shadowed VQ 0x%x\n", i);
394 gred_destroy_vq(table->tab[i]);
395 table->tab[i] = NULL;
396 }
397 }
1da177e4 398
6639607e
TG
399 return 0;
400}
401
f62d6b93
TG
402static inline int gred_change_vq(struct Qdisc *sch, int dp,
403 struct tc_gred_qopt *ctl, int prio, u8 *stab)
6639607e
TG
404{
405 struct gred_sched *table = qdisc_priv(sch);
406 struct gred_sched_data *q;
f62d6b93
TG
407
408 if (table->tab[dp] == NULL) {
0da974f4 409 table->tab[dp] = kzalloc(sizeof(*q), GFP_KERNEL);
f62d6b93
TG
410 if (table->tab[dp] == NULL)
411 return -ENOMEM;
f62d6b93
TG
412 }
413
414 q = table->tab[dp];
415 q->DP = dp;
416 q->prio = prio;
f62d6b93 417 q->limit = ctl->limit;
22b33429
TG
418
419 if (q->backlog == 0)
420 red_end_of_idle_period(&q->parms);
421
422 red_set_parms(&q->parms,
423 ctl->qth_min, ctl->qth_max, ctl->Wlog, ctl->Plog,
424 ctl->Scell_log, stab);
425
f62d6b93
TG
426 return 0;
427}
428
429static int gred_change(struct Qdisc *sch, struct rtattr *opt)
430{
431 struct gred_sched *table = qdisc_priv(sch);
6639607e 432 struct tc_gred_qopt *ctl;
f62d6b93
TG
433 struct rtattr *tb[TCA_GRED_MAX];
434 int err = -EINVAL, prio = GRED_DEF_PRIO;
435 u8 *stab;
6639607e 436
f62d6b93 437 if (opt == NULL || rtattr_parse_nested(tb, TCA_GRED_MAX, opt))
6639607e
TG
438 return -EINVAL;
439
440 if (tb[TCA_GRED_PARMS-1] == NULL && tb[TCA_GRED_STAB-1] == NULL)
f62d6b93 441 return gred_change_table_def(sch, opt);
1da177e4 442
f62d6b93
TG
443 if (tb[TCA_GRED_PARMS-1] == NULL ||
444 RTA_PAYLOAD(tb[TCA_GRED_PARMS-1]) < sizeof(*ctl) ||
445 tb[TCA_GRED_STAB-1] == NULL ||
446 RTA_PAYLOAD(tb[TCA_GRED_STAB-1]) < 256)
447 return -EINVAL;
1da177e4
LT
448
449 ctl = RTA_DATA(tb[TCA_GRED_PARMS-1]);
f62d6b93 450 stab = RTA_DATA(tb[TCA_GRED_STAB-1]);
a8aaa995
TG
451
452 if (ctl->DP >= table->DPs)
f62d6b93 453 goto errout;
1da177e4 454
d6fd4e96 455 if (gred_rio_mode(table)) {
f62d6b93
TG
456 if (ctl->prio == 0) {
457 int def_prio = GRED_DEF_PRIO;
458
459 if (table->tab[table->def])
460 def_prio = table->tab[table->def]->prio;
461
462 printk(KERN_DEBUG "GRED: DP %u does not have a prio "
463 "setting default to %d\n", ctl->DP, def_prio);
464
465 prio = def_prio;
466 } else
467 prio = ctl->prio;
1da177e4
LT
468 }
469
f62d6b93 470 sch_tree_lock(sch);
1da177e4 471
f62d6b93
TG
472 err = gred_change_vq(sch, ctl->DP, ctl, prio, stab);
473 if (err < 0)
474 goto errout_locked;
1da177e4 475
d6fd4e96 476 if (gred_rio_mode(table)) {
dea3f628
TG
477 gred_disable_wred_mode(table);
478 if (gred_wred_mode_check(sch))
479 gred_enable_wred_mode(table);
1da177e4
LT
480 }
481
f62d6b93 482 err = 0;
1da177e4 483
f62d6b93
TG
484errout_locked:
485 sch_tree_unlock(sch);
486errout:
487 return err;
1da177e4
LT
488}
489
490static int gred_init(struct Qdisc *sch, struct rtattr *opt)
491{
6639607e 492 struct rtattr *tb[TCA_GRED_MAX];
1da177e4 493
6639607e 494 if (opt == NULL || rtattr_parse_nested(tb, TCA_GRED_MAX, opt))
1da177e4
LT
495 return -EINVAL;
496
6639607e
TG
497 if (tb[TCA_GRED_PARMS-1] || tb[TCA_GRED_STAB-1])
498 return -EINVAL;
1da177e4 499
6639607e 500 return gred_change_table_def(sch, tb[TCA_GRED_DPS-1]);
1da177e4
LT
501}
502
503static int gred_dump(struct Qdisc *sch, struct sk_buff *skb)
504{
1da177e4 505 struct gred_sched *table = qdisc_priv(sch);
05f1cc01 506 struct rtattr *parms, *opts = NULL;
1da177e4 507 int i;
e0636822
TG
508 struct tc_gred_sopt sopt = {
509 .DPs = table->DPs,
510 .def_DP = table->def,
511 .grio = gred_rio_mode(table),
b38c7eef 512 .flags = table->red_flags,
e0636822 513 };
1da177e4 514
05f1cc01 515 opts = RTA_NEST(skb, TCA_OPTIONS);
e0636822 516 RTA_PUT(skb, TCA_GRED_DPS, sizeof(sopt), &sopt);
05f1cc01 517 parms = RTA_NEST(skb, TCA_GRED_PARMS);
1da177e4 518
05f1cc01
TG
519 for (i = 0; i < MAX_DPs; i++) {
520 struct gred_sched_data *q = table->tab[i];
521 struct tc_gred_qopt opt;
1da177e4 522
05f1cc01 523 memset(&opt, 0, sizeof(opt));
1da177e4
LT
524
525 if (!q) {
526 /* hack -- fix at some point with proper message
527 This is how we indicate to tc that there is no VQ
528 at this DP */
529
05f1cc01
TG
530 opt.DP = MAX_DPs + i;
531 goto append_opt;
1da177e4
LT
532 }
533
05f1cc01
TG
534 opt.limit = q->limit;
535 opt.DP = q->DP;
536 opt.backlog = q->backlog;
537 opt.prio = q->prio;
22b33429
TG
538 opt.qth_min = q->parms.qth_min >> q->parms.Wlog;
539 opt.qth_max = q->parms.qth_max >> q->parms.Wlog;
540 opt.Wlog = q->parms.Wlog;
541 opt.Plog = q->parms.Plog;
542 opt.Scell_log = q->parms.Scell_log;
543 opt.other = q->stats.other;
544 opt.early = q->stats.prob_drop;
545 opt.forced = q->stats.forced_drop;
546 opt.pdrop = q->stats.pdrop;
05f1cc01
TG
547 opt.packets = q->packetsin;
548 opt.bytesin = q->bytesin;
549
22b33429
TG
550 if (gred_wred_mode(table)) {
551 q->parms.qidlestart =
552 table->tab[table->def]->parms.qidlestart;
553 q->parms.qavg = table->tab[table->def]->parms.qavg;
1da177e4 554 }
05f1cc01 555
22b33429
TG
556 opt.qave = red_calc_qavg(&q->parms, q->parms.qavg);
557
05f1cc01
TG
558append_opt:
559 RTA_APPEND(skb, sizeof(opt), &opt);
1da177e4
LT
560 }
561
05f1cc01 562 RTA_NEST_END(skb, parms);
1da177e4 563
05f1cc01 564 return RTA_NEST_END(skb, opts);
1da177e4
LT
565
566rtattr_failure:
05f1cc01 567 return RTA_NEST_CANCEL(skb, opts);
1da177e4
LT
568}
569
570static void gred_destroy(struct Qdisc *sch)
571{
572 struct gred_sched *table = qdisc_priv(sch);
573 int i;
574
1e4dfaf9 575 for (i = 0; i < table->DPs; i++) {
1da177e4 576 if (table->tab[i])
6639607e 577 gred_destroy_vq(table->tab[i]);
1da177e4
LT
578 }
579}
580
581static struct Qdisc_ops gred_qdisc_ops = {
1da177e4
LT
582 .id = "gred",
583 .priv_size = sizeof(struct gred_sched),
584 .enqueue = gred_enqueue,
585 .dequeue = gred_dequeue,
586 .requeue = gred_requeue,
587 .drop = gred_drop,
588 .init = gred_init,
589 .reset = gred_reset,
590 .destroy = gred_destroy,
591 .change = gred_change,
592 .dump = gred_dump,
593 .owner = THIS_MODULE,
594};
595
596static int __init gred_module_init(void)
597{
598 return register_qdisc(&gred_qdisc_ops);
599}
1e4dfaf9
TG
600
601static void __exit gred_module_exit(void)
1da177e4
LT
602{
603 unregister_qdisc(&gred_qdisc_ops);
604}
1e4dfaf9 605
1da177e4
LT
606module_init(gred_module_init)
607module_exit(gred_module_exit)
1e4dfaf9 608
1da177e4 609MODULE_LICENSE("GPL");