6b31b28a44
Simplifies code a lot by separating the red algorithm and the queueing logic. We now differentiate between probability marks and forced marks but sum them together again to not break backwards compatibility. Signed-off-by: Thomas Graf <tgraf@suug.ch> Signed-off-by: Arnaldo Carvalho de Melo <acme@mandriva.com>
287 lines
6.5 KiB
C
287 lines
6.5 KiB
C
/*
|
|
* net/sched/sch_red.c Random Early Detection queue.
|
|
*
|
|
* This program is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU General Public License
|
|
* as published by the Free Software Foundation; either version
|
|
* 2 of the License, or (at your option) any later version.
|
|
*
|
|
* Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
|
|
*
|
|
* Changes:
|
|
* J Hadi Salim <hadi@nortel.com> 980914: computation fixes
|
|
* Alexey Makarenko <makar@phoenix.kharkov.ua> 990814: qave on idle link was calculated incorrectly.
|
|
* J Hadi Salim <hadi@nortelnetworks.com> 980816: ECN support
|
|
*/
|
|
|
|
#include <linux/config.h>
|
|
#include <linux/module.h>
|
|
#include <asm/uaccess.h>
|
|
#include <asm/system.h>
|
|
#include <linux/bitops.h>
|
|
#include <linux/types.h>
|
|
#include <linux/kernel.h>
|
|
#include <linux/sched.h>
|
|
#include <linux/string.h>
|
|
#include <linux/mm.h>
|
|
#include <linux/socket.h>
|
|
#include <linux/sockios.h>
|
|
#include <linux/in.h>
|
|
#include <linux/errno.h>
|
|
#include <linux/interrupt.h>
|
|
#include <linux/if_ether.h>
|
|
#include <linux/inet.h>
|
|
#include <linux/netdevice.h>
|
|
#include <linux/etherdevice.h>
|
|
#include <linux/notifier.h>
|
|
#include <net/ip.h>
|
|
#include <net/route.h>
|
|
#include <linux/skbuff.h>
|
|
#include <net/sock.h>
|
|
#include <net/pkt_sched.h>
|
|
#include <net/inet_ecn.h>
|
|
#include <net/dsfield.h>
|
|
#include <net/red.h>
|
|
|
|
|
|
/* Parameters, settable by user:
|
|
-----------------------------
|
|
|
|
limit - bytes (must be > qth_max + burst)
|
|
|
|
Hard limit on queue length, should be chosen >qth_max
|
|
to allow packet bursts. This parameter does not
|
|
affect the algorithms behaviour and can be chosen
|
|
arbitrarily high (well, less than ram size)
|
|
Really, this limit will never be reached
|
|
if RED works correctly.
|
|
*/
|
|
|
|
struct red_sched_data
|
|
{
|
|
u32 limit; /* HARD maximal queue length */
|
|
unsigned char flags;
|
|
struct red_parms parms;
|
|
struct red_stats stats;
|
|
};
|
|
|
|
static inline int red_use_ecn(struct red_sched_data *q)
|
|
{
|
|
return q->flags & TC_RED_ECN;
|
|
}
|
|
|
|
static int
|
|
red_enqueue(struct sk_buff *skb, struct Qdisc* sch)
|
|
{
|
|
struct red_sched_data *q = qdisc_priv(sch);
|
|
|
|
q->parms.qavg = red_calc_qavg(&q->parms, sch->qstats.backlog);
|
|
|
|
if (red_is_idling(&q->parms))
|
|
red_end_of_idle_period(&q->parms);
|
|
|
|
switch (red_action(&q->parms, q->parms.qavg)) {
|
|
case RED_DONT_MARK:
|
|
break;
|
|
|
|
case RED_PROB_MARK:
|
|
sch->qstats.overlimits++;
|
|
if (!red_use_ecn(q) || !INET_ECN_set_ce(skb)) {
|
|
q->stats.prob_drop++;
|
|
goto congestion_drop;
|
|
}
|
|
|
|
q->stats.prob_mark++;
|
|
break;
|
|
|
|
case RED_HARD_MARK:
|
|
sch->qstats.overlimits++;
|
|
if (!red_use_ecn(q) || !INET_ECN_set_ce(skb)) {
|
|
q->stats.forced_drop++;
|
|
goto congestion_drop;
|
|
}
|
|
|
|
q->stats.forced_mark++;
|
|
break;
|
|
}
|
|
|
|
if (sch->qstats.backlog + skb->len <= q->limit) {
|
|
__skb_queue_tail(&sch->q, skb);
|
|
sch->qstats.backlog += skb->len;
|
|
sch->bstats.bytes += skb->len;
|
|
sch->bstats.packets++;
|
|
return NET_XMIT_SUCCESS;
|
|
}
|
|
|
|
q->stats.pdrop++;
|
|
kfree_skb(skb);
|
|
sch->qstats.drops++;
|
|
return NET_XMIT_DROP;
|
|
|
|
congestion_drop:
|
|
kfree_skb(skb);
|
|
sch->qstats.drops++;
|
|
return NET_XMIT_CN;
|
|
}
|
|
|
|
static int
|
|
red_requeue(struct sk_buff *skb, struct Qdisc* sch)
|
|
{
|
|
struct red_sched_data *q = qdisc_priv(sch);
|
|
|
|
if (red_is_idling(&q->parms))
|
|
red_end_of_idle_period(&q->parms);
|
|
|
|
__skb_queue_head(&sch->q, skb);
|
|
sch->qstats.backlog += skb->len;
|
|
sch->qstats.requeues++;
|
|
return 0;
|
|
}
|
|
|
|
static struct sk_buff *
|
|
red_dequeue(struct Qdisc* sch)
|
|
{
|
|
struct sk_buff *skb;
|
|
struct red_sched_data *q = qdisc_priv(sch);
|
|
|
|
skb = __skb_dequeue(&sch->q);
|
|
if (skb) {
|
|
sch->qstats.backlog -= skb->len;
|
|
return skb;
|
|
}
|
|
|
|
red_start_of_idle_period(&q->parms);
|
|
return NULL;
|
|
}
|
|
|
|
static unsigned int red_drop(struct Qdisc* sch)
|
|
{
|
|
struct sk_buff *skb;
|
|
struct red_sched_data *q = qdisc_priv(sch);
|
|
|
|
skb = __skb_dequeue_tail(&sch->q);
|
|
if (skb) {
|
|
unsigned int len = skb->len;
|
|
sch->qstats.backlog -= len;
|
|
sch->qstats.drops++;
|
|
q->stats.other++;
|
|
kfree_skb(skb);
|
|
return len;
|
|
}
|
|
|
|
red_start_of_idle_period(&q->parms);
|
|
return 0;
|
|
}
|
|
|
|
static void red_reset(struct Qdisc* sch)
|
|
{
|
|
struct red_sched_data *q = qdisc_priv(sch);
|
|
|
|
__skb_queue_purge(&sch->q);
|
|
sch->qstats.backlog = 0;
|
|
red_restart(&q->parms);
|
|
}
|
|
|
|
static int red_change(struct Qdisc *sch, struct rtattr *opt)
|
|
{
|
|
struct red_sched_data *q = qdisc_priv(sch);
|
|
struct rtattr *tb[TCA_RED_STAB];
|
|
struct tc_red_qopt *ctl;
|
|
|
|
if (opt == NULL ||
|
|
rtattr_parse_nested(tb, TCA_RED_STAB, opt) ||
|
|
tb[TCA_RED_PARMS-1] == 0 || tb[TCA_RED_STAB-1] == 0 ||
|
|
RTA_PAYLOAD(tb[TCA_RED_PARMS-1]) < sizeof(*ctl) ||
|
|
RTA_PAYLOAD(tb[TCA_RED_STAB-1]) < 256)
|
|
return -EINVAL;
|
|
|
|
ctl = RTA_DATA(tb[TCA_RED_PARMS-1]);
|
|
|
|
sch_tree_lock(sch);
|
|
q->flags = ctl->flags;
|
|
q->limit = ctl->limit;
|
|
|
|
red_set_parms(&q->parms, ctl->qth_min, ctl->qth_max, ctl->Wlog,
|
|
ctl->Plog, ctl->Scell_log,
|
|
RTA_DATA(tb[TCA_RED_STAB-1]));
|
|
|
|
if (skb_queue_empty(&sch->q))
|
|
red_end_of_idle_period(&q->parms);
|
|
sch_tree_unlock(sch);
|
|
return 0;
|
|
}
|
|
|
|
static int red_init(struct Qdisc* sch, struct rtattr *opt)
|
|
{
|
|
return red_change(sch, opt);
|
|
}
|
|
|
|
static int red_dump(struct Qdisc *sch, struct sk_buff *skb)
|
|
{
|
|
struct red_sched_data *q = qdisc_priv(sch);
|
|
unsigned char *b = skb->tail;
|
|
struct rtattr *rta;
|
|
struct tc_red_qopt opt = {
|
|
.limit = q->limit,
|
|
.flags = q->flags,
|
|
.qth_min = q->parms.qth_min >> q->parms.Wlog,
|
|
.qth_max = q->parms.qth_max >> q->parms.Wlog,
|
|
.Wlog = q->parms.Wlog,
|
|
.Plog = q->parms.Plog,
|
|
.Scell_log = q->parms.Scell_log,
|
|
};
|
|
|
|
rta = (struct rtattr*)b;
|
|
RTA_PUT(skb, TCA_OPTIONS, 0, NULL);
|
|
RTA_PUT(skb, TCA_RED_PARMS, sizeof(opt), &opt);
|
|
rta->rta_len = skb->tail - b;
|
|
|
|
return skb->len;
|
|
|
|
rtattr_failure:
|
|
skb_trim(skb, b - skb->data);
|
|
return -1;
|
|
}
|
|
|
|
static int red_dump_stats(struct Qdisc *sch, struct gnet_dump *d)
|
|
{
|
|
struct red_sched_data *q = qdisc_priv(sch);
|
|
struct tc_red_xstats st = {
|
|
.early = q->stats.prob_drop + q->stats.forced_drop,
|
|
.pdrop = q->stats.pdrop,
|
|
.other = q->stats.other,
|
|
.marked = q->stats.prob_mark + q->stats.forced_mark,
|
|
};
|
|
|
|
return gnet_stats_copy_app(d, &st, sizeof(st));
|
|
}
|
|
|
|
static struct Qdisc_ops red_qdisc_ops = {
|
|
.next = NULL,
|
|
.cl_ops = NULL,
|
|
.id = "red",
|
|
.priv_size = sizeof(struct red_sched_data),
|
|
.enqueue = red_enqueue,
|
|
.dequeue = red_dequeue,
|
|
.requeue = red_requeue,
|
|
.drop = red_drop,
|
|
.init = red_init,
|
|
.reset = red_reset,
|
|
.change = red_change,
|
|
.dump = red_dump,
|
|
.dump_stats = red_dump_stats,
|
|
.owner = THIS_MODULE,
|
|
};
|
|
|
|
static int __init red_module_init(void)
|
|
{
|
|
return register_qdisc(&red_qdisc_ops);
|
|
}
|
|
static void __exit red_module_exit(void)
|
|
{
|
|
unregister_qdisc(&red_qdisc_ops);
|
|
}
|
|
module_init(red_module_init)
|
|
module_exit(red_module_exit)
|
|
MODULE_LICENSE("GPL");
|