mirror of
				git://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
				synced 2025-09-04 20:19:47 +08:00 
			
		
		
		
	 1b34ec43c9
			
		
	
	
		1b34ec43c9
		
	
	
	
	
		
			
			These macros contain a hidden goto, and are thus extremely error prone and make code hard to audit. Signed-off-by: David S. Miller <davem@davemloft.net>
		
			
				
	
	
		
			392 lines
		
	
	
		
			8.7 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			392 lines
		
	
	
		
			8.7 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * net/sched/sch_red.c	Random Early Detection queue.
 | |
|  *
 | |
|  *		This program is free software; you can redistribute it and/or
 | |
|  *		modify it under the terms of the GNU General Public License
 | |
|  *		as published by the Free Software Foundation; either version
 | |
|  *		2 of the License, or (at your option) any later version.
 | |
|  *
 | |
|  * Authors:	Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
 | |
|  *
 | |
|  * Changes:
 | |
|  * J Hadi Salim 980914:	computation fixes
 | |
|  * Alexey Makarenko <makar@phoenix.kharkov.ua> 990814: qave on idle link was calculated incorrectly.
 | |
|  * J Hadi Salim 980816:  ECN support
 | |
|  */
 | |
| 
 | |
| #include <linux/module.h>
 | |
| #include <linux/types.h>
 | |
| #include <linux/kernel.h>
 | |
| #include <linux/skbuff.h>
 | |
| #include <net/pkt_sched.h>
 | |
| #include <net/inet_ecn.h>
 | |
| #include <net/red.h>
 | |
| 
 | |
| 
 | |
| /*	Parameters, settable by user:
 | |
| 	-----------------------------
 | |
| 
 | |
| 	limit		- bytes (must be > qth_max + burst)
 | |
| 
 | |
| 	Hard limit on queue length, should be chosen >qth_max
 | |
| 	to allow packet bursts. This parameter does not
 | |
| 	affect the algorithms behaviour and can be chosen
 | |
| 	arbitrarily high (well, less than ram size)
 | |
| 	Really, this limit will never be reached
 | |
| 	if RED works correctly.
 | |
|  */
 | |
| 
 | |
| struct red_sched_data {
 | |
| 	u32			limit;		/* HARD maximal queue length */
 | |
| 	unsigned char		flags;
 | |
| 	struct timer_list	adapt_timer;
 | |
| 	struct red_parms	parms;
 | |
| 	struct red_vars		vars;
 | |
| 	struct red_stats	stats;
 | |
| 	struct Qdisc		*qdisc;
 | |
| };
 | |
| 
 | |
| static inline int red_use_ecn(struct red_sched_data *q)
 | |
| {
 | |
| 	return q->flags & TC_RED_ECN;
 | |
| }
 | |
| 
 | |
| static inline int red_use_harddrop(struct red_sched_data *q)
 | |
| {
 | |
| 	return q->flags & TC_RED_HARDDROP;
 | |
| }
 | |
| 
 | |
| static int red_enqueue(struct sk_buff *skb, struct Qdisc *sch)
 | |
| {
 | |
| 	struct red_sched_data *q = qdisc_priv(sch);
 | |
| 	struct Qdisc *child = q->qdisc;
 | |
| 	int ret;
 | |
| 
 | |
| 	q->vars.qavg = red_calc_qavg(&q->parms,
 | |
| 				     &q->vars,
 | |
| 				     child->qstats.backlog);
 | |
| 
 | |
| 	if (red_is_idling(&q->vars))
 | |
| 		red_end_of_idle_period(&q->vars);
 | |
| 
 | |
| 	switch (red_action(&q->parms, &q->vars, q->vars.qavg)) {
 | |
| 	case RED_DONT_MARK:
 | |
| 		break;
 | |
| 
 | |
| 	case RED_PROB_MARK:
 | |
| 		sch->qstats.overlimits++;
 | |
| 		if (!red_use_ecn(q) || !INET_ECN_set_ce(skb)) {
 | |
| 			q->stats.prob_drop++;
 | |
| 			goto congestion_drop;
 | |
| 		}
 | |
| 
 | |
| 		q->stats.prob_mark++;
 | |
| 		break;
 | |
| 
 | |
| 	case RED_HARD_MARK:
 | |
| 		sch->qstats.overlimits++;
 | |
| 		if (red_use_harddrop(q) || !red_use_ecn(q) ||
 | |
| 		    !INET_ECN_set_ce(skb)) {
 | |
| 			q->stats.forced_drop++;
 | |
| 			goto congestion_drop;
 | |
| 		}
 | |
| 
 | |
| 		q->stats.forced_mark++;
 | |
| 		break;
 | |
| 	}
 | |
| 
 | |
| 	ret = qdisc_enqueue(skb, child);
 | |
| 	if (likely(ret == NET_XMIT_SUCCESS)) {
 | |
| 		sch->q.qlen++;
 | |
| 	} else if (net_xmit_drop_count(ret)) {
 | |
| 		q->stats.pdrop++;
 | |
| 		sch->qstats.drops++;
 | |
| 	}
 | |
| 	return ret;
 | |
| 
 | |
| congestion_drop:
 | |
| 	qdisc_drop(skb, sch);
 | |
| 	return NET_XMIT_CN;
 | |
| }
 | |
| 
 | |
| static struct sk_buff *red_dequeue(struct Qdisc *sch)
 | |
| {
 | |
| 	struct sk_buff *skb;
 | |
| 	struct red_sched_data *q = qdisc_priv(sch);
 | |
| 	struct Qdisc *child = q->qdisc;
 | |
| 
 | |
| 	skb = child->dequeue(child);
 | |
| 	if (skb) {
 | |
| 		qdisc_bstats_update(sch, skb);
 | |
| 		sch->q.qlen--;
 | |
| 	} else {
 | |
| 		if (!red_is_idling(&q->vars))
 | |
| 			red_start_of_idle_period(&q->vars);
 | |
| 	}
 | |
| 	return skb;
 | |
| }
 | |
| 
 | |
| static struct sk_buff *red_peek(struct Qdisc *sch)
 | |
| {
 | |
| 	struct red_sched_data *q = qdisc_priv(sch);
 | |
| 	struct Qdisc *child = q->qdisc;
 | |
| 
 | |
| 	return child->ops->peek(child);
 | |
| }
 | |
| 
 | |
| static unsigned int red_drop(struct Qdisc *sch)
 | |
| {
 | |
| 	struct red_sched_data *q = qdisc_priv(sch);
 | |
| 	struct Qdisc *child = q->qdisc;
 | |
| 	unsigned int len;
 | |
| 
 | |
| 	if (child->ops->drop && (len = child->ops->drop(child)) > 0) {
 | |
| 		q->stats.other++;
 | |
| 		sch->qstats.drops++;
 | |
| 		sch->q.qlen--;
 | |
| 		return len;
 | |
| 	}
 | |
| 
 | |
| 	if (!red_is_idling(&q->vars))
 | |
| 		red_start_of_idle_period(&q->vars);
 | |
| 
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static void red_reset(struct Qdisc *sch)
 | |
| {
 | |
| 	struct red_sched_data *q = qdisc_priv(sch);
 | |
| 
 | |
| 	qdisc_reset(q->qdisc);
 | |
| 	sch->q.qlen = 0;
 | |
| 	red_restart(&q->vars);
 | |
| }
 | |
| 
 | |
| static void red_destroy(struct Qdisc *sch)
 | |
| {
 | |
| 	struct red_sched_data *q = qdisc_priv(sch);
 | |
| 
 | |
| 	del_timer_sync(&q->adapt_timer);
 | |
| 	qdisc_destroy(q->qdisc);
 | |
| }
 | |
| 
 | |
| static const struct nla_policy red_policy[TCA_RED_MAX + 1] = {
 | |
| 	[TCA_RED_PARMS]	= { .len = sizeof(struct tc_red_qopt) },
 | |
| 	[TCA_RED_STAB]	= { .len = RED_STAB_SIZE },
 | |
| 	[TCA_RED_MAX_P] = { .type = NLA_U32 },
 | |
| };
 | |
| 
 | |
| static int red_change(struct Qdisc *sch, struct nlattr *opt)
 | |
| {
 | |
| 	struct red_sched_data *q = qdisc_priv(sch);
 | |
| 	struct nlattr *tb[TCA_RED_MAX + 1];
 | |
| 	struct tc_red_qopt *ctl;
 | |
| 	struct Qdisc *child = NULL;
 | |
| 	int err;
 | |
| 	u32 max_P;
 | |
| 
 | |
| 	if (opt == NULL)
 | |
| 		return -EINVAL;
 | |
| 
 | |
| 	err = nla_parse_nested(tb, TCA_RED_MAX, opt, red_policy);
 | |
| 	if (err < 0)
 | |
| 		return err;
 | |
| 
 | |
| 	if (tb[TCA_RED_PARMS] == NULL ||
 | |
| 	    tb[TCA_RED_STAB] == NULL)
 | |
| 		return -EINVAL;
 | |
| 
 | |
| 	max_P = tb[TCA_RED_MAX_P] ? nla_get_u32(tb[TCA_RED_MAX_P]) : 0;
 | |
| 
 | |
| 	ctl = nla_data(tb[TCA_RED_PARMS]);
 | |
| 
 | |
| 	if (ctl->limit > 0) {
 | |
| 		child = fifo_create_dflt(sch, &bfifo_qdisc_ops, ctl->limit);
 | |
| 		if (IS_ERR(child))
 | |
| 			return PTR_ERR(child);
 | |
| 	}
 | |
| 
 | |
| 	sch_tree_lock(sch);
 | |
| 	q->flags = ctl->flags;
 | |
| 	q->limit = ctl->limit;
 | |
| 	if (child) {
 | |
| 		qdisc_tree_decrease_qlen(q->qdisc, q->qdisc->q.qlen);
 | |
| 		qdisc_destroy(q->qdisc);
 | |
| 		q->qdisc = child;
 | |
| 	}
 | |
| 
 | |
| 	red_set_parms(&q->parms,
 | |
| 		      ctl->qth_min, ctl->qth_max, ctl->Wlog,
 | |
| 		      ctl->Plog, ctl->Scell_log,
 | |
| 		      nla_data(tb[TCA_RED_STAB]),
 | |
| 		      max_P);
 | |
| 	red_set_vars(&q->vars);
 | |
| 
 | |
| 	del_timer(&q->adapt_timer);
 | |
| 	if (ctl->flags & TC_RED_ADAPTATIVE)
 | |
| 		mod_timer(&q->adapt_timer, jiffies + HZ/2);
 | |
| 
 | |
| 	if (!q->qdisc->q.qlen)
 | |
| 		red_start_of_idle_period(&q->vars);
 | |
| 
 | |
| 	sch_tree_unlock(sch);
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static inline void red_adaptative_timer(unsigned long arg)
 | |
| {
 | |
| 	struct Qdisc *sch = (struct Qdisc *)arg;
 | |
| 	struct red_sched_data *q = qdisc_priv(sch);
 | |
| 	spinlock_t *root_lock = qdisc_lock(qdisc_root_sleeping(sch));
 | |
| 
 | |
| 	spin_lock(root_lock);
 | |
| 	red_adaptative_algo(&q->parms, &q->vars);
 | |
| 	mod_timer(&q->adapt_timer, jiffies + HZ/2);
 | |
| 	spin_unlock(root_lock);
 | |
| }
 | |
| 
 | |
| static int red_init(struct Qdisc *sch, struct nlattr *opt)
 | |
| {
 | |
| 	struct red_sched_data *q = qdisc_priv(sch);
 | |
| 
 | |
| 	q->qdisc = &noop_qdisc;
 | |
| 	setup_timer(&q->adapt_timer, red_adaptative_timer, (unsigned long)sch);
 | |
| 	return red_change(sch, opt);
 | |
| }
 | |
| 
 | |
| static int red_dump(struct Qdisc *sch, struct sk_buff *skb)
 | |
| {
 | |
| 	struct red_sched_data *q = qdisc_priv(sch);
 | |
| 	struct nlattr *opts = NULL;
 | |
| 	struct tc_red_qopt opt = {
 | |
| 		.limit		= q->limit,
 | |
| 		.flags		= q->flags,
 | |
| 		.qth_min	= q->parms.qth_min >> q->parms.Wlog,
 | |
| 		.qth_max	= q->parms.qth_max >> q->parms.Wlog,
 | |
| 		.Wlog		= q->parms.Wlog,
 | |
| 		.Plog		= q->parms.Plog,
 | |
| 		.Scell_log	= q->parms.Scell_log,
 | |
| 	};
 | |
| 
 | |
| 	sch->qstats.backlog = q->qdisc->qstats.backlog;
 | |
| 	opts = nla_nest_start(skb, TCA_OPTIONS);
 | |
| 	if (opts == NULL)
 | |
| 		goto nla_put_failure;
 | |
| 	if (nla_put(skb, TCA_RED_PARMS, sizeof(opt), &opt) ||
 | |
| 	    nla_put_u32(skb, TCA_RED_MAX_P, q->parms.max_P))
 | |
| 		goto nla_put_failure;
 | |
| 	return nla_nest_end(skb, opts);
 | |
| 
 | |
| nla_put_failure:
 | |
| 	nla_nest_cancel(skb, opts);
 | |
| 	return -EMSGSIZE;
 | |
| }
 | |
| 
 | |
| static int red_dump_stats(struct Qdisc *sch, struct gnet_dump *d)
 | |
| {
 | |
| 	struct red_sched_data *q = qdisc_priv(sch);
 | |
| 	struct tc_red_xstats st = {
 | |
| 		.early	= q->stats.prob_drop + q->stats.forced_drop,
 | |
| 		.pdrop	= q->stats.pdrop,
 | |
| 		.other	= q->stats.other,
 | |
| 		.marked	= q->stats.prob_mark + q->stats.forced_mark,
 | |
| 	};
 | |
| 
 | |
| 	return gnet_stats_copy_app(d, &st, sizeof(st));
 | |
| }
 | |
| 
 | |
| static int red_dump_class(struct Qdisc *sch, unsigned long cl,
 | |
| 			  struct sk_buff *skb, struct tcmsg *tcm)
 | |
| {
 | |
| 	struct red_sched_data *q = qdisc_priv(sch);
 | |
| 
 | |
| 	tcm->tcm_handle |= TC_H_MIN(1);
 | |
| 	tcm->tcm_info = q->qdisc->handle;
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static int red_graft(struct Qdisc *sch, unsigned long arg, struct Qdisc *new,
 | |
| 		     struct Qdisc **old)
 | |
| {
 | |
| 	struct red_sched_data *q = qdisc_priv(sch);
 | |
| 
 | |
| 	if (new == NULL)
 | |
| 		new = &noop_qdisc;
 | |
| 
 | |
| 	sch_tree_lock(sch);
 | |
| 	*old = q->qdisc;
 | |
| 	q->qdisc = new;
 | |
| 	qdisc_tree_decrease_qlen(*old, (*old)->q.qlen);
 | |
| 	qdisc_reset(*old);
 | |
| 	sch_tree_unlock(sch);
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static struct Qdisc *red_leaf(struct Qdisc *sch, unsigned long arg)
 | |
| {
 | |
| 	struct red_sched_data *q = qdisc_priv(sch);
 | |
| 	return q->qdisc;
 | |
| }
 | |
| 
 | |
| static unsigned long red_get(struct Qdisc *sch, u32 classid)
 | |
| {
 | |
| 	return 1;
 | |
| }
 | |
| 
 | |
| static void red_put(struct Qdisc *sch, unsigned long arg)
 | |
| {
 | |
| }
 | |
| 
 | |
| static void red_walk(struct Qdisc *sch, struct qdisc_walker *walker)
 | |
| {
 | |
| 	if (!walker->stop) {
 | |
| 		if (walker->count >= walker->skip)
 | |
| 			if (walker->fn(sch, 1, walker) < 0) {
 | |
| 				walker->stop = 1;
 | |
| 				return;
 | |
| 			}
 | |
| 		walker->count++;
 | |
| 	}
 | |
| }
 | |
| 
 | |
| static const struct Qdisc_class_ops red_class_ops = {
 | |
| 	.graft		=	red_graft,
 | |
| 	.leaf		=	red_leaf,
 | |
| 	.get		=	red_get,
 | |
| 	.put		=	red_put,
 | |
| 	.walk		=	red_walk,
 | |
| 	.dump		=	red_dump_class,
 | |
| };
 | |
| 
 | |
| static struct Qdisc_ops red_qdisc_ops __read_mostly = {
 | |
| 	.id		=	"red",
 | |
| 	.priv_size	=	sizeof(struct red_sched_data),
 | |
| 	.cl_ops		=	&red_class_ops,
 | |
| 	.enqueue	=	red_enqueue,
 | |
| 	.dequeue	=	red_dequeue,
 | |
| 	.peek		=	red_peek,
 | |
| 	.drop		=	red_drop,
 | |
| 	.init		=	red_init,
 | |
| 	.reset		=	red_reset,
 | |
| 	.destroy	=	red_destroy,
 | |
| 	.change		=	red_change,
 | |
| 	.dump		=	red_dump,
 | |
| 	.dump_stats	=	red_dump_stats,
 | |
| 	.owner		=	THIS_MODULE,
 | |
| };
 | |
| 
 | |
| static int __init red_module_init(void)
 | |
| {
 | |
| 	return register_qdisc(&red_qdisc_ops);
 | |
| }
 | |
| 
 | |
| static void __exit red_module_exit(void)
 | |
| {
 | |
| 	unregister_qdisc(&red_qdisc_ops);
 | |
| }
 | |
| 
 | |
| module_init(red_module_init)
 | |
| module_exit(red_module_exit)
 | |
| 
 | |
| MODULE_LICENSE("GPL");
 |