| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484 | /* * net/sched/sch_prio.c	Simple 3-band priority "scheduler". * *		This program is free software; you can redistribute it and/or *		modify it under the terms of the GNU General Public License *		as published by the Free Software Foundation; either version *		2 of the License, or (at your option) any later version. * * Authors:	Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru> * Fixes:       19990609: J Hadi Salim <hadi@nortelnetworks.com>: *              Init --  EINVAL when opt undefined */#include <linux/module.h>#include <linux/slab.h>#include <linux/types.h>#include <linux/kernel.h>#include <linux/string.h>#include <linux/errno.h>#include <linux/skbuff.h>#include <net/netlink.h>#include <net/pkt_sched.h>#include <net/pkt_cls.h>struct prio_sched_data {	int bands;	struct tcf_proto __rcu *filter_list;	struct tcf_block *block;	u8  prio2band[TC_PRIO_MAX+1];	struct Qdisc *queues[TCQ_PRIO_BANDS];};static struct Qdisc *prio_classify(struct sk_buff *skb, struct Qdisc *sch, int *qerr){	struct prio_sched_data *q = qdisc_priv(sch);	u32 band = skb->priority;	struct tcf_result res;	struct tcf_proto *fl;	int err;	*qerr = NET_XMIT_SUCCESS | __NET_XMIT_BYPASS;	if (TC_H_MAJ(skb->priority) != sch->handle) {		fl = rcu_dereference_bh(q->filter_list);		err = tcf_classify(skb, fl, &res, false);#ifdef CONFIG_NET_CLS_ACT		switch (err) {		case TC_ACT_STOLEN:		case TC_ACT_QUEUED:		case TC_ACT_TRAP:			*qerr = NET_XMIT_SUCCESS | __NET_XMIT_STOLEN;			/* fall through */		case TC_ACT_SHOT:			return NULL;		}#endif		if (!fl || err < 0) {			if (TC_H_MAJ(band))				band = 0;			return q->queues[q->prio2band[band & TC_PRIO_MAX]];		}		band = res.classid;	}	band = TC_H_MIN(band) - 1;	if (band >= q->bands)		return q->queues[q->prio2band[0]];	return q->queues[band];}static intprio_enqueue(struct sk_buff *skb, struct Qdisc *sch, struct sk_buff **to_free){	struct Qdisc *qdisc;	int ret;	qdisc = prio_classify(skb, sch, &ret);#ifdef CONFIG_NET_CLS_ACT	if (qdisc == NULL) {		if (ret & __NET_XMIT_BYPASS)			qdisc_qstats_drop(sch);		__qdisc_drop(skb, to_free);		return ret;	}#endif	ret = qdisc_enqueue(skb, qdisc, to_free);	if (ret == NET_XMIT_SUCCESS) {		qdisc_qstats_backlog_inc(sch, skb);		sch->q.qlen++;		return NET_XMIT_SUCCESS;	}	if (net_xmit_drop_count(ret))		qdisc_qstats_drop(sch);	return ret;}static struct sk_buff *prio_peek(struct Qdisc *sch){	struct prio_sched_data *q = qdisc_priv(sch);	int prio;	for (prio = 0; prio < q->bands; prio++) {		struct Qdisc *qdisc = q->queues[prio];		struct sk_buff *skb = qdisc->ops->peek(qdisc);		if (skb)			return skb;	}	return NULL;}static struct sk_buff *prio_dequeue(struct Qdisc *sch){	struct prio_sched_data *q = qdisc_priv(sch);	int prio;	for (prio = 0; prio < q->bands; prio++) {		struct Qdisc *qdisc = q->queues[prio];		struct sk_buff *skb = qdisc_dequeue_peeked(qdisc);		if (skb) {			qdisc_bstats_update(sch, skb);			qdisc_qstats_backlog_dec(sch, skb);			sch->q.qlen--;			return skb;		}	}	return NULL;}static voidprio_reset(struct Qdisc *sch){	int prio;	struct prio_sched_data *q = qdisc_priv(sch);	for (prio = 0; prio < q->bands; prio++)		qdisc_reset(q->queues[prio]);	sch->qstats.backlog = 0;	sch->q.qlen = 0;}static int prio_offload(struct Qdisc *sch, struct tc_prio_qopt *qopt){	struct net_device *dev = qdisc_dev(sch);	struct tc_prio_qopt_offload opt = {		.handle = sch->handle,		.parent = sch->parent,	};	if (!tc_can_offload(dev) || !dev->netdev_ops->ndo_setup_tc)		return -EOPNOTSUPP;	if (qopt) {		opt.command = TC_PRIO_REPLACE;		opt.replace_params.bands = qopt->bands;		memcpy(&opt.replace_params.priomap, qopt->priomap,		       TC_PRIO_MAX + 1);		opt.replace_params.qstats = &sch->qstats;	} else {		opt.command = TC_PRIO_DESTROY;	}	return dev->netdev_ops->ndo_setup_tc(dev, TC_SETUP_QDISC_PRIO, &opt);}static voidprio_destroy(struct Qdisc *sch){	int prio;	struct prio_sched_data *q = qdisc_priv(sch);	tcf_block_put(q->block);	prio_offload(sch, NULL);	for (prio = 0; prio < q->bands; prio++)		qdisc_destroy(q->queues[prio]);}static int prio_tune(struct Qdisc *sch, struct nlattr *opt,		     struct netlink_ext_ack *extack){	struct prio_sched_data *q = qdisc_priv(sch);	struct Qdisc *queues[TCQ_PRIO_BANDS];	int oldbands = q->bands, i;	struct tc_prio_qopt *qopt;	if (nla_len(opt) < sizeof(*qopt))		return -EINVAL;	qopt = nla_data(opt);	if (qopt->bands > TCQ_PRIO_BANDS || qopt->bands < 2)		return -EINVAL;	for (i = 0; i <= TC_PRIO_MAX; i++) {		if (qopt->priomap[i] >= qopt->bands)			return -EINVAL;	}	/* Before commit, make sure we can allocate all new qdiscs */	for (i = oldbands; i < qopt->bands; i++) {		queues[i] = qdisc_create_dflt(sch->dev_queue, &pfifo_qdisc_ops,					      TC_H_MAKE(sch->handle, i + 1),					      extack);		if (!queues[i]) {			while (i > oldbands)				qdisc_destroy(queues[--i]);			return -ENOMEM;		}	}	prio_offload(sch, qopt);	sch_tree_lock(sch);	q->bands = qopt->bands;	memcpy(q->prio2band, qopt->priomap, TC_PRIO_MAX+1);	for (i = q->bands; i < oldbands; i++) {		struct Qdisc *child = q->queues[i];		qdisc_tree_reduce_backlog(child, child->q.qlen,					  child->qstats.backlog);		qdisc_destroy(child);	}	for (i = oldbands; i < q->bands; i++) {		q->queues[i] = queues[i];		if (q->queues[i] != &noop_qdisc)			qdisc_hash_add(q->queues[i], true);	}	sch_tree_unlock(sch);	return 0;}static int prio_init(struct Qdisc *sch, struct nlattr *opt,		     struct netlink_ext_ack *extack){	struct prio_sched_data *q = qdisc_priv(sch);	int err;	if (!opt)		return -EINVAL;	err = tcf_block_get(&q->block, &q->filter_list, sch, extack);	if (err)		return err;	return prio_tune(sch, opt, extack);}static int prio_dump_offload(struct Qdisc *sch){	struct net_device *dev = qdisc_dev(sch);	struct tc_prio_qopt_offload hw_stats = {		.command = TC_PRIO_STATS,		.handle = sch->handle,		.parent = sch->parent,		{			.stats = {				.bstats = &sch->bstats,				.qstats = &sch->qstats,			},		},	};	int err;	sch->flags &= ~TCQ_F_OFFLOADED;	if (!tc_can_offload(dev) || !dev->netdev_ops->ndo_setup_tc)		return 0;	err = dev->netdev_ops->ndo_setup_tc(dev, TC_SETUP_QDISC_PRIO,					    &hw_stats);	if (err == -EOPNOTSUPP)		return 0;	if (!err)		sch->flags |= TCQ_F_OFFLOADED;	return err;}static int prio_dump(struct Qdisc *sch, struct sk_buff *skb){	struct prio_sched_data *q = qdisc_priv(sch);	unsigned char *b = skb_tail_pointer(skb);	struct tc_prio_qopt opt;	int err;	opt.bands = q->bands;	memcpy(&opt.priomap, q->prio2band, TC_PRIO_MAX + 1);	err = prio_dump_offload(sch);	if (err)		goto nla_put_failure;	if (nla_put(skb, TCA_OPTIONS, sizeof(opt), &opt))		goto nla_put_failure;	return skb->len;nla_put_failure:	nlmsg_trim(skb, b);	return -1;}static int prio_graft(struct Qdisc *sch, unsigned long arg, struct Qdisc *new,		      struct Qdisc **old, struct netlink_ext_ack *extack){	struct prio_sched_data *q = qdisc_priv(sch);	struct tc_prio_qopt_offload graft_offload;	struct net_device *dev = qdisc_dev(sch);	unsigned long band = arg - 1;	bool any_qdisc_is_offloaded;	int err;	if (!new) {		new = qdisc_create_dflt(sch->dev_queue, &pfifo_qdisc_ops,					TC_H_MAKE(sch->handle, arg), extack);		if (!new)			new = &noop_qdisc;		else			qdisc_hash_add(new, true);	}	*old = qdisc_replace(sch, new, &q->queues[band]);	if (!tc_can_offload(dev))		return 0;	graft_offload.handle = sch->handle;	graft_offload.parent = sch->parent;	graft_offload.graft_params.band = band;	graft_offload.graft_params.child_handle = new->handle;	graft_offload.command = TC_PRIO_GRAFT;	err = dev->netdev_ops->ndo_setup_tc(dev, TC_SETUP_QDISC_PRIO,					    &graft_offload);	/* Don't report error if the graft is part of destroy operation. */	if (err && new != &noop_qdisc) {		/* Don't report error if the parent, the old child and the new		 * one are not offloaded.		 */		any_qdisc_is_offloaded = sch->flags & TCQ_F_OFFLOADED;		any_qdisc_is_offloaded |= new->flags & TCQ_F_OFFLOADED;		if (*old)			any_qdisc_is_offloaded |= (*old)->flags &						   TCQ_F_OFFLOADED;		if (any_qdisc_is_offloaded)			NL_SET_ERR_MSG(extack, "Offloading graft operation failed.");	}	return 0;}static struct Qdisc *prio_leaf(struct Qdisc *sch, unsigned long arg){	struct prio_sched_data *q = qdisc_priv(sch);	unsigned long band = arg - 1;	return q->queues[band];}static unsigned long prio_find(struct Qdisc *sch, u32 classid){	struct prio_sched_data *q = qdisc_priv(sch);	unsigned long band = TC_H_MIN(classid);	if (band - 1 >= q->bands)		return 0;	return band;}static unsigned long prio_bind(struct Qdisc *sch, unsigned long parent, u32 classid){	return prio_find(sch, classid);}static void prio_unbind(struct Qdisc *q, unsigned long cl){}static int prio_dump_class(struct Qdisc *sch, unsigned long cl, struct sk_buff *skb,			   struct tcmsg *tcm){	struct prio_sched_data *q = qdisc_priv(sch);	tcm->tcm_handle |= TC_H_MIN(cl);	tcm->tcm_info = q->queues[cl-1]->handle;	return 0;}static int prio_dump_class_stats(struct Qdisc *sch, unsigned long cl,				 struct gnet_dump *d){	struct prio_sched_data *q = qdisc_priv(sch);	struct Qdisc *cl_q;	cl_q = q->queues[cl - 1];	if (gnet_stats_copy_basic(qdisc_root_sleeping_running(sch),				  d, cl_q->cpu_bstats, &cl_q->bstats) < 0 ||	    gnet_stats_copy_queue(d, NULL, &cl_q->qstats, cl_q->q.qlen) < 0)		return -1;	return 0;}static void prio_walk(struct Qdisc *sch, struct qdisc_walker *arg){	struct prio_sched_data *q = qdisc_priv(sch);	int prio;	if (arg->stop)		return;	for (prio = 0; prio < q->bands; prio++) {		if (arg->count < arg->skip) {			arg->count++;			continue;		}		if (arg->fn(sch, prio + 1, arg) < 0) {			arg->stop = 1;			break;		}		arg->count++;	}}static struct tcf_block *prio_tcf_block(struct Qdisc *sch, unsigned long cl,					struct netlink_ext_ack *extack){	struct prio_sched_data *q = qdisc_priv(sch);	if (cl)		return NULL;	return q->block;}static const struct Qdisc_class_ops prio_class_ops = {	.graft		=	prio_graft,	.leaf		=	prio_leaf,	.find		=	prio_find,	.walk		=	prio_walk,	.tcf_block	=	prio_tcf_block,	.bind_tcf	=	prio_bind,	.unbind_tcf	=	prio_unbind,	.dump		=	prio_dump_class,	.dump_stats	=	prio_dump_class_stats,};static struct Qdisc_ops prio_qdisc_ops __read_mostly = {	.next		=	NULL,	.cl_ops		=	&prio_class_ops,	.id		=	"prio",	.priv_size	=	sizeof(struct prio_sched_data),	.enqueue	=	prio_enqueue,	.dequeue	=	prio_dequeue,	.peek		=	prio_peek,	.init		=	prio_init,	.reset		=	prio_reset,	.destroy	=	prio_destroy,	.change		=	prio_tune,	.dump		=	prio_dump,	.owner		=	THIS_MODULE,};static int __init prio_module_init(void){	return register_qdisc(&prio_qdisc_ops);}static void __exit prio_module_exit(void){	unregister_qdisc(&prio_qdisc_ops);}module_init(prio_module_init)module_exit(prio_module_exit)MODULE_LICENSE("GPL");
 |