pkt_sched: Fix qdisc list locking

Since some qdiscs call qdisc_tree_decrease_qlen() (so qdisc_lookup())
without rtnl_lock(), adding and deleting from a qdisc list needs
additional locking. This patch adds global spinlock qdisc_list_lock
and wrapper functions for modifying the list. It is considered as a
temporary solution until hfsc_dequeue(), netem_dequeue() and
tbf_dequeue() (or qdisc_tree_decrease_qlen()) are redone.

With feedback from Herbert Xu and David S. Miller.

Signed-off-by: Jarek Poplawski <jarkao2@gmail.com>
Acked-by: Herbert Xu <herbert@gondor.apana.org.au>
Signed-off-by: David S. Miller <davem@davemloft.net>

authored by Jarek Poplawski and committed by David S. Miller f6e0b239 2540e051

+42 -8
+1
include/net/pkt_sched.h
··· 78 79 extern int register_qdisc(struct Qdisc_ops *qops); 80 extern int unregister_qdisc(struct Qdisc_ops *qops); 81 extern struct Qdisc *qdisc_lookup(struct net_device *dev, u32 handle); 82 extern struct Qdisc *qdisc_lookup_class(struct net_device *dev, u32 handle); 83 extern struct qdisc_rate_table *qdisc_get_rtab(struct tc_ratespec *r,
··· 78 79 extern int register_qdisc(struct Qdisc_ops *qops); 80 extern int unregister_qdisc(struct Qdisc_ops *qops); 81 + extern void qdisc_list_del(struct Qdisc *q); 82 extern struct Qdisc *qdisc_lookup(struct net_device *dev, u32 handle); 83 extern struct Qdisc *qdisc_lookup_class(struct net_device *dev, u32 handle); 84 extern struct qdisc_rate_table *qdisc_get_rtab(struct tc_ratespec *r,
+39 -5
net/sched/sch_api.c
··· 199 return NULL; 200 } 201 202 struct Qdisc *qdisc_lookup(struct net_device *dev, u32 handle) 203 { 204 unsigned int i; 205 206 for (i = 0; i < dev->num_tx_queues; i++) { 207 struct netdev_queue *txq = netdev_get_tx_queue(dev, i); 208 - struct Qdisc *q, *txq_root = txq->qdisc_sleeping; 209 210 q = qdisc_match_from_root(txq_root, handle); 211 if (q) 212 - return q; 213 } 214 - return qdisc_match_from_root(dev->rx_queue.qdisc_sleeping, handle); 215 } 216 217 static struct Qdisc *qdisc_leaf(struct Qdisc *p, u32 classid) ··· 844 goto err_out3; 845 } 846 } 847 - if ((parent != TC_H_ROOT) && !(sch->flags & TCQ_F_INGRESS)) 848 - list_add_tail(&sch->list, &dev_queue->qdisc_sleeping->list); 849 850 return sch; 851 }
··· 199 return NULL; 200 } 201 202 + /* 203 + * This lock is needed until some qdiscs stop calling qdisc_tree_decrease_qlen() 204 + * without rtnl_lock(); currently hfsc_dequeue(), netem_dequeue(), tbf_dequeue() 205 + */ 206 + static DEFINE_SPINLOCK(qdisc_list_lock); 207 + 208 + static void qdisc_list_add(struct Qdisc *q) 209 + { 210 + if ((q->parent != TC_H_ROOT) && !(q->flags & TCQ_F_INGRESS)) { 211 + spin_lock_bh(&qdisc_list_lock); 212 + list_add_tail(&q->list, &qdisc_root_sleeping(q)->list); 213 + spin_unlock_bh(&qdisc_list_lock); 214 + } 215 + } 216 + 217 + void qdisc_list_del(struct Qdisc *q) 218 + { 219 + if ((q->parent != TC_H_ROOT) && !(q->flags & TCQ_F_INGRESS)) { 220 + spin_lock_bh(&qdisc_list_lock); 221 + list_del(&q->list); 222 + spin_unlock_bh(&qdisc_list_lock); 223 + } 224 + } 225 + EXPORT_SYMBOL(qdisc_list_del); 226 + 227 struct Qdisc *qdisc_lookup(struct net_device *dev, u32 handle) 228 { 229 unsigned int i; 230 + struct Qdisc *q; 231 + 232 + spin_lock_bh(&qdisc_list_lock); 233 234 for (i = 0; i < dev->num_tx_queues; i++) { 235 struct netdev_queue *txq = netdev_get_tx_queue(dev, i); 236 + struct Qdisc *txq_root = txq->qdisc_sleeping; 237 238 q = qdisc_match_from_root(txq_root, handle); 239 if (q) 240 + goto unlock; 241 } 242 + 243 + q = qdisc_match_from_root(dev->rx_queue.qdisc_sleeping, handle); 244 + 245 + unlock: 246 + spin_unlock_bh(&qdisc_list_lock); 247 + 248 + return q; 249 } 250 251 static struct Qdisc *qdisc_leaf(struct Qdisc *p, u32 classid) ··· 810 goto err_out3; 811 } 812 } 813 + 814 + qdisc_list_add(sch); 815 816 return sch; 817 }
+2 -3
net/sched/sch_generic.c
··· 526 !atomic_dec_and_test(&qdisc->refcnt)) 527 return; 528 529 - if (qdisc->parent) 530 - list_del(&qdisc->list); 531 - 532 #ifdef CONFIG_NET_SCHED 533 qdisc_put_stab(qdisc->stab); 534 #endif 535 gen_kill_estimator(&qdisc->bstats, &qdisc->rate_est);
··· 526 !atomic_dec_and_test(&qdisc->refcnt)) 527 return; 528 529 #ifdef CONFIG_NET_SCHED 530 + qdisc_list_del(qdisc); 531 + 532 qdisc_put_stab(qdisc->stab); 533 #endif 534 gen_kill_estimator(&qdisc->bstats, &qdisc->rate_est);