net: sched: avoid unnecessary seqcount operation for lockless qdisc
[linux-block.git] / include / net / sch_generic.h
CommitLineData
b2441318 1/* SPDX-License-Identifier: GPL-2.0 */
1da177e4
LT
2#ifndef __NET_SCHED_GENERIC_H
3#define __NET_SCHED_GENERIC_H
4
1da177e4
LT
5#include <linux/netdevice.h>
6#include <linux/types.h>
7#include <linux/rcupdate.h>
1da177e4
LT
8#include <linux/pkt_sched.h>
9#include <linux/pkt_cls.h>
22e0f8b9 10#include <linux/percpu.h>
5772e9a3 11#include <linux/dynamic_queue_limits.h>
5bc17018 12#include <linux/list.h>
7b936405 13#include <linux/refcount.h>
7aa0045d 14#include <linux/workqueue.h>
c266f64d 15#include <linux/mutex.h>
4f8116c8 16#include <linux/rwsem.h>
97394bef 17#include <linux/atomic.h>
59eb87cb 18#include <linux/hashtable.h>
1da177e4 19#include <net/gen_stats.h>
be577ddc 20#include <net/rtnetlink.h>
a7323311 21#include <net/flow_offload.h>
1da177e4
LT
22
23struct Qdisc_ops;
24struct qdisc_walker;
25struct tcf_walker;
26struct module;
d58e468b 27struct bpf_flow_keys;
1da177e4 28
fd2c3ef7 29struct qdisc_rate_table {
1da177e4
LT
30 struct tc_ratespec rate;
31 u32 data[256];
32 struct qdisc_rate_table *next;
33 int refcnt;
34};
35
fd2c3ef7 36enum qdisc_state_t {
37437bb2 37 __QDISC_STATE_SCHED,
a9312ae8 38 __QDISC_STATE_DEACTIVATED,
a90c57f2 39 __QDISC_STATE_MISSED,
e2627c8c
DM
40};
41
175f9c1b 42struct qdisc_size_table {
a2da570d 43 struct rcu_head rcu;
175f9c1b
JK
44 struct list_head list;
45 struct tc_sizespec szopts;
46 int refcnt;
47 u16 data[];
48};
49
48da34b7
FW
50/* similar to sk_buff_head, but skb->prev pointer is undefined. */
51struct qdisc_skb_head {
52 struct sk_buff *head;
53 struct sk_buff *tail;
73eb628d 54 __u32 qlen;
48da34b7
FW
55 spinlock_t lock;
56};
57
fd2c3ef7 58struct Qdisc {
520ac30f
ED
59 int (*enqueue)(struct sk_buff *skb,
60 struct Qdisc *sch,
61 struct sk_buff **to_free);
62 struct sk_buff * (*dequeue)(struct Qdisc *sch);
05bdd2f1 63 unsigned int flags;
b00355db 64#define TCQ_F_BUILTIN 1
fd245a4a
ED
65#define TCQ_F_INGRESS 2
66#define TCQ_F_CAN_BYPASS 4
67#define TCQ_F_MQROOT 8
1abbe139
ED
68#define TCQ_F_ONETXQUEUE 0x10 /* dequeue_skb() can assume all skbs are for
69 * q->dev_queue : It can test
70 * netif_xmit_frozen_or_stopped() before
71 * dequeueing next packet.
72 * Its true for MQ/MQPRIO slaves, or non
73 * multiqueue device.
74 */
b00355db 75#define TCQ_F_WARN_NONWC (1 << 16)
22e0f8b9 76#define TCQ_F_CPUSTATS 0x20 /* run using percpu statistics */
4eaf3b84
ED
77#define TCQ_F_NOPARENT 0x40 /* root of its hierarchy :
78 * qdisc_tree_decrease_qlen() should stop.
79 */
49b49971 80#define TCQ_F_INVISIBLE 0x80 /* invisible by default in dump */
6b3ba914 81#define TCQ_F_NOLOCK 0x100 /* qdisc does not require locking */
7a4fa291 82#define TCQ_F_OFFLOADED 0x200 /* qdisc is offloaded to HW */
45203a3b 83 u32 limit;
05bdd2f1 84 const struct Qdisc_ops *ops;
a2da570d 85 struct qdisc_size_table __rcu *stab;
59cc1f61 86 struct hlist_node hash;
1da177e4
LT
87 u32 handle;
88 u32 parent;
72b25a91 89
5e140dfc 90 struct netdev_queue *dev_queue;
5e140dfc 91
1c0d32fd 92 struct net_rate_estimator __rcu *rate_est;
0d32ef8c
ED
93 struct gnet_stats_basic_cpu __percpu *cpu_bstats;
94 struct gnet_stats_queue __percpu *cpu_qstats;
846e463a 95 int pad;
e9be0e99 96 refcount_t refcnt;
0d32ef8c 97
5e140dfc
ED
98 /*
99 * For performance sake on SMP, we put highly modified fields at the end
100 */
a53851e2 101 struct sk_buff_head gso_skb ____cacheline_aligned_in_smp;
48da34b7 102 struct qdisc_skb_head q;
0d32ef8c 103 struct gnet_stats_basic_packed bstats;
f9eb8aea 104 seqcount_t running;
0d32ef8c 105 struct gnet_stats_queue qstats;
4d202a0d
ED
106 unsigned long state;
107 struct Qdisc *next_sched;
70e57d5e 108 struct sk_buff_head skb_bad_txq;
45203a3b
ED
109
110 spinlock_t busylock ____cacheline_aligned_in_smp;
96009c7d 111 spinlock_t seqlock;
28cff537
PA
112
113 /* for NOLOCK qdisc, true if there are no enqueued skbs */
114 bool empty;
3a7d0d07 115 struct rcu_head rcu;
846e463a
ED
116
117 /* private data */
118 long privdata[] ____cacheline_aligned;
1da177e4
LT
119};
120
551143d8
ED
121static inline void qdisc_refcount_inc(struct Qdisc *qdisc)
122{
123 if (qdisc->flags & TCQ_F_BUILTIN)
124 return;
125 refcount_inc(&qdisc->refcnt);
126}
127
9d7e82ce
VB
128/* Intended to be used by unlocked users, when concurrent qdisc release is
129 * possible.
130 */
131
132static inline struct Qdisc *qdisc_refcount_inc_nz(struct Qdisc *qdisc)
133{
134 if (qdisc->flags & TCQ_F_BUILTIN)
135 return qdisc;
136 if (refcount_inc_not_zero(&qdisc->refcnt))
137 return qdisc;
138 return NULL;
139}
140
96009c7d 141static inline bool qdisc_is_running(struct Qdisc *qdisc)
bc135b23 142{
32f7b44d 143 if (qdisc->flags & TCQ_F_NOLOCK)
96009c7d 144 return spin_is_locked(&qdisc->seqlock);
f9eb8aea 145 return (raw_read_seqcount(&qdisc->running) & 1) ? true : false;
bc135b23
ED
146}
147
9c01c9f1
PA
148static inline bool qdisc_is_percpu_stats(const struct Qdisc *q)
149{
150 return q->flags & TCQ_F_CPUSTATS;
151}
152
28cff537
PA
153static inline bool qdisc_is_empty(const struct Qdisc *qdisc)
154{
9c01c9f1 155 if (qdisc_is_percpu_stats(qdisc))
90b2be27
ED
156 return READ_ONCE(qdisc->empty);
157 return !READ_ONCE(qdisc->q.qlen);
28cff537
PA
158}
159
bc135b23
ED
160static inline bool qdisc_run_begin(struct Qdisc *qdisc)
161{
32f7b44d 162 if (qdisc->flags & TCQ_F_NOLOCK) {
a90c57f2
YL
163 if (spin_trylock(&qdisc->seqlock))
164 goto nolock_empty;
165
166 /* If the MISSED flag is set, it means other thread has
167 * set the MISSED flag before second spin_trylock(), so
168 * we can return false here to avoid multi cpus doing
169 * the set_bit() and second spin_trylock() concurrently.
170 */
171 if (test_bit(__QDISC_STATE_MISSED, &qdisc->state))
172 return false;
173
174 /* Set the MISSED flag before the second spin_trylock(),
175 * if the second spin_trylock() return false, it means
176 * other cpu holding the lock will do dequeuing for us
177 * or it will see the MISSED flag set after releasing
178 * lock and reschedule the net_tx_action() to do the
179 * dequeuing.
180 */
181 set_bit(__QDISC_STATE_MISSED, &qdisc->state);
182
183 /* Retry again in case other CPU may not see the new flag
184 * after it releases the lock at the end of qdisc_run_end().
185 */
96009c7d 186 if (!spin_trylock(&qdisc->seqlock))
32f7b44d 187 return false;
a90c57f2
YL
188
189nolock_empty:
90b2be27 190 WRITE_ONCE(qdisc->empty, false);
dd25296a 191 return true;
32f7b44d 192 } else if (qdisc_is_running(qdisc)) {
fd245a4a 193 return false;
32f7b44d 194 }
52fbb290
ED
195 /* Variant of write_seqcount_begin() telling lockdep a trylock
196 * was attempted.
197 */
198 raw_write_seqcount_begin(&qdisc->running);
199 seqcount_acquire(&qdisc->running.dep_map, 0, 1, _RET_IP_);
fd245a4a 200 return true;
bc135b23
ED
201}
202
203static inline void qdisc_run_end(struct Qdisc *qdisc)
204{
a90c57f2 205 if (qdisc->flags & TCQ_F_NOLOCK) {
96009c7d 206 spin_unlock(&qdisc->seqlock);
a90c57f2
YL
207
208 if (unlikely(test_bit(__QDISC_STATE_MISSED,
209 &qdisc->state))) {
210 clear_bit(__QDISC_STATE_MISSED, &qdisc->state);
211 __netif_schedule(qdisc);
212 }
dd25296a
YL
213 } else {
214 write_seqcount_end(&qdisc->running);
a90c57f2 215 }
fd245a4a
ED
216}
217
5772e9a3
JDB
218static inline bool qdisc_may_bulk(const struct Qdisc *qdisc)
219{
220 return qdisc->flags & TCQ_F_ONETXQUEUE;
221}
222
223static inline int qdisc_avail_bulklimit(const struct netdev_queue *txq)
224{
225#ifdef CONFIG_BQL
226 /* Non-BQL migrated drivers will return 0, too. */
227 return dql_avail(&txq->dql);
228#else
229 return 0;
230#endif
231}
232
fd2c3ef7 233struct Qdisc_class_ops {
dfcd2a2b 234 unsigned int flags;
1da177e4 235 /* Child qdisc manipulation */
926e61b7 236 struct netdev_queue * (*select_queue)(struct Qdisc *, struct tcmsg *);
1da177e4 237 int (*graft)(struct Qdisc *, unsigned long cl,
653d6fd6
AA
238 struct Qdisc *, struct Qdisc **,
239 struct netlink_ext_ack *extack);
1da177e4 240 struct Qdisc * (*leaf)(struct Qdisc *, unsigned long cl);
43effa1e 241 void (*qlen_notify)(struct Qdisc *, unsigned long);
1da177e4
LT
242
243 /* Class manipulation routines */
143976ce 244 unsigned long (*find)(struct Qdisc *, u32 classid);
1da177e4 245 int (*change)(struct Qdisc *, u32, u32,
793d81d6
AA
246 struct nlattr **, unsigned long *,
247 struct netlink_ext_ack *);
4dd78a73
MM
248 int (*delete)(struct Qdisc *, unsigned long,
249 struct netlink_ext_ack *);
1da177e4
LT
250 void (*walk)(struct Qdisc *, struct qdisc_walker * arg);
251
252 /* Filter manipulation */
0ac4bd68 253 struct tcf_block * (*tcf_block)(struct Qdisc *sch,
cbaacc4e
AA
254 unsigned long arg,
255 struct netlink_ext_ack *extack);
1da177e4
LT
256 unsigned long (*bind_tcf)(struct Qdisc *, unsigned long,
257 u32 classid);
258 void (*unbind_tcf)(struct Qdisc *, unsigned long);
259
260 /* rtnetlink specific */
261 int (*dump)(struct Qdisc *, unsigned long,
262 struct sk_buff *skb, struct tcmsg*);
263 int (*dump_stats)(struct Qdisc *, unsigned long,
264 struct gnet_dump *);
265};
266
dfcd2a2b
VB
267/* Qdisc_class_ops flag values */
268
269/* Implements API that doesn't require rtnl lock */
270enum qdisc_class_ops_flags {
271 QDISC_CLASS_OPS_DOIT_UNLOCKED = 1,
272};
273
fd2c3ef7 274struct Qdisc_ops {
1da177e4 275 struct Qdisc_ops *next;
20fea08b 276 const struct Qdisc_class_ops *cl_ops;
1da177e4
LT
277 char id[IFNAMSIZ];
278 int priv_size;
d59f5ffa 279 unsigned int static_flags;
1da177e4 280
520ac30f
ED
281 int (*enqueue)(struct sk_buff *skb,
282 struct Qdisc *sch,
283 struct sk_buff **to_free);
1da177e4 284 struct sk_buff * (*dequeue)(struct Qdisc *);
90d841fd 285 struct sk_buff * (*peek)(struct Qdisc *);
1da177e4 286
e63d7dfd
AA
287 int (*init)(struct Qdisc *sch, struct nlattr *arg,
288 struct netlink_ext_ack *extack);
1da177e4
LT
289 void (*reset)(struct Qdisc *);
290 void (*destroy)(struct Qdisc *);
0ac4bd68 291 int (*change)(struct Qdisc *sch,
2030721c
AA
292 struct nlattr *arg,
293 struct netlink_ext_ack *extack);
0ac4bd68 294 void (*attach)(struct Qdisc *sch);
48bfd55e 295 int (*change_tx_queue_len)(struct Qdisc *, unsigned int);
1da177e4
LT
296
297 int (*dump)(struct Qdisc *, struct sk_buff *);
298 int (*dump_stats)(struct Qdisc *, struct gnet_dump *);
299
d47a6b0e
JP
300 void (*ingress_block_set)(struct Qdisc *sch,
301 u32 block_index);
302 void (*egress_block_set)(struct Qdisc *sch,
303 u32 block_index);
304 u32 (*ingress_block_get)(struct Qdisc *sch);
305 u32 (*egress_block_get)(struct Qdisc *sch);
306
1da177e4
LT
307 struct module *owner;
308};
309
310
fd2c3ef7 311struct tcf_result {
db50514f
JP
312 union {
313 struct {
314 unsigned long class;
315 u32 classid;
316 };
317 const struct tcf_proto *goto_tp;
cd11b164 318
720f22fe 319 /* used in the skb_tc_reinsert function */
cd11b164
PA
320 struct {
321 bool ingress;
322 struct gnet_stats_queue *qstats;
323 };
db50514f 324 };
1da177e4
LT
325};
326
9f407f17
JP
327struct tcf_chain;
328
fd2c3ef7 329struct tcf_proto_ops {
36272874 330 struct list_head head;
1da177e4
LT
331 char kind[IFNAMSIZ];
332
dc7f9f6e
ED
333 int (*classify)(struct sk_buff *,
334 const struct tcf_proto *,
335 struct tcf_result *);
1da177e4 336 int (*init)(struct tcf_proto*);
12db03b6 337 void (*destroy)(struct tcf_proto *tp, bool rtnl_held,
715df5ec 338 struct netlink_ext_ack *extack);
1da177e4 339
8113c095 340 void* (*get)(struct tcf_proto*, u32 handle);
7d5509fa 341 void (*put)(struct tcf_proto *tp, void *f);
c1b52739 342 int (*change)(struct net *net, struct sk_buff *,
af4c6641 343 struct tcf_proto*, unsigned long,
add93b61 344 u32 handle, struct nlattr **,
12db03b6 345 void **, bool, bool,
7306db38 346 struct netlink_ext_ack *);
8865fdd4 347 int (*delete)(struct tcf_proto *tp, void *arg,
12db03b6 348 bool *last, bool rtnl_held,
571acf21 349 struct netlink_ext_ack *);
a5b72a08 350 bool (*delete_empty)(struct tcf_proto *tp);
12db03b6
VB
351 void (*walk)(struct tcf_proto *tp,
352 struct tcf_walker *arg, bool rtnl_held);
e56185c7 353 int (*reoffload)(struct tcf_proto *tp, bool add,
a7323311 354 flow_setup_cb_t *cb, void *cb_priv,
e56185c7 355 struct netlink_ext_ack *extack);
a449a3e7
VB
356 void (*hw_add)(struct tcf_proto *tp,
357 void *type_data);
358 void (*hw_del)(struct tcf_proto *tp,
359 void *type_data);
2e24cd75
CW
360 void (*bind_class)(void *, u32, unsigned long,
361 void *, unsigned long);
9f407f17
JP
362 void * (*tmplt_create)(struct net *net,
363 struct tcf_chain *chain,
364 struct nlattr **tca,
365 struct netlink_ext_ack *extack);
366 void (*tmplt_destroy)(void *tmplt_priv);
1da177e4
LT
367
368 /* rtnetlink specific */
8113c095 369 int (*dump)(struct net*, struct tcf_proto*, void *,
12db03b6
VB
370 struct sk_buff *skb, struct tcmsg*,
371 bool);
f8ab1807
VB
372 int (*terse_dump)(struct net *net,
373 struct tcf_proto *tp, void *fh,
374 struct sk_buff *skb,
375 struct tcmsg *t, bool rtnl_held);
9f407f17
JP
376 int (*tmplt_dump)(struct sk_buff *skb,
377 struct net *net,
378 void *tmplt_priv);
1da177e4
LT
379
380 struct module *owner;
12db03b6
VB
381 int flags;
382};
383
a5b72a08
DC
384/* Classifiers setting TCF_PROTO_OPS_DOIT_UNLOCKED in tcf_proto_ops->flags
385 * are expected to implement tcf_proto_ops->delete_empty(), otherwise race
386 * conditions can occur when filters are inserted/deleted simultaneously.
387 */
12db03b6
VB
388enum tcf_proto_ops_flags {
389 TCF_PROTO_OPS_DOIT_UNLOCKED = 1,
1da177e4
LT
390};
391
fd2c3ef7 392struct tcf_proto {
1da177e4 393 /* Fast access part */
25d8c0d5
JF
394 struct tcf_proto __rcu *next;
395 void __rcu *root;
7fd4b288
PA
396
397 /* called under RCU BH lock*/
dc7f9f6e
ED
398 int (*classify)(struct sk_buff *,
399 const struct tcf_proto *,
400 struct tcf_result *);
66c6f529 401 __be16 protocol;
1da177e4
LT
402
403 /* All the rest */
404 u32 prio;
1da177e4 405 void *data;
dc7f9f6e 406 const struct tcf_proto_ops *ops;
5bc17018 407 struct tcf_chain *chain;
8b64678e
VB
408 /* Lock protects tcf_proto shared state and can be used by unlocked
409 * classifiers to protect their private data.
410 */
411 spinlock_t lock;
412 bool deleting;
4dbfa766 413 refcount_t refcnt;
25d8c0d5 414 struct rcu_head rcu;
59eb87cb 415 struct hlist_node destroy_ht_node;
1da177e4
LT
416};
417
175f9c1b 418struct qdisc_skb_cb {
089b19a9
SF
419 struct {
420 unsigned int pkt_len;
421 u16 slave_dev_queue_mapping;
422 u16 tc_classid;
d58e468b 423 };
25711786
ED
424#define QDISC_CB_PRIV_LEN 20
425 unsigned char data[QDISC_CB_PRIV_LEN];
038ebb1a 426 u16 mru;
7baf2429 427 bool post_ct;
175f9c1b
JK
428};
429
c7eb7d72
JP
430typedef void tcf_chain_head_change_t(struct tcf_proto *tp_head, void *priv);
431
2190d1d0 432struct tcf_chain {
ed76f5ed
VB
433 /* Protects filter_chain. */
434 struct mutex filter_chain_lock;
2190d1d0 435 struct tcf_proto __rcu *filter_chain;
5bc17018
JP
436 struct list_head list;
437 struct tcf_block *block;
438 u32 index; /* chain index */
439 unsigned int refcnt;
1f3ed383 440 unsigned int action_refcnt;
32a4f5ec 441 bool explicitly_created;
726d0612 442 bool flushing;
9f407f17
JP
443 const struct tcf_proto_ops *tmplt_ops;
444 void *tmplt_priv;
ee3bbfe8 445 struct rcu_head rcu;
6529eaba
JP
446};
447
2190d1d0 448struct tcf_block {
c266f64d
VB
449 /* Lock protects tcf_block and lifetime-management data of chains
450 * attached to the block (refcnt, action_refcnt, explicitly_created).
451 */
452 struct mutex lock;
5bc17018 453 struct list_head chain_list;
48617387 454 u32 index; /* block index for shared blocks */
a7df4870 455 u32 classid; /* which class this block belongs to */
cfebd7e2 456 refcount_t refcnt;
855319be 457 struct net *net;
69d78ef2 458 struct Qdisc *q;
4f8116c8 459 struct rw_semaphore cb_lock; /* protects cb_list and offload counters */
14bfb13f 460 struct flow_block flow_block;
f36fe1c4
JP
461 struct list_head owner_list;
462 bool keep_dst;
97394bef 463 atomic_t offloadcnt; /* Number of oddloaded filters */
caa72601 464 unsigned int nooffloaddevcnt; /* Number of devs unable to do offload */
c9f14470 465 unsigned int lockeddevcnt; /* Number of devs that require rtnl lock. */
f71e0ca4
JP
466 struct {
467 struct tcf_chain *chain;
468 struct list_head filter_chain_list;
469 } chain0;
0607e439 470 struct rcu_head rcu;
59eb87cb
JH
471 DECLARE_HASHTABLE(proto_destroy_ht, 7);
472 struct mutex proto_destroy_lock; /* Lock for proto_destroy hashtable. */
2190d1d0
JP
473};
474
ed76f5ed
VB
475static inline bool lockdep_tcf_chain_is_locked(struct tcf_chain *chain)
476{
477 return lockdep_is_held(&chain->filter_chain_lock);
478}
8b64678e
VB
479
480static inline bool lockdep_tcf_proto_is_locked(struct tcf_proto *tp)
481{
482 return lockdep_is_held(&tp->lock);
483}
ed76f5ed
VB
484
485#define tcf_chain_dereference(p, chain) \
486 rcu_dereference_protected(p, lockdep_tcf_chain_is_locked(chain))
487
8b64678e
VB
488#define tcf_proto_dereference(p, tp) \
489 rcu_dereference_protected(p, lockdep_tcf_proto_is_locked(tp))
490
16bda13d
DM
491static inline void qdisc_cb_private_validate(const struct sk_buff *skb, int sz)
492{
493 struct qdisc_skb_cb *qcb;
5ee31c68 494
038ebb1a 495 BUILD_BUG_ON(sizeof(skb->cb) < sizeof(*qcb));
16bda13d
DM
496 BUILD_BUG_ON(sizeof(qcb->data) < sz);
497}
498
73eb628d
PA
499static inline int qdisc_qlen_cpu(const struct Qdisc *q)
500{
501 return this_cpu_ptr(q->cpu_qstats)->qlen;
502}
503
05bdd2f1 504static inline int qdisc_qlen(const struct Qdisc *q)
bbd8a0d3
KK
505{
506 return q->q.qlen;
507}
508
73eb628d 509static inline int qdisc_qlen_sum(const struct Qdisc *q)
7e66016f 510{
73eb628d
PA
511 __u32 qlen = q->qstats.qlen;
512 int i;
7e66016f 513
73eb628d
PA
514 if (qdisc_is_percpu_stats(q)) {
515 for_each_possible_cpu(i)
516 qlen += per_cpu_ptr(q->cpu_qstats, i)->qlen;
517 } else {
6172abc1 518 qlen += q->q.qlen;
73eb628d 519 }
7e66016f
JF
520
521 return qlen;
522}
523
bfe0d029 524static inline struct qdisc_skb_cb *qdisc_skb_cb(const struct sk_buff *skb)
175f9c1b
JK
525{
526 return (struct qdisc_skb_cb *)skb->cb;
527}
528
83874000
DM
529static inline spinlock_t *qdisc_lock(struct Qdisc *qdisc)
530{
531 return &qdisc->q.lock;
532}
533
05bdd2f1 534static inline struct Qdisc *qdisc_root(const struct Qdisc *qdisc)
7698b4fc 535{
46e5da40
JF
536 struct Qdisc *q = rcu_dereference_rtnl(qdisc->dev_queue->qdisc);
537
538 return q;
7698b4fc
DM
539}
540
159d2c7d
ED
541static inline struct Qdisc *qdisc_root_bh(const struct Qdisc *qdisc)
542{
543 return rcu_dereference_bh(qdisc->dev_queue->qdisc);
544}
545
05bdd2f1 546static inline struct Qdisc *qdisc_root_sleeping(const struct Qdisc *qdisc)
2540e051
JP
547{
548 return qdisc->dev_queue->qdisc_sleeping;
549}
550
7e43f112
DM
551/* The qdisc root lock is a mechanism by which to top level
552 * of a qdisc tree can be locked from any qdisc node in the
553 * forest. This allows changing the configuration of some
554 * aspect of the qdisc tree while blocking out asynchronous
555 * qdisc access in the packet processing paths.
556 *
557 * It is only legal to do this when the root will not change
558 * on us. Otherwise we'll potentially lock the wrong qdisc
559 * root. This is enforced by holding the RTNL semaphore, which
560 * all users of this lock accessor must do.
561 */
05bdd2f1 562static inline spinlock_t *qdisc_root_lock(const struct Qdisc *qdisc)
7698b4fc
DM
563{
564 struct Qdisc *root = qdisc_root(qdisc);
565
7e43f112 566 ASSERT_RTNL();
83874000 567 return qdisc_lock(root);
7698b4fc
DM
568}
569
05bdd2f1 570static inline spinlock_t *qdisc_root_sleeping_lock(const struct Qdisc *qdisc)
f6f9b93f
JP
571{
572 struct Qdisc *root = qdisc_root_sleeping(qdisc);
573
574 ASSERT_RTNL();
575 return qdisc_lock(root);
576}
577
edb09eb1
ED
578static inline seqcount_t *qdisc_root_sleeping_running(const struct Qdisc *qdisc)
579{
580 struct Qdisc *root = qdisc_root_sleeping(qdisc);
581
582 ASSERT_RTNL();
583 return &root->running;
584}
585
05bdd2f1 586static inline struct net_device *qdisc_dev(const struct Qdisc *qdisc)
5ce2d488
DM
587{
588 return qdisc->dev_queue->dev;
589}
1da177e4 590
ca1e4ab1 591static inline void sch_tree_lock(struct Qdisc *q)
78a5b30b 592{
ca1e4ab1
MM
593 if (q->flags & TCQ_F_MQROOT)
594 spin_lock_bh(qdisc_lock(q));
595 else
596 spin_lock_bh(qdisc_root_sleeping_lock(q));
78a5b30b
DM
597}
598
ca1e4ab1 599static inline void sch_tree_unlock(struct Qdisc *q)
78a5b30b 600{
ca1e4ab1
MM
601 if (q->flags & TCQ_F_MQROOT)
602 spin_unlock_bh(qdisc_lock(q));
603 else
604 spin_unlock_bh(qdisc_root_sleeping_lock(q));
78a5b30b
DM
605}
606
e41a33e6
TG
607extern struct Qdisc noop_qdisc;
608extern struct Qdisc_ops noop_qdisc_ops;
6ec1c69a
DM
609extern struct Qdisc_ops pfifo_fast_ops;
610extern struct Qdisc_ops mq_qdisc_ops;
d66d6c31 611extern struct Qdisc_ops noqueue_qdisc_ops;
6da7c8fc 612extern const struct Qdisc_ops *default_qdisc_ops;
1f27cde3
ED
613static inline const struct Qdisc_ops *
614get_default_qdisc_ops(const struct net_device *dev, int ntx)
615{
616 return ntx < dev->real_num_tx_queues ?
617 default_qdisc_ops : &pfifo_fast_ops;
618}
e41a33e6 619
fd2c3ef7 620struct Qdisc_class_common {
6fe1c7a5
PM
621 u32 classid;
622 struct hlist_node hnode;
623};
624
fd2c3ef7 625struct Qdisc_class_hash {
6fe1c7a5
PM
626 struct hlist_head *hash;
627 unsigned int hashsize;
628 unsigned int hashmask;
629 unsigned int hashelems;
630};
631
632static inline unsigned int qdisc_class_hash(u32 id, u32 mask)
633{
634 id ^= id >> 8;
635 id ^= id >> 4;
636 return id & mask;
637}
638
639static inline struct Qdisc_class_common *
05bdd2f1 640qdisc_class_find(const struct Qdisc_class_hash *hash, u32 id)
6fe1c7a5
PM
641{
642 struct Qdisc_class_common *cl;
6fe1c7a5
PM
643 unsigned int h;
644
7d3f0cd4
GF
645 if (!id)
646 return NULL;
647
6fe1c7a5 648 h = qdisc_class_hash(id, hash->hashmask);
b67bfe0d 649 hlist_for_each_entry(cl, &hash->hash[h], hnode) {
6fe1c7a5
PM
650 if (cl->classid == id)
651 return cl;
652 }
653 return NULL;
654}
655
384c181e
AN
656static inline int tc_classid_to_hwtc(struct net_device *dev, u32 classid)
657{
658 u32 hwtc = TC_H_MIN(classid) - TC_H_MIN_PRIORITY;
659
660 return (hwtc < netdev_get_num_tc(dev)) ? hwtc : -EINVAL;
661}
662
5c15257f
JP
663int qdisc_class_hash_init(struct Qdisc_class_hash *);
664void qdisc_class_hash_insert(struct Qdisc_class_hash *,
665 struct Qdisc_class_common *);
666void qdisc_class_hash_remove(struct Qdisc_class_hash *,
667 struct Qdisc_class_common *);
668void qdisc_class_hash_grow(struct Qdisc *, struct Qdisc_class_hash *);
669void qdisc_class_hash_destroy(struct Qdisc_class_hash *);
670
48bfd55e 671int dev_qdisc_change_tx_queue_len(struct net_device *dev);
5c15257f
JP
672void dev_init_scheduler(struct net_device *dev);
673void dev_shutdown(struct net_device *dev);
674void dev_activate(struct net_device *dev);
675void dev_deactivate(struct net_device *dev);
676void dev_deactivate_many(struct list_head *head);
677struct Qdisc *dev_graft_qdisc(struct netdev_queue *dev_queue,
678 struct Qdisc *qdisc);
679void qdisc_reset(struct Qdisc *qdisc);
86bd446b 680void qdisc_put(struct Qdisc *qdisc);
3a7d0d07 681void qdisc_put_unlocked(struct Qdisc *qdisc);
5f2939d9 682void qdisc_tree_reduce_backlog(struct Qdisc *qdisc, int n, int len);
b592843c
JK
683#ifdef CONFIG_NET_SCHED
684int qdisc_offload_dump_helper(struct Qdisc *q, enum tc_setup_type type,
685 void *type_data);
bfaee911
JK
686void qdisc_offload_graft_helper(struct net_device *dev, struct Qdisc *sch,
687 struct Qdisc *new, struct Qdisc *old,
688 enum tc_setup_type type, void *type_data,
689 struct netlink_ext_ack *extack);
b592843c
JK
690#else
691static inline int
692qdisc_offload_dump_helper(struct Qdisc *q, enum tc_setup_type type,
693 void *type_data)
694{
695 q->flags &= ~TCQ_F_OFFLOADED;
696 return 0;
697}
bfaee911
JK
698
699static inline void
700qdisc_offload_graft_helper(struct net_device *dev, struct Qdisc *sch,
701 struct Qdisc *new, struct Qdisc *old,
702 enum tc_setup_type type, void *type_data,
703 struct netlink_ext_ack *extack)
704{
705}
b592843c 706#endif
5c15257f 707struct Qdisc *qdisc_alloc(struct netdev_queue *dev_queue,
d0bd684d
AA
708 const struct Qdisc_ops *ops,
709 struct netlink_ext_ack *extack);
81d947e2 710void qdisc_free(struct Qdisc *qdisc);
5c15257f 711struct Qdisc *qdisc_create_dflt(struct netdev_queue *dev_queue,
a38a9882
AA
712 const struct Qdisc_ops *ops, u32 parentid,
713 struct netlink_ext_ack *extack);
5c15257f
JP
714void __qdisc_calculate_pkt_len(struct sk_buff *skb,
715 const struct qdisc_size_table *stab);
27b29f63 716int skb_do_redirect(struct sk_buff *);
1da177e4 717
fdc5432a
DB
718static inline bool skb_at_tc_ingress(const struct sk_buff *skb)
719{
720#ifdef CONFIG_NET_CLS_ACT
8dc07fdb 721 return skb->tc_at_ingress;
fdc5432a
DB
722#else
723 return false;
724#endif
725}
726
e7246e12
WB
727static inline bool skb_skip_tc_classify(struct sk_buff *skb)
728{
729#ifdef CONFIG_NET_CLS_ACT
730 if (skb->tc_skip_classify) {
731 skb->tc_skip_classify = 0;
732 return true;
733 }
734#endif
735 return false;
736}
737
3a053b1a 738/* Reset all TX qdiscs greater than index of a device. */
f0796d5c 739static inline void qdisc_reset_all_tx_gt(struct net_device *dev, unsigned int i)
5aa70995 740{
4ef6acff
JF
741 struct Qdisc *qdisc;
742
f0796d5c 743 for (; i < dev->num_tx_queues; i++) {
46e5da40 744 qdisc = rtnl_dereference(netdev_get_tx_queue(dev, i)->qdisc);
4ef6acff
JF
745 if (qdisc) {
746 spin_lock_bh(qdisc_lock(qdisc));
747 qdisc_reset(qdisc);
748 spin_unlock_bh(qdisc_lock(qdisc));
749 }
750 }
5aa70995
DM
751}
752
3e745dd6
DM
753/* Are all TX queues of the device empty? */
754static inline bool qdisc_all_tx_empty(const struct net_device *dev)
755{
e8a0464c 756 unsigned int i;
46e5da40
JF
757
758 rcu_read_lock();
e8a0464c
DM
759 for (i = 0; i < dev->num_tx_queues; i++) {
760 struct netdev_queue *txq = netdev_get_tx_queue(dev, i);
46e5da40 761 const struct Qdisc *q = rcu_dereference(txq->qdisc);
3e745dd6 762
1f5e6fdd 763 if (!qdisc_is_empty(q)) {
46e5da40 764 rcu_read_unlock();
e8a0464c 765 return false;
46e5da40 766 }
e8a0464c 767 }
46e5da40 768 rcu_read_unlock();
e8a0464c 769 return true;
3e745dd6
DM
770}
771
6fa9864b 772/* Are any of the TX qdiscs changing? */
05bdd2f1 773static inline bool qdisc_tx_changing(const struct net_device *dev)
6fa9864b 774{
e8a0464c 775 unsigned int i;
46e5da40 776
e8a0464c
DM
777 for (i = 0; i < dev->num_tx_queues; i++) {
778 struct netdev_queue *txq = netdev_get_tx_queue(dev, i);
46e5da40 779 if (rcu_access_pointer(txq->qdisc) != txq->qdisc_sleeping)
e8a0464c
DM
780 return true;
781 }
782 return false;
6fa9864b
DM
783}
784
e8a0464c 785/* Is the device using the noop qdisc on all queues? */
05297949
DM
786static inline bool qdisc_tx_is_noop(const struct net_device *dev)
787{
e8a0464c 788 unsigned int i;
46e5da40 789
e8a0464c
DM
790 for (i = 0; i < dev->num_tx_queues; i++) {
791 struct netdev_queue *txq = netdev_get_tx_queue(dev, i);
46e5da40 792 if (rcu_access_pointer(txq->qdisc) != &noop_qdisc)
e8a0464c
DM
793 return false;
794 }
795 return true;
05297949
DM
796}
797
bfe0d029 798static inline unsigned int qdisc_pkt_len(const struct sk_buff *skb)
0abf77e5 799{
175f9c1b 800 return qdisc_skb_cb(skb)->pkt_len;
0abf77e5
JK
801}
802
c27f339a 803/* additional qdisc xmit flags (NET_XMIT_MASK in linux/netdevice.h) */
378a2f09
JP
804enum net_xmit_qdisc_t {
805 __NET_XMIT_STOLEN = 0x00010000,
c27f339a 806 __NET_XMIT_BYPASS = 0x00020000,
378a2f09
JP
807};
808
c27f339a 809#ifdef CONFIG_NET_CLS_ACT
378a2f09 810#define net_xmit_drop_count(e) ((e) & __NET_XMIT_STOLEN ? 0 : 1)
378a2f09
JP
811#else
812#define net_xmit_drop_count(e) (1)
813#endif
814
a2da570d
ED
815static inline void qdisc_calculate_pkt_len(struct sk_buff *skb,
816 const struct Qdisc *sch)
5f86173b 817{
3a682fbd 818#ifdef CONFIG_NET_SCHED
a2da570d
ED
819 struct qdisc_size_table *stab = rcu_dereference_bh(sch->stab);
820
821 if (stab)
822 __qdisc_calculate_pkt_len(skb, stab);
3a682fbd 823#endif
a2da570d
ED
824}
825
ac5c66f2 826static inline int qdisc_enqueue(struct sk_buff *skb, struct Qdisc *sch,
520ac30f 827 struct sk_buff **to_free)
a2da570d
ED
828{
829 qdisc_calculate_pkt_len(skb, sch);
ac5c66f2 830 return sch->enqueue(skb, sch, to_free);
5f86173b
JK
831}
832
38040702
AV
833static inline void _bstats_update(struct gnet_stats_basic_packed *bstats,
834 __u64 bytes, __u32 packets)
835{
836 bstats->bytes += bytes;
837 bstats->packets += packets;
838}
839
bfe0d029
ED
840static inline void bstats_update(struct gnet_stats_basic_packed *bstats,
841 const struct sk_buff *skb)
842{
38040702
AV
843 _bstats_update(bstats,
844 qdisc_pkt_len(skb),
845 skb_is_gso(skb) ? skb_shinfo(skb)->gso_segs : 1);
846}
847
848static inline void _bstats_cpu_update(struct gnet_stats_basic_cpu *bstats,
849 __u64 bytes, __u32 packets)
850{
851 u64_stats_update_begin(&bstats->syncp);
852 _bstats_update(&bstats->bstats, bytes, packets);
853 u64_stats_update_end(&bstats->syncp);
bfe0d029
ED
854}
855
24ea591d
ED
856static inline void bstats_cpu_update(struct gnet_stats_basic_cpu *bstats,
857 const struct sk_buff *skb)
22e0f8b9 858{
22e0f8b9
JF
859 u64_stats_update_begin(&bstats->syncp);
860 bstats_update(&bstats->bstats, skb);
861 u64_stats_update_end(&bstats->syncp);
862}
863
24ea591d
ED
864static inline void qdisc_bstats_cpu_update(struct Qdisc *sch,
865 const struct sk_buff *skb)
866{
867 bstats_cpu_update(this_cpu_ptr(sch->cpu_bstats), skb);
868}
869
bfe0d029
ED
870static inline void qdisc_bstats_update(struct Qdisc *sch,
871 const struct sk_buff *skb)
bbd8a0d3 872{
bfe0d029 873 bstats_update(&sch->bstats, skb);
bbd8a0d3
KK
874}
875
25331d6c
JF
876static inline void qdisc_qstats_backlog_dec(struct Qdisc *sch,
877 const struct sk_buff *skb)
878{
879 sch->qstats.backlog -= qdisc_pkt_len(skb);
880}
881
40bd0362
JF
882static inline void qdisc_qstats_cpu_backlog_dec(struct Qdisc *sch,
883 const struct sk_buff *skb)
884{
885 this_cpu_sub(sch->cpu_qstats->backlog, qdisc_pkt_len(skb));
886}
887
25331d6c
JF
888static inline void qdisc_qstats_backlog_inc(struct Qdisc *sch,
889 const struct sk_buff *skb)
890{
891 sch->qstats.backlog += qdisc_pkt_len(skb);
892}
893
40bd0362
JF
894static inline void qdisc_qstats_cpu_backlog_inc(struct Qdisc *sch,
895 const struct sk_buff *skb)
896{
897 this_cpu_add(sch->cpu_qstats->backlog, qdisc_pkt_len(skb));
898}
899
73eb628d 900static inline void qdisc_qstats_cpu_qlen_inc(struct Qdisc *sch)
40bd0362 901{
73eb628d 902 this_cpu_inc(sch->cpu_qstats->qlen);
40bd0362
JF
903}
904
73eb628d 905static inline void qdisc_qstats_cpu_qlen_dec(struct Qdisc *sch)
40bd0362 906{
73eb628d 907 this_cpu_dec(sch->cpu_qstats->qlen);
40bd0362
JF
908}
909
910static inline void qdisc_qstats_cpu_requeues_inc(struct Qdisc *sch)
911{
912 this_cpu_inc(sch->cpu_qstats->requeues);
913}
914
25331d6c
JF
915static inline void __qdisc_qstats_drop(struct Qdisc *sch, int count)
916{
917 sch->qstats.drops += count;
918}
919
24ea591d 920static inline void qstats_drop_inc(struct gnet_stats_queue *qstats)
25331d6c 921{
24ea591d 922 qstats->drops++;
25331d6c
JF
923}
924
24ea591d 925static inline void qstats_overlimit_inc(struct gnet_stats_queue *qstats)
b0ab6f92 926{
24ea591d
ED
927 qstats->overlimits++;
928}
b0ab6f92 929
24ea591d
ED
930static inline void qdisc_qstats_drop(struct Qdisc *sch)
931{
932 qstats_drop_inc(&sch->qstats);
933}
934
935static inline void qdisc_qstats_cpu_drop(struct Qdisc *sch)
936{
eb60a8dd 937 this_cpu_inc(sch->cpu_qstats->drops);
b0ab6f92
JF
938}
939
25331d6c
JF
940static inline void qdisc_qstats_overlimit(struct Qdisc *sch)
941{
942 sch->qstats.overlimits++;
943}
944
5dd431b6
PA
945static inline int qdisc_qstats_copy(struct gnet_dump *d, struct Qdisc *sch)
946{
947 __u32 qlen = qdisc_qlen_sum(sch);
948
949 return gnet_stats_copy_queue(d, sch->cpu_qstats, &sch->qstats, qlen);
950}
951
952static inline void qdisc_qstats_qlen_backlog(struct Qdisc *sch, __u32 *qlen,
953 __u32 *backlog)
954{
955 struct gnet_stats_queue qstats = { 0 };
956 __u32 len = qdisc_qlen_sum(sch);
957
958 __gnet_stats_copy_queue(&qstats, sch->cpu_qstats, &sch->qstats, len);
959 *qlen = qstats.qlen;
960 *backlog = qstats.backlog;
961}
962
e5f0e8f8
PA
963static inline void qdisc_tree_flush_backlog(struct Qdisc *sch)
964{
965 __u32 qlen, backlog;
966
967 qdisc_qstats_qlen_backlog(sch, &qlen, &backlog);
968 qdisc_tree_reduce_backlog(sch, qlen, backlog);
969}
970
971static inline void qdisc_purge_queue(struct Qdisc *sch)
972{
973 __u32 qlen, backlog;
974
975 qdisc_qstats_qlen_backlog(sch, &qlen, &backlog);
976 qdisc_reset(sch);
977 qdisc_tree_reduce_backlog(sch, qlen, backlog);
978}
979
48da34b7
FW
980static inline void qdisc_skb_head_init(struct qdisc_skb_head *qh)
981{
982 qh->head = NULL;
983 qh->tail = NULL;
984 qh->qlen = 0;
985}
986
aea890b8
DM
987static inline void __qdisc_enqueue_tail(struct sk_buff *skb,
988 struct qdisc_skb_head *qh)
9972b25d 989{
48da34b7
FW
990 struct sk_buff *last = qh->tail;
991
992 if (last) {
993 skb->next = NULL;
994 last->next = skb;
995 qh->tail = skb;
996 } else {
997 qh->tail = skb;
998 qh->head = skb;
999 }
1000 qh->qlen++;
9972b25d
TG
1001}
1002
1003static inline int qdisc_enqueue_tail(struct sk_buff *skb, struct Qdisc *sch)
1004{
aea890b8
DM
1005 __qdisc_enqueue_tail(skb, &sch->q);
1006 qdisc_qstats_backlog_inc(sch, skb);
1007 return NET_XMIT_SUCCESS;
9972b25d
TG
1008}
1009
59697730
DM
1010static inline void __qdisc_enqueue_head(struct sk_buff *skb,
1011 struct qdisc_skb_head *qh)
1012{
1013 skb->next = qh->head;
1014
1015 if (!qh->head)
1016 qh->tail = skb;
1017 qh->head = skb;
1018 qh->qlen++;
1019}
1020
48da34b7 1021static inline struct sk_buff *__qdisc_dequeue_head(struct qdisc_skb_head *qh)
9972b25d 1022{
48da34b7
FW
1023 struct sk_buff *skb = qh->head;
1024
1025 if (likely(skb != NULL)) {
1026 qh->head = skb->next;
1027 qh->qlen--;
1028 if (qh->head == NULL)
1029 qh->tail = NULL;
1030 skb->next = NULL;
1031 }
9972b25d 1032
ec323368
FW
1033 return skb;
1034}
1035
1036static inline struct sk_buff *qdisc_dequeue_head(struct Qdisc *sch)
1037{
1038 struct sk_buff *skb = __qdisc_dequeue_head(&sch->q);
1039
9190b3b3 1040 if (likely(skb != NULL)) {
25331d6c 1041 qdisc_qstats_backlog_dec(sch, skb);
9190b3b3
ED
1042 qdisc_bstats_update(sch, skb);
1043 }
9972b25d
TG
1044
1045 return skb;
1046}
1047
520ac30f
ED
1048/* Instead of calling kfree_skb() while root qdisc lock is held,
1049 * queue the skb for future freeing at end of __dev_xmit_skb()
1050 */
1051static inline void __qdisc_drop(struct sk_buff *skb, struct sk_buff **to_free)
1052{
1053 skb->next = *to_free;
1054 *to_free = skb;
1055}
1056
35d889d1
AK
1057static inline void __qdisc_drop_all(struct sk_buff *skb,
1058 struct sk_buff **to_free)
1059{
1060 if (skb->prev)
1061 skb->prev->next = *to_free;
1062 else
1063 skb->next = *to_free;
1064 *to_free = skb;
1065}
1066
57dbb2d8 1067static inline unsigned int __qdisc_queue_drop_head(struct Qdisc *sch,
48da34b7 1068 struct qdisc_skb_head *qh,
520ac30f 1069 struct sk_buff **to_free)
57dbb2d8 1070{
48da34b7 1071 struct sk_buff *skb = __qdisc_dequeue_head(qh);
57dbb2d8
HPP
1072
1073 if (likely(skb != NULL)) {
1074 unsigned int len = qdisc_pkt_len(skb);
520ac30f 1075
25331d6c 1076 qdisc_qstats_backlog_dec(sch, skb);
520ac30f 1077 __qdisc_drop(skb, to_free);
57dbb2d8
HPP
1078 return len;
1079 }
1080
1081 return 0;
1082}
1083
48a8f519
PM
1084static inline struct sk_buff *qdisc_peek_head(struct Qdisc *sch)
1085{
48da34b7
FW
1086 const struct qdisc_skb_head *qh = &sch->q;
1087
1088 return qh->head;
48a8f519
PM
1089}
1090
77be155c
JP
1091/* generic pseudo peek method for non-work-conserving qdisc */
1092static inline struct sk_buff *qdisc_peek_dequeued(struct Qdisc *sch)
1093{
a53851e2
JF
1094 struct sk_buff *skb = skb_peek(&sch->gso_skb);
1095
77be155c 1096 /* we can reuse ->gso_skb because peek isn't called for root qdiscs */
a53851e2
JF
1097 if (!skb) {
1098 skb = sch->dequeue(sch);
1099
1100 if (skb) {
1101 __skb_queue_head(&sch->gso_skb, skb);
61c9eaf9 1102 /* it's still part of the queue */
a53851e2 1103 qdisc_qstats_backlog_inc(sch, skb);
61c9eaf9 1104 sch->q.qlen++;
a27758ff 1105 }
61c9eaf9 1106 }
77be155c 1107
a53851e2 1108 return skb;
77be155c
JP
1109}
1110
8a53e616
PA
1111static inline void qdisc_update_stats_at_dequeue(struct Qdisc *sch,
1112 struct sk_buff *skb)
1113{
1114 if (qdisc_is_percpu_stats(sch)) {
1115 qdisc_qstats_cpu_backlog_dec(sch, skb);
1116 qdisc_bstats_cpu_update(sch, skb);
73eb628d 1117 qdisc_qstats_cpu_qlen_dec(sch);
8a53e616
PA
1118 } else {
1119 qdisc_qstats_backlog_dec(sch, skb);
1120 qdisc_bstats_update(sch, skb);
1121 sch->q.qlen--;
1122 }
1123}
1124
1125static inline void qdisc_update_stats_at_enqueue(struct Qdisc *sch,
1126 unsigned int pkt_len)
1127{
1128 if (qdisc_is_percpu_stats(sch)) {
73eb628d 1129 qdisc_qstats_cpu_qlen_inc(sch);
8a53e616
PA
1130 this_cpu_add(sch->cpu_qstats->backlog, pkt_len);
1131 } else {
1132 sch->qstats.backlog += pkt_len;
1133 sch->q.qlen++;
1134 }
1135}
1136
77be155c
JP
1137/* use instead of qdisc->dequeue() for all qdiscs queried with ->peek() */
1138static inline struct sk_buff *qdisc_dequeue_peeked(struct Qdisc *sch)
1139{
a53851e2 1140 struct sk_buff *skb = skb_peek(&sch->gso_skb);
77be155c 1141
61c9eaf9 1142 if (skb) {
a53851e2 1143 skb = __skb_dequeue(&sch->gso_skb);
9c01c9f1
PA
1144 if (qdisc_is_percpu_stats(sch)) {
1145 qdisc_qstats_cpu_backlog_dec(sch, skb);
73eb628d 1146 qdisc_qstats_cpu_qlen_dec(sch);
9c01c9f1
PA
1147 } else {
1148 qdisc_qstats_backlog_dec(sch, skb);
1149 sch->q.qlen--;
1150 }
61c9eaf9 1151 } else {
77be155c 1152 skb = sch->dequeue(sch);
61c9eaf9 1153 }
77be155c
JP
1154
1155 return skb;
1156}
1157
48da34b7 1158static inline void __qdisc_reset_queue(struct qdisc_skb_head *qh)
9972b25d
TG
1159{
1160 /*
1161 * We do not know the backlog in bytes of this list, it
1162 * is up to the caller to correct it
1163 */
48da34b7
FW
1164 ASSERT_RTNL();
1165 if (qh->qlen) {
1166 rtnl_kfree_skbs(qh->head, qh->tail);
1167
1168 qh->head = NULL;
1169 qh->tail = NULL;
1170 qh->qlen = 0;
1b5c5493 1171 }
9972b25d
TG
1172}
1173
1174static inline void qdisc_reset_queue(struct Qdisc *sch)
1175{
1b5c5493 1176 __qdisc_reset_queue(&sch->q);
9972b25d
TG
1177 sch->qstats.backlog = 0;
1178}
1179
86a7996c
WC
1180static inline struct Qdisc *qdisc_replace(struct Qdisc *sch, struct Qdisc *new,
1181 struct Qdisc **pold)
1182{
1183 struct Qdisc *old;
1184
1185 sch_tree_lock(sch);
1186 old = *pold;
1187 *pold = new;
e5f0e8f8 1188 if (old != NULL)
938e0fcd 1189 qdisc_purge_queue(old);
86a7996c
WC
1190 sch_tree_unlock(sch);
1191
1192 return old;
1193}
1194
1b5c5493
ED
1195static inline void rtnl_qdisc_drop(struct sk_buff *skb, struct Qdisc *sch)
1196{
1197 rtnl_kfree_skbs(skb, skb);
1198 qdisc_qstats_drop(sch);
1199}
1200
40bd0362
JF
1201static inline int qdisc_drop_cpu(struct sk_buff *skb, struct Qdisc *sch,
1202 struct sk_buff **to_free)
1203{
1204 __qdisc_drop(skb, to_free);
1205 qdisc_qstats_cpu_drop(sch);
1206
1207 return NET_XMIT_DROP;
1208}
520ac30f
ED
1209
1210static inline int qdisc_drop(struct sk_buff *skb, struct Qdisc *sch,
1211 struct sk_buff **to_free)
9972b25d 1212{
520ac30f 1213 __qdisc_drop(skb, to_free);
25331d6c 1214 qdisc_qstats_drop(sch);
9972b25d
TG
1215
1216 return NET_XMIT_DROP;
1217}
1218
35d889d1
AK
1219static inline int qdisc_drop_all(struct sk_buff *skb, struct Qdisc *sch,
1220 struct sk_buff **to_free)
1221{
1222 __qdisc_drop_all(skb, to_free);
1223 qdisc_qstats_drop(sch);
1224
1225 return NET_XMIT_DROP;
1226}
1227
e9bef55d
JDB
1228/* Length to Time (L2T) lookup in a qdisc_rate_table, to determine how
1229 long it will take to send a packet given its size.
1230 */
1231static inline u32 qdisc_l2t(struct qdisc_rate_table* rtab, unsigned int pktlen)
1232{
e08b0998
JDB
1233 int slot = pktlen + rtab->rate.cell_align + rtab->rate.overhead;
1234 if (slot < 0)
1235 slot = 0;
e9bef55d
JDB
1236 slot >>= rtab->rate.cell_log;
1237 if (slot > 255)
a02cec21 1238 return rtab->data[255]*(slot >> 8) + rtab->data[slot & 0xFF];
e9bef55d
JDB
1239 return rtab->data[slot];
1240}
1241
292f1c7f 1242struct psched_ratecfg {
130d3d68 1243 u64 rate_bytes_ps; /* bytes per second */
01cb71d2
ED
1244 u32 mult;
1245 u16 overhead;
8a8e3d84 1246 u8 linklayer;
01cb71d2 1247 u8 shift;
292f1c7f
JP
1248};
1249
1250static inline u64 psched_l2t_ns(const struct psched_ratecfg *r,
1251 unsigned int len)
1252{
8a8e3d84
JDB
1253 len += r->overhead;
1254
1255 if (unlikely(r->linklayer == TC_LINKLAYER_ATM))
1256 return ((u64)(DIV_ROUND_UP(len,48)*53) * r->mult) >> r->shift;
1257
1258 return ((u64)len * r->mult) >> r->shift;
292f1c7f
JP
1259}
1260
5c15257f 1261void psched_ratecfg_precompute(struct psched_ratecfg *r,
3e1e3aae
ED
1262 const struct tc_ratespec *conf,
1263 u64 rate64);
292f1c7f 1264
01cb71d2
ED
1265static inline void psched_ratecfg_getrate(struct tc_ratespec *res,
1266 const struct psched_ratecfg *r)
292f1c7f 1267{
01cb71d2 1268 memset(res, 0, sizeof(*res));
3e1e3aae
ED
1269
1270 /* legacy struct tc_ratespec has a 32bit @rate field
1271 * Qdisc using 64bit rate should add new attributes
1272 * in order to maintain compatibility.
1273 */
1274 res->rate = min_t(u64, r->rate_bytes_ps, ~0U);
1275
01cb71d2 1276 res->overhead = r->overhead;
8a8e3d84 1277 res->linklayer = (r->linklayer & TC_LINKLAYER_MASK);
292f1c7f
JP
1278}
1279
2ffe0395
BZ
1280struct psched_pktrate {
1281 u64 rate_pkts_ps; /* packets per second */
1282 u32 mult;
1283 u8 shift;
1284};
1285
1286static inline u64 psched_pkt2t_ns(const struct psched_pktrate *r,
1287 unsigned int pkt_num)
1288{
1289 return ((u64)pkt_num * r->mult) >> r->shift;
1290}
1291
1292void psched_ppscfg_precompute(struct psched_pktrate *r, u64 pktrate64);
1293
46209401
JP
1294/* Mini Qdisc serves for specific needs of ingress/clsact Qdisc.
1295 * The fast path only needs to access filter list and to update stats
1296 */
1297struct mini_Qdisc {
1298 struct tcf_proto *filter_list;
7d17c544 1299 struct tcf_block *block;
46209401
JP
1300 struct gnet_stats_basic_cpu __percpu *cpu_bstats;
1301 struct gnet_stats_queue __percpu *cpu_qstats;
1302 struct rcu_head rcu;
1303};
1304
1305static inline void mini_qdisc_bstats_cpu_update(struct mini_Qdisc *miniq,
1306 const struct sk_buff *skb)
1307{
1308 bstats_cpu_update(this_cpu_ptr(miniq->cpu_bstats), skb);
1309}
1310
1311static inline void mini_qdisc_qstats_cpu_drop(struct mini_Qdisc *miniq)
1312{
1313 this_cpu_inc(miniq->cpu_qstats->drops);
1314}
1315
1316struct mini_Qdisc_pair {
1317 struct mini_Qdisc miniq1;
1318 struct mini_Qdisc miniq2;
1319 struct mini_Qdisc __rcu **p_miniq;
1320};
1321
1322void mini_qdisc_pair_swap(struct mini_Qdisc_pair *miniqp,
1323 struct tcf_proto *tp_head);
1324void mini_qdisc_pair_init(struct mini_Qdisc_pair *miniqp, struct Qdisc *qdisc,
1325 struct mini_Qdisc __rcu **p_miniq);
7d17c544
PB
1326void mini_qdisc_pair_block_init(struct mini_Qdisc_pair *miniqp,
1327 struct tcf_block *block);
46209401 1328
c129412f 1329int sch_frag_xmit_hook(struct sk_buff *skb, int (*xmit)(struct sk_buff *skb));
cd11b164 1330
1da177e4 1331#endif