Commit | Line | Data |
---|---|---|
b2441318 | 1 | /* SPDX-License-Identifier: GPL-2.0 */ |
1da177e4 LT |
2 | #ifndef __NET_SCHED_GENERIC_H |
3 | #define __NET_SCHED_GENERIC_H | |
4 | ||
1da177e4 LT |
5 | #include <linux/netdevice.h> |
6 | #include <linux/types.h> | |
7 | #include <linux/rcupdate.h> | |
1da177e4 LT |
8 | #include <linux/pkt_sched.h> |
9 | #include <linux/pkt_cls.h> | |
22e0f8b9 | 10 | #include <linux/percpu.h> |
5772e9a3 | 11 | #include <linux/dynamic_queue_limits.h> |
5bc17018 | 12 | #include <linux/list.h> |
7b936405 | 13 | #include <linux/refcount.h> |
7aa0045d | 14 | #include <linux/workqueue.h> |
c266f64d | 15 | #include <linux/mutex.h> |
4f8116c8 | 16 | #include <linux/rwsem.h> |
97394bef | 17 | #include <linux/atomic.h> |
59eb87cb | 18 | #include <linux/hashtable.h> |
1da177e4 | 19 | #include <net/gen_stats.h> |
be577ddc | 20 | #include <net/rtnetlink.h> |
a7323311 | 21 | #include <net/flow_offload.h> |
1da177e4 LT |
22 | |
23 | struct Qdisc_ops; | |
24 | struct qdisc_walker; | |
25 | struct tcf_walker; | |
26 | struct module; | |
d58e468b | 27 | struct bpf_flow_keys; |
1da177e4 | 28 | |
fd2c3ef7 | 29 | struct qdisc_rate_table { |
1da177e4 LT |
30 | struct tc_ratespec rate; |
31 | u32 data[256]; | |
32 | struct qdisc_rate_table *next; | |
33 | int refcnt; | |
34 | }; | |
35 | ||
fd2c3ef7 | 36 | enum qdisc_state_t { |
37437bb2 | 37 | __QDISC_STATE_SCHED, |
a9312ae8 | 38 | __QDISC_STATE_DEACTIVATED, |
a90c57f2 | 39 | __QDISC_STATE_MISSED, |
c4fef01b | 40 | __QDISC_STATE_DRAINING, |
97604c65 ED |
41 | }; |
42 | ||
43 | enum qdisc_state2_t { | |
29cbcd85 AD |
44 | /* Only for !TCQ_F_NOLOCK qdisc. Never access it directly. |
45 | * Use qdisc_run_begin/end() or qdisc_is_running() instead. | |
46 | */ | |
97604c65 | 47 | __QDISC_STATE2_RUNNING, |
e2627c8c DM |
48 | }; |
49 | ||
c4fef01b YL |
50 | #define QDISC_STATE_MISSED BIT(__QDISC_STATE_MISSED) |
51 | #define QDISC_STATE_DRAINING BIT(__QDISC_STATE_DRAINING) | |
52 | ||
53 | #define QDISC_STATE_NON_EMPTY (QDISC_STATE_MISSED | \ | |
54 | QDISC_STATE_DRAINING) | |
55 | ||
175f9c1b | 56 | struct qdisc_size_table { |
a2da570d | 57 | struct rcu_head rcu; |
175f9c1b JK |
58 | struct list_head list; |
59 | struct tc_sizespec szopts; | |
60 | int refcnt; | |
61 | u16 data[]; | |
62 | }; | |
63 | ||
48da34b7 FW |
64 | /* similar to sk_buff_head, but skb->prev pointer is undefined. */ |
65 | struct qdisc_skb_head { | |
66 | struct sk_buff *head; | |
67 | struct sk_buff *tail; | |
73eb628d | 68 | __u32 qlen; |
48da34b7 FW |
69 | spinlock_t lock; |
70 | }; | |
71 | ||
fd2c3ef7 | 72 | struct Qdisc { |
520ac30f ED |
73 | int (*enqueue)(struct sk_buff *skb, |
74 | struct Qdisc *sch, | |
75 | struct sk_buff **to_free); | |
76 | struct sk_buff * (*dequeue)(struct Qdisc *sch); | |
05bdd2f1 | 77 | unsigned int flags; |
b00355db | 78 | #define TCQ_F_BUILTIN 1 |
fd245a4a ED |
79 | #define TCQ_F_INGRESS 2 |
80 | #define TCQ_F_CAN_BYPASS 4 | |
81 | #define TCQ_F_MQROOT 8 | |
1abbe139 ED |
82 | #define TCQ_F_ONETXQUEUE 0x10 /* dequeue_skb() can assume all skbs are for |
83 | * q->dev_queue : It can test | |
84 | * netif_xmit_frozen_or_stopped() before | |
85 | * dequeueing next packet. | |
86 | * Its true for MQ/MQPRIO slaves, or non | |
87 | * multiqueue device. | |
88 | */ | |
b00355db | 89 | #define TCQ_F_WARN_NONWC (1 << 16) |
22e0f8b9 | 90 | #define TCQ_F_CPUSTATS 0x20 /* run using percpu statistics */ |
4eaf3b84 ED |
91 | #define TCQ_F_NOPARENT 0x40 /* root of its hierarchy : |
92 | * qdisc_tree_decrease_qlen() should stop. | |
93 | */ | |
49b49971 | 94 | #define TCQ_F_INVISIBLE 0x80 /* invisible by default in dump */ |
6b3ba914 | 95 | #define TCQ_F_NOLOCK 0x100 /* qdisc does not require locking */ |
7a4fa291 | 96 | #define TCQ_F_OFFLOADED 0x200 /* qdisc is offloaded to HW */ |
45203a3b | 97 | u32 limit; |
05bdd2f1 | 98 | const struct Qdisc_ops *ops; |
a2da570d | 99 | struct qdisc_size_table __rcu *stab; |
59cc1f61 | 100 | struct hlist_node hash; |
1da177e4 LT |
101 | u32 handle; |
102 | u32 parent; | |
72b25a91 | 103 | |
5e140dfc | 104 | struct netdev_queue *dev_queue; |
5e140dfc | 105 | |
1c0d32fd | 106 | struct net_rate_estimator __rcu *rate_est; |
50dc9a85 | 107 | struct gnet_stats_basic_sync __percpu *cpu_bstats; |
0d32ef8c | 108 | struct gnet_stats_queue __percpu *cpu_qstats; |
846e463a | 109 | int pad; |
e9be0e99 | 110 | refcount_t refcnt; |
0d32ef8c | 111 | |
5e140dfc ED |
112 | /* |
113 | * For performance sake on SMP, we put highly modified fields at the end | |
114 | */ | |
a53851e2 | 115 | struct sk_buff_head gso_skb ____cacheline_aligned_in_smp; |
48da34b7 | 116 | struct qdisc_skb_head q; |
50dc9a85 | 117 | struct gnet_stats_basic_sync bstats; |
0d32ef8c | 118 | struct gnet_stats_queue qstats; |
4d202a0d | 119 | unsigned long state; |
97604c65 | 120 | unsigned long state2; /* must be written under qdisc spinlock */ |
4d202a0d | 121 | struct Qdisc *next_sched; |
70e57d5e | 122 | struct sk_buff_head skb_bad_txq; |
45203a3b ED |
123 | |
124 | spinlock_t busylock ____cacheline_aligned_in_smp; | |
96009c7d | 125 | spinlock_t seqlock; |
28cff537 | 126 | |
3a7d0d07 | 127 | struct rcu_head rcu; |
606509f2 | 128 | netdevice_tracker dev_tracker; |
846e463a ED |
129 | /* private data */ |
130 | long privdata[] ____cacheline_aligned; | |
1da177e4 LT |
131 | }; |
132 | ||
551143d8 ED |
133 | static inline void qdisc_refcount_inc(struct Qdisc *qdisc) |
134 | { | |
135 | if (qdisc->flags & TCQ_F_BUILTIN) | |
136 | return; | |
137 | refcount_inc(&qdisc->refcnt); | |
138 | } | |
139 | ||
9d7e82ce VB |
140 | /* Intended to be used by unlocked users, when concurrent qdisc release is |
141 | * possible. | |
142 | */ | |
143 | ||
144 | static inline struct Qdisc *qdisc_refcount_inc_nz(struct Qdisc *qdisc) | |
145 | { | |
146 | if (qdisc->flags & TCQ_F_BUILTIN) | |
147 | return qdisc; | |
148 | if (refcount_inc_not_zero(&qdisc->refcnt)) | |
149 | return qdisc; | |
150 | return NULL; | |
151 | } | |
152 | ||
29cbcd85 AD |
153 | /* For !TCQ_F_NOLOCK qdisc: callers must either call this within a qdisc |
154 | * root_lock section, or provide their own memory barriers -- ordering | |
155 | * against qdisc_run_begin/end() atomic bit operations. | |
156 | */ | |
96009c7d | 157 | static inline bool qdisc_is_running(struct Qdisc *qdisc) |
bc135b23 | 158 | { |
32f7b44d | 159 | if (qdisc->flags & TCQ_F_NOLOCK) |
96009c7d | 160 | return spin_is_locked(&qdisc->seqlock); |
97604c65 | 161 | return test_bit(__QDISC_STATE2_RUNNING, &qdisc->state2); |
bc135b23 ED |
162 | } |
163 | ||
c4fef01b YL |
164 | static inline bool nolock_qdisc_is_empty(const struct Qdisc *qdisc) |
165 | { | |
166 | return !(READ_ONCE(qdisc->state) & QDISC_STATE_NON_EMPTY); | |
167 | } | |
168 | ||
9c01c9f1 PA |
169 | static inline bool qdisc_is_percpu_stats(const struct Qdisc *q) |
170 | { | |
171 | return q->flags & TCQ_F_CPUSTATS; | |
172 | } | |
173 | ||
28cff537 PA |
174 | static inline bool qdisc_is_empty(const struct Qdisc *qdisc) |
175 | { | |
9c01c9f1 | 176 | if (qdisc_is_percpu_stats(qdisc)) |
d3e0f575 | 177 | return nolock_qdisc_is_empty(qdisc); |
90b2be27 | 178 | return !READ_ONCE(qdisc->q.qlen); |
28cff537 PA |
179 | } |
180 | ||
29cbcd85 AD |
181 | /* For !TCQ_F_NOLOCK qdisc, qdisc_run_begin/end() must be invoked with |
182 | * the qdisc root lock acquired. | |
183 | */ | |
bc135b23 ED |
184 | static inline bool qdisc_run_begin(struct Qdisc *qdisc) |
185 | { | |
32f7b44d | 186 | if (qdisc->flags & TCQ_F_NOLOCK) { |
a90c57f2 | 187 | if (spin_trylock(&qdisc->seqlock)) |
d3e0f575 | 188 | return true; |
a90c57f2 | 189 | |
89837eb4 YL |
190 | /* Paired with smp_mb__after_atomic() to make sure |
191 | * STATE_MISSED checking is synchronized with clearing | |
192 | * in pfifo_fast_dequeue(). | |
193 | */ | |
194 | smp_mb__before_atomic(); | |
195 | ||
a90c57f2 YL |
196 | /* If the MISSED flag is set, it means other thread has |
197 | * set the MISSED flag before second spin_trylock(), so | |
198 | * we can return false here to avoid multi cpus doing | |
199 | * the set_bit() and second spin_trylock() concurrently. | |
200 | */ | |
201 | if (test_bit(__QDISC_STATE_MISSED, &qdisc->state)) | |
202 | return false; | |
203 | ||
204 | /* Set the MISSED flag before the second spin_trylock(), | |
205 | * if the second spin_trylock() return false, it means | |
206 | * other cpu holding the lock will do dequeuing for us | |
207 | * or it will see the MISSED flag set after releasing | |
208 | * lock and reschedule the net_tx_action() to do the | |
209 | * dequeuing. | |
210 | */ | |
211 | set_bit(__QDISC_STATE_MISSED, &qdisc->state); | |
212 | ||
89837eb4 YL |
213 | /* spin_trylock() only has load-acquire semantic, so use |
214 | * smp_mb__after_atomic() to ensure STATE_MISSED is set | |
215 | * before doing the second spin_trylock(). | |
216 | */ | |
217 | smp_mb__after_atomic(); | |
218 | ||
a90c57f2 YL |
219 | /* Retry again in case other CPU may not see the new flag |
220 | * after it releases the lock at the end of qdisc_run_end(). | |
221 | */ | |
d3e0f575 | 222 | return spin_trylock(&qdisc->seqlock); |
32f7b44d | 223 | } |
97604c65 | 224 | return !__test_and_set_bit(__QDISC_STATE2_RUNNING, &qdisc->state2); |
bc135b23 ED |
225 | } |
226 | ||
227 | static inline void qdisc_run_end(struct Qdisc *qdisc) | |
228 | { | |
a90c57f2 | 229 | if (qdisc->flags & TCQ_F_NOLOCK) { |
96009c7d | 230 | spin_unlock(&qdisc->seqlock); |
a90c57f2 YL |
231 | |
232 | if (unlikely(test_bit(__QDISC_STATE_MISSED, | |
c4fef01b | 233 | &qdisc->state))) |
a90c57f2 | 234 | __netif_schedule(qdisc); |
dd25296a | 235 | } else { |
97604c65 | 236 | __clear_bit(__QDISC_STATE2_RUNNING, &qdisc->state2); |
a90c57f2 | 237 | } |
fd245a4a ED |
238 | } |
239 | ||
5772e9a3 JDB |
240 | static inline bool qdisc_may_bulk(const struct Qdisc *qdisc) |
241 | { | |
242 | return qdisc->flags & TCQ_F_ONETXQUEUE; | |
243 | } | |
244 | ||
245 | static inline int qdisc_avail_bulklimit(const struct netdev_queue *txq) | |
246 | { | |
247 | #ifdef CONFIG_BQL | |
248 | /* Non-BQL migrated drivers will return 0, too. */ | |
249 | return dql_avail(&txq->dql); | |
250 | #else | |
251 | return 0; | |
252 | #endif | |
253 | } | |
254 | ||
fd2c3ef7 | 255 | struct Qdisc_class_ops { |
dfcd2a2b | 256 | unsigned int flags; |
1da177e4 | 257 | /* Child qdisc manipulation */ |
926e61b7 | 258 | struct netdev_queue * (*select_queue)(struct Qdisc *, struct tcmsg *); |
1da177e4 | 259 | int (*graft)(struct Qdisc *, unsigned long cl, |
653d6fd6 AA |
260 | struct Qdisc *, struct Qdisc **, |
261 | struct netlink_ext_ack *extack); | |
1da177e4 | 262 | struct Qdisc * (*leaf)(struct Qdisc *, unsigned long cl); |
43effa1e | 263 | void (*qlen_notify)(struct Qdisc *, unsigned long); |
1da177e4 LT |
264 | |
265 | /* Class manipulation routines */ | |
143976ce | 266 | unsigned long (*find)(struct Qdisc *, u32 classid); |
1da177e4 | 267 | int (*change)(struct Qdisc *, u32, u32, |
793d81d6 AA |
268 | struct nlattr **, unsigned long *, |
269 | struct netlink_ext_ack *); | |
4dd78a73 MM |
270 | int (*delete)(struct Qdisc *, unsigned long, |
271 | struct netlink_ext_ack *); | |
1da177e4 LT |
272 | void (*walk)(struct Qdisc *, struct qdisc_walker * arg); |
273 | ||
274 | /* Filter manipulation */ | |
0ac4bd68 | 275 | struct tcf_block * (*tcf_block)(struct Qdisc *sch, |
cbaacc4e AA |
276 | unsigned long arg, |
277 | struct netlink_ext_ack *extack); | |
1da177e4 LT |
278 | unsigned long (*bind_tcf)(struct Qdisc *, unsigned long, |
279 | u32 classid); | |
280 | void (*unbind_tcf)(struct Qdisc *, unsigned long); | |
281 | ||
282 | /* rtnetlink specific */ | |
283 | int (*dump)(struct Qdisc *, unsigned long, | |
284 | struct sk_buff *skb, struct tcmsg*); | |
285 | int (*dump_stats)(struct Qdisc *, unsigned long, | |
286 | struct gnet_dump *); | |
287 | }; | |
288 | ||
dfcd2a2b VB |
289 | /* Qdisc_class_ops flag values */ |
290 | ||
291 | /* Implements API that doesn't require rtnl lock */ | |
292 | enum qdisc_class_ops_flags { | |
293 | QDISC_CLASS_OPS_DOIT_UNLOCKED = 1, | |
294 | }; | |
295 | ||
fd2c3ef7 | 296 | struct Qdisc_ops { |
1da177e4 | 297 | struct Qdisc_ops *next; |
20fea08b | 298 | const struct Qdisc_class_ops *cl_ops; |
1da177e4 LT |
299 | char id[IFNAMSIZ]; |
300 | int priv_size; | |
d59f5ffa | 301 | unsigned int static_flags; |
1da177e4 | 302 | |
520ac30f ED |
303 | int (*enqueue)(struct sk_buff *skb, |
304 | struct Qdisc *sch, | |
305 | struct sk_buff **to_free); | |
1da177e4 | 306 | struct sk_buff * (*dequeue)(struct Qdisc *); |
90d841fd | 307 | struct sk_buff * (*peek)(struct Qdisc *); |
1da177e4 | 308 | |
e63d7dfd AA |
309 | int (*init)(struct Qdisc *sch, struct nlattr *arg, |
310 | struct netlink_ext_ack *extack); | |
1da177e4 LT |
311 | void (*reset)(struct Qdisc *); |
312 | void (*destroy)(struct Qdisc *); | |
0ac4bd68 | 313 | int (*change)(struct Qdisc *sch, |
2030721c AA |
314 | struct nlattr *arg, |
315 | struct netlink_ext_ack *extack); | |
0ac4bd68 | 316 | void (*attach)(struct Qdisc *sch); |
48bfd55e | 317 | int (*change_tx_queue_len)(struct Qdisc *, unsigned int); |
1e080f17 JK |
318 | void (*change_real_num_tx)(struct Qdisc *sch, |
319 | unsigned int new_real_tx); | |
1da177e4 LT |
320 | |
321 | int (*dump)(struct Qdisc *, struct sk_buff *); | |
322 | int (*dump_stats)(struct Qdisc *, struct gnet_dump *); | |
323 | ||
d47a6b0e JP |
324 | void (*ingress_block_set)(struct Qdisc *sch, |
325 | u32 block_index); | |
326 | void (*egress_block_set)(struct Qdisc *sch, | |
327 | u32 block_index); | |
328 | u32 (*ingress_block_get)(struct Qdisc *sch); | |
329 | u32 (*egress_block_get)(struct Qdisc *sch); | |
330 | ||
1da177e4 LT |
331 | struct module *owner; |
332 | }; | |
333 | ||
334 | ||
fd2c3ef7 | 335 | struct tcf_result { |
db50514f JP |
336 | union { |
337 | struct { | |
338 | unsigned long class; | |
339 | u32 classid; | |
340 | }; | |
341 | const struct tcf_proto *goto_tp; | |
cd11b164 | 342 | |
720f22fe | 343 | /* used in the skb_tc_reinsert function */ |
cd11b164 PA |
344 | struct { |
345 | bool ingress; | |
346 | struct gnet_stats_queue *qstats; | |
347 | }; | |
db50514f | 348 | }; |
1da177e4 LT |
349 | }; |
350 | ||
9f407f17 JP |
351 | struct tcf_chain; |
352 | ||
fd2c3ef7 | 353 | struct tcf_proto_ops { |
36272874 | 354 | struct list_head head; |
1da177e4 LT |
355 | char kind[IFNAMSIZ]; |
356 | ||
dc7f9f6e ED |
357 | int (*classify)(struct sk_buff *, |
358 | const struct tcf_proto *, | |
359 | struct tcf_result *); | |
1da177e4 | 360 | int (*init)(struct tcf_proto*); |
12db03b6 | 361 | void (*destroy)(struct tcf_proto *tp, bool rtnl_held, |
715df5ec | 362 | struct netlink_ext_ack *extack); |
1da177e4 | 363 | |
8113c095 | 364 | void* (*get)(struct tcf_proto*, u32 handle); |
7d5509fa | 365 | void (*put)(struct tcf_proto *tp, void *f); |
c1b52739 | 366 | int (*change)(struct net *net, struct sk_buff *, |
af4c6641 | 367 | struct tcf_proto*, unsigned long, |
add93b61 | 368 | u32 handle, struct nlattr **, |
695176bf | 369 | void **, u32, |
7306db38 | 370 | struct netlink_ext_ack *); |
8865fdd4 | 371 | int (*delete)(struct tcf_proto *tp, void *arg, |
12db03b6 | 372 | bool *last, bool rtnl_held, |
571acf21 | 373 | struct netlink_ext_ack *); |
a5b72a08 | 374 | bool (*delete_empty)(struct tcf_proto *tp); |
12db03b6 VB |
375 | void (*walk)(struct tcf_proto *tp, |
376 | struct tcf_walker *arg, bool rtnl_held); | |
e56185c7 | 377 | int (*reoffload)(struct tcf_proto *tp, bool add, |
a7323311 | 378 | flow_setup_cb_t *cb, void *cb_priv, |
e56185c7 | 379 | struct netlink_ext_ack *extack); |
a449a3e7 VB |
380 | void (*hw_add)(struct tcf_proto *tp, |
381 | void *type_data); | |
382 | void (*hw_del)(struct tcf_proto *tp, | |
383 | void *type_data); | |
2e24cd75 CW |
384 | void (*bind_class)(void *, u32, unsigned long, |
385 | void *, unsigned long); | |
9f407f17 JP |
386 | void * (*tmplt_create)(struct net *net, |
387 | struct tcf_chain *chain, | |
388 | struct nlattr **tca, | |
389 | struct netlink_ext_ack *extack); | |
390 | void (*tmplt_destroy)(void *tmplt_priv); | |
1da177e4 LT |
391 | |
392 | /* rtnetlink specific */ | |
8113c095 | 393 | int (*dump)(struct net*, struct tcf_proto*, void *, |
12db03b6 VB |
394 | struct sk_buff *skb, struct tcmsg*, |
395 | bool); | |
f8ab1807 VB |
396 | int (*terse_dump)(struct net *net, |
397 | struct tcf_proto *tp, void *fh, | |
398 | struct sk_buff *skb, | |
399 | struct tcmsg *t, bool rtnl_held); | |
9f407f17 JP |
400 | int (*tmplt_dump)(struct sk_buff *skb, |
401 | struct net *net, | |
402 | void *tmplt_priv); | |
1da177e4 LT |
403 | |
404 | struct module *owner; | |
12db03b6 VB |
405 | int flags; |
406 | }; | |
407 | ||
a5b72a08 DC |
408 | /* Classifiers setting TCF_PROTO_OPS_DOIT_UNLOCKED in tcf_proto_ops->flags |
409 | * are expected to implement tcf_proto_ops->delete_empty(), otherwise race | |
410 | * conditions can occur when filters are inserted/deleted simultaneously. | |
411 | */ | |
12db03b6 VB |
412 | enum tcf_proto_ops_flags { |
413 | TCF_PROTO_OPS_DOIT_UNLOCKED = 1, | |
1da177e4 LT |
414 | }; |
415 | ||
fd2c3ef7 | 416 | struct tcf_proto { |
1da177e4 | 417 | /* Fast access part */ |
25d8c0d5 JF |
418 | struct tcf_proto __rcu *next; |
419 | void __rcu *root; | |
7fd4b288 PA |
420 | |
421 | /* called under RCU BH lock*/ | |
dc7f9f6e ED |
422 | int (*classify)(struct sk_buff *, |
423 | const struct tcf_proto *, | |
424 | struct tcf_result *); | |
66c6f529 | 425 | __be16 protocol; |
1da177e4 LT |
426 | |
427 | /* All the rest */ | |
428 | u32 prio; | |
1da177e4 | 429 | void *data; |
dc7f9f6e | 430 | const struct tcf_proto_ops *ops; |
5bc17018 | 431 | struct tcf_chain *chain; |
8b64678e VB |
432 | /* Lock protects tcf_proto shared state and can be used by unlocked |
433 | * classifiers to protect their private data. | |
434 | */ | |
435 | spinlock_t lock; | |
436 | bool deleting; | |
4dbfa766 | 437 | refcount_t refcnt; |
25d8c0d5 | 438 | struct rcu_head rcu; |
59eb87cb | 439 | struct hlist_node destroy_ht_node; |
1da177e4 LT |
440 | }; |
441 | ||
175f9c1b | 442 | struct qdisc_skb_cb { |
089b19a9 SF |
443 | struct { |
444 | unsigned int pkt_len; | |
445 | u16 slave_dev_queue_mapping; | |
446 | u16 tc_classid; | |
d58e468b | 447 | }; |
25711786 ED |
448 | #define QDISC_CB_PRIV_LEN 20 |
449 | unsigned char data[QDISC_CB_PRIV_LEN]; | |
175f9c1b JK |
450 | }; |
451 | ||
c7eb7d72 JP |
452 | typedef void tcf_chain_head_change_t(struct tcf_proto *tp_head, void *priv); |
453 | ||
2190d1d0 | 454 | struct tcf_chain { |
ed76f5ed VB |
455 | /* Protects filter_chain. */ |
456 | struct mutex filter_chain_lock; | |
2190d1d0 | 457 | struct tcf_proto __rcu *filter_chain; |
5bc17018 JP |
458 | struct list_head list; |
459 | struct tcf_block *block; | |
460 | u32 index; /* chain index */ | |
461 | unsigned int refcnt; | |
1f3ed383 | 462 | unsigned int action_refcnt; |
32a4f5ec | 463 | bool explicitly_created; |
726d0612 | 464 | bool flushing; |
9f407f17 JP |
465 | const struct tcf_proto_ops *tmplt_ops; |
466 | void *tmplt_priv; | |
ee3bbfe8 | 467 | struct rcu_head rcu; |
6529eaba JP |
468 | }; |
469 | ||
2190d1d0 | 470 | struct tcf_block { |
c266f64d VB |
471 | /* Lock protects tcf_block and lifetime-management data of chains |
472 | * attached to the block (refcnt, action_refcnt, explicitly_created). | |
473 | */ | |
474 | struct mutex lock; | |
5bc17018 | 475 | struct list_head chain_list; |
48617387 | 476 | u32 index; /* block index for shared blocks */ |
a7df4870 | 477 | u32 classid; /* which class this block belongs to */ |
cfebd7e2 | 478 | refcount_t refcnt; |
855319be | 479 | struct net *net; |
69d78ef2 | 480 | struct Qdisc *q; |
4f8116c8 | 481 | struct rw_semaphore cb_lock; /* protects cb_list and offload counters */ |
14bfb13f | 482 | struct flow_block flow_block; |
f36fe1c4 JP |
483 | struct list_head owner_list; |
484 | bool keep_dst; | |
97394bef | 485 | atomic_t offloadcnt; /* Number of oddloaded filters */ |
caa72601 | 486 | unsigned int nooffloaddevcnt; /* Number of devs unable to do offload */ |
c9f14470 | 487 | unsigned int lockeddevcnt; /* Number of devs that require rtnl lock. */ |
f71e0ca4 JP |
488 | struct { |
489 | struct tcf_chain *chain; | |
490 | struct list_head filter_chain_list; | |
491 | } chain0; | |
0607e439 | 492 | struct rcu_head rcu; |
59eb87cb JH |
493 | DECLARE_HASHTABLE(proto_destroy_ht, 7); |
494 | struct mutex proto_destroy_lock; /* Lock for proto_destroy hashtable. */ | |
2190d1d0 JP |
495 | }; |
496 | ||
ed76f5ed VB |
497 | static inline bool lockdep_tcf_chain_is_locked(struct tcf_chain *chain) |
498 | { | |
499 | return lockdep_is_held(&chain->filter_chain_lock); | |
500 | } | |
8b64678e VB |
501 | |
502 | static inline bool lockdep_tcf_proto_is_locked(struct tcf_proto *tp) | |
503 | { | |
504 | return lockdep_is_held(&tp->lock); | |
505 | } | |
ed76f5ed VB |
506 | |
507 | #define tcf_chain_dereference(p, chain) \ | |
508 | rcu_dereference_protected(p, lockdep_tcf_chain_is_locked(chain)) | |
509 | ||
8b64678e VB |
510 | #define tcf_proto_dereference(p, tp) \ |
511 | rcu_dereference_protected(p, lockdep_tcf_proto_is_locked(tp)) | |
512 | ||
16bda13d DM |
513 | static inline void qdisc_cb_private_validate(const struct sk_buff *skb, int sz) |
514 | { | |
515 | struct qdisc_skb_cb *qcb; | |
5ee31c68 | 516 | |
038ebb1a | 517 | BUILD_BUG_ON(sizeof(skb->cb) < sizeof(*qcb)); |
16bda13d DM |
518 | BUILD_BUG_ON(sizeof(qcb->data) < sz); |
519 | } | |
520 | ||
05bdd2f1 | 521 | static inline int qdisc_qlen(const struct Qdisc *q) |
bbd8a0d3 KK |
522 | { |
523 | return q->q.qlen; | |
524 | } | |
525 | ||
73eb628d | 526 | static inline int qdisc_qlen_sum(const struct Qdisc *q) |
7e66016f | 527 | { |
73eb628d PA |
528 | __u32 qlen = q->qstats.qlen; |
529 | int i; | |
7e66016f | 530 | |
73eb628d PA |
531 | if (qdisc_is_percpu_stats(q)) { |
532 | for_each_possible_cpu(i) | |
533 | qlen += per_cpu_ptr(q->cpu_qstats, i)->qlen; | |
534 | } else { | |
6172abc1 | 535 | qlen += q->q.qlen; |
73eb628d | 536 | } |
7e66016f JF |
537 | |
538 | return qlen; | |
539 | } | |
540 | ||
bfe0d029 | 541 | static inline struct qdisc_skb_cb *qdisc_skb_cb(const struct sk_buff *skb) |
175f9c1b JK |
542 | { |
543 | return (struct qdisc_skb_cb *)skb->cb; | |
544 | } | |
545 | ||
83874000 DM |
546 | static inline spinlock_t *qdisc_lock(struct Qdisc *qdisc) |
547 | { | |
548 | return &qdisc->q.lock; | |
549 | } | |
550 | ||
05bdd2f1 | 551 | static inline struct Qdisc *qdisc_root(const struct Qdisc *qdisc) |
7698b4fc | 552 | { |
46e5da40 JF |
553 | struct Qdisc *q = rcu_dereference_rtnl(qdisc->dev_queue->qdisc); |
554 | ||
555 | return q; | |
7698b4fc DM |
556 | } |
557 | ||
159d2c7d ED |
558 | static inline struct Qdisc *qdisc_root_bh(const struct Qdisc *qdisc) |
559 | { | |
560 | return rcu_dereference_bh(qdisc->dev_queue->qdisc); | |
561 | } | |
562 | ||
05bdd2f1 | 563 | static inline struct Qdisc *qdisc_root_sleeping(const struct Qdisc *qdisc) |
2540e051 JP |
564 | { |
565 | return qdisc->dev_queue->qdisc_sleeping; | |
566 | } | |
567 | ||
7e43f112 DM |
568 | /* The qdisc root lock is a mechanism by which to top level |
569 | * of a qdisc tree can be locked from any qdisc node in the | |
570 | * forest. This allows changing the configuration of some | |
571 | * aspect of the qdisc tree while blocking out asynchronous | |
572 | * qdisc access in the packet processing paths. | |
573 | * | |
574 | * It is only legal to do this when the root will not change | |
575 | * on us. Otherwise we'll potentially lock the wrong qdisc | |
576 | * root. This is enforced by holding the RTNL semaphore, which | |
577 | * all users of this lock accessor must do. | |
578 | */ | |
05bdd2f1 | 579 | static inline spinlock_t *qdisc_root_lock(const struct Qdisc *qdisc) |
7698b4fc DM |
580 | { |
581 | struct Qdisc *root = qdisc_root(qdisc); | |
582 | ||
7e43f112 | 583 | ASSERT_RTNL(); |
83874000 | 584 | return qdisc_lock(root); |
7698b4fc DM |
585 | } |
586 | ||
05bdd2f1 | 587 | static inline spinlock_t *qdisc_root_sleeping_lock(const struct Qdisc *qdisc) |
f6f9b93f JP |
588 | { |
589 | struct Qdisc *root = qdisc_root_sleeping(qdisc); | |
590 | ||
591 | ASSERT_RTNL(); | |
592 | return qdisc_lock(root); | |
593 | } | |
594 | ||
05bdd2f1 | 595 | static inline struct net_device *qdisc_dev(const struct Qdisc *qdisc) |
5ce2d488 DM |
596 | { |
597 | return qdisc->dev_queue->dev; | |
598 | } | |
1da177e4 | 599 | |
ca1e4ab1 | 600 | static inline void sch_tree_lock(struct Qdisc *q) |
78a5b30b | 601 | { |
ca1e4ab1 MM |
602 | if (q->flags & TCQ_F_MQROOT) |
603 | spin_lock_bh(qdisc_lock(q)); | |
604 | else | |
605 | spin_lock_bh(qdisc_root_sleeping_lock(q)); | |
78a5b30b DM |
606 | } |
607 | ||
ca1e4ab1 | 608 | static inline void sch_tree_unlock(struct Qdisc *q) |
78a5b30b | 609 | { |
ca1e4ab1 MM |
610 | if (q->flags & TCQ_F_MQROOT) |
611 | spin_unlock_bh(qdisc_lock(q)); | |
612 | else | |
613 | spin_unlock_bh(qdisc_root_sleeping_lock(q)); | |
78a5b30b DM |
614 | } |
615 | ||
e41a33e6 TG |
616 | extern struct Qdisc noop_qdisc; |
617 | extern struct Qdisc_ops noop_qdisc_ops; | |
6ec1c69a DM |
618 | extern struct Qdisc_ops pfifo_fast_ops; |
619 | extern struct Qdisc_ops mq_qdisc_ops; | |
d66d6c31 | 620 | extern struct Qdisc_ops noqueue_qdisc_ops; |
6da7c8fc | 621 | extern const struct Qdisc_ops *default_qdisc_ops; |
1f27cde3 ED |
622 | static inline const struct Qdisc_ops * |
623 | get_default_qdisc_ops(const struct net_device *dev, int ntx) | |
624 | { | |
625 | return ntx < dev->real_num_tx_queues ? | |
626 | default_qdisc_ops : &pfifo_fast_ops; | |
627 | } | |
e41a33e6 | 628 | |
fd2c3ef7 | 629 | struct Qdisc_class_common { |
6fe1c7a5 PM |
630 | u32 classid; |
631 | struct hlist_node hnode; | |
632 | }; | |
633 | ||
fd2c3ef7 | 634 | struct Qdisc_class_hash { |
6fe1c7a5 PM |
635 | struct hlist_head *hash; |
636 | unsigned int hashsize; | |
637 | unsigned int hashmask; | |
638 | unsigned int hashelems; | |
639 | }; | |
640 | ||
641 | static inline unsigned int qdisc_class_hash(u32 id, u32 mask) | |
642 | { | |
643 | id ^= id >> 8; | |
644 | id ^= id >> 4; | |
645 | return id & mask; | |
646 | } | |
647 | ||
648 | static inline struct Qdisc_class_common * | |
05bdd2f1 | 649 | qdisc_class_find(const struct Qdisc_class_hash *hash, u32 id) |
6fe1c7a5 PM |
650 | { |
651 | struct Qdisc_class_common *cl; | |
6fe1c7a5 PM |
652 | unsigned int h; |
653 | ||
7d3f0cd4 GF |
654 | if (!id) |
655 | return NULL; | |
656 | ||
6fe1c7a5 | 657 | h = qdisc_class_hash(id, hash->hashmask); |
b67bfe0d | 658 | hlist_for_each_entry(cl, &hash->hash[h], hnode) { |
6fe1c7a5 PM |
659 | if (cl->classid == id) |
660 | return cl; | |
661 | } | |
662 | return NULL; | |
663 | } | |
664 | ||
384c181e AN |
665 | static inline int tc_classid_to_hwtc(struct net_device *dev, u32 classid) |
666 | { | |
667 | u32 hwtc = TC_H_MIN(classid) - TC_H_MIN_PRIORITY; | |
668 | ||
669 | return (hwtc < netdev_get_num_tc(dev)) ? hwtc : -EINVAL; | |
670 | } | |
671 | ||
5c15257f JP |
672 | int qdisc_class_hash_init(struct Qdisc_class_hash *); |
673 | void qdisc_class_hash_insert(struct Qdisc_class_hash *, | |
674 | struct Qdisc_class_common *); | |
675 | void qdisc_class_hash_remove(struct Qdisc_class_hash *, | |
676 | struct Qdisc_class_common *); | |
677 | void qdisc_class_hash_grow(struct Qdisc *, struct Qdisc_class_hash *); | |
678 | void qdisc_class_hash_destroy(struct Qdisc_class_hash *); | |
679 | ||
48bfd55e | 680 | int dev_qdisc_change_tx_queue_len(struct net_device *dev); |
1e080f17 JK |
681 | void dev_qdisc_change_real_num_tx(struct net_device *dev, |
682 | unsigned int new_real_tx); | |
5c15257f JP |
683 | void dev_init_scheduler(struct net_device *dev); |
684 | void dev_shutdown(struct net_device *dev); | |
685 | void dev_activate(struct net_device *dev); | |
686 | void dev_deactivate(struct net_device *dev); | |
687 | void dev_deactivate_many(struct list_head *head); | |
688 | struct Qdisc *dev_graft_qdisc(struct netdev_queue *dev_queue, | |
689 | struct Qdisc *qdisc); | |
690 | void qdisc_reset(struct Qdisc *qdisc); | |
86bd446b | 691 | void qdisc_put(struct Qdisc *qdisc); |
3a7d0d07 | 692 | void qdisc_put_unlocked(struct Qdisc *qdisc); |
5f2939d9 | 693 | void qdisc_tree_reduce_backlog(struct Qdisc *qdisc, int n, int len); |
b592843c JK |
694 | #ifdef CONFIG_NET_SCHED |
695 | int qdisc_offload_dump_helper(struct Qdisc *q, enum tc_setup_type type, | |
696 | void *type_data); | |
bfaee911 JK |
697 | void qdisc_offload_graft_helper(struct net_device *dev, struct Qdisc *sch, |
698 | struct Qdisc *new, struct Qdisc *old, | |
699 | enum tc_setup_type type, void *type_data, | |
700 | struct netlink_ext_ack *extack); | |
b592843c JK |
701 | #else |
702 | static inline int | |
703 | qdisc_offload_dump_helper(struct Qdisc *q, enum tc_setup_type type, | |
704 | void *type_data) | |
705 | { | |
706 | q->flags &= ~TCQ_F_OFFLOADED; | |
707 | return 0; | |
708 | } | |
bfaee911 JK |
709 | |
710 | static inline void | |
711 | qdisc_offload_graft_helper(struct net_device *dev, struct Qdisc *sch, | |
712 | struct Qdisc *new, struct Qdisc *old, | |
713 | enum tc_setup_type type, void *type_data, | |
714 | struct netlink_ext_ack *extack) | |
715 | { | |
716 | } | |
b592843c | 717 | #endif |
5c15257f | 718 | struct Qdisc *qdisc_alloc(struct netdev_queue *dev_queue, |
d0bd684d AA |
719 | const struct Qdisc_ops *ops, |
720 | struct netlink_ext_ack *extack); | |
81d947e2 | 721 | void qdisc_free(struct Qdisc *qdisc); |
5c15257f | 722 | struct Qdisc *qdisc_create_dflt(struct netdev_queue *dev_queue, |
a38a9882 AA |
723 | const struct Qdisc_ops *ops, u32 parentid, |
724 | struct netlink_ext_ack *extack); | |
5c15257f JP |
725 | void __qdisc_calculate_pkt_len(struct sk_buff *skb, |
726 | const struct qdisc_size_table *stab); | |
27b29f63 | 727 | int skb_do_redirect(struct sk_buff *); |
1da177e4 | 728 | |
fdc5432a DB |
729 | static inline bool skb_at_tc_ingress(const struct sk_buff *skb) |
730 | { | |
731 | #ifdef CONFIG_NET_CLS_ACT | |
8dc07fdb | 732 | return skb->tc_at_ingress; |
fdc5432a DB |
733 | #else |
734 | return false; | |
735 | #endif | |
736 | } | |
737 | ||
e7246e12 WB |
738 | static inline bool skb_skip_tc_classify(struct sk_buff *skb) |
739 | { | |
740 | #ifdef CONFIG_NET_CLS_ACT | |
741 | if (skb->tc_skip_classify) { | |
742 | skb->tc_skip_classify = 0; | |
743 | return true; | |
744 | } | |
745 | #endif | |
746 | return false; | |
747 | } | |
748 | ||
3a053b1a | 749 | /* Reset all TX qdiscs greater than index of a device. */ |
f0796d5c | 750 | static inline void qdisc_reset_all_tx_gt(struct net_device *dev, unsigned int i) |
5aa70995 | 751 | { |
4ef6acff JF |
752 | struct Qdisc *qdisc; |
753 | ||
f0796d5c | 754 | for (; i < dev->num_tx_queues; i++) { |
46e5da40 | 755 | qdisc = rtnl_dereference(netdev_get_tx_queue(dev, i)->qdisc); |
4ef6acff JF |
756 | if (qdisc) { |
757 | spin_lock_bh(qdisc_lock(qdisc)); | |
758 | qdisc_reset(qdisc); | |
759 | spin_unlock_bh(qdisc_lock(qdisc)); | |
760 | } | |
761 | } | |
5aa70995 DM |
762 | } |
763 | ||
3e745dd6 DM |
764 | /* Are all TX queues of the device empty? */ |
765 | static inline bool qdisc_all_tx_empty(const struct net_device *dev) | |
766 | { | |
e8a0464c | 767 | unsigned int i; |
46e5da40 JF |
768 | |
769 | rcu_read_lock(); | |
e8a0464c DM |
770 | for (i = 0; i < dev->num_tx_queues; i++) { |
771 | struct netdev_queue *txq = netdev_get_tx_queue(dev, i); | |
46e5da40 | 772 | const struct Qdisc *q = rcu_dereference(txq->qdisc); |
3e745dd6 | 773 | |
1f5e6fdd | 774 | if (!qdisc_is_empty(q)) { |
46e5da40 | 775 | rcu_read_unlock(); |
e8a0464c | 776 | return false; |
46e5da40 | 777 | } |
e8a0464c | 778 | } |
46e5da40 | 779 | rcu_read_unlock(); |
e8a0464c | 780 | return true; |
3e745dd6 DM |
781 | } |
782 | ||
6fa9864b | 783 | /* Are any of the TX qdiscs changing? */ |
05bdd2f1 | 784 | static inline bool qdisc_tx_changing(const struct net_device *dev) |
6fa9864b | 785 | { |
e8a0464c | 786 | unsigned int i; |
46e5da40 | 787 | |
e8a0464c DM |
788 | for (i = 0; i < dev->num_tx_queues; i++) { |
789 | struct netdev_queue *txq = netdev_get_tx_queue(dev, i); | |
46e5da40 | 790 | if (rcu_access_pointer(txq->qdisc) != txq->qdisc_sleeping) |
e8a0464c DM |
791 | return true; |
792 | } | |
793 | return false; | |
6fa9864b DM |
794 | } |
795 | ||
e8a0464c | 796 | /* Is the device using the noop qdisc on all queues? */ |
05297949 DM |
797 | static inline bool qdisc_tx_is_noop(const struct net_device *dev) |
798 | { | |
e8a0464c | 799 | unsigned int i; |
46e5da40 | 800 | |
e8a0464c DM |
801 | for (i = 0; i < dev->num_tx_queues; i++) { |
802 | struct netdev_queue *txq = netdev_get_tx_queue(dev, i); | |
46e5da40 | 803 | if (rcu_access_pointer(txq->qdisc) != &noop_qdisc) |
e8a0464c DM |
804 | return false; |
805 | } | |
806 | return true; | |
05297949 DM |
807 | } |
808 | ||
bfe0d029 | 809 | static inline unsigned int qdisc_pkt_len(const struct sk_buff *skb) |
0abf77e5 | 810 | { |
175f9c1b | 811 | return qdisc_skb_cb(skb)->pkt_len; |
0abf77e5 JK |
812 | } |
813 | ||
c27f339a | 814 | /* additional qdisc xmit flags (NET_XMIT_MASK in linux/netdevice.h) */ |
378a2f09 JP |
815 | enum net_xmit_qdisc_t { |
816 | __NET_XMIT_STOLEN = 0x00010000, | |
c27f339a | 817 | __NET_XMIT_BYPASS = 0x00020000, |
378a2f09 JP |
818 | }; |
819 | ||
c27f339a | 820 | #ifdef CONFIG_NET_CLS_ACT |
378a2f09 | 821 | #define net_xmit_drop_count(e) ((e) & __NET_XMIT_STOLEN ? 0 : 1) |
378a2f09 JP |
822 | #else |
823 | #define net_xmit_drop_count(e) (1) | |
824 | #endif | |
825 | ||
a2da570d ED |
826 | static inline void qdisc_calculate_pkt_len(struct sk_buff *skb, |
827 | const struct Qdisc *sch) | |
5f86173b | 828 | { |
3a682fbd | 829 | #ifdef CONFIG_NET_SCHED |
a2da570d ED |
830 | struct qdisc_size_table *stab = rcu_dereference_bh(sch->stab); |
831 | ||
832 | if (stab) | |
833 | __qdisc_calculate_pkt_len(skb, stab); | |
3a682fbd | 834 | #endif |
a2da570d ED |
835 | } |
836 | ||
ac5c66f2 | 837 | static inline int qdisc_enqueue(struct sk_buff *skb, struct Qdisc *sch, |
520ac30f | 838 | struct sk_buff **to_free) |
a2da570d ED |
839 | { |
840 | qdisc_calculate_pkt_len(skb, sch); | |
ac5c66f2 | 841 | return sch->enqueue(skb, sch, to_free); |
5f86173b JK |
842 | } |
843 | ||
50dc9a85 | 844 | static inline void _bstats_update(struct gnet_stats_basic_sync *bstats, |
38040702 AV |
845 | __u64 bytes, __u32 packets) |
846 | { | |
67c9e627 | 847 | u64_stats_update_begin(&bstats->syncp); |
50dc9a85 AD |
848 | u64_stats_add(&bstats->bytes, bytes); |
849 | u64_stats_add(&bstats->packets, packets); | |
67c9e627 | 850 | u64_stats_update_end(&bstats->syncp); |
38040702 AV |
851 | } |
852 | ||
50dc9a85 | 853 | static inline void bstats_update(struct gnet_stats_basic_sync *bstats, |
bfe0d029 ED |
854 | const struct sk_buff *skb) |
855 | { | |
38040702 AV |
856 | _bstats_update(bstats, |
857 | qdisc_pkt_len(skb), | |
858 | skb_is_gso(skb) ? skb_shinfo(skb)->gso_segs : 1); | |
859 | } | |
860 | ||
24ea591d ED |
861 | static inline void qdisc_bstats_cpu_update(struct Qdisc *sch, |
862 | const struct sk_buff *skb) | |
863 | { | |
50dc9a85 | 864 | bstats_update(this_cpu_ptr(sch->cpu_bstats), skb); |
24ea591d ED |
865 | } |
866 | ||
bfe0d029 ED |
867 | static inline void qdisc_bstats_update(struct Qdisc *sch, |
868 | const struct sk_buff *skb) | |
bbd8a0d3 | 869 | { |
bfe0d029 | 870 | bstats_update(&sch->bstats, skb); |
bbd8a0d3 KK |
871 | } |
872 | ||
25331d6c JF |
873 | static inline void qdisc_qstats_backlog_dec(struct Qdisc *sch, |
874 | const struct sk_buff *skb) | |
875 | { | |
876 | sch->qstats.backlog -= qdisc_pkt_len(skb); | |
877 | } | |
878 | ||
40bd0362 JF |
879 | static inline void qdisc_qstats_cpu_backlog_dec(struct Qdisc *sch, |
880 | const struct sk_buff *skb) | |
881 | { | |
882 | this_cpu_sub(sch->cpu_qstats->backlog, qdisc_pkt_len(skb)); | |
883 | } | |
884 | ||
25331d6c JF |
885 | static inline void qdisc_qstats_backlog_inc(struct Qdisc *sch, |
886 | const struct sk_buff *skb) | |
887 | { | |
888 | sch->qstats.backlog += qdisc_pkt_len(skb); | |
889 | } | |
890 | ||
40bd0362 JF |
891 | static inline void qdisc_qstats_cpu_backlog_inc(struct Qdisc *sch, |
892 | const struct sk_buff *skb) | |
893 | { | |
894 | this_cpu_add(sch->cpu_qstats->backlog, qdisc_pkt_len(skb)); | |
895 | } | |
896 | ||
73eb628d | 897 | static inline void qdisc_qstats_cpu_qlen_inc(struct Qdisc *sch) |
40bd0362 | 898 | { |
73eb628d | 899 | this_cpu_inc(sch->cpu_qstats->qlen); |
40bd0362 JF |
900 | } |
901 | ||
73eb628d | 902 | static inline void qdisc_qstats_cpu_qlen_dec(struct Qdisc *sch) |
40bd0362 | 903 | { |
73eb628d | 904 | this_cpu_dec(sch->cpu_qstats->qlen); |
40bd0362 JF |
905 | } |
906 | ||
907 | static inline void qdisc_qstats_cpu_requeues_inc(struct Qdisc *sch) | |
908 | { | |
909 | this_cpu_inc(sch->cpu_qstats->requeues); | |
910 | } | |
911 | ||
25331d6c JF |
912 | static inline void __qdisc_qstats_drop(struct Qdisc *sch, int count) |
913 | { | |
914 | sch->qstats.drops += count; | |
915 | } | |
916 | ||
24ea591d | 917 | static inline void qstats_drop_inc(struct gnet_stats_queue *qstats) |
25331d6c | 918 | { |
24ea591d | 919 | qstats->drops++; |
25331d6c JF |
920 | } |
921 | ||
24ea591d | 922 | static inline void qstats_overlimit_inc(struct gnet_stats_queue *qstats) |
b0ab6f92 | 923 | { |
24ea591d ED |
924 | qstats->overlimits++; |
925 | } | |
b0ab6f92 | 926 | |
24ea591d ED |
927 | static inline void qdisc_qstats_drop(struct Qdisc *sch) |
928 | { | |
929 | qstats_drop_inc(&sch->qstats); | |
930 | } | |
931 | ||
932 | static inline void qdisc_qstats_cpu_drop(struct Qdisc *sch) | |
933 | { | |
eb60a8dd | 934 | this_cpu_inc(sch->cpu_qstats->drops); |
b0ab6f92 JF |
935 | } |
936 | ||
25331d6c JF |
937 | static inline void qdisc_qstats_overlimit(struct Qdisc *sch) |
938 | { | |
939 | sch->qstats.overlimits++; | |
940 | } | |
941 | ||
5dd431b6 PA |
942 | static inline int qdisc_qstats_copy(struct gnet_dump *d, struct Qdisc *sch) |
943 | { | |
944 | __u32 qlen = qdisc_qlen_sum(sch); | |
945 | ||
946 | return gnet_stats_copy_queue(d, sch->cpu_qstats, &sch->qstats, qlen); | |
947 | } | |
948 | ||
949 | static inline void qdisc_qstats_qlen_backlog(struct Qdisc *sch, __u32 *qlen, | |
950 | __u32 *backlog) | |
951 | { | |
952 | struct gnet_stats_queue qstats = { 0 }; | |
5dd431b6 | 953 | |
10940eb7 SAS |
954 | gnet_stats_add_queue(&qstats, sch->cpu_qstats, &sch->qstats); |
955 | *qlen = qstats.qlen + qdisc_qlen(sch); | |
5dd431b6 PA |
956 | *backlog = qstats.backlog; |
957 | } | |
958 | ||
e5f0e8f8 PA |
959 | static inline void qdisc_tree_flush_backlog(struct Qdisc *sch) |
960 | { | |
961 | __u32 qlen, backlog; | |
962 | ||
963 | qdisc_qstats_qlen_backlog(sch, &qlen, &backlog); | |
964 | qdisc_tree_reduce_backlog(sch, qlen, backlog); | |
965 | } | |
966 | ||
967 | static inline void qdisc_purge_queue(struct Qdisc *sch) | |
968 | { | |
969 | __u32 qlen, backlog; | |
970 | ||
971 | qdisc_qstats_qlen_backlog(sch, &qlen, &backlog); | |
972 | qdisc_reset(sch); | |
973 | qdisc_tree_reduce_backlog(sch, qlen, backlog); | |
974 | } | |
975 | ||
48da34b7 FW |
976 | static inline void qdisc_skb_head_init(struct qdisc_skb_head *qh) |
977 | { | |
978 | qh->head = NULL; | |
979 | qh->tail = NULL; | |
980 | qh->qlen = 0; | |
981 | } | |
982 | ||
aea890b8 DM |
983 | static inline void __qdisc_enqueue_tail(struct sk_buff *skb, |
984 | struct qdisc_skb_head *qh) | |
9972b25d | 985 | { |
48da34b7 FW |
986 | struct sk_buff *last = qh->tail; |
987 | ||
988 | if (last) { | |
989 | skb->next = NULL; | |
990 | last->next = skb; | |
991 | qh->tail = skb; | |
992 | } else { | |
993 | qh->tail = skb; | |
994 | qh->head = skb; | |
995 | } | |
996 | qh->qlen++; | |
9972b25d TG |
997 | } |
998 | ||
999 | static inline int qdisc_enqueue_tail(struct sk_buff *skb, struct Qdisc *sch) | |
1000 | { | |
aea890b8 DM |
1001 | __qdisc_enqueue_tail(skb, &sch->q); |
1002 | qdisc_qstats_backlog_inc(sch, skb); | |
1003 | return NET_XMIT_SUCCESS; | |
9972b25d TG |
1004 | } |
1005 | ||
59697730 DM |
1006 | static inline void __qdisc_enqueue_head(struct sk_buff *skb, |
1007 | struct qdisc_skb_head *qh) | |
1008 | { | |
1009 | skb->next = qh->head; | |
1010 | ||
1011 | if (!qh->head) | |
1012 | qh->tail = skb; | |
1013 | qh->head = skb; | |
1014 | qh->qlen++; | |
1015 | } | |
1016 | ||
48da34b7 | 1017 | static inline struct sk_buff *__qdisc_dequeue_head(struct qdisc_skb_head *qh) |
9972b25d | 1018 | { |
48da34b7 FW |
1019 | struct sk_buff *skb = qh->head; |
1020 | ||
1021 | if (likely(skb != NULL)) { | |
1022 | qh->head = skb->next; | |
1023 | qh->qlen--; | |
1024 | if (qh->head == NULL) | |
1025 | qh->tail = NULL; | |
1026 | skb->next = NULL; | |
1027 | } | |
9972b25d | 1028 | |
ec323368 FW |
1029 | return skb; |
1030 | } | |
1031 | ||
1032 | static inline struct sk_buff *qdisc_dequeue_head(struct Qdisc *sch) | |
1033 | { | |
1034 | struct sk_buff *skb = __qdisc_dequeue_head(&sch->q); | |
1035 | ||
9190b3b3 | 1036 | if (likely(skb != NULL)) { |
25331d6c | 1037 | qdisc_qstats_backlog_dec(sch, skb); |
9190b3b3 ED |
1038 | qdisc_bstats_update(sch, skb); |
1039 | } | |
9972b25d TG |
1040 | |
1041 | return skb; | |
1042 | } | |
1043 | ||
520ac30f ED |
1044 | /* Instead of calling kfree_skb() while root qdisc lock is held, |
1045 | * queue the skb for future freeing at end of __dev_xmit_skb() | |
1046 | */ | |
1047 | static inline void __qdisc_drop(struct sk_buff *skb, struct sk_buff **to_free) | |
1048 | { | |
1049 | skb->next = *to_free; | |
1050 | *to_free = skb; | |
1051 | } | |
1052 | ||
35d889d1 AK |
1053 | static inline void __qdisc_drop_all(struct sk_buff *skb, |
1054 | struct sk_buff **to_free) | |
1055 | { | |
1056 | if (skb->prev) | |
1057 | skb->prev->next = *to_free; | |
1058 | else | |
1059 | skb->next = *to_free; | |
1060 | *to_free = skb; | |
1061 | } | |
1062 | ||
57dbb2d8 | 1063 | static inline unsigned int __qdisc_queue_drop_head(struct Qdisc *sch, |
48da34b7 | 1064 | struct qdisc_skb_head *qh, |
520ac30f | 1065 | struct sk_buff **to_free) |
57dbb2d8 | 1066 | { |
48da34b7 | 1067 | struct sk_buff *skb = __qdisc_dequeue_head(qh); |
57dbb2d8 HPP |
1068 | |
1069 | if (likely(skb != NULL)) { | |
1070 | unsigned int len = qdisc_pkt_len(skb); | |
520ac30f | 1071 | |
25331d6c | 1072 | qdisc_qstats_backlog_dec(sch, skb); |
520ac30f | 1073 | __qdisc_drop(skb, to_free); |
57dbb2d8 HPP |
1074 | return len; |
1075 | } | |
1076 | ||
1077 | return 0; | |
1078 | } | |
1079 | ||
48a8f519 PM |
1080 | static inline struct sk_buff *qdisc_peek_head(struct Qdisc *sch) |
1081 | { | |
48da34b7 FW |
1082 | const struct qdisc_skb_head *qh = &sch->q; |
1083 | ||
1084 | return qh->head; | |
48a8f519 PM |
1085 | } |
1086 | ||
77be155c JP |
1087 | /* generic pseudo peek method for non-work-conserving qdisc */ |
1088 | static inline struct sk_buff *qdisc_peek_dequeued(struct Qdisc *sch) | |
1089 | { | |
a53851e2 JF |
1090 | struct sk_buff *skb = skb_peek(&sch->gso_skb); |
1091 | ||
77be155c | 1092 | /* we can reuse ->gso_skb because peek isn't called for root qdiscs */ |
a53851e2 JF |
1093 | if (!skb) { |
1094 | skb = sch->dequeue(sch); | |
1095 | ||
1096 | if (skb) { | |
1097 | __skb_queue_head(&sch->gso_skb, skb); | |
61c9eaf9 | 1098 | /* it's still part of the queue */ |
a53851e2 | 1099 | qdisc_qstats_backlog_inc(sch, skb); |
61c9eaf9 | 1100 | sch->q.qlen++; |
a27758ff | 1101 | } |
61c9eaf9 | 1102 | } |
77be155c | 1103 | |
a53851e2 | 1104 | return skb; |
77be155c JP |
1105 | } |
1106 | ||
8a53e616 PA |
1107 | static inline void qdisc_update_stats_at_dequeue(struct Qdisc *sch, |
1108 | struct sk_buff *skb) | |
1109 | { | |
1110 | if (qdisc_is_percpu_stats(sch)) { | |
1111 | qdisc_qstats_cpu_backlog_dec(sch, skb); | |
1112 | qdisc_bstats_cpu_update(sch, skb); | |
73eb628d | 1113 | qdisc_qstats_cpu_qlen_dec(sch); |
8a53e616 PA |
1114 | } else { |
1115 | qdisc_qstats_backlog_dec(sch, skb); | |
1116 | qdisc_bstats_update(sch, skb); | |
1117 | sch->q.qlen--; | |
1118 | } | |
1119 | } | |
1120 | ||
1121 | static inline void qdisc_update_stats_at_enqueue(struct Qdisc *sch, | |
1122 | unsigned int pkt_len) | |
1123 | { | |
1124 | if (qdisc_is_percpu_stats(sch)) { | |
73eb628d | 1125 | qdisc_qstats_cpu_qlen_inc(sch); |
8a53e616 PA |
1126 | this_cpu_add(sch->cpu_qstats->backlog, pkt_len); |
1127 | } else { | |
1128 | sch->qstats.backlog += pkt_len; | |
1129 | sch->q.qlen++; | |
1130 | } | |
1131 | } | |
1132 | ||
77be155c JP |
1133 | /* use instead of qdisc->dequeue() for all qdiscs queried with ->peek() */ |
1134 | static inline struct sk_buff *qdisc_dequeue_peeked(struct Qdisc *sch) | |
1135 | { | |
a53851e2 | 1136 | struct sk_buff *skb = skb_peek(&sch->gso_skb); |
77be155c | 1137 | |
61c9eaf9 | 1138 | if (skb) { |
a53851e2 | 1139 | skb = __skb_dequeue(&sch->gso_skb); |
9c01c9f1 PA |
1140 | if (qdisc_is_percpu_stats(sch)) { |
1141 | qdisc_qstats_cpu_backlog_dec(sch, skb); | |
73eb628d | 1142 | qdisc_qstats_cpu_qlen_dec(sch); |
9c01c9f1 PA |
1143 | } else { |
1144 | qdisc_qstats_backlog_dec(sch, skb); | |
1145 | sch->q.qlen--; | |
1146 | } | |
61c9eaf9 | 1147 | } else { |
77be155c | 1148 | skb = sch->dequeue(sch); |
61c9eaf9 | 1149 | } |
77be155c JP |
1150 | |
1151 | return skb; | |
1152 | } | |
1153 | ||
48da34b7 | 1154 | static inline void __qdisc_reset_queue(struct qdisc_skb_head *qh) |
9972b25d TG |
1155 | { |
1156 | /* | |
1157 | * We do not know the backlog in bytes of this list, it | |
1158 | * is up to the caller to correct it | |
1159 | */ | |
48da34b7 FW |
1160 | ASSERT_RTNL(); |
1161 | if (qh->qlen) { | |
1162 | rtnl_kfree_skbs(qh->head, qh->tail); | |
1163 | ||
1164 | qh->head = NULL; | |
1165 | qh->tail = NULL; | |
1166 | qh->qlen = 0; | |
1b5c5493 | 1167 | } |
9972b25d TG |
1168 | } |
1169 | ||
1170 | static inline void qdisc_reset_queue(struct Qdisc *sch) | |
1171 | { | |
1b5c5493 | 1172 | __qdisc_reset_queue(&sch->q); |
9972b25d TG |
1173 | sch->qstats.backlog = 0; |
1174 | } | |
1175 | ||
86a7996c WC |
1176 | static inline struct Qdisc *qdisc_replace(struct Qdisc *sch, struct Qdisc *new, |
1177 | struct Qdisc **pold) | |
1178 | { | |
1179 | struct Qdisc *old; | |
1180 | ||
1181 | sch_tree_lock(sch); | |
1182 | old = *pold; | |
1183 | *pold = new; | |
e5f0e8f8 | 1184 | if (old != NULL) |
938e0fcd | 1185 | qdisc_purge_queue(old); |
86a7996c WC |
1186 | sch_tree_unlock(sch); |
1187 | ||
1188 | return old; | |
1189 | } | |
1190 | ||
1b5c5493 ED |
1191 | static inline void rtnl_qdisc_drop(struct sk_buff *skb, struct Qdisc *sch) |
1192 | { | |
1193 | rtnl_kfree_skbs(skb, skb); | |
1194 | qdisc_qstats_drop(sch); | |
1195 | } | |
1196 | ||
40bd0362 JF |
1197 | static inline int qdisc_drop_cpu(struct sk_buff *skb, struct Qdisc *sch, |
1198 | struct sk_buff **to_free) | |
1199 | { | |
1200 | __qdisc_drop(skb, to_free); | |
1201 | qdisc_qstats_cpu_drop(sch); | |
1202 | ||
1203 | return NET_XMIT_DROP; | |
1204 | } | |
520ac30f ED |
1205 | |
1206 | static inline int qdisc_drop(struct sk_buff *skb, struct Qdisc *sch, | |
1207 | struct sk_buff **to_free) | |
9972b25d | 1208 | { |
520ac30f | 1209 | __qdisc_drop(skb, to_free); |
25331d6c | 1210 | qdisc_qstats_drop(sch); |
9972b25d TG |
1211 | |
1212 | return NET_XMIT_DROP; | |
1213 | } | |
1214 | ||
35d889d1 AK |
1215 | static inline int qdisc_drop_all(struct sk_buff *skb, struct Qdisc *sch, |
1216 | struct sk_buff **to_free) | |
1217 | { | |
1218 | __qdisc_drop_all(skb, to_free); | |
1219 | qdisc_qstats_drop(sch); | |
1220 | ||
1221 | return NET_XMIT_DROP; | |
1222 | } | |
1223 | ||
e9bef55d JDB |
1224 | /* Length to Time (L2T) lookup in a qdisc_rate_table, to determine how |
1225 | long it will take to send a packet given its size. | |
1226 | */ | |
1227 | static inline u32 qdisc_l2t(struct qdisc_rate_table* rtab, unsigned int pktlen) | |
1228 | { | |
e08b0998 JDB |
1229 | int slot = pktlen + rtab->rate.cell_align + rtab->rate.overhead; |
1230 | if (slot < 0) | |
1231 | slot = 0; | |
e9bef55d JDB |
1232 | slot >>= rtab->rate.cell_log; |
1233 | if (slot > 255) | |
a02cec21 | 1234 | return rtab->data[255]*(slot >> 8) + rtab->data[slot & 0xFF]; |
e9bef55d JDB |
1235 | return rtab->data[slot]; |
1236 | } | |
1237 | ||
292f1c7f | 1238 | struct psched_ratecfg { |
130d3d68 | 1239 | u64 rate_bytes_ps; /* bytes per second */ |
01cb71d2 ED |
1240 | u32 mult; |
1241 | u16 overhead; | |
fb80445c | 1242 | u16 mpu; |
8a8e3d84 | 1243 | u8 linklayer; |
01cb71d2 | 1244 | u8 shift; |
292f1c7f JP |
1245 | }; |
1246 | ||
1247 | static inline u64 psched_l2t_ns(const struct psched_ratecfg *r, | |
1248 | unsigned int len) | |
1249 | { | |
8a8e3d84 JDB |
1250 | len += r->overhead; |
1251 | ||
fb80445c KB |
1252 | if (len < r->mpu) |
1253 | len = r->mpu; | |
1254 | ||
8a8e3d84 JDB |
1255 | if (unlikely(r->linklayer == TC_LINKLAYER_ATM)) |
1256 | return ((u64)(DIV_ROUND_UP(len,48)*53) * r->mult) >> r->shift; | |
1257 | ||
1258 | return ((u64)len * r->mult) >> r->shift; | |
292f1c7f JP |
1259 | } |
1260 | ||
5c15257f | 1261 | void psched_ratecfg_precompute(struct psched_ratecfg *r, |
3e1e3aae ED |
1262 | const struct tc_ratespec *conf, |
1263 | u64 rate64); | |
292f1c7f | 1264 | |
01cb71d2 ED |
1265 | static inline void psched_ratecfg_getrate(struct tc_ratespec *res, |
1266 | const struct psched_ratecfg *r) | |
292f1c7f | 1267 | { |
01cb71d2 | 1268 | memset(res, 0, sizeof(*res)); |
3e1e3aae ED |
1269 | |
1270 | /* legacy struct tc_ratespec has a 32bit @rate field | |
1271 | * Qdisc using 64bit rate should add new attributes | |
1272 | * in order to maintain compatibility. | |
1273 | */ | |
1274 | res->rate = min_t(u64, r->rate_bytes_ps, ~0U); | |
1275 | ||
01cb71d2 | 1276 | res->overhead = r->overhead; |
fb80445c | 1277 | res->mpu = r->mpu; |
8a8e3d84 | 1278 | res->linklayer = (r->linklayer & TC_LINKLAYER_MASK); |
292f1c7f JP |
1279 | } |
1280 | ||
2ffe0395 BZ |
1281 | struct psched_pktrate { |
1282 | u64 rate_pkts_ps; /* packets per second */ | |
1283 | u32 mult; | |
1284 | u8 shift; | |
1285 | }; | |
1286 | ||
1287 | static inline u64 psched_pkt2t_ns(const struct psched_pktrate *r, | |
1288 | unsigned int pkt_num) | |
1289 | { | |
1290 | return ((u64)pkt_num * r->mult) >> r->shift; | |
1291 | } | |
1292 | ||
1293 | void psched_ppscfg_precompute(struct psched_pktrate *r, u64 pktrate64); | |
1294 | ||
46209401 JP |
1295 | /* Mini Qdisc serves for specific needs of ingress/clsact Qdisc. |
1296 | * The fast path only needs to access filter list and to update stats | |
1297 | */ | |
1298 | struct mini_Qdisc { | |
1299 | struct tcf_proto *filter_list; | |
7d17c544 | 1300 | struct tcf_block *block; |
50dc9a85 | 1301 | struct gnet_stats_basic_sync __percpu *cpu_bstats; |
46209401 | 1302 | struct gnet_stats_queue __percpu *cpu_qstats; |
26746382 | 1303 | unsigned long rcu_state; |
46209401 JP |
1304 | }; |
1305 | ||
1306 | static inline void mini_qdisc_bstats_cpu_update(struct mini_Qdisc *miniq, | |
1307 | const struct sk_buff *skb) | |
1308 | { | |
50dc9a85 | 1309 | bstats_update(this_cpu_ptr(miniq->cpu_bstats), skb); |
46209401 JP |
1310 | } |
1311 | ||
1312 | static inline void mini_qdisc_qstats_cpu_drop(struct mini_Qdisc *miniq) | |
1313 | { | |
1314 | this_cpu_inc(miniq->cpu_qstats->drops); | |
1315 | } | |
1316 | ||
1317 | struct mini_Qdisc_pair { | |
1318 | struct mini_Qdisc miniq1; | |
1319 | struct mini_Qdisc miniq2; | |
1320 | struct mini_Qdisc __rcu **p_miniq; | |
1321 | }; | |
1322 | ||
1323 | void mini_qdisc_pair_swap(struct mini_Qdisc_pair *miniqp, | |
1324 | struct tcf_proto *tp_head); | |
1325 | void mini_qdisc_pair_init(struct mini_Qdisc_pair *miniqp, struct Qdisc *qdisc, | |
1326 | struct mini_Qdisc __rcu **p_miniq); | |
7d17c544 PB |
1327 | void mini_qdisc_pair_block_init(struct mini_Qdisc_pair *miniqp, |
1328 | struct tcf_block *block); | |
46209401 | 1329 | |
f7116fb4 JK |
1330 | void mq_change_real_num_tx(struct Qdisc *sch, unsigned int new_real_tx); |
1331 | ||
c129412f | 1332 | int sch_frag_xmit_hook(struct sk_buff *skb, int (*xmit)(struct sk_buff *skb)); |
cd11b164 | 1333 | |
1da177e4 | 1334 | #endif |