1 #ifndef __LINUX_PKT_SCHED_H
2 #define __LINUX_PKT_SCHED_H
4 #include <linux/types.h>
6 /* Logical priority bands not depending on specific packet scheduler.
7 Every scheduler will map them to real traffic classes, if it has
8 no more precise mechanism to classify packets.
10 These numbers have no special meaning, though their coincidence
11 with obsolete IPv6 values is not occasional :-). New IPv6 drafts
12 preferred full anarchy inspired by diffserv group.
14 Note: TC_PRIO_BESTEFFORT does not mean that it is the most unhappy
15 class, actually, as rule it will be handled with more care than
19 #define TC_PRIO_BESTEFFORT 0
20 #define TC_PRIO_FILLER 1
21 #define TC_PRIO_BULK 2
22 #define TC_PRIO_INTERACTIVE_BULK 4
23 #define TC_PRIO_INTERACTIVE 6
24 #define TC_PRIO_CONTROL 7
26 #define TC_PRIO_MAX 15
28 /* Generic queue statistics, available for all the elements.
29 Particular schedulers may have also their private records.
33 __u64 bytes; /* Number of enqueued bytes */
34 __u32 packets; /* Number of enqueued packets */
35 __u32 drops; /* Packets dropped because of lack of resources */
36 __u32 overlimits; /* Number of throttle events when this
37 * flow goes out of allocated bandwidth */
38 __u32 bps; /* Current flow byte rate */
39 __u32 pps; /* Current flow packet rate */
46 unsigned char ewma_log;
52 All the traffic control objects have 32bit identifiers, or "handles".
54 They can be considered as opaque numbers from user API viewpoint,
55 but actually they always consist of two fields: major and
56 minor numbers, which are interpreted by kernel specially,
57 that may be used by applications, though not recommended.
59 F.e. qdisc handles always have minor number equal to zero,
60 classes (or flows) have major equal to parent qdisc major, and
61 minor uniquely identifying class inside qdisc.
63 Macros to manipulate handles:
66 #define TC_H_MAJ_MASK (0xFFFF0000U)
67 #define TC_H_MIN_MASK (0x0000FFFFU)
68 #define TC_H_MAJ(h) ((h)&TC_H_MAJ_MASK)
69 #define TC_H_MIN(h) ((h)&TC_H_MIN_MASK)
70 #define TC_H_MAKE(maj,min) (((maj)&TC_H_MAJ_MASK)|((min)&TC_H_MIN_MASK))
72 #define TC_H_UNSPEC (0U)
73 #define TC_H_ROOT (0xFFFFFFFFU)
74 #define TC_H_INGRESS (0xFFFFFFF1U)
77 unsigned char cell_log;
78 unsigned char __reserved;
79 unsigned short overhead;
85 #define TC_RTAB_SIZE 1024
88 unsigned char cell_log;
89 unsigned char size_log;
92 unsigned int linklayer;
105 #define TCA_STAB_MAX (__TCA_STAB_MAX - 1)
109 struct tc_fifo_qopt {
110 __u32 limit; /* Queue length: bytes for bfifo, packets for pfifo */
115 #define TCQ_PRIO_BANDS 16
116 #define TCQ_MIN_PRIO_BANDS 2
118 struct tc_prio_qopt {
119 int bands; /* Number of bands */
120 __u8 priomap[TC_PRIO_MAX+1]; /* Map: logical priority -> PRIO band */
125 struct tc_multiq_qopt {
126 __u16 bands; /* Number of bands */
127 __u16 max_bands; /* Maximum number of queues */
133 struct tc_ratespec rate;
134 struct tc_ratespec peakrate;
148 #define TCA_TBF_MAX (__TCA_TBF_MAX - 1)
153 /* TEQL does not require any parameters */
158 unsigned quantum; /* Bytes per round allocated to flow */
159 int perturb_period; /* Period of hash perturbation */
160 __u32 limit; /* Maximal packets in queue */
161 unsigned divisor; /* Hash divisor */
162 unsigned flows; /* Maximal number of flows */
165 struct tc_sfq_qopt_v1 {
166 struct tc_sfq_qopt v0;
167 unsigned int depth; /* max number of packets per flow */
168 unsigned int headdrop;
172 struct tc_sfq_xstats {
186 #define TCA_RED_MAX (__TCA_RED_MAX - 1)
189 __u32 limit; /* HARD maximal queue length (bytes) */
190 __u32 qth_min; /* Min average length threshold (bytes) */
191 __u32 qth_max; /* Max average length threshold (bytes) */
192 unsigned char Wlog; /* log(W) */
193 unsigned char Plog; /* log(P_max/(qth_max-qth_min)) */
194 unsigned char Scell_log; /* cell size for idle damping */
197 #define TC_RED_HARDDROP 2
198 #define TC_RED_ADAPTATIVE 4
201 struct tc_red_xstats {
202 __u32 early; /* Early drops */
203 __u32 pdrop; /* Drops due to queue limits */
204 __u32 other; /* Drops due to drop() calls */
205 __u32 marked; /* Marked packets */
221 #define TCA_GRED_MAX (__TCA_GRED_MAX - 1)
223 struct tc_gred_qopt {
224 __u32 limit; /* HARD maximal queue length (bytes) */
225 __u32 qth_min; /* Min average length threshold (bytes) */
226 __u32 qth_max; /* Max average length threshold (bytes) */
227 __u32 DP; /* up to 2^32 DPs */
234 __u8 Wlog; /* log(W) */
235 __u8 Plog; /* log(P_max/(qth_max-qth_min)) */
236 __u8 Scell_log; /* cell size for idle damping */
237 __u8 prio; /* prio of this VQ */
243 struct tc_gred_sopt {
261 #define TCA_CHOKE_MAX (__TCA_CHOKE_MAX - 1)
263 struct tc_choke_qopt {
264 __u32 limit; /* Hard queue length (packets) */
265 __u32 qth_min; /* Min average threshold (packets) */
266 __u32 qth_max; /* Max average threshold (packets) */
267 unsigned char Wlog; /* log(W) */
268 unsigned char Plog; /* log(P_max/(qth_max-qth_min)) */
269 unsigned char Scell_log; /* cell size for idle damping */
270 unsigned char flags; /* see RED flags */
273 struct tc_choke_xstats {
274 __u32 early; /* Early drops */
275 __u32 pdrop; /* Drops due to queue limits */
276 __u32 other; /* Drops due to drop() calls */
277 __u32 marked; /* Marked packets */
278 __u32 matched; /* Drops due to flow match */
282 #define TC_HTB_NUMPRIO 8
283 #define TC_HTB_MAXDEPTH 8
284 #define TC_HTB_PROTOVER 3 /* the same as HTB and TC's major */
287 struct tc_ratespec rate;
288 struct tc_ratespec ceil;
292 __u32 level; /* out only */
296 __u32 version; /* to match HTB/TC */
297 __u32 rate2quantum; /* bps->quantum divisor */
298 __u32 defcls; /* default class number */
299 __u32 debug; /* debug flags */
302 __u32 direct_pkts; /* count of non shaped packets */
313 #define TCA_HTB_MAX (__TCA_HTB_MAX - 1)
315 struct tc_htb_xstats {
318 __u32 giants; /* too big packets (rate will not be accurate) */
325 struct tc_hfsc_qopt {
326 __u16 defcls; /* default class */
329 struct tc_service_curve {
330 __u32 m1; /* slope of the first segment in bps */
331 __u32 d; /* x-projection of the first segment in us */
332 __u32 m2; /* slope of the second segment in bps */
335 struct tc_hfsc_stats {
336 __u64 work; /* total work done */
337 __u64 rtwork; /* work done by real-time criteria */
338 __u32 period; /* current period */
339 __u32 level; /* class level in hierarchy */
350 #define TCA_HFSC_MAX (__TCA_HFSC_MAX - 1)
355 #define TC_CBQ_MAXPRIO 8
356 #define TC_CBQ_MAXLEVEL 8
357 #define TC_CBQ_DEF_EWMA 5
359 struct tc_cbq_lssopt {
360 unsigned char change;
362 #define TCF_CBQ_LSS_BOUNDED 1
363 #define TCF_CBQ_LSS_ISOLATED 2
364 unsigned char ewma_log;
366 #define TCF_CBQ_LSS_FLAGS 1
367 #define TCF_CBQ_LSS_EWMA 2
368 #define TCF_CBQ_LSS_MAXIDLE 4
369 #define TCF_CBQ_LSS_MINIDLE 8
370 #define TCF_CBQ_LSS_OFFTIME 0x10
371 #define TCF_CBQ_LSS_AVPKT 0x20
378 struct tc_cbq_wrropt {
380 unsigned char priority;
381 unsigned char cpriority;
382 unsigned char __reserved;
388 unsigned char strategy;
389 #define TC_CBQ_OVL_CLASSIC 0
390 #define TC_CBQ_OVL_DELAY 1
391 #define TC_CBQ_OVL_LOWPRIO 2
392 #define TC_CBQ_OVL_DROP 3
393 #define TC_CBQ_OVL_RCLASSIC 4
394 unsigned char priority2;
399 struct tc_cbq_police {
400 unsigned char police;
401 unsigned char __res1;
402 unsigned short __res2;
411 struct tc_cbq_xstats {
423 TCA_CBQ_OVL_STRATEGY,
430 #define TCA_CBQ_MAX (__TCA_CBQ_MAX - 1)
437 TCA_DSMARK_DEFAULT_INDEX,
438 TCA_DSMARK_SET_TC_INDEX,
444 #define TCA_DSMARK_MAX (__TCA_DSMARK_MAX - 1)
450 TCA_ATM_FD, /* file/socket descriptor */
451 TCA_ATM_PTR, /* pointer to descriptor - later */
452 TCA_ATM_HDR, /* LL header */
453 TCA_ATM_EXCESS, /* excess traffic class (0 for CLP) */
454 TCA_ATM_ADDR, /* PVC address (for output only) */
455 TCA_ATM_STATE, /* VC state (ATM_VS_*; for output only) */
459 #define TCA_ATM_MAX (__TCA_ATM_MAX - 1)
461 /* Network emulator */
466 TCA_NETEM_DELAY_DIST,
474 #define TCA_NETEM_MAX (__TCA_NETEM_MAX - 1)
476 struct tc_netem_qopt {
477 __u32 latency; /* added delay (us) */
478 __u32 limit; /* fifo limit (packets) */
479 __u32 loss; /* random packet loss (0=none ~0=100%) */
480 __u32 gap; /* re-ordering gap (0 for none) */
481 __u32 duplicate; /* random packet dup (0=none ~0=100%) */
482 __u32 jitter; /* random jitter in latency (us) */
485 struct tc_netem_corr {
486 __u32 delay_corr; /* delay correlation */
487 __u32 loss_corr; /* packet loss correlation */
488 __u32 dup_corr; /* duplicate correlation */
491 struct tc_netem_reorder {
496 struct tc_netem_corrupt {
501 struct tc_netem_rate {
502 __u32 rate; /* byte/s */
503 __s32 packet_overhead;
510 NETEM_LOSS_GI, /* General Intuitive - 4 state model */
511 NETEM_LOSS_GE, /* Gilbert Elliot models */
514 #define NETEM_LOSS_MAX (__NETEM_LOSS_MAX - 1)
516 /* State transition probabilities for 4 state model */
517 struct tc_netem_gimodel {
525 /* Gilbert-Elliot models */
526 struct tc_netem_gemodel {
533 #define NETEM_DIST_SCALE 8192
534 #define NETEM_DIST_MAX 16384
544 #define TCA_DRR_MAX (__TCA_DRR_MAX - 1)
546 struct tc_drr_stats {
551 #define TC_QOPT_BITMASK 15
552 #define TC_QOPT_MAX_QUEUE 16
554 struct tc_mqprio_qopt {
556 __u8 prio_tc_map[TC_QOPT_BITMASK + 1];
558 __u16 count[TC_QOPT_MAX_QUEUE];
559 __u16 offset[TC_QOPT_MAX_QUEUE];
570 #define TCA_SFB_MAX (__TCA_SFB_MAX - 1)
573 * Note: increment, decrement are Q0.16 fixed-point values.
576 __u32 rehash_interval; /* delay between hash move, in ms */
577 __u32 warmup_time; /* double buffering warmup time in ms (warmup_time < rehash_interval) */
578 __u32 max; /* max len of qlen_min */
579 __u32 bin_size; /* maximum queue length per bin */
580 __u32 increment; /* probability increment, (d1 in Blue) */
581 __u32 decrement; /* probability decrement, (d2 in Blue) */
582 __u32 limit; /* max SFB queue length */
583 __u32 penalty_rate; /* inelastic flows are rate limited to 'rate' pps */
587 struct tc_sfb_xstats {
592 __u32 childdrop; /* drops in child qdisc */
599 #define SFB_MAX_PROB 0xFFFF
609 #define TCA_QFQ_MAX (__TCA_QFQ_MAX - 1)
611 struct tc_qfq_stats {