Commit | Line | Data |
---|---|---|
2874c5fd | 1 | /* SPDX-License-Identifier: GPL-2.0-or-later */ |
1da177e4 LT |
2 | /* |
3 | * INET An implementation of the TCP/IP protocol suite for the LINUX | |
4 | * operating system. INET is implemented using the BSD Socket | |
5 | * interface as the means of communication with the user level. | |
6 | * | |
7 | * Definitions for the TCP protocol. | |
8 | * | |
9 | * Version: @(#)tcp.h 1.0.2 04/28/93 | |
10 | * | |
11 | * Author: Fred N. van Kempen, <waltje@uWalt.NL.Mugnet.ORG> | |
1da177e4 LT |
12 | */ |
13 | #ifndef _LINUX_TCP_H | |
14 | #define _LINUX_TCP_H | |
15 | ||
1da177e4 | 16 | |
1da177e4 | 17 | #include <linux/skbuff.h> |
64033892 | 18 | #include <linux/win_minmax.h> |
1da177e4 | 19 | #include <net/sock.h> |
463c84b9 | 20 | #include <net/inet_connection_sock.h> |
8feaf0c0 | 21 | #include <net/inet_timewait_sock.h> |
607ca46e | 22 | #include <uapi/linux/tcp.h> |
1da177e4 | 23 | |
aa8223c7 ACM |
24 | static inline struct tcphdr *tcp_hdr(const struct sk_buff *skb) |
25 | { | |
9c70220b | 26 | return (struct tcphdr *)skb_transport_header(skb); |
aa8223c7 ACM |
27 | } |
28 | ||
d9b3fca2 CG |
29 | static inline unsigned int __tcp_hdrlen(const struct tcphdr *th) |
30 | { | |
31 | return th->doff * 4; | |
32 | } | |
33 | ||
ab6a5bb6 ACM |
34 | static inline unsigned int tcp_hdrlen(const struct sk_buff *skb) |
35 | { | |
d9b3fca2 | 36 | return __tcp_hdrlen(tcp_hdr(skb)); |
ab6a5bb6 ACM |
37 | } |
38 | ||
6a674e9c JG |
39 | static inline struct tcphdr *inner_tcp_hdr(const struct sk_buff *skb) |
40 | { | |
41 | return (struct tcphdr *)skb_inner_transport_header(skb); | |
42 | } | |
43 | ||
44 | static inline unsigned int inner_tcp_hdrlen(const struct sk_buff *skb) | |
45 | { | |
46 | return inner_tcp_hdr(skb)->doff * 4; | |
47 | } | |
48 | ||
504148fe ED |
49 | /** |
50 | * skb_tcp_all_headers - Returns size of all headers for a TCP packet | |
51 | * @skb: buffer | |
52 | * | |
53 | * Used in TX path, for a packet known to be a TCP one. | |
54 | * | |
55 | * if (skb_is_gso(skb)) { | |
56 | * int hlen = skb_tcp_all_headers(skb); | |
57 | * ... | |
58 | */ | |
59 | static inline int skb_tcp_all_headers(const struct sk_buff *skb) | |
60 | { | |
61 | return skb_transport_offset(skb) + tcp_hdrlen(skb); | |
62 | } | |
63 | ||
64 | /** | |
65 | * skb_inner_tcp_all_headers - Returns size of all headers for an encap TCP packet | |
66 | * @skb: buffer | |
67 | * | |
68 | * Used in TX path, for a packet known to be a TCP one. | |
69 | * | |
70 | * if (skb_is_gso(skb) && skb->encapsulation) { | |
71 | * int hlen = skb_inner_tcp_all_headers(skb); | |
72 | * ... | |
73 | */ | |
74 | static inline int skb_inner_tcp_all_headers(const struct sk_buff *skb) | |
75 | { | |
76 | return skb_inner_transport_offset(skb) + inner_tcp_hdrlen(skb); | |
77 | } | |
78 | ||
ab6a5bb6 ACM |
79 | static inline unsigned int tcp_optlen(const struct sk_buff *skb) |
80 | { | |
aa8223c7 | 81 | return (tcp_hdr(skb)->doff - 5) * 4; |
ab6a5bb6 ACM |
82 | } |
83 | ||
2100c8d2 YC |
84 | /* TCP Fast Open */ |
85 | #define TCP_FASTOPEN_COOKIE_MIN 4 /* Min Fast Open Cookie size in bytes */ | |
86 | #define TCP_FASTOPEN_COOKIE_MAX 16 /* Max Fast Open Cookie size in bytes */ | |
10467163 | 87 | #define TCP_FASTOPEN_COOKIE_SIZE 8 /* the size employed by this impl. */ |
2100c8d2 YC |
88 | |
89 | /* TCP Fast Open Cookie as stored in memory */ | |
90 | struct tcp_fastopen_cookie { | |
438ac880 | 91 | __le64 val[DIV_ROUND_UP(TCP_FASTOPEN_COOKIE_MAX, sizeof(u64))]; |
2100c8d2 | 92 | s8 len; |
7f9b838b | 93 | bool exp; /* In RFC6994 experimental option format */ |
2100c8d2 YC |
94 | }; |
95 | ||
1da177e4 | 96 | /* This defines a selective acknowledgement block. */ |
269bd27e AV |
97 | struct tcp_sack_block_wire { |
98 | __be32 start_seq; | |
99 | __be32 end_seq; | |
100 | }; | |
101 | ||
1da177e4 | 102 | struct tcp_sack_block { |
3a137d20 ACM |
103 | u32 start_seq; |
104 | u32 end_seq; | |
1da177e4 LT |
105 | }; |
106 | ||
ab56222a VS |
107 | /*These are used to set the sack_ok field in struct tcp_options_received */ |
108 | #define TCP_SACK_SEEN (1 << 0) /*1 = peer is SACK capable, */ | |
ab56222a VS |
109 | #define TCP_DSACK_SEEN (1 << 2) /*1 = DSACK was received from peer*/ |
110 | ||
1da177e4 LT |
111 | struct tcp_options_received { |
112 | /* PAWS/RTTM data */ | |
cca9bab1 | 113 | int ts_recent_stamp;/* Time we stored ts_recent (for aging) */ |
3a137d20 ACM |
114 | u32 ts_recent; /* Time stamp to echo next */ |
115 | u32 rcv_tsval; /* Time stamp value */ | |
116 | u32 rcv_tsecr; /* Time stamp echo reply */ | |
117 | u16 saw_tstamp : 1, /* Saw TIMESTAMP on last packet */ | |
1da177e4 LT |
118 | tstamp_ok : 1, /* TIMESTAMP seen on SYN packet */ |
119 | dsack : 1, /* D-SACK is scheduled */ | |
120 | wscale_ok : 1, /* Wscale seen on SYN packet */ | |
60e2a778 UB |
121 | sack_ok : 3, /* SACK seen on SYN packet */ |
122 | smc_ok : 1, /* SMC seen on SYN packet */ | |
1da177e4 LT |
123 | snd_wscale : 4, /* Window scaling received from sender */ |
124 | rcv_wscale : 4; /* Window scaling to send to receiver */ | |
7656d684 MKL |
125 | u8 saw_unknown:1, /* Received unknown option */ |
126 | unused:7; | |
3a137d20 | 127 | u8 num_sacks; /* Number of SACK blocks */ |
435cf559 | 128 | u16 user_mss; /* mss requested by user in ioctl */ |
3a137d20 | 129 | u16 mss_clamp; /* Maximal mss, negotiated at connection setup */ |
1da177e4 LT |
130 | }; |
131 | ||
519855c5 WAS |
132 | static inline void tcp_clear_options(struct tcp_options_received *rx_opt) |
133 | { | |
435cf559 WAS |
134 | rx_opt->tstamp_ok = rx_opt->sack_ok = 0; |
135 | rx_opt->wscale_ok = rx_opt->snd_wscale = 0; | |
60e2a778 UB |
136 | #if IS_ENABLED(CONFIG_SMC) |
137 | rx_opt->smc_ok = 0; | |
138 | #endif | |
519855c5 WAS |
139 | } |
140 | ||
4389dded | 141 | /* This is the max number of SACKS that we'll generate and process. It's safe |
435cf559 | 142 | * to increase this, although since: |
4389dded AL |
143 | * size = TCPOLEN_SACK_BASE_ALIGNED (4) + n * TCPOLEN_SACK_PERBLOCK (8) |
144 | * only four options will fit in a standard TCP header */ | |
145 | #define TCP_NUM_SACKS 4 | |
146 | ||
435cf559 WAS |
147 | struct tcp_request_sock_ops; |
148 | ||
2e6599cb | 149 | struct tcp_request_sock { |
cfb6eeb4 | 150 | struct inet_request_sock req; |
b2e4b3de | 151 | const struct tcp_request_sock_ops *af_specific; |
9a568de4 | 152 | u64 snt_synack; /* first SYNACK sent time */ |
9439ce00 | 153 | bool tfo_listener; |
cec37a6e | 154 | bool is_mptcp; |
90bf4513 PA |
155 | #if IS_ENABLED(CONFIG_MPTCP) |
156 | bool drop_req; | |
157 | #endif | |
58d607d3 | 158 | u32 txhash; |
435cf559 WAS |
159 | u32 rcv_isn; |
160 | u32 snt_isn; | |
95a22cae | 161 | u32 ts_off; |
a9b2c06d | 162 | u32 last_oow_ack_time; /* last SYNACK */ |
10467163 JC |
163 | u32 rcv_nxt; /* the ack # by SYNACK. For |
164 | * FastOpen it's the seq# | |
165 | * after data-in-SYN. | |
166 | */ | |
e9b12edc | 167 | u8 syn_tos; |
2e6599cb ACM |
168 | }; |
169 | ||
60236fdd | 170 | static inline struct tcp_request_sock *tcp_rsk(const struct request_sock *req) |
2e6599cb ACM |
171 | { |
172 | return (struct tcp_request_sock *)req; | |
173 | } | |
174 | ||
1da177e4 | 175 | struct tcp_sock { |
463c84b9 ACM |
176 | /* inet_connection_sock has to be the first member of tcp_sock */ |
177 | struct inet_connection_sock inet_conn; | |
2ff52f28 | 178 | u16 tcp_header_len; /* Bytes of tcp header to send */ |
605ad7f1 | 179 | u16 gso_segs; /* Max number of segs per GSO packet */ |
1da177e4 | 180 | |
31770e34 FW |
181 | /* |
182 | * Header prediction flags | |
183 | * 0x5?10 << 16 + snd_wnd in net byte order | |
184 | */ | |
185 | __be32 pred_flags; | |
186 | ||
1da177e4 LT |
187 | /* |
188 | * RFC793 variables by their proper names. This means you can | |
189 | * read the code and the spec side by side (and laugh ...) | |
190 | * See RFC793 and RFC1122. The RFC writes these in capitals. | |
191 | */ | |
bdd1f9ed ED |
192 | u64 bytes_received; /* RFC4898 tcpEStatsAppHCThruOctetsReceived |
193 | * sum(delta(rcv_nxt)), or how many bytes | |
194 | * were acked. | |
195 | */ | |
2efd055c MRL |
196 | u32 segs_in; /* RFC4898 tcpEStatsPerfSegsIn |
197 | * total number of segments in. | |
198 | */ | |
a44d6eac MKL |
199 | u32 data_segs_in; /* RFC4898 tcpEStatsPerfDataSegsIn |
200 | * total number of data segments in. | |
201 | */ | |
3a137d20 | 202 | u32 rcv_nxt; /* What we want to receive next */ |
54287cc1 ED |
203 | u32 copied_seq; /* Head of yet unread data */ |
204 | u32 rcv_wup; /* rcv_nxt on last window update sent */ | |
3a137d20 | 205 | u32 snd_nxt; /* Next sequence we send */ |
2efd055c MRL |
206 | u32 segs_out; /* RFC4898 tcpEStatsPerfSegsOut |
207 | * The total number of segments sent. | |
208 | */ | |
a44d6eac MKL |
209 | u32 data_segs_out; /* RFC4898 tcpEStatsPerfDataSegsOut |
210 | * total number of data segments sent. | |
211 | */ | |
ba113c3a WW |
212 | u64 bytes_sent; /* RFC4898 tcpEStatsPerfHCDataOctetsOut |
213 | * total number of data bytes sent. | |
214 | */ | |
0df48c26 ED |
215 | u64 bytes_acked; /* RFC4898 tcpEStatsAppHCThruOctetsAcked |
216 | * sum(delta(snd_una)), or how many bytes | |
217 | * were acked. | |
218 | */ | |
7e10b655 WW |
219 | u32 dsack_dups; /* RFC4898 tcpEStatsStackDSACKDups |
220 | * total number of DSACK blocks received | |
221 | */ | |
3a137d20 ACM |
222 | u32 snd_una; /* First byte we want an ack for */ |
223 | u32 snd_sml; /* Last byte of the most recently transmitted small packet */ | |
224 | u32 rcv_tstamp; /* timestamp of last received ACK (for keepalives) */ | |
225 | u32 lsndtime; /* timestamp of last sent data packet (for restart window) */ | |
f2b2c582 | 226 | u32 last_oow_ack_time; /* timestamp of last out-of-window ACK */ |
86de5921 | 227 | u32 compressed_ack_rcv_nxt; |
1da177e4 | 228 | |
ceaa1fef AV |
229 | u32 tsoffset; /* timestamp offset */ |
230 | ||
46d3ceab | 231 | struct list_head tsq_node; /* anchor in tsq_tasklet.head list */ |
e2080072 | 232 | struct list_head tsorted_sent_queue; /* time-sorted sent but un-SACKed skbs */ |
46d3ceab | 233 | |
3a137d20 ACM |
234 | u32 snd_wl1; /* Sequence for window update */ |
235 | u32 snd_wnd; /* The window we expect to receive */ | |
236 | u32 max_window; /* Maximal window ever seen from peer */ | |
237 | u32 mss_cache; /* Cached effective mss, not including SACKS */ | |
1da177e4 | 238 | |
3a137d20 ACM |
239 | u32 window_clamp; /* Maximal window to advertise */ |
240 | u32 rcv_ssthresh; /* Current window clamp */ | |
1da177e4 | 241 | |
659a8ad5 YC |
242 | /* Information of the most recently (s)acked skb */ |
243 | struct tcp_rack { | |
9a568de4 | 244 | u64 mstamp; /* (Re)sent time of the skb */ |
deed7be7 | 245 | u32 rtt_us; /* Associated RTT */ |
1d0833df | 246 | u32 end_seq; /* Ending TCP sequence of the skb */ |
1f255691 PJ |
247 | u32 last_delivered; /* tp->delivered at last reo_wnd adj */ |
248 | u8 reo_wnd_steps; /* Allowed reordering window */ | |
249 | #define TCP_RACK_RECOVERY_THRESH 16 | |
250 | u8 reo_wnd_persist:5, /* No. of recovery since last adj */ | |
251 | dsack_seen:1, /* Whether DSACK seen after last adj */ | |
7ec65372 | 252 | advanced:1; /* mstamp advanced since last lost marking */ |
659a8ad5 | 253 | } rack; |
b79eeeb9 | 254 | u16 advmss; /* Advertised MSS */ |
5d9f4262 | 255 | u8 compressed_ack; |
76be93fc YC |
256 | u8 dup_ack_counter:2, |
257 | tlp_retrans:1, /* TLP is a retransmission */ | |
258 | unused:5; | |
05b055e8 FY |
259 | u32 chrono_start; /* Start time in jiffies of a TCP chrono */ |
260 | u32 chrono_stat[3]; /* Time in jiffies for chrono_stat stats */ | |
261 | u8 chrono_type:2, /* current chronograph type */ | |
262 | rate_app_limited:1, /* rate_{delivered,interval_us} limited? */ | |
19f6d3f3 | 263 | fastopen_connect:1, /* FASTOPEN_CONNECT sockopt */ |
71c02379 | 264 | fastopen_no_cookie:1, /* Allow send/recv SYN+data without a cookie */ |
d4761754 | 265 | is_sack_reneg:1, /* in recovery from loss with SACK reneg? */ |
48027478 | 266 | fastopen_client_fail:2; /* reason why fastopen failed */ |
36e31b0a AP |
267 | u8 nonagle : 4,/* Disable Nagle algorithm? */ |
268 | thin_lto : 1,/* Use linear timeouts for thin streams */ | |
b75eba76 | 269 | recvmsg_inq : 1,/* Indicate # of bytes in queue upon recvmsg */ |
e33099f9 YC |
270 | repair : 1, |
271 | frto : 1;/* F-RTO (RFC5682) activated in CA_Loss */ | |
ee995283 | 272 | u8 repair_queue; |
267cf9fa MKL |
273 | u8 save_syn:2, /* Save headers of SYN packet */ |
274 | syn_data:1, /* SYN includes data */ | |
6f73601e | 275 | syn_fastopen:1, /* SYN includes Fast Open option */ |
2646c831 | 276 | syn_fastopen_exp:1,/* SYN includes Fast Open exp. option */ |
cf1ef3f0 | 277 | syn_fastopen_ch:1, /* Active TFO re-enabling probe */ |
ca8a2263 | 278 | syn_data_acked:1,/* data in SYN is acked by SYN-ACK */ |
267cf9fa | 279 | is_cwnd_limited:1;/* forward progress limited by snd_cwnd? */ |
76be93fc | 280 | u32 tlp_high_seq; /* snd_nxt at the time of TLP */ |
1da177e4 | 281 | |
a842fe14 | 282 | u32 tcp_tx_delay; /* delay (in usec) added to TX packets */ |
9799ccb0 | 283 | u64 tcp_wstamp_ns; /* departure time for next sent data packet */ |
5f6188a8 | 284 | u64 tcp_clock_cache; /* cache last tcp_clock_ns() (see tcp_mstamp_refresh()) */ |
9799ccb0 | 285 | |
1da177e4 | 286 | /* RTT measurement */ |
9a568de4 | 287 | u64 tcp_mstamp; /* most recent packet received/sent */ |
740b0f18 ED |
288 | u32 srtt_us; /* smoothed round trip time << 3 in usecs */ |
289 | u32 mdev_us; /* medium deviation */ | |
290 | u32 mdev_max_us; /* maximal mdev for the last rtt period */ | |
291 | u32 rttvar_us; /* smoothed mdev_max */ | |
3a137d20 | 292 | u32 rtt_seq; /* sequence number to update rttvar */ |
64033892 | 293 | struct minmax rtt_min; |
3a137d20 ACM |
294 | |
295 | u32 packets_out; /* Packets which are "in flight" */ | |
3a137d20 | 296 | u32 retrans_out; /* Retransmitted packets out */ |
ca8a2263 | 297 | u32 max_packets_out; /* max packets_out in last window */ |
f4ce91ce | 298 | u32 cwnd_usage_seq; /* right edge of cwnd usage tracking flight */ |
b79eeeb9 IJ |
299 | |
300 | u16 urg_data; /* Saved octet of OOB data and control flags */ | |
b79eeeb9 | 301 | u8 ecn_flags; /* ECN status bits. */ |
dca145ff ED |
302 | u8 keepalive_probes; /* num of allowed keep alive probes */ |
303 | u32 reordering; /* Packet reordering metric. */ | |
7ec65372 | 304 | u32 reord_seen; /* number of data packet reordering events */ |
33f5f57e IJ |
305 | u32 snd_up; /* Urgent pointer */ |
306 | ||
1da177e4 LT |
307 | /* |
308 | * Options received (usually on last packet, some only on SYN packets). | |
309 | */ | |
1da177e4 LT |
310 | struct tcp_options_received rx_opt; |
311 | ||
312 | /* | |
313 | * Slow start and congestion control (see also Nagle, and Karn & Partridge) | |
314 | */ | |
3a137d20 ACM |
315 | u32 snd_ssthresh; /* Slow start size threshold */ |
316 | u32 snd_cwnd; /* Sending congestion window */ | |
f78a1b38 | 317 | u32 snd_cwnd_cnt; /* Linear increase counter */ |
e0ef57cc | 318 | u32 snd_cwnd_clamp; /* Do not allow snd_cwnd to grow above this */ |
3a137d20 ACM |
319 | u32 snd_cwnd_used; |
320 | u32 snd_cwnd_stamp; | |
4faf7839 | 321 | u32 prior_cwnd; /* cwnd right before starting loss recovery */ |
a262f0cd ND |
322 | u32 prr_delivered; /* Number of newly delivered packets to |
323 | * receiver in Recovery. */ | |
324 | u32 prr_out; /* Total number of pkts sent during Recovery. */ | |
ddf1af6f | 325 | u32 delivered; /* Total data packets delivered incl. rexmits */ |
e21db6f6 | 326 | u32 delivered_ce; /* Like the above but only ECE marked packets */ |
0682e690 | 327 | u32 lost; /* Total data packets lost incl. rexmits */ |
d7722e85 | 328 | u32 app_limited; /* limited until "delivered" reaches this val */ |
9a568de4 ED |
329 | u64 first_tx_mstamp; /* start of window send phase */ |
330 | u64 delivered_mstamp; /* time we reached "delivered" */ | |
eb8329e0 YC |
331 | u32 rate_delivered; /* saved rate sample: packets delivered */ |
332 | u32 rate_interval_us; /* saved rate sample: time elapsed */ | |
1da177e4 | 333 | |
3a137d20 | 334 | u32 rcv_wnd; /* Current receiver window */ |
3a137d20 | 335 | u32 write_seq; /* Tail(+1) of data held in tcp send buffer */ |
c9bee3b7 | 336 | u32 notsent_lowat; /* TCP_NOTSENT_LOWAT */ |
3a137d20 | 337 | u32 pushed_seq; /* Last pushed seq, required to talk to windows */ |
b79eeeb9 IJ |
338 | u32 lost_out; /* Lost packets */ |
339 | u32 sacked_out; /* SACK'd packets */ | |
1da177e4 | 340 | |
218af599 | 341 | struct hrtimer pacing_timer; |
5d9f4262 | 342 | struct hrtimer compressed_ack_timer; |
218af599 | 343 | |
b79eeeb9 IJ |
344 | /* from STCP, retrans queue hinting */ |
345 | struct sk_buff* lost_skb_hint; | |
b79eeeb9 | 346 | struct sk_buff *retransmit_skb_hint; |
b79eeeb9 | 347 | |
9f5afeae YW |
348 | /* OOO segments go in this rbtree. Socket lock must be held. */ |
349 | struct rb_root out_of_order_queue; | |
350 | struct sk_buff *ooo_last_skb; /* cache rb_last(out_of_order_queue) */ | |
b79eeeb9 | 351 | |
c0a788c4 | 352 | /* SACKs data, these 2 need to be together (see tcp_options_write) */ |
1da177e4 LT |
353 | struct tcp_sack_block duplicate_sack[1]; /* D-SACK block */ |
354 | struct tcp_sack_block selective_acks[4]; /* The SACKS themselves*/ | |
355 | ||
fd6dad61 | 356 | struct tcp_sack_block recv_sack_cache[4]; |
6a438bbe | 357 | |
ecb97192 NC |
358 | struct sk_buff *highest_sack; /* skb just after the highest |
359 | * skb with SACKed bit set | |
a47e5a98 IJ |
360 | * (validity guaranteed only if |
361 | * sacked_out > 0) | |
362 | */ | |
d738cd8f | 363 | |
6a438bbe | 364 | int lost_cnt_hint; |
6a438bbe | 365 | |
4b749440 | 366 | u32 prior_ssthresh; /* ssthresh saved at recovery start */ |
3a137d20 | 367 | u32 high_seq; /* snd_nxt at onset of congestion */ |
1da177e4 | 368 | |
3a137d20 | 369 | u32 retrans_stamp; /* Timestamp of the last retransmit, |
1da177e4 LT |
370 | * also used in SYN-SENT to remember stamp of |
371 | * the first SYN. */ | |
989e04c5 | 372 | u32 undo_marker; /* snd_una upon a new recovery episode. */ |
1da177e4 | 373 | int undo_retrans; /* number of undoable retransmissions. */ |
fb31c9b9 WW |
374 | u64 bytes_retrans; /* RFC4898 tcpEStatsPerfOctetsRetrans |
375 | * Total data bytes retransmitted | |
376 | */ | |
b79eeeb9 IJ |
377 | u32 total_retrans; /* Total retransmits for entire connection */ |
378 | ||
3a137d20 | 379 | u32 urg_seq; /* Seq of received urgent pointer */ |
1da177e4 LT |
380 | unsigned int keepalive_time; /* time before keep alive takes place */ |
381 | unsigned int keepalive_intvl; /* time interval between keep alive probes */ | |
1da177e4 | 382 | |
a0f82f64 | 383 | int linger2; |
1da177e4 | 384 | |
b13d8807 LB |
385 | |
386 | /* Sock_ops bpf program related variables */ | |
387 | #ifdef CONFIG_BPF | |
388 | u8 bpf_sock_ops_cb_flags; /* Control calling BPF programs | |
389 | * values defined in uapi/linux/tcp.h | |
390 | */ | |
061ff040 MKL |
391 | u8 bpf_chg_cc_inprogress:1; /* In the middle of |
392 | * bpf_setsockopt(TCP_CONGESTION), | |
393 | * it is to avoid the bpf_tcp_cc->init() | |
394 | * to recur itself by calling | |
395 | * bpf_setsockopt(TCP_CONGESTION, "itself"). | |
396 | */ | |
b13d8807 LB |
397 | #define BPF_SOCK_OPS_TEST_FLAG(TP, ARG) (TP->bpf_sock_ops_cb_flags & ARG) |
398 | #else | |
399 | #define BPF_SOCK_OPS_TEST_FLAG(TP, ARG) 0 | |
400 | #endif | |
401 | ||
32efcc06 AK |
402 | u16 timeout_rehash; /* Timeout-triggered rehash attempts */ |
403 | ||
f9af2dbb TH |
404 | u32 rcv_ooopack; /* Received out-of-order packets, for tcpinfo */ |
405 | ||
1da177e4 | 406 | /* Receiver side RTT estimation */ |
3f6c65d6 | 407 | u32 rcv_rtt_last_tsecr; |
1da177e4 | 408 | struct { |
9a568de4 ED |
409 | u32 rtt_us; |
410 | u32 seq; | |
411 | u64 time; | |
1da177e4 LT |
412 | } rcv_rtt_est; |
413 | ||
414 | /* Receiver queue space */ | |
415 | struct { | |
607065ba | 416 | u32 space; |
9a568de4 ED |
417 | u32 seq; |
418 | u64 time; | |
1da177e4 | 419 | } rcvq_space; |
0e7b1368 JH |
420 | |
421 | /* TCP-specific MTU probe information. */ | |
422 | struct { | |
3a137d20 ACM |
423 | u32 probe_seq_start; |
424 | u32 probe_seq_end; | |
0e7b1368 | 425 | } mtu_probe; |
29c1c446 | 426 | u32 plb_rehash; /* PLB-triggered rehash attempts */ |
563d34d0 ED |
427 | u32 mtu_info; /* We received an ICMP_FRAG_NEEDED / ICMPV6_PKT_TOOBIG |
428 | * while socket was owned by user. | |
429 | */ | |
2303f994 PK |
430 | #if IS_ENABLED(CONFIG_MPTCP) |
431 | bool is_mptcp; | |
432 | #endif | |
267cf9fa | 433 | #if IS_ENABLED(CONFIG_SMC) |
48b6190a | 434 | bool (*smc_hs_congested)(const struct sock *sk); |
267cf9fa MKL |
435 | bool syn_smc; /* SYN includes SMC */ |
436 | #endif | |
cfb6eeb4 YH |
437 | |
438 | #ifdef CONFIG_TCP_MD5SIG | |
439 | /* TCP AF-Specific parts; only used by MD5 Signature support so far */ | |
b2e4b3de | 440 | const struct tcp_sock_af_ops *af_specific; |
cfb6eeb4 | 441 | |
b2e4b3de | 442 | /* TCP MD5 Signature Option information */ |
a8afca03 | 443 | struct tcp_md5sig_info __rcu *md5sig_info; |
cfb6eeb4 | 444 | #endif |
435cf559 | 445 | |
10467163 JC |
446 | /* TCP fastopen related information */ |
447 | struct tcp_fastopen_request *fastopen_req; | |
448 | /* fastopen_rsk points to request_sock that resulted in this big | |
449 | * socket. Used to retransmit SYNACKs etc. | |
450 | */ | |
d983ea6f | 451 | struct request_sock __rcu *fastopen_rsk; |
70a217f1 | 452 | struct saved_syn *saved_syn; |
1da177e4 LT |
453 | }; |
454 | ||
40fc3423 | 455 | enum tsq_enum { |
46d3ceab ED |
456 | TSQ_THROTTLED, |
457 | TSQ_QUEUED, | |
6f458dfb ED |
458 | TCP_TSQ_DEFERRED, /* tcp_tasklet_func() found socket was owned */ |
459 | TCP_WRITE_TIMER_DEFERRED, /* tcp_write_timer() found socket was owned */ | |
460 | TCP_DELACK_TIMER_DEFERRED, /* tcp_delack_timer() found socket was owned */ | |
563d34d0 ED |
461 | TCP_MTU_REDUCED_DEFERRED, /* tcp_v{4|6}_err() could not call |
462 | * tcp_v{4|6}_mtu_reduced() | |
463 | */ | |
46d3ceab ED |
464 | }; |
465 | ||
40fc3423 ED |
466 | enum tsq_flags { |
467 | TSQF_THROTTLED = (1UL << TSQ_THROTTLED), | |
468 | TSQF_QUEUED = (1UL << TSQ_QUEUED), | |
469 | TCPF_TSQ_DEFERRED = (1UL << TCP_TSQ_DEFERRED), | |
470 | TCPF_WRITE_TIMER_DEFERRED = (1UL << TCP_WRITE_TIMER_DEFERRED), | |
471 | TCPF_DELACK_TIMER_DEFERRED = (1UL << TCP_DELACK_TIMER_DEFERRED), | |
472 | TCPF_MTU_REDUCED_DEFERRED = (1UL << TCP_MTU_REDUCED_DEFERRED), | |
473 | }; | |
474 | ||
1da177e4 LT |
475 | static inline struct tcp_sock *tcp_sk(const struct sock *sk) |
476 | { | |
477 | return (struct tcp_sock *)sk; | |
478 | } | |
479 | ||
8feaf0c0 ACM |
480 | struct tcp_timewait_sock { |
481 | struct inet_timewait_sock tw_sk; | |
d475f090 ED |
482 | #define tw_rcv_nxt tw_sk.__tw_common.skc_tw_rcv_nxt |
483 | #define tw_snd_nxt tw_sk.__tw_common.skc_tw_snd_nxt | |
3a137d20 | 484 | u32 tw_rcv_wnd; |
ceaa1fef | 485 | u32 tw_ts_offset; |
3a137d20 | 486 | u32 tw_ts_recent; |
4fb17a60 NC |
487 | |
488 | /* The time we sent the last out-of-window ACK: */ | |
489 | u32 tw_last_oow_ack_time; | |
490 | ||
cca9bab1 | 491 | int tw_ts_recent_stamp; |
a842fe14 | 492 | u32 tw_tx_delay; |
cfb6eeb4 | 493 | #ifdef CONFIG_TCP_MD5SIG |
2397849b | 494 | struct tcp_md5sig_key *tw_md5_key; |
cfb6eeb4 | 495 | #endif |
8feaf0c0 ACM |
496 | }; |
497 | ||
498 | static inline struct tcp_timewait_sock *tcp_twsk(const struct sock *sk) | |
499 | { | |
500 | return (struct tcp_timewait_sock *)sk; | |
501 | } | |
502 | ||
10467163 JC |
503 | static inline bool tcp_passive_fastopen(const struct sock *sk) |
504 | { | |
d983ea6f ED |
505 | return sk->sk_state == TCP_SYN_RECV && |
506 | rcu_access_pointer(tcp_sk(sk)->fastopen_rsk) != NULL; | |
10467163 JC |
507 | } |
508 | ||
0536fcc0 | 509 | static inline void fastopen_queue_tune(struct sock *sk, int backlog) |
10467163 | 510 | { |
0536fcc0 | 511 | struct request_sock_queue *queue = &inet_csk(sk)->icsk_accept_queue; |
dbf650b6 | 512 | int somaxconn = READ_ONCE(sock_net(sk)->core.sysctl_somaxconn); |
0536fcc0 | 513 | |
dbf650b6 | 514 | queue->fastopenq.max_qlen = min_t(unsigned int, backlog, somaxconn); |
10467163 JC |
515 | } |
516 | ||
805c4bc0 ED |
517 | static inline void tcp_move_syn(struct tcp_sock *tp, |
518 | struct request_sock *req) | |
519 | { | |
520 | tp->saved_syn = req->saved_syn; | |
521 | req->saved_syn = NULL; | |
522 | } | |
523 | ||
cd8ae852 ED |
524 | static inline void tcp_saved_syn_free(struct tcp_sock *tp) |
525 | { | |
526 | kfree(tp->saved_syn); | |
527 | tp->saved_syn = NULL; | |
528 | } | |
529 | ||
70a217f1 MKL |
530 | static inline u32 tcp_saved_syn_len(const struct saved_syn *saved_syn) |
531 | { | |
267cf9fa MKL |
532 | return saved_syn->mac_hdrlen + saved_syn->network_hdrlen + |
533 | saved_syn->tcp_hdrlen; | |
70a217f1 MKL |
534 | } |
535 | ||
48040793 | 536 | struct sk_buff *tcp_get_timestamping_opt_stats(const struct sock *sk, |
e7ed11ee YS |
537 | const struct sk_buff *orig_skb, |
538 | const struct sk_buff *ack_skb); | |
1c885808 | 539 | |
3541f9e8 ED |
540 | static inline u16 tcp_mss_clamp(const struct tcp_sock *tp, u16 mss) |
541 | { | |
542 | /* We use READ_ONCE() here because socket might not be locked. | |
543 | * This happens for listeners. | |
544 | */ | |
545 | u16 user_mss = READ_ONCE(tp->rx_opt.user_mss); | |
546 | ||
547 | return (user_mss && user_mss < mss) ? user_mss : mss; | |
548 | } | |
3b4929f6 ED |
549 | |
550 | int tcp_skb_shift(struct sk_buff *to, struct sk_buff *from, int pcount, | |
551 | int shiftlen); | |
552 | ||
6fadaa56 | 553 | void __tcp_sock_set_cork(struct sock *sk, bool on); |
db10538a | 554 | void tcp_sock_set_cork(struct sock *sk, bool on); |
480aeb96 | 555 | int tcp_sock_set_keepcnt(struct sock *sk, int val); |
aad4a0a9 | 556 | int tcp_sock_set_keepidle_locked(struct sock *sk, int val); |
71c48eb8 | 557 | int tcp_sock_set_keepidle(struct sock *sk, int val); |
d41ecaac | 558 | int tcp_sock_set_keepintvl(struct sock *sk, int val); |
6fadaa56 | 559 | void __tcp_sock_set_nodelay(struct sock *sk, bool on); |
12abc5ee | 560 | void tcp_sock_set_nodelay(struct sock *sk); |
ddd061b8 | 561 | void tcp_sock_set_quickack(struct sock *sk, int val); |
557eadfc | 562 | int tcp_sock_set_syncnt(struct sock *sk, int val); |
c488aead | 563 | void tcp_sock_set_user_timeout(struct sock *sk, u32 val); |
db10538a | 564 | |
1da177e4 | 565 | #endif /* _LINUX_TCP_H */ |