Commit | Line | Data |
---|---|---|
3c4d7559 DW |
1 | /* |
2 | * Copyright (c) 2016-2017, Mellanox Technologies. All rights reserved. | |
3 | * Copyright (c) 2016-2017, Dave Watson <davejwatson@fb.com>. All rights reserved. | |
4 | * Copyright (c) 2016-2017, Lance Chao <lancerchao@fb.com>. All rights reserved. | |
5 | * Copyright (c) 2016, Fridolin Pokorny <fridolin.pokorny@gmail.com>. All rights reserved. | |
6 | * Copyright (c) 2016, Nikos Mavrogiannopoulos <nmav@gnutls.org>. All rights reserved. | |
d3b18ad3 | 7 | * Copyright (c) 2018, Covalent IO, Inc. http://covalent.io |
3c4d7559 DW |
8 | * |
9 | * This software is available to you under a choice of one of two | |
10 | * licenses. You may choose to be licensed under the terms of the GNU | |
11 | * General Public License (GPL) Version 2, available from the file | |
12 | * COPYING in the main directory of this source tree, or the | |
13 | * OpenIB.org BSD license below: | |
14 | * | |
15 | * Redistribution and use in source and binary forms, with or | |
16 | * without modification, are permitted provided that the following | |
17 | * conditions are met: | |
18 | * | |
19 | * - Redistributions of source code must retain the above | |
20 | * copyright notice, this list of conditions and the following | |
21 | * disclaimer. | |
22 | * | |
23 | * - Redistributions in binary form must reproduce the above | |
24 | * copyright notice, this list of conditions and the following | |
25 | * disclaimer in the documentation and/or other materials | |
26 | * provided with the distribution. | |
27 | * | |
28 | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, | |
29 | * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF | |
30 | * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND | |
31 | * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS | |
32 | * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN | |
33 | * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN | |
34 | * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE | |
35 | * SOFTWARE. | |
36 | */ | |
37 | ||
da353fac | 38 | #include <linux/bug.h> |
c46234eb | 39 | #include <linux/sched/signal.h> |
3c4d7559 | 40 | #include <linux/module.h> |
8d338c76 | 41 | #include <linux/kernel.h> |
974271e5 | 42 | #include <linux/splice.h> |
3c4d7559 DW |
43 | #include <crypto/aead.h> |
44 | ||
c46234eb | 45 | #include <net/strparser.h> |
3c4d7559 | 46 | #include <net/tls.h> |
40e0b090 | 47 | #include <trace/events/sock.h> |
3c4d7559 | 48 | |
58790314 JK |
49 | #include "tls.h" |
50 | ||
4175eac3 | 51 | struct tls_decrypt_arg { |
6bd116c8 | 52 | struct_group(inargs, |
4175eac3 JK |
53 | bool zc; |
54 | bool async; | |
13114dc5 | 55 | bool async_done; |
ce61327c | 56 | u8 tail; |
6bd116c8 JK |
57 | ); |
58 | ||
59 | struct sk_buff *skb; | |
4175eac3 JK |
60 | }; |
61 | ||
b89fec54 | 62 | struct tls_decrypt_ctx { |
8d338c76 | 63 | struct sock *sk; |
bee6b7b3 | 64 | u8 iv[TLS_MAX_IV_SIZE]; |
b89fec54 JK |
65 | u8 aad[TLS_MAX_AAD_SIZE]; |
66 | u8 tail; | |
32b55c5f | 67 | bool free_sgout; |
b89fec54 JK |
68 | struct scatterlist sg[]; |
69 | }; | |
70 | ||
da353fac DJ |
71 | noinline void tls_err_abort(struct sock *sk, int err) |
72 | { | |
73 | WARN_ON_ONCE(err >= 0); | |
74 | /* sk->sk_err should contain a positive error code. */ | |
8a0d57df JK |
75 | WRITE_ONCE(sk->sk_err, -err); |
76 | /* Paired with smp_rmb() in tcp_poll() */ | |
77 | smp_wmb(); | |
da353fac DJ |
78 | sk_error_report(sk); |
79 | } | |
80 | ||
0927f71d DRK |
81 | static int __skb_nsg(struct sk_buff *skb, int offset, int len, |
82 | unsigned int recursion_level) | |
83 | { | |
84 | int start = skb_headlen(skb); | |
85 | int i, chunk = start - offset; | |
86 | struct sk_buff *frag_iter; | |
87 | int elt = 0; | |
88 | ||
89 | if (unlikely(recursion_level >= 24)) | |
90 | return -EMSGSIZE; | |
91 | ||
92 | if (chunk > 0) { | |
93 | if (chunk > len) | |
94 | chunk = len; | |
95 | elt++; | |
96 | len -= chunk; | |
97 | if (len == 0) | |
98 | return elt; | |
99 | offset += chunk; | |
100 | } | |
101 | ||
102 | for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) { | |
103 | int end; | |
104 | ||
105 | WARN_ON(start > offset + len); | |
106 | ||
107 | end = start + skb_frag_size(&skb_shinfo(skb)->frags[i]); | |
108 | chunk = end - offset; | |
109 | if (chunk > 0) { | |
110 | if (chunk > len) | |
111 | chunk = len; | |
112 | elt++; | |
113 | len -= chunk; | |
114 | if (len == 0) | |
115 | return elt; | |
116 | offset += chunk; | |
117 | } | |
118 | start = end; | |
119 | } | |
120 | ||
121 | if (unlikely(skb_has_frag_list(skb))) { | |
122 | skb_walk_frags(skb, frag_iter) { | |
123 | int end, ret; | |
124 | ||
125 | WARN_ON(start > offset + len); | |
126 | ||
127 | end = start + frag_iter->len; | |
128 | chunk = end - offset; | |
129 | if (chunk > 0) { | |
130 | if (chunk > len) | |
131 | chunk = len; | |
132 | ret = __skb_nsg(frag_iter, offset - start, chunk, | |
133 | recursion_level + 1); | |
134 | if (unlikely(ret < 0)) | |
135 | return ret; | |
136 | elt += ret; | |
137 | len -= chunk; | |
138 | if (len == 0) | |
139 | return elt; | |
140 | offset += chunk; | |
141 | } | |
142 | start = end; | |
143 | } | |
144 | } | |
145 | BUG_ON(len); | |
146 | return elt; | |
147 | } | |
148 | ||
149 | /* Return the number of scatterlist elements required to completely map the | |
150 | * skb, or -EMSGSIZE if the recursion depth is exceeded. | |
151 | */ | |
152 | static int skb_nsg(struct sk_buff *skb, int offset, int len) | |
153 | { | |
154 | return __skb_nsg(skb, offset, len, 0); | |
155 | } | |
156 | ||
ce61327c JK |
157 | static int tls_padding_length(struct tls_prot_info *prot, struct sk_buff *skb, |
158 | struct tls_decrypt_arg *darg) | |
130b392c DW |
159 | { |
160 | struct strp_msg *rxm = strp_msg(skb); | |
c3f6bb74 | 161 | struct tls_msg *tlm = tls_msg(skb); |
130b392c DW |
162 | int sub = 0; |
163 | ||
164 | /* Determine zero-padding length */ | |
b53f4976 | 165 | if (prot->version == TLS_1_3_VERSION) { |
5deee41b | 166 | int offset = rxm->full_len - TLS_TAG_SIZE - 1; |
ce61327c | 167 | char content_type = darg->zc ? darg->tail : 0; |
130b392c | 168 | int err; |
130b392c DW |
169 | |
170 | while (content_type == 0) { | |
5deee41b | 171 | if (offset < prot->prepend_size) |
130b392c | 172 | return -EBADMSG; |
5deee41b | 173 | err = skb_copy_bits(skb, rxm->offset + offset, |
130b392c | 174 | &content_type, 1); |
b53f4976 JK |
175 | if (err) |
176 | return err; | |
130b392c DW |
177 | if (content_type) |
178 | break; | |
179 | sub++; | |
5deee41b | 180 | offset--; |
130b392c | 181 | } |
c3f6bb74 | 182 | tlm->control = content_type; |
130b392c DW |
183 | } |
184 | return sub; | |
185 | } | |
186 | ||
8580e55a | 187 | static void tls_decrypt_done(void *data, int err) |
94524d8f | 188 | { |
8580e55a | 189 | struct aead_request *aead_req = data; |
8d338c76 | 190 | struct crypto_aead *aead = crypto_aead_reqtfm(aead_req); |
94524d8f | 191 | struct scatterlist *sgout = aead_req->dst; |
7a3dd8c8 | 192 | struct tls_sw_context_rx *ctx; |
8d338c76 | 193 | struct tls_decrypt_ctx *dctx; |
7a3dd8c8 | 194 | struct tls_context *tls_ctx; |
94524d8f VG |
195 | struct scatterlist *sg; |
196 | unsigned int pages; | |
6ececdc5 | 197 | struct sock *sk; |
8d338c76 HX |
198 | int aead_size; |
199 | ||
85905414 JK |
200 | /* If requests get too backlogged crypto API returns -EBUSY and calls |
201 | * ->complete(-EINPROGRESS) immediately followed by ->complete(0) | |
202 | * to make waiting for backlog to flush with crypto_wait_req() easier. | |
203 | * First wait converts -EBUSY -> -EINPROGRESS, and the second one | |
204 | * -EINPROGRESS -> 0. | |
205 | * We have a single struct crypto_async_request per direction, this | |
206 | * scheme doesn't help us, so just ignore the first ->complete(). | |
207 | */ | |
208 | if (err == -EINPROGRESS) | |
209 | return; | |
210 | ||
8d338c76 HX |
211 | aead_size = sizeof(*aead_req) + crypto_aead_reqsize(aead); |
212 | aead_size = ALIGN(aead_size, __alignof__(*dctx)); | |
213 | dctx = (void *)((u8 *)aead_req + aead_size); | |
7a3dd8c8 | 214 | |
8d338c76 | 215 | sk = dctx->sk; |
6ececdc5 | 216 | tls_ctx = tls_get_ctx(sk); |
7a3dd8c8 | 217 | ctx = tls_sw_ctx_rx(tls_ctx); |
94524d8f VG |
218 | |
219 | /* Propagate if there was an err */ | |
220 | if (err) { | |
5c5ec668 | 221 | if (err == -EBADMSG) |
6ececdc5 | 222 | TLS_INC_STATS(sock_net(sk), LINUX_MIB_TLSDECRYPTERROR); |
94524d8f | 223 | ctx->async_wait.err = err; |
6ececdc5 | 224 | tls_err_abort(sk, err); |
94524d8f VG |
225 | } |
226 | ||
692d7b5d | 227 | /* Free the destination pages if skb was not decrypted inplace */ |
32b55c5f | 228 | if (dctx->free_sgout) { |
692d7b5d VG |
229 | /* Skip the first S/G entry as it points to AAD */ |
230 | for_each_sg(sg_next(sgout), sg, UINT_MAX, pages) { | |
231 | if (!sg) | |
232 | break; | |
233 | put_page(sg_page(sg)); | |
234 | } | |
94524d8f VG |
235 | } |
236 | ||
237 | kfree(aead_req); | |
238 | ||
aec79619 | 239 | if (atomic_dec_and_test(&ctx->decrypt_pending)) |
94524d8f VG |
240 | complete(&ctx->async_wait.completion); |
241 | } | |
242 | ||
c57ca512 JK |
243 | static int tls_decrypt_async_wait(struct tls_sw_context_rx *ctx) |
244 | { | |
aec79619 | 245 | if (!atomic_dec_and_test(&ctx->decrypt_pending)) |
c57ca512 | 246 | crypto_wait_req(-EINPROGRESS, &ctx->async_wait); |
aec79619 | 247 | atomic_inc(&ctx->decrypt_pending); |
c57ca512 JK |
248 | |
249 | return ctx->async_wait.err; | |
250 | } | |
251 | ||
c46234eb DW |
252 | static int tls_do_decryption(struct sock *sk, |
253 | struct scatterlist *sgin, | |
254 | struct scatterlist *sgout, | |
255 | char *iv_recv, | |
256 | size_t data_len, | |
94524d8f | 257 | struct aead_request *aead_req, |
3547a1f9 | 258 | struct tls_decrypt_arg *darg) |
c46234eb DW |
259 | { |
260 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
4509de14 | 261 | struct tls_prot_info *prot = &tls_ctx->prot_info; |
f66de3ee | 262 | struct tls_sw_context_rx *ctx = tls_sw_ctx_rx(tls_ctx); |
c46234eb | 263 | int ret; |
c46234eb | 264 | |
0b243d00 | 265 | aead_request_set_tfm(aead_req, ctx->aead_recv); |
4509de14 | 266 | aead_request_set_ad(aead_req, prot->aad_size); |
c46234eb | 267 | aead_request_set_crypt(aead_req, sgin, sgout, |
4509de14 | 268 | data_len + prot->tag_size, |
c46234eb | 269 | (u8 *)iv_recv); |
c46234eb | 270 | |
3547a1f9 | 271 | if (darg->async) { |
94524d8f VG |
272 | aead_request_set_callback(aead_req, |
273 | CRYPTO_TFM_REQ_MAY_BACKLOG, | |
8d338c76 | 274 | tls_decrypt_done, aead_req); |
aec79619 | 275 | DEBUG_NET_WARN_ON_ONCE(atomic_read(&ctx->decrypt_pending) < 1); |
94524d8f VG |
276 | atomic_inc(&ctx->decrypt_pending); |
277 | } else { | |
41532b78 SD |
278 | DECLARE_CRYPTO_WAIT(wait); |
279 | ||
94524d8f VG |
280 | aead_request_set_callback(aead_req, |
281 | CRYPTO_TFM_REQ_MAY_BACKLOG, | |
41532b78 SD |
282 | crypto_req_done, &wait); |
283 | ret = crypto_aead_decrypt(aead_req); | |
284 | if (ret == -EINPROGRESS || ret == -EBUSY) | |
285 | ret = crypto_wait_req(ret, &wait); | |
286 | return ret; | |
94524d8f VG |
287 | } |
288 | ||
289 | ret = crypto_aead_decrypt(aead_req); | |
13114dc5 SD |
290 | if (ret == -EINPROGRESS) |
291 | return 0; | |
292 | ||
85905414 JK |
293 | if (ret == -EBUSY) { |
294 | ret = tls_decrypt_async_wait(ctx); | |
13114dc5 SD |
295 | darg->async_done = true; |
296 | /* all completions have run, we're not doing async anymore */ | |
297 | darg->async = false; | |
298 | return ret; | |
94524d8f | 299 | } |
13114dc5 SD |
300 | |
301 | atomic_dec(&ctx->decrypt_pending); | |
3547a1f9 JK |
302 | darg->async = false; |
303 | ||
c46234eb DW |
304 | return ret; |
305 | } | |
306 | ||
d829e9c4 | 307 | static void tls_trim_both_msgs(struct sock *sk, int target_size) |
3c4d7559 DW |
308 | { |
309 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
4509de14 | 310 | struct tls_prot_info *prot = &tls_ctx->prot_info; |
f66de3ee | 311 | struct tls_sw_context_tx *ctx = tls_sw_ctx_tx(tls_ctx); |
a42055e8 | 312 | struct tls_rec *rec = ctx->open_rec; |
3c4d7559 | 313 | |
d829e9c4 | 314 | sk_msg_trim(sk, &rec->msg_plaintext, target_size); |
3c4d7559 | 315 | if (target_size > 0) |
4509de14 | 316 | target_size += prot->overhead_size; |
d829e9c4 | 317 | sk_msg_trim(sk, &rec->msg_encrypted, target_size); |
3c4d7559 DW |
318 | } |
319 | ||
d829e9c4 | 320 | static int tls_alloc_encrypted_msg(struct sock *sk, int len) |
3c4d7559 DW |
321 | { |
322 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
f66de3ee | 323 | struct tls_sw_context_tx *ctx = tls_sw_ctx_tx(tls_ctx); |
a42055e8 | 324 | struct tls_rec *rec = ctx->open_rec; |
d829e9c4 | 325 | struct sk_msg *msg_en = &rec->msg_encrypted; |
3c4d7559 | 326 | |
d829e9c4 | 327 | return sk_msg_alloc(sk, msg_en, len, 0); |
3c4d7559 DW |
328 | } |
329 | ||
d829e9c4 | 330 | static int tls_clone_plaintext_msg(struct sock *sk, int required) |
3c4d7559 DW |
331 | { |
332 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
4509de14 | 333 | struct tls_prot_info *prot = &tls_ctx->prot_info; |
f66de3ee | 334 | struct tls_sw_context_tx *ctx = tls_sw_ctx_tx(tls_ctx); |
a42055e8 | 335 | struct tls_rec *rec = ctx->open_rec; |
d829e9c4 DB |
336 | struct sk_msg *msg_pl = &rec->msg_plaintext; |
337 | struct sk_msg *msg_en = &rec->msg_encrypted; | |
4e6d4720 | 338 | int skip, len; |
3c4d7559 | 339 | |
d829e9c4 DB |
340 | /* We add page references worth len bytes from encrypted sg |
341 | * at the end of plaintext sg. It is guaranteed that msg_en | |
4e6d4720 VG |
342 | * has enough required room (ensured by caller). |
343 | */ | |
d829e9c4 | 344 | len = required - msg_pl->sg.size; |
52ea992c | 345 | |
d829e9c4 DB |
346 | /* Skip initial bytes in msg_en's data to be able to use |
347 | * same offset of both plain and encrypted data. | |
4e6d4720 | 348 | */ |
4509de14 | 349 | skip = prot->prepend_size + msg_pl->sg.size; |
4e6d4720 | 350 | |
d829e9c4 | 351 | return sk_msg_clone(sk, msg_pl, msg_en, skip, len); |
3c4d7559 DW |
352 | } |
353 | ||
d3b18ad3 | 354 | static struct tls_rec *tls_get_rec(struct sock *sk) |
3c4d7559 DW |
355 | { |
356 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
4509de14 | 357 | struct tls_prot_info *prot = &tls_ctx->prot_info; |
f66de3ee | 358 | struct tls_sw_context_tx *ctx = tls_sw_ctx_tx(tls_ctx); |
d3b18ad3 JF |
359 | struct sk_msg *msg_pl, *msg_en; |
360 | struct tls_rec *rec; | |
361 | int mem_size; | |
3c4d7559 | 362 | |
d3b18ad3 JF |
363 | mem_size = sizeof(struct tls_rec) + crypto_aead_reqsize(ctx->aead_send); |
364 | ||
365 | rec = kzalloc(mem_size, sk->sk_allocation); | |
a42055e8 | 366 | if (!rec) |
d3b18ad3 JF |
367 | return NULL; |
368 | ||
369 | msg_pl = &rec->msg_plaintext; | |
370 | msg_en = &rec->msg_encrypted; | |
371 | ||
372 | sk_msg_init(msg_pl); | |
373 | sk_msg_init(msg_en); | |
374 | ||
375 | sg_init_table(rec->sg_aead_in, 2); | |
4509de14 | 376 | sg_set_buf(&rec->sg_aead_in[0], rec->aad_space, prot->aad_size); |
d3b18ad3 JF |
377 | sg_unmark_end(&rec->sg_aead_in[1]); |
378 | ||
379 | sg_init_table(rec->sg_aead_out, 2); | |
4509de14 | 380 | sg_set_buf(&rec->sg_aead_out[0], rec->aad_space, prot->aad_size); |
d3b18ad3 JF |
381 | sg_unmark_end(&rec->sg_aead_out[1]); |
382 | ||
8d338c76 HX |
383 | rec->sk = sk; |
384 | ||
d3b18ad3 JF |
385 | return rec; |
386 | } | |
a42055e8 | 387 | |
d3b18ad3 JF |
388 | static void tls_free_rec(struct sock *sk, struct tls_rec *rec) |
389 | { | |
d829e9c4 DB |
390 | sk_msg_free(sk, &rec->msg_encrypted); |
391 | sk_msg_free(sk, &rec->msg_plaintext); | |
c774973e | 392 | kfree(rec); |
a42055e8 VG |
393 | } |
394 | ||
d3b18ad3 JF |
395 | static void tls_free_open_rec(struct sock *sk) |
396 | { | |
397 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
398 | struct tls_sw_context_tx *ctx = tls_sw_ctx_tx(tls_ctx); | |
399 | struct tls_rec *rec = ctx->open_rec; | |
400 | ||
401 | if (rec) { | |
402 | tls_free_rec(sk, rec); | |
403 | ctx->open_rec = NULL; | |
404 | } | |
405 | } | |
406 | ||
a42055e8 VG |
407 | int tls_tx_records(struct sock *sk, int flags) |
408 | { | |
409 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
410 | struct tls_sw_context_tx *ctx = tls_sw_ctx_tx(tls_ctx); | |
411 | struct tls_rec *rec, *tmp; | |
d829e9c4 | 412 | struct sk_msg *msg_en; |
a42055e8 VG |
413 | int tx_flags, rc = 0; |
414 | ||
415 | if (tls_is_partially_sent_record(tls_ctx)) { | |
9932a29a | 416 | rec = list_first_entry(&ctx->tx_list, |
a42055e8 VG |
417 | struct tls_rec, list); |
418 | ||
419 | if (flags == -1) | |
420 | tx_flags = rec->tx_flags; | |
421 | else | |
422 | tx_flags = flags; | |
423 | ||
424 | rc = tls_push_partial_record(sk, tls_ctx, tx_flags); | |
425 | if (rc) | |
426 | goto tx_err; | |
427 | ||
428 | /* Full record has been transmitted. | |
9932a29a | 429 | * Remove the head of tx_list |
a42055e8 | 430 | */ |
a42055e8 | 431 | list_del(&rec->list); |
d829e9c4 | 432 | sk_msg_free(sk, &rec->msg_plaintext); |
a42055e8 VG |
433 | kfree(rec); |
434 | } | |
435 | ||
9932a29a VG |
436 | /* Tx all ready records */ |
437 | list_for_each_entry_safe(rec, tmp, &ctx->tx_list, list) { | |
438 | if (READ_ONCE(rec->tx_ready)) { | |
a42055e8 VG |
439 | if (flags == -1) |
440 | tx_flags = rec->tx_flags; | |
441 | else | |
442 | tx_flags = flags; | |
443 | ||
d829e9c4 | 444 | msg_en = &rec->msg_encrypted; |
a42055e8 | 445 | rc = tls_push_sg(sk, tls_ctx, |
d829e9c4 | 446 | &msg_en->sg.data[msg_en->sg.curr], |
a42055e8 VG |
447 | 0, tx_flags); |
448 | if (rc) | |
449 | goto tx_err; | |
450 | ||
a42055e8 | 451 | list_del(&rec->list); |
d829e9c4 | 452 | sk_msg_free(sk, &rec->msg_plaintext); |
a42055e8 VG |
453 | kfree(rec); |
454 | } else { | |
455 | break; | |
456 | } | |
457 | } | |
458 | ||
459 | tx_err: | |
460 | if (rc < 0 && rc != -EAGAIN) | |
da353fac | 461 | tls_err_abort(sk, -EBADMSG); |
a42055e8 VG |
462 | |
463 | return rc; | |
464 | } | |
465 | ||
8580e55a | 466 | static void tls_encrypt_done(void *data, int err) |
a42055e8 | 467 | { |
8d338c76 HX |
468 | struct tls_sw_context_tx *ctx; |
469 | struct tls_context *tls_ctx; | |
470 | struct tls_prot_info *prot; | |
d3777cea | 471 | struct tls_rec *rec = data; |
d829e9c4 DB |
472 | struct scatterlist *sge; |
473 | struct sk_msg *msg_en; | |
8d338c76 | 474 | struct sock *sk; |
a42055e8 | 475 | |
85905414 JK |
476 | if (err == -EINPROGRESS) /* see the comment in tls_decrypt_done() */ |
477 | return; | |
478 | ||
d829e9c4 | 479 | msg_en = &rec->msg_encrypted; |
a42055e8 | 480 | |
8d338c76 HX |
481 | sk = rec->sk; |
482 | tls_ctx = tls_get_ctx(sk); | |
483 | prot = &tls_ctx->prot_info; | |
484 | ctx = tls_sw_ctx_tx(tls_ctx); | |
485 | ||
d829e9c4 | 486 | sge = sk_msg_elem(msg_en, msg_en->sg.curr); |
4509de14 VG |
487 | sge->offset -= prot->prepend_size; |
488 | sge->length += prot->prepend_size; | |
a42055e8 | 489 | |
80ece6a0 | 490 | /* Check if error is previously set on socket */ |
a42055e8 | 491 | if (err || sk->sk_err) { |
a42055e8 VG |
492 | rec = NULL; |
493 | ||
494 | /* If err is already set on socket, return the same code */ | |
495 | if (sk->sk_err) { | |
1d9d6fd2 | 496 | ctx->async_wait.err = -sk->sk_err; |
a42055e8 VG |
497 | } else { |
498 | ctx->async_wait.err = err; | |
499 | tls_err_abort(sk, err); | |
500 | } | |
501 | } | |
502 | ||
9932a29a VG |
503 | if (rec) { |
504 | struct tls_rec *first_rec; | |
505 | ||
506 | /* Mark the record as ready for transmission */ | |
507 | smp_store_mb(rec->tx_ready, true); | |
508 | ||
509 | /* If received record is at head of tx_list, schedule tx */ | |
510 | first_rec = list_first_entry(&ctx->tx_list, | |
511 | struct tls_rec, list); | |
e01e3934 JK |
512 | if (rec == first_rec) { |
513 | /* Schedule the transmission */ | |
514 | if (!test_and_set_bit(BIT_TX_SCHEDULED, | |
515 | &ctx->tx_bitmask)) | |
516 | schedule_delayed_work(&ctx->tx_work.work, 1); | |
517 | } | |
9932a29a | 518 | } |
a42055e8 | 519 | |
aec79619 | 520 | if (atomic_dec_and_test(&ctx->encrypt_pending)) |
a42055e8 | 521 | complete(&ctx->async_wait.completion); |
3c4d7559 DW |
522 | } |
523 | ||
c57ca512 JK |
524 | static int tls_encrypt_async_wait(struct tls_sw_context_tx *ctx) |
525 | { | |
aec79619 | 526 | if (!atomic_dec_and_test(&ctx->encrypt_pending)) |
c57ca512 | 527 | crypto_wait_req(-EINPROGRESS, &ctx->async_wait); |
aec79619 | 528 | atomic_inc(&ctx->encrypt_pending); |
c57ca512 JK |
529 | |
530 | return ctx->async_wait.err; | |
531 | } | |
532 | ||
a42055e8 VG |
533 | static int tls_do_encryption(struct sock *sk, |
534 | struct tls_context *tls_ctx, | |
a447da7d DB |
535 | struct tls_sw_context_tx *ctx, |
536 | struct aead_request *aead_req, | |
d829e9c4 | 537 | size_t data_len, u32 start) |
3c4d7559 | 538 | { |
4509de14 | 539 | struct tls_prot_info *prot = &tls_ctx->prot_info; |
a42055e8 | 540 | struct tls_rec *rec = ctx->open_rec; |
d829e9c4 DB |
541 | struct sk_msg *msg_en = &rec->msg_encrypted; |
542 | struct scatterlist *sge = sk_msg_elem(msg_en, start); | |
f295b3ae VG |
543 | int rc, iv_offset = 0; |
544 | ||
545 | /* For CCM based ciphers, first byte of IV is a constant */ | |
128cfb88 TZ |
546 | switch (prot->cipher_type) { |
547 | case TLS_CIPHER_AES_CCM_128: | |
f295b3ae VG |
548 | rec->iv_data[0] = TLS_AES_CCM_IV_B0_BYTE; |
549 | iv_offset = 1; | |
128cfb88 TZ |
550 | break; |
551 | case TLS_CIPHER_SM4_CCM: | |
552 | rec->iv_data[0] = TLS_SM4_CCM_IV_B0_BYTE; | |
553 | iv_offset = 1; | |
554 | break; | |
f295b3ae VG |
555 | } |
556 | ||
557 | memcpy(&rec->iv_data[iv_offset], tls_ctx->tx.iv, | |
558 | prot->iv_size + prot->salt_size); | |
3c4d7559 | 559 | |
58790314 JK |
560 | tls_xor_iv_with_seq(prot, rec->iv_data + iv_offset, |
561 | tls_ctx->tx.rec_seq); | |
32eb67b9 | 562 | |
4509de14 VG |
563 | sge->offset += prot->prepend_size; |
564 | sge->length -= prot->prepend_size; | |
3c4d7559 | 565 | |
d829e9c4 | 566 | msg_en->sg.curr = start; |
4e6d4720 | 567 | |
3c4d7559 | 568 | aead_request_set_tfm(aead_req, ctx->aead_send); |
4509de14 | 569 | aead_request_set_ad(aead_req, prot->aad_size); |
d829e9c4 DB |
570 | aead_request_set_crypt(aead_req, rec->sg_aead_in, |
571 | rec->sg_aead_out, | |
32eb67b9 | 572 | data_len, rec->iv_data); |
a54667f6 VG |
573 | |
574 | aead_request_set_callback(aead_req, CRYPTO_TFM_REQ_MAY_BACKLOG, | |
d3777cea | 575 | tls_encrypt_done, rec); |
a42055e8 | 576 | |
9932a29a VG |
577 | /* Add the record in tx_list */ |
578 | list_add_tail((struct list_head *)&rec->list, &ctx->tx_list); | |
aec79619 | 579 | DEBUG_NET_WARN_ON_ONCE(atomic_read(&ctx->encrypt_pending) < 1); |
a42055e8 | 580 | atomic_inc(&ctx->encrypt_pending); |
a54667f6 | 581 | |
a42055e8 | 582 | rc = crypto_aead_encrypt(aead_req); |
85905414 JK |
583 | if (rc == -EBUSY) { |
584 | rc = tls_encrypt_async_wait(ctx); | |
585 | rc = rc ?: -EINPROGRESS; | |
586 | } | |
a42055e8 VG |
587 | if (!rc || rc != -EINPROGRESS) { |
588 | atomic_dec(&ctx->encrypt_pending); | |
4509de14 VG |
589 | sge->offset -= prot->prepend_size; |
590 | sge->length += prot->prepend_size; | |
a42055e8 | 591 | } |
3c4d7559 | 592 | |
9932a29a VG |
593 | if (!rc) { |
594 | WRITE_ONCE(rec->tx_ready, true); | |
595 | } else if (rc != -EINPROGRESS) { | |
596 | list_del(&rec->list); | |
a42055e8 | 597 | return rc; |
9932a29a | 598 | } |
3c4d7559 | 599 | |
a42055e8 VG |
600 | /* Unhook the record from context if encryption is not failure */ |
601 | ctx->open_rec = NULL; | |
fb0f886f | 602 | tls_advance_record_sn(sk, prot, &tls_ctx->tx); |
3c4d7559 DW |
603 | return rc; |
604 | } | |
605 | ||
d3b18ad3 JF |
606 | static int tls_split_open_record(struct sock *sk, struct tls_rec *from, |
607 | struct tls_rec **to, struct sk_msg *msg_opl, | |
608 | struct sk_msg *msg_oen, u32 split_point, | |
609 | u32 tx_overhead_size, u32 *orig_end) | |
610 | { | |
611 | u32 i, j, bytes = 0, apply = msg_opl->apply_bytes; | |
612 | struct scatterlist *sge, *osge, *nsge; | |
613 | u32 orig_size = msg_opl->sg.size; | |
614 | struct scatterlist tmp = { }; | |
615 | struct sk_msg *msg_npl; | |
616 | struct tls_rec *new; | |
617 | int ret; | |
618 | ||
619 | new = tls_get_rec(sk); | |
620 | if (!new) | |
621 | return -ENOMEM; | |
622 | ret = sk_msg_alloc(sk, &new->msg_encrypted, msg_opl->sg.size + | |
623 | tx_overhead_size, 0); | |
624 | if (ret < 0) { | |
625 | tls_free_rec(sk, new); | |
626 | return ret; | |
627 | } | |
628 | ||
629 | *orig_end = msg_opl->sg.end; | |
630 | i = msg_opl->sg.start; | |
631 | sge = sk_msg_elem(msg_opl, i); | |
632 | while (apply && sge->length) { | |
633 | if (sge->length > apply) { | |
634 | u32 len = sge->length - apply; | |
635 | ||
636 | get_page(sg_page(sge)); | |
637 | sg_set_page(&tmp, sg_page(sge), len, | |
638 | sge->offset + apply); | |
639 | sge->length = apply; | |
640 | bytes += apply; | |
641 | apply = 0; | |
642 | } else { | |
643 | apply -= sge->length; | |
644 | bytes += sge->length; | |
645 | } | |
646 | ||
647 | sk_msg_iter_var_next(i); | |
648 | if (i == msg_opl->sg.end) | |
649 | break; | |
650 | sge = sk_msg_elem(msg_opl, i); | |
651 | } | |
652 | ||
653 | msg_opl->sg.end = i; | |
654 | msg_opl->sg.curr = i; | |
655 | msg_opl->sg.copybreak = 0; | |
656 | msg_opl->apply_bytes = 0; | |
657 | msg_opl->sg.size = bytes; | |
658 | ||
659 | msg_npl = &new->msg_plaintext; | |
660 | msg_npl->apply_bytes = apply; | |
661 | msg_npl->sg.size = orig_size - bytes; | |
662 | ||
663 | j = msg_npl->sg.start; | |
664 | nsge = sk_msg_elem(msg_npl, j); | |
665 | if (tmp.length) { | |
666 | memcpy(nsge, &tmp, sizeof(*nsge)); | |
667 | sk_msg_iter_var_next(j); | |
668 | nsge = sk_msg_elem(msg_npl, j); | |
669 | } | |
670 | ||
671 | osge = sk_msg_elem(msg_opl, i); | |
672 | while (osge->length) { | |
673 | memcpy(nsge, osge, sizeof(*nsge)); | |
674 | sg_unmark_end(nsge); | |
675 | sk_msg_iter_var_next(i); | |
676 | sk_msg_iter_var_next(j); | |
677 | if (i == *orig_end) | |
678 | break; | |
679 | osge = sk_msg_elem(msg_opl, i); | |
680 | nsge = sk_msg_elem(msg_npl, j); | |
681 | } | |
682 | ||
683 | msg_npl->sg.end = j; | |
684 | msg_npl->sg.curr = j; | |
685 | msg_npl->sg.copybreak = 0; | |
686 | ||
687 | *to = new; | |
688 | return 0; | |
689 | } | |
690 | ||
691 | static void tls_merge_open_record(struct sock *sk, struct tls_rec *to, | |
692 | struct tls_rec *from, u32 orig_end) | |
693 | { | |
694 | struct sk_msg *msg_npl = &from->msg_plaintext; | |
695 | struct sk_msg *msg_opl = &to->msg_plaintext; | |
696 | struct scatterlist *osge, *nsge; | |
697 | u32 i, j; | |
698 | ||
699 | i = msg_opl->sg.end; | |
700 | sk_msg_iter_var_prev(i); | |
701 | j = msg_npl->sg.start; | |
702 | ||
703 | osge = sk_msg_elem(msg_opl, i); | |
704 | nsge = sk_msg_elem(msg_npl, j); | |
705 | ||
706 | if (sg_page(osge) == sg_page(nsge) && | |
707 | osge->offset + osge->length == nsge->offset) { | |
708 | osge->length += nsge->length; | |
709 | put_page(sg_page(nsge)); | |
710 | } | |
711 | ||
712 | msg_opl->sg.end = orig_end; | |
713 | msg_opl->sg.curr = orig_end; | |
714 | msg_opl->sg.copybreak = 0; | |
715 | msg_opl->apply_bytes = msg_opl->sg.size + msg_npl->sg.size; | |
716 | msg_opl->sg.size += msg_npl->sg.size; | |
717 | ||
718 | sk_msg_free(sk, &to->msg_encrypted); | |
719 | sk_msg_xfer_full(&to->msg_encrypted, &from->msg_encrypted); | |
720 | ||
721 | kfree(from); | |
722 | } | |
723 | ||
3c4d7559 DW |
724 | static int tls_push_record(struct sock *sk, int flags, |
725 | unsigned char record_type) | |
726 | { | |
727 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
4509de14 | 728 | struct tls_prot_info *prot = &tls_ctx->prot_info; |
f66de3ee | 729 | struct tls_sw_context_tx *ctx = tls_sw_ctx_tx(tls_ctx); |
d3b18ad3 | 730 | struct tls_rec *rec = ctx->open_rec, *tmp = NULL; |
3f649ab7 | 731 | u32 i, split_point, orig_end; |
d829e9c4 | 732 | struct sk_msg *msg_pl, *msg_en; |
a447da7d | 733 | struct aead_request *req; |
d3b18ad3 | 734 | bool split; |
3c4d7559 DW |
735 | int rc; |
736 | ||
a42055e8 VG |
737 | if (!rec) |
738 | return 0; | |
a447da7d | 739 | |
d829e9c4 DB |
740 | msg_pl = &rec->msg_plaintext; |
741 | msg_en = &rec->msg_encrypted; | |
742 | ||
d3b18ad3 JF |
743 | split_point = msg_pl->apply_bytes; |
744 | split = split_point && split_point < msg_pl->sg.size; | |
d468e477 JF |
745 | if (unlikely((!split && |
746 | msg_pl->sg.size + | |
747 | prot->overhead_size > msg_en->sg.size) || | |
748 | (split && | |
749 | split_point + | |
750 | prot->overhead_size > msg_en->sg.size))) { | |
751 | split = true; | |
752 | split_point = msg_en->sg.size; | |
753 | } | |
d3b18ad3 JF |
754 | if (split) { |
755 | rc = tls_split_open_record(sk, rec, &tmp, msg_pl, msg_en, | |
4509de14 | 756 | split_point, prot->overhead_size, |
d3b18ad3 JF |
757 | &orig_end); |
758 | if (rc < 0) | |
759 | return rc; | |
d468e477 JF |
760 | /* This can happen if above tls_split_open_record allocates |
761 | * a single large encryption buffer instead of two smaller | |
762 | * ones. In this case adjust pointers and continue without | |
763 | * split. | |
764 | */ | |
765 | if (!msg_pl->sg.size) { | |
766 | tls_merge_open_record(sk, rec, tmp, orig_end); | |
767 | msg_pl = &rec->msg_plaintext; | |
768 | msg_en = &rec->msg_encrypted; | |
769 | split = false; | |
770 | } | |
d3b18ad3 | 771 | sk_msg_trim(sk, msg_en, msg_pl->sg.size + |
4509de14 | 772 | prot->overhead_size); |
d3b18ad3 JF |
773 | } |
774 | ||
a42055e8 VG |
775 | rec->tx_flags = flags; |
776 | req = &rec->aead_req; | |
3c4d7559 | 777 | |
d829e9c4 DB |
778 | i = msg_pl->sg.end; |
779 | sk_msg_iter_var_prev(i); | |
130b392c DW |
780 | |
781 | rec->content_type = record_type; | |
4509de14 | 782 | if (prot->version == TLS_1_3_VERSION) { |
130b392c DW |
783 | /* Add content type to end of message. No padding added */ |
784 | sg_set_buf(&rec->sg_content_type, &rec->content_type, 1); | |
785 | sg_mark_end(&rec->sg_content_type); | |
786 | sg_chain(msg_pl->sg.data, msg_pl->sg.end + 1, | |
787 | &rec->sg_content_type); | |
788 | } else { | |
789 | sg_mark_end(sk_msg_elem(msg_pl, i)); | |
790 | } | |
a42055e8 | 791 | |
9aaaa568 JF |
792 | if (msg_pl->sg.end < msg_pl->sg.start) { |
793 | sg_chain(&msg_pl->sg.data[msg_pl->sg.start], | |
794 | MAX_SKB_FRAGS - msg_pl->sg.start + 1, | |
795 | msg_pl->sg.data); | |
796 | } | |
797 | ||
d829e9c4 | 798 | i = msg_pl->sg.start; |
9e5ffed3 | 799 | sg_chain(rec->sg_aead_in, 2, &msg_pl->sg.data[i]); |
d829e9c4 DB |
800 | |
801 | i = msg_en->sg.end; | |
802 | sk_msg_iter_var_prev(i); | |
803 | sg_mark_end(sk_msg_elem(msg_en, i)); | |
804 | ||
805 | i = msg_en->sg.start; | |
806 | sg_chain(rec->sg_aead_out, 2, &msg_en->sg.data[i]); | |
807 | ||
4509de14 | 808 | tls_make_aad(rec->aad_space, msg_pl->sg.size + prot->tail_size, |
6942a284 | 809 | tls_ctx->tx.rec_seq, record_type, prot); |
3c4d7559 DW |
810 | |
811 | tls_fill_prepend(tls_ctx, | |
d829e9c4 | 812 | page_address(sg_page(&msg_en->sg.data[i])) + |
130b392c | 813 | msg_en->sg.data[i].offset, |
4509de14 | 814 | msg_pl->sg.size + prot->tail_size, |
6942a284 | 815 | record_type); |
3c4d7559 | 816 | |
d829e9c4 | 817 | tls_ctx->pending_open_record_frags = false; |
3c4d7559 | 818 | |
130b392c | 819 | rc = tls_do_encryption(sk, tls_ctx, ctx, req, |
4509de14 | 820 | msg_pl->sg.size + prot->tail_size, i); |
a42055e8 | 821 | if (rc < 0) { |
d3b18ad3 | 822 | if (rc != -EINPROGRESS) { |
da353fac | 823 | tls_err_abort(sk, -EBADMSG); |
d3b18ad3 JF |
824 | if (split) { |
825 | tls_ctx->pending_open_record_frags = true; | |
826 | tls_merge_open_record(sk, rec, tmp, orig_end); | |
827 | } | |
828 | } | |
5b053e12 | 829 | ctx->async_capable = 1; |
a42055e8 | 830 | return rc; |
d3b18ad3 JF |
831 | } else if (split) { |
832 | msg_pl = &tmp->msg_plaintext; | |
833 | msg_en = &tmp->msg_encrypted; | |
4509de14 | 834 | sk_msg_trim(sk, msg_en, msg_pl->sg.size + prot->overhead_size); |
d3b18ad3 JF |
835 | tls_ctx->pending_open_record_frags = true; |
836 | ctx->open_rec = tmp; | |
a42055e8 | 837 | } |
3c4d7559 | 838 | |
9932a29a | 839 | return tls_tx_records(sk, flags); |
3c4d7559 DW |
840 | } |
841 | ||
d3b18ad3 JF |
842 | static int bpf_exec_tx_verdict(struct sk_msg *msg, struct sock *sk, |
843 | bool full_record, u8 record_type, | |
a7bff11f | 844 | ssize_t *copied, int flags) |
3c4d7559 DW |
845 | { |
846 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
f66de3ee | 847 | struct tls_sw_context_tx *ctx = tls_sw_ctx_tx(tls_ctx); |
d3b18ad3 JF |
848 | struct sk_msg msg_redir = { }; |
849 | struct sk_psock *psock; | |
850 | struct sock *sk_redir; | |
a42055e8 | 851 | struct tls_rec *rec; |
a351d608 | 852 | bool enospc, policy, redir_ingress; |
d3b18ad3 | 853 | int err = 0, send; |
7246d8ed | 854 | u32 delta = 0; |
d3b18ad3 | 855 | |
0608c69c | 856 | policy = !(flags & MSG_SENDPAGE_NOPOLICY); |
d3b18ad3 | 857 | psock = sk_psock_get(sk); |
d10523d0 JK |
858 | if (!psock || !policy) { |
859 | err = tls_push_record(sk, flags, record_type); | |
cfaa80c9 | 860 | if (err && err != -EINPROGRESS && sk->sk_err == EBADMSG) { |
d10523d0 JK |
861 | *copied -= sk_msg_free(sk, msg); |
862 | tls_free_open_rec(sk); | |
635d9398 | 863 | err = -sk->sk_err; |
d10523d0 | 864 | } |
095f5614 XY |
865 | if (psock) |
866 | sk_psock_put(sk, psock); | |
d10523d0 JK |
867 | return err; |
868 | } | |
d3b18ad3 JF |
869 | more_data: |
870 | enospc = sk_msg_full(msg); | |
7246d8ed JF |
871 | if (psock->eval == __SK_NONE) { |
872 | delta = msg->sg.size; | |
d3b18ad3 | 873 | psock->eval = sk_psock_msg_verdict(sk, psock, msg); |
7361d448 | 874 | delta -= msg->sg.size; |
7246d8ed | 875 | } |
d3b18ad3 JF |
876 | if (msg->cork_bytes && msg->cork_bytes > msg->sg.size && |
877 | !enospc && !full_record) { | |
878 | err = -ENOSPC; | |
879 | goto out_err; | |
880 | } | |
881 | msg->cork_bytes = 0; | |
882 | send = msg->sg.size; | |
883 | if (msg->apply_bytes && msg->apply_bytes < send) | |
884 | send = msg->apply_bytes; | |
885 | ||
886 | switch (psock->eval) { | |
887 | case __SK_PASS: | |
888 | err = tls_push_record(sk, flags, record_type); | |
cfaa80c9 | 889 | if (err && err != -EINPROGRESS && sk->sk_err == EBADMSG) { |
d3b18ad3 JF |
890 | *copied -= sk_msg_free(sk, msg); |
891 | tls_free_open_rec(sk); | |
635d9398 | 892 | err = -sk->sk_err; |
d3b18ad3 JF |
893 | goto out_err; |
894 | } | |
895 | break; | |
896 | case __SK_REDIRECT: | |
a351d608 | 897 | redir_ingress = psock->redir_ingress; |
d3b18ad3 JF |
898 | sk_redir = psock->sk_redir; |
899 | memcpy(&msg_redir, msg, sizeof(*msg)); | |
900 | if (msg->apply_bytes < send) | |
901 | msg->apply_bytes = 0; | |
902 | else | |
903 | msg->apply_bytes -= send; | |
904 | sk_msg_return_zero(sk, msg, send); | |
905 | msg->sg.size -= send; | |
906 | release_sock(sk); | |
a351d608 PY |
907 | err = tcp_bpf_sendmsg_redir(sk_redir, redir_ingress, |
908 | &msg_redir, send, flags); | |
d3b18ad3 JF |
909 | lock_sock(sk); |
910 | if (err < 0) { | |
911 | *copied -= sk_msg_free_nocharge(sk, &msg_redir); | |
912 | msg->sg.size = 0; | |
913 | } | |
914 | if (msg->sg.size == 0) | |
915 | tls_free_open_rec(sk); | |
916 | break; | |
917 | case __SK_DROP: | |
918 | default: | |
919 | sk_msg_free_partial(sk, msg, send); | |
920 | if (msg->apply_bytes < send) | |
921 | msg->apply_bytes = 0; | |
922 | else | |
923 | msg->apply_bytes -= send; | |
924 | if (msg->sg.size == 0) | |
925 | tls_free_open_rec(sk); | |
7246d8ed | 926 | *copied -= (send + delta); |
d3b18ad3 JF |
927 | err = -EACCES; |
928 | } | |
a42055e8 | 929 | |
d3b18ad3 JF |
930 | if (likely(!err)) { |
931 | bool reset_eval = !ctx->open_rec; | |
a42055e8 | 932 | |
d3b18ad3 JF |
933 | rec = ctx->open_rec; |
934 | if (rec) { | |
935 | msg = &rec->msg_plaintext; | |
936 | if (!msg->apply_bytes) | |
937 | reset_eval = true; | |
938 | } | |
939 | if (reset_eval) { | |
940 | psock->eval = __SK_NONE; | |
941 | if (psock->sk_redir) { | |
942 | sock_put(psock->sk_redir); | |
943 | psock->sk_redir = NULL; | |
944 | } | |
945 | } | |
946 | if (rec) | |
947 | goto more_data; | |
948 | } | |
949 | out_err: | |
950 | sk_psock_put(sk, psock); | |
951 | return err; | |
952 | } | |
953 | ||
954 | static int tls_sw_push_pending_record(struct sock *sk, int flags) | |
955 | { | |
956 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
957 | struct tls_sw_context_tx *ctx = tls_sw_ctx_tx(tls_ctx); | |
958 | struct tls_rec *rec = ctx->open_rec; | |
959 | struct sk_msg *msg_pl; | |
960 | size_t copied; | |
a42055e8 | 961 | |
a42055e8 | 962 | if (!rec) |
d3b18ad3 | 963 | return 0; |
a42055e8 | 964 | |
d829e9c4 | 965 | msg_pl = &rec->msg_plaintext; |
d3b18ad3 JF |
966 | copied = msg_pl->sg.size; |
967 | if (!copied) | |
968 | return 0; | |
a42055e8 | 969 | |
d3b18ad3 JF |
970 | return bpf_exec_tx_verdict(msg_pl, sk, true, TLS_RECORD_TYPE_DATA, |
971 | &copied, flags); | |
a42055e8 VG |
972 | } |
973 | ||
fe1e81d4 DH |
974 | static int tls_sw_sendmsg_splice(struct sock *sk, struct msghdr *msg, |
975 | struct sk_msg *msg_pl, size_t try_to_copy, | |
976 | ssize_t *copied) | |
977 | { | |
978 | struct page *page = NULL, **pages = &page; | |
979 | ||
980 | do { | |
981 | ssize_t part; | |
982 | size_t off; | |
983 | ||
984 | part = iov_iter_extract_pages(&msg->msg_iter, &pages, | |
985 | try_to_copy, 1, 0, &off); | |
986 | if (part <= 0) | |
987 | return part ?: -EIO; | |
988 | ||
989 | if (WARN_ON_ONCE(!sendpage_ok(page))) { | |
990 | iov_iter_revert(&msg->msg_iter, part); | |
991 | return -EIO; | |
992 | } | |
993 | ||
994 | sk_msg_page_add(msg_pl, page, part, off); | |
c5a59500 JF |
995 | msg_pl->sg.copybreak = 0; |
996 | msg_pl->sg.curr = msg_pl->sg.end; | |
fe1e81d4 DH |
997 | sk_mem_charge(sk, part); |
998 | *copied += part; | |
999 | try_to_copy -= part; | |
1000 | } while (try_to_copy && !sk_msg_full(msg_pl)); | |
1001 | ||
1002 | return 0; | |
1003 | } | |
1004 | ||
45e5be84 DH |
1005 | static int tls_sw_sendmsg_locked(struct sock *sk, struct msghdr *msg, |
1006 | size_t size) | |
a42055e8 | 1007 | { |
3c4d7559 | 1008 | long timeo = sock_sndtimeo(sk, msg->msg_flags & MSG_DONTWAIT); |
a42055e8 | 1009 | struct tls_context *tls_ctx = tls_get_ctx(sk); |
4509de14 | 1010 | struct tls_prot_info *prot = &tls_ctx->prot_info; |
a42055e8 | 1011 | struct tls_sw_context_tx *ctx = tls_sw_ctx_tx(tls_ctx); |
5b053e12 | 1012 | bool async_capable = ctx->async_capable; |
a42055e8 | 1013 | unsigned char record_type = TLS_RECORD_TYPE_DATA; |
00e23707 | 1014 | bool is_kvec = iov_iter_is_kvec(&msg->msg_iter); |
3c4d7559 | 1015 | bool eor = !(msg->msg_flags & MSG_MORE); |
a7bff11f VF |
1016 | size_t try_to_copy; |
1017 | ssize_t copied = 0; | |
d829e9c4 | 1018 | struct sk_msg *msg_pl, *msg_en; |
a42055e8 VG |
1019 | struct tls_rec *rec; |
1020 | int required_size; | |
1021 | int num_async = 0; | |
3c4d7559 | 1022 | bool full_record; |
a42055e8 VG |
1023 | int record_room; |
1024 | int num_zc = 0; | |
3c4d7559 | 1025 | int orig_size; |
4128c0cf | 1026 | int ret = 0; |
3c4d7559 | 1027 | |
e22e358b HR |
1028 | if (!eor && (msg->msg_flags & MSG_EOR)) |
1029 | return -EINVAL; | |
1030 | ||
3c4d7559 | 1031 | if (unlikely(msg->msg_controllen)) { |
58790314 | 1032 | ret = tls_process_cmsg(sk, msg, &record_type); |
a42055e8 VG |
1033 | if (ret) { |
1034 | if (ret == -EINPROGRESS) | |
1035 | num_async++; | |
1036 | else if (ret != -EAGAIN) | |
1037 | goto send_end; | |
1038 | } | |
3c4d7559 DW |
1039 | } |
1040 | ||
1041 | while (msg_data_left(msg)) { | |
1042 | if (sk->sk_err) { | |
30be8f8d | 1043 | ret = -sk->sk_err; |
3c4d7559 DW |
1044 | goto send_end; |
1045 | } | |
1046 | ||
d3b18ad3 JF |
1047 | if (ctx->open_rec) |
1048 | rec = ctx->open_rec; | |
1049 | else | |
1050 | rec = ctx->open_rec = tls_get_rec(sk); | |
a42055e8 VG |
1051 | if (!rec) { |
1052 | ret = -ENOMEM; | |
1053 | goto send_end; | |
1054 | } | |
1055 | ||
d829e9c4 DB |
1056 | msg_pl = &rec->msg_plaintext; |
1057 | msg_en = &rec->msg_encrypted; | |
1058 | ||
1059 | orig_size = msg_pl->sg.size; | |
3c4d7559 DW |
1060 | full_record = false; |
1061 | try_to_copy = msg_data_left(msg); | |
d829e9c4 | 1062 | record_room = TLS_MAX_PAYLOAD_SIZE - msg_pl->sg.size; |
3c4d7559 DW |
1063 | if (try_to_copy >= record_room) { |
1064 | try_to_copy = record_room; | |
1065 | full_record = true; | |
1066 | } | |
1067 | ||
d829e9c4 | 1068 | required_size = msg_pl->sg.size + try_to_copy + |
4509de14 | 1069 | prot->overhead_size; |
3c4d7559 DW |
1070 | |
1071 | if (!sk_stream_memory_free(sk)) | |
1072 | goto wait_for_sndbuf; | |
a42055e8 | 1073 | |
3c4d7559 | 1074 | alloc_encrypted: |
d829e9c4 | 1075 | ret = tls_alloc_encrypted_msg(sk, required_size); |
3c4d7559 DW |
1076 | if (ret) { |
1077 | if (ret != -ENOSPC) | |
1078 | goto wait_for_memory; | |
1079 | ||
1080 | /* Adjust try_to_copy according to the amount that was | |
1081 | * actually allocated. The difference is due | |
1082 | * to max sg elements limit | |
1083 | */ | |
d829e9c4 | 1084 | try_to_copy -= required_size - msg_en->sg.size; |
3c4d7559 DW |
1085 | full_record = true; |
1086 | } | |
a42055e8 | 1087 | |
fe1e81d4 DH |
1088 | if (try_to_copy && (msg->msg_flags & MSG_SPLICE_PAGES)) { |
1089 | ret = tls_sw_sendmsg_splice(sk, msg, msg_pl, | |
1090 | try_to_copy, &copied); | |
1091 | if (ret < 0) | |
1092 | goto send_end; | |
1093 | tls_ctx->pending_open_record_frags = true; | |
dc9dfc8d JF |
1094 | |
1095 | if (sk_msg_full(msg_pl)) | |
1096 | full_record = true; | |
1097 | ||
1098 | if (full_record || eor) | |
fe1e81d4 DH |
1099 | goto copied; |
1100 | continue; | |
1101 | } | |
1102 | ||
a42055e8 | 1103 | if (!is_kvec && (full_record || eor) && !async_capable) { |
d3b18ad3 JF |
1104 | u32 first = msg_pl->sg.end; |
1105 | ||
d829e9c4 DB |
1106 | ret = sk_msg_zerocopy_from_iter(sk, &msg->msg_iter, |
1107 | msg_pl, try_to_copy); | |
3c4d7559 DW |
1108 | if (ret) |
1109 | goto fallback_to_reg_send; | |
1110 | ||
a42055e8 | 1111 | num_zc++; |
3c4d7559 | 1112 | copied += try_to_copy; |
d3b18ad3 JF |
1113 | |
1114 | sk_msg_sg_copy_set(msg_pl, first); | |
1115 | ret = bpf_exec_tx_verdict(msg_pl, sk, full_record, | |
1116 | record_type, &copied, | |
1117 | msg->msg_flags); | |
a42055e8 VG |
1118 | if (ret) { |
1119 | if (ret == -EINPROGRESS) | |
1120 | num_async++; | |
d3b18ad3 JF |
1121 | else if (ret == -ENOMEM) |
1122 | goto wait_for_memory; | |
c329ef96 | 1123 | else if (ctx->open_rec && ret == -ENOSPC) |
d3b18ad3 | 1124 | goto rollback_iter; |
a42055e8 VG |
1125 | else if (ret != -EAGAIN) |
1126 | goto send_end; | |
1127 | } | |
5a3611ef | 1128 | continue; |
d3b18ad3 JF |
1129 | rollback_iter: |
1130 | copied -= try_to_copy; | |
1131 | sk_msg_sg_copy_clear(msg_pl, first); | |
1132 | iov_iter_revert(&msg->msg_iter, | |
1133 | msg_pl->sg.size - orig_size); | |
3c4d7559 | 1134 | fallback_to_reg_send: |
d829e9c4 | 1135 | sk_msg_trim(sk, msg_pl, orig_size); |
3c4d7559 DW |
1136 | } |
1137 | ||
d829e9c4 | 1138 | required_size = msg_pl->sg.size + try_to_copy; |
4e6d4720 | 1139 | |
d829e9c4 | 1140 | ret = tls_clone_plaintext_msg(sk, required_size); |
3c4d7559 DW |
1141 | if (ret) { |
1142 | if (ret != -ENOSPC) | |
4e6d4720 | 1143 | goto send_end; |
3c4d7559 DW |
1144 | |
1145 | /* Adjust try_to_copy according to the amount that was | |
1146 | * actually allocated. The difference is due | |
1147 | * to max sg elements limit | |
1148 | */ | |
d829e9c4 | 1149 | try_to_copy -= required_size - msg_pl->sg.size; |
3c4d7559 | 1150 | full_record = true; |
4509de14 VG |
1151 | sk_msg_trim(sk, msg_en, |
1152 | msg_pl->sg.size + prot->overhead_size); | |
3c4d7559 DW |
1153 | } |
1154 | ||
65a10e28 VG |
1155 | if (try_to_copy) { |
1156 | ret = sk_msg_memcopy_from_iter(sk, &msg->msg_iter, | |
1157 | msg_pl, try_to_copy); | |
1158 | if (ret < 0) | |
1159 | goto trim_sgl; | |
1160 | } | |
3c4d7559 | 1161 | |
d829e9c4 DB |
1162 | /* Open records defined only if successfully copied, otherwise |
1163 | * we would trim the sg but not reset the open record frags. | |
1164 | */ | |
1165 | tls_ctx->pending_open_record_frags = true; | |
3c4d7559 | 1166 | copied += try_to_copy; |
fe1e81d4 | 1167 | copied: |
3c4d7559 | 1168 | if (full_record || eor) { |
d3b18ad3 JF |
1169 | ret = bpf_exec_tx_verdict(msg_pl, sk, full_record, |
1170 | record_type, &copied, | |
1171 | msg->msg_flags); | |
3c4d7559 | 1172 | if (ret) { |
a42055e8 VG |
1173 | if (ret == -EINPROGRESS) |
1174 | num_async++; | |
d3b18ad3 JF |
1175 | else if (ret == -ENOMEM) |
1176 | goto wait_for_memory; | |
1177 | else if (ret != -EAGAIN) { | |
1178 | if (ret == -ENOSPC) | |
1179 | ret = 0; | |
a42055e8 | 1180 | goto send_end; |
d3b18ad3 | 1181 | } |
3c4d7559 DW |
1182 | } |
1183 | } | |
1184 | ||
1185 | continue; | |
1186 | ||
1187 | wait_for_sndbuf: | |
1188 | set_bit(SOCK_NOSPACE, &sk->sk_socket->flags); | |
1189 | wait_for_memory: | |
1190 | ret = sk_stream_wait_memory(sk, &timeo); | |
1191 | if (ret) { | |
1192 | trim_sgl: | |
c329ef96 JK |
1193 | if (ctx->open_rec) |
1194 | tls_trim_both_msgs(sk, orig_size); | |
3c4d7559 DW |
1195 | goto send_end; |
1196 | } | |
1197 | ||
c329ef96 | 1198 | if (ctx->open_rec && msg_en->sg.size < required_size) |
3c4d7559 | 1199 | goto alloc_encrypted; |
3c4d7559 DW |
1200 | } |
1201 | ||
a42055e8 VG |
1202 | if (!num_async) { |
1203 | goto send_end; | |
1204 | } else if (num_zc) { | |
c57ca512 | 1205 | int err; |
a42055e8 | 1206 | |
c57ca512 JK |
1207 | /* Wait for pending encryptions to get completed */ |
1208 | err = tls_encrypt_async_wait(ctx); | |
1209 | if (err) { | |
1210 | ret = err; | |
a42055e8 VG |
1211 | copied = 0; |
1212 | } | |
1213 | } | |
1214 | ||
1215 | /* Transmit if any encryptions have completed */ | |
1216 | if (test_and_clear_bit(BIT_TX_SCHEDULED, &ctx->tx_bitmask)) { | |
1217 | cancel_delayed_work(&ctx->tx_work.work); | |
1218 | tls_tx_records(sk, msg->msg_flags); | |
1219 | } | |
1220 | ||
3c4d7559 DW |
1221 | send_end: |
1222 | ret = sk_stream_error(sk, msg->msg_flags, ret); | |
45e5be84 DH |
1223 | return copied > 0 ? copied : ret; |
1224 | } | |
3c4d7559 | 1225 | |
45e5be84 DH |
1226 | int tls_sw_sendmsg(struct sock *sk, struct msghdr *msg, size_t size) |
1227 | { | |
1228 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
1229 | int ret; | |
1230 | ||
1231 | if (msg->msg_flags & ~(MSG_MORE | MSG_DONTWAIT | MSG_NOSIGNAL | | |
e22e358b | 1232 | MSG_CMSG_COMPAT | MSG_SPLICE_PAGES | MSG_EOR | |
b848b26c | 1233 | MSG_SENDPAGE_NOPOLICY)) |
45e5be84 DH |
1234 | return -EOPNOTSUPP; |
1235 | ||
1236 | ret = mutex_lock_interruptible(&tls_ctx->tx_lock); | |
1237 | if (ret) | |
1238 | return ret; | |
1239 | lock_sock(sk); | |
1240 | ret = tls_sw_sendmsg_locked(sk, msg, size); | |
3c4d7559 | 1241 | release_sock(sk); |
79ffe608 | 1242 | mutex_unlock(&tls_ctx->tx_lock); |
45e5be84 | 1243 | return ret; |
3c4d7559 DW |
1244 | } |
1245 | ||
df720d28 DH |
1246 | /* |
1247 | * Handle unexpected EOF during splice without SPLICE_F_MORE set. | |
1248 | */ | |
1249 | void tls_sw_splice_eof(struct socket *sock) | |
1250 | { | |
1251 | struct sock *sk = sock->sk; | |
1252 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
1253 | struct tls_sw_context_tx *ctx = tls_sw_ctx_tx(tls_ctx); | |
1254 | struct tls_rec *rec; | |
1255 | struct sk_msg *msg_pl; | |
1256 | ssize_t copied = 0; | |
1257 | bool retrying = false; | |
1258 | int ret = 0; | |
df720d28 DH |
1259 | |
1260 | if (!ctx->open_rec) | |
1261 | return; | |
1262 | ||
1263 | mutex_lock(&tls_ctx->tx_lock); | |
1264 | lock_sock(sk); | |
1265 | ||
1266 | retry: | |
53f2cb49 | 1267 | /* same checks as in tls_sw_push_pending_record() */ |
df720d28 DH |
1268 | rec = ctx->open_rec; |
1269 | if (!rec) | |
1270 | goto unlock; | |
1271 | ||
1272 | msg_pl = &rec->msg_plaintext; | |
53f2cb49 JH |
1273 | if (msg_pl->sg.size == 0) |
1274 | goto unlock; | |
df720d28 DH |
1275 | |
1276 | /* Check the BPF advisor and perform transmission. */ | |
1277 | ret = bpf_exec_tx_verdict(msg_pl, sk, false, TLS_RECORD_TYPE_DATA, | |
1278 | &copied, 0); | |
1279 | switch (ret) { | |
1280 | case 0: | |
1281 | case -EAGAIN: | |
1282 | if (retrying) | |
1283 | goto unlock; | |
1284 | retrying = true; | |
1285 | goto retry; | |
1286 | case -EINPROGRESS: | |
1287 | break; | |
1288 | default: | |
1289 | goto unlock; | |
1290 | } | |
1291 | ||
1292 | /* Wait for pending encryptions to get completed */ | |
c57ca512 | 1293 | if (tls_encrypt_async_wait(ctx)) |
df720d28 DH |
1294 | goto unlock; |
1295 | ||
1296 | /* Transmit if any encryptions have completed */ | |
1297 | if (test_and_clear_bit(BIT_TX_SCHEDULED, &ctx->tx_bitmask)) { | |
1298 | cancel_delayed_work(&ctx->tx_work.work); | |
1299 | tls_tx_records(sk, 0); | |
1300 | } | |
1301 | ||
1302 | unlock: | |
1303 | release_sock(sk); | |
1304 | mutex_unlock(&tls_ctx->tx_lock); | |
1305 | } | |
1306 | ||
35560b7f JK |
1307 | static int |
1308 | tls_rx_rec_wait(struct sock *sk, struct sk_psock *psock, bool nonblock, | |
70f03fc2 | 1309 | bool released) |
c46234eb DW |
1310 | { |
1311 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
f66de3ee | 1312 | struct tls_sw_context_rx *ctx = tls_sw_ctx_rx(tls_ctx); |
c46234eb | 1313 | DEFINE_WAIT_FUNC(wait, woken_wake_function); |
419ce133 | 1314 | int ret = 0; |
70f03fc2 JK |
1315 | long timeo; |
1316 | ||
1317 | timeo = sock_rcvtimeo(sk, nonblock); | |
c46234eb | 1318 | |
b92a13d4 | 1319 | while (!tls_strp_msg_ready(ctx)) { |
35560b7f JK |
1320 | if (!sk_psock_queue_empty(psock)) |
1321 | return 0; | |
1322 | ||
1323 | if (sk->sk_err) | |
1324 | return sock_error(sk); | |
c46234eb | 1325 | |
419ce133 PA |
1326 | if (ret < 0) |
1327 | return ret; | |
1328 | ||
20ffc7ad | 1329 | if (!skb_queue_empty(&sk->sk_receive_queue)) { |
84c61fe1 | 1330 | tls_strp_check_rcv(&ctx->strp); |
b92a13d4 | 1331 | if (tls_strp_msg_ready(ctx)) |
35560b7f | 1332 | break; |
20ffc7ad VF |
1333 | } |
1334 | ||
fcf4793e | 1335 | if (sk->sk_shutdown & RCV_SHUTDOWN) |
35560b7f | 1336 | return 0; |
fcf4793e | 1337 | |
c46234eb | 1338 | if (sock_flag(sk, SOCK_DONE)) |
35560b7f | 1339 | return 0; |
c46234eb | 1340 | |
70f03fc2 | 1341 | if (!timeo) |
35560b7f | 1342 | return -EAGAIN; |
c46234eb | 1343 | |
84c61fe1 | 1344 | released = true; |
c46234eb DW |
1345 | add_wait_queue(sk_sleep(sk), &wait); |
1346 | sk_set_bit(SOCKWQ_ASYNC_WAITDATA, sk); | |
419ce133 PA |
1347 | ret = sk_wait_event(sk, &timeo, |
1348 | tls_strp_msg_ready(ctx) || | |
1349 | !sk_psock_queue_empty(psock), | |
1350 | &wait); | |
c46234eb DW |
1351 | sk_clear_bit(SOCKWQ_ASYNC_WAITDATA, sk); |
1352 | remove_wait_queue(sk_sleep(sk), &wait); | |
1353 | ||
1354 | /* Handle signals */ | |
35560b7f JK |
1355 | if (signal_pending(current)) |
1356 | return sock_intr_errno(timeo); | |
c46234eb DW |
1357 | } |
1358 | ||
84c61fe1 JK |
1359 | tls_strp_msg_load(&ctx->strp, released); |
1360 | ||
35560b7f | 1361 | return 1; |
c46234eb DW |
1362 | } |
1363 | ||
d4bd88e6 | 1364 | static int tls_setup_from_iter(struct iov_iter *from, |
d829e9c4 | 1365 | int length, int *pages_used, |
d829e9c4 DB |
1366 | struct scatterlist *to, |
1367 | int to_max_pages) | |
1368 | { | |
1369 | int rc = 0, i = 0, num_elem = *pages_used, maxpages; | |
1370 | struct page *pages[MAX_SKB_FRAGS]; | |
d4bd88e6 | 1371 | unsigned int size = 0; |
d829e9c4 DB |
1372 | ssize_t copied, use; |
1373 | size_t offset; | |
1374 | ||
1375 | while (length > 0) { | |
1376 | i = 0; | |
1377 | maxpages = to_max_pages - num_elem; | |
1378 | if (maxpages == 0) { | |
1379 | rc = -EFAULT; | |
1380 | goto out; | |
1381 | } | |
1ef255e2 | 1382 | copied = iov_iter_get_pages2(from, pages, |
d829e9c4 DB |
1383 | length, |
1384 | maxpages, &offset); | |
1385 | if (copied <= 0) { | |
1386 | rc = -EFAULT; | |
1387 | goto out; | |
1388 | } | |
1389 | ||
d829e9c4 DB |
1390 | length -= copied; |
1391 | size += copied; | |
1392 | while (copied) { | |
1393 | use = min_t(int, copied, PAGE_SIZE - offset); | |
1394 | ||
1395 | sg_set_page(&to[num_elem], | |
1396 | pages[i], use, offset); | |
1397 | sg_unmark_end(&to[num_elem]); | |
1398 | /* We do not uncharge memory from this API */ | |
1399 | ||
1400 | offset = 0; | |
1401 | copied -= use; | |
1402 | ||
1403 | i++; | |
1404 | num_elem++; | |
1405 | } | |
1406 | } | |
1407 | /* Mark the end in the last sg entry if newly added */ | |
1408 | if (num_elem > *pages_used) | |
1409 | sg_mark_end(&to[num_elem - 1]); | |
1410 | out: | |
1411 | if (rc) | |
d4bd88e6 | 1412 | iov_iter_revert(from, size); |
d829e9c4 DB |
1413 | *pages_used = num_elem; |
1414 | ||
1415 | return rc; | |
1416 | } | |
1417 | ||
fd31f399 JK |
1418 | static struct sk_buff * |
1419 | tls_alloc_clrtxt_skb(struct sock *sk, struct sk_buff *skb, | |
1420 | unsigned int full_len) | |
1421 | { | |
1422 | struct strp_msg *clr_rxm; | |
1423 | struct sk_buff *clr_skb; | |
1424 | int err; | |
1425 | ||
1426 | clr_skb = alloc_skb_with_frags(0, full_len, TLS_PAGE_ORDER, | |
1427 | &err, sk->sk_allocation); | |
1428 | if (!clr_skb) | |
1429 | return NULL; | |
1430 | ||
1431 | skb_copy_header(clr_skb, skb); | |
1432 | clr_skb->len = full_len; | |
1433 | clr_skb->data_len = full_len; | |
1434 | ||
1435 | clr_rxm = strp_msg(clr_skb); | |
1436 | clr_rxm->offset = 0; | |
1437 | ||
1438 | return clr_skb; | |
1439 | } | |
1440 | ||
8a958732 JK |
1441 | /* Decrypt handlers |
1442 | * | |
dd47ed36 | 1443 | * tls_decrypt_sw() and tls_decrypt_device() are decrypt handlers. |
8a958732 JK |
1444 | * They must transform the darg in/out argument are as follows: |
1445 | * | Input | Output | |
1446 | * ------------------------------------------------------------------- | |
1447 | * zc | Zero-copy decrypt allowed | Zero-copy performed | |
1448 | * async | Async decrypt allowed | Async crypto used / in progress | |
6bd116c8 | 1449 | * skb | * | Output skb |
b93f5700 JK |
1450 | * |
1451 | * If ZC decryption was performed darg.skb will point to the input skb. | |
8a958732 JK |
1452 | */ |
1453 | ||
0b243d00 | 1454 | /* This function decrypts the input skb into either out_iov or in out_sg |
8a958732 | 1455 | * or in skb buffers itself. The input parameter 'darg->zc' indicates if |
0b243d00 VG |
1456 | * zero-copy mode needs to be tried or not. With zero-copy mode, either |
1457 | * out_iov or out_sg must be non-NULL. In case both out_iov and out_sg are | |
1458 | * NULL, then the decryption happens inside skb buffers itself, i.e. | |
8a958732 | 1459 | * zero-copy gets disabled and 'darg->zc' is updated. |
0b243d00 | 1460 | */ |
541cc48b | 1461 | static int tls_decrypt_sg(struct sock *sk, struct iov_iter *out_iov, |
8a958732 JK |
1462 | struct scatterlist *out_sg, |
1463 | struct tls_decrypt_arg *darg) | |
0b243d00 VG |
1464 | { |
1465 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
1466 | struct tls_sw_context_rx *ctx = tls_sw_ctx_rx(tls_ctx); | |
4509de14 | 1467 | struct tls_prot_info *prot = &tls_ctx->prot_info; |
b89fec54 | 1468 | int n_sgin, n_sgout, aead_size, err, pages = 0; |
541cc48b | 1469 | struct sk_buff *skb = tls_strp_msg(ctx); |
fd31f399 JK |
1470 | const struct strp_msg *rxm = strp_msg(skb); |
1471 | const struct tls_msg *tlm = tls_msg(skb); | |
0b243d00 | 1472 | struct aead_request *aead_req; |
0b243d00 VG |
1473 | struct scatterlist *sgin = NULL; |
1474 | struct scatterlist *sgout = NULL; | |
603380f5 | 1475 | const int data_len = rxm->full_len - prot->overhead_size; |
ce61327c | 1476 | int tail_pages = !!prot->tail_size; |
b89fec54 | 1477 | struct tls_decrypt_ctx *dctx; |
fd31f399 | 1478 | struct sk_buff *clear_skb; |
f295b3ae | 1479 | int iv_offset = 0; |
b89fec54 | 1480 | u8 *mem; |
0b243d00 | 1481 | |
fd31f399 JK |
1482 | n_sgin = skb_nsg(skb, rxm->offset + prot->prepend_size, |
1483 | rxm->full_len - prot->prepend_size); | |
1484 | if (n_sgin < 1) | |
1485 | return n_sgin ?: -EBADMSG; | |
1486 | ||
4175eac3 | 1487 | if (darg->zc && (out_iov || out_sg)) { |
fd31f399 JK |
1488 | clear_skb = NULL; |
1489 | ||
0b243d00 | 1490 | if (out_iov) |
ce61327c | 1491 | n_sgout = 1 + tail_pages + |
b93235e6 | 1492 | iov_iter_npages_cap(out_iov, INT_MAX, data_len); |
0b243d00 VG |
1493 | else |
1494 | n_sgout = sg_nents(out_sg); | |
1495 | } else { | |
4175eac3 | 1496 | darg->zc = false; |
0b243d00 | 1497 | |
fd31f399 JK |
1498 | clear_skb = tls_alloc_clrtxt_skb(sk, skb, rxm->full_len); |
1499 | if (!clear_skb) | |
1500 | return -ENOMEM; | |
1501 | ||
1502 | n_sgout = 1 + skb_shinfo(clear_skb)->nr_frags; | |
1503 | } | |
0b243d00 VG |
1504 | |
1505 | /* Increment to accommodate AAD */ | |
1506 | n_sgin = n_sgin + 1; | |
1507 | ||
0b243d00 | 1508 | /* Allocate a single block of memory which contains |
b89fec54 JK |
1509 | * aead_req || tls_decrypt_ctx. |
1510 | * Both structs are variable length. | |
0b243d00 | 1511 | */ |
b89fec54 | 1512 | aead_size = sizeof(*aead_req) + crypto_aead_reqsize(ctx->aead_recv); |
8d338c76 | 1513 | aead_size = ALIGN(aead_size, __alignof__(*dctx)); |
a2713257 | 1514 | mem = kmalloc(aead_size + struct_size(dctx, sg, size_add(n_sgin, n_sgout)), |
b89fec54 | 1515 | sk->sk_allocation); |
fd31f399 JK |
1516 | if (!mem) { |
1517 | err = -ENOMEM; | |
1518 | goto exit_free_skb; | |
1519 | } | |
0b243d00 VG |
1520 | |
1521 | /* Segment the allocated memory */ | |
1522 | aead_req = (struct aead_request *)mem; | |
b89fec54 | 1523 | dctx = (struct tls_decrypt_ctx *)(mem + aead_size); |
8d338c76 | 1524 | dctx->sk = sk; |
b89fec54 JK |
1525 | sgin = &dctx->sg[0]; |
1526 | sgout = &dctx->sg[n_sgin]; | |
0b243d00 | 1527 | |
128cfb88 TZ |
1528 | /* For CCM based ciphers, first byte of nonce+iv is a constant */ |
1529 | switch (prot->cipher_type) { | |
1530 | case TLS_CIPHER_AES_CCM_128: | |
b89fec54 | 1531 | dctx->iv[0] = TLS_AES_CCM_IV_B0_BYTE; |
f295b3ae | 1532 | iv_offset = 1; |
128cfb88 TZ |
1533 | break; |
1534 | case TLS_CIPHER_SM4_CCM: | |
b89fec54 | 1535 | dctx->iv[0] = TLS_SM4_CCM_IV_B0_BYTE; |
128cfb88 TZ |
1536 | iv_offset = 1; |
1537 | break; | |
f295b3ae VG |
1538 | } |
1539 | ||
0b243d00 | 1540 | /* Prepare IV */ |
a6acbe62 | 1541 | if (prot->version == TLS_1_3_VERSION || |
a4ae58cd | 1542 | prot->cipher_type == TLS_CIPHER_CHACHA20_POLY1305) { |
b89fec54 | 1543 | memcpy(&dctx->iv[iv_offset], tls_ctx->rx.iv, |
9381fe8c | 1544 | prot->iv_size + prot->salt_size); |
a4ae58cd JK |
1545 | } else { |
1546 | err = skb_copy_bits(skb, rxm->offset + TLS_HEADER_SIZE, | |
b89fec54 | 1547 | &dctx->iv[iv_offset] + prot->salt_size, |
a4ae58cd | 1548 | prot->iv_size); |
03957d84 JK |
1549 | if (err < 0) |
1550 | goto exit_free; | |
b89fec54 | 1551 | memcpy(&dctx->iv[iv_offset], tls_ctx->rx.iv, prot->salt_size); |
a4ae58cd | 1552 | } |
58790314 | 1553 | tls_xor_iv_with_seq(prot, &dctx->iv[iv_offset], tls_ctx->rx.rec_seq); |
0b243d00 VG |
1554 | |
1555 | /* Prepare AAD */ | |
b89fec54 | 1556 | tls_make_aad(dctx->aad, rxm->full_len - prot->overhead_size + |
4509de14 | 1557 | prot->tail_size, |
c3f6bb74 | 1558 | tls_ctx->rx.rec_seq, tlm->control, prot); |
0b243d00 VG |
1559 | |
1560 | /* Prepare sgin */ | |
1561 | sg_init_table(sgin, n_sgin); | |
b89fec54 | 1562 | sg_set_buf(&sgin[0], dctx->aad, prot->aad_size); |
0b243d00 | 1563 | err = skb_to_sgvec(skb, &sgin[1], |
4509de14 VG |
1564 | rxm->offset + prot->prepend_size, |
1565 | rxm->full_len - prot->prepend_size); | |
03957d84 JK |
1566 | if (err < 0) |
1567 | goto exit_free; | |
0b243d00 | 1568 | |
fd31f399 JK |
1569 | if (clear_skb) { |
1570 | sg_init_table(sgout, n_sgout); | |
1571 | sg_set_buf(&sgout[0], dctx->aad, prot->aad_size); | |
1572 | ||
1573 | err = skb_to_sgvec(clear_skb, &sgout[1], prot->prepend_size, | |
1574 | data_len + prot->tail_size); | |
1575 | if (err < 0) | |
1576 | goto exit_free; | |
1577 | } else if (out_iov) { | |
1578 | sg_init_table(sgout, n_sgout); | |
1579 | sg_set_buf(&sgout[0], dctx->aad, prot->aad_size); | |
1580 | ||
1581 | err = tls_setup_from_iter(out_iov, data_len, &pages, &sgout[1], | |
1582 | (n_sgout - 1 - tail_pages)); | |
1583 | if (err < 0) | |
1584 | goto exit_free_pages; | |
1585 | ||
1586 | if (prot->tail_size) { | |
1587 | sg_unmark_end(&sgout[pages]); | |
1588 | sg_set_buf(&sgout[pages + 1], &dctx->tail, | |
1589 | prot->tail_size); | |
1590 | sg_mark_end(&sgout[pages + 1]); | |
0b243d00 | 1591 | } |
fd31f399 JK |
1592 | } else if (out_sg) { |
1593 | memcpy(sgout, out_sg, n_sgout * sizeof(*sgout)); | |
0b243d00 | 1594 | } |
32b55c5f | 1595 | dctx->free_sgout = !!pages; |
0b243d00 VG |
1596 | |
1597 | /* Prepare and submit AEAD request */ | |
6ececdc5 | 1598 | err = tls_do_decryption(sk, sgin, sgout, dctx->iv, |
603380f5 | 1599 | data_len + prot->tail_size, aead_req, darg); |
13114dc5 SD |
1600 | if (err) { |
1601 | if (darg->async_done) | |
1602 | goto exit_free_skb; | |
6bd116c8 | 1603 | goto exit_free_pages; |
13114dc5 | 1604 | } |
6bd116c8 | 1605 | |
fd31f399 JK |
1606 | darg->skb = clear_skb ?: tls_strp_msg(ctx); |
1607 | clear_skb = NULL; | |
c618db2a JK |
1608 | |
1609 | if (unlikely(darg->async)) { | |
84c61fe1 | 1610 | err = tls_strp_msg_hold(&ctx->strp, &ctx->async_hold); |
c618db2a JK |
1611 | if (err) |
1612 | __skb_queue_tail(&ctx->async_hold, darg->skb); | |
1613 | return err; | |
1614 | } | |
0b243d00 | 1615 | |
13114dc5 SD |
1616 | if (unlikely(darg->async_done)) |
1617 | return 0; | |
1618 | ||
ce61327c | 1619 | if (prot->tail_size) |
b89fec54 | 1620 | darg->tail = dctx->tail; |
ce61327c | 1621 | |
6bd116c8 | 1622 | exit_free_pages: |
0b243d00 VG |
1623 | /* Release the pages in case iov was mapped to pages */ |
1624 | for (; pages > 0; pages--) | |
1625 | put_page(sg_page(&sgout[pages])); | |
03957d84 | 1626 | exit_free: |
0b243d00 | 1627 | kfree(mem); |
fd31f399 JK |
1628 | exit_free_skb: |
1629 | consume_skb(clear_skb); | |
0b243d00 VG |
1630 | return err; |
1631 | } | |
1632 | ||
8a958732 | 1633 | static int |
dd47ed36 JK |
1634 | tls_decrypt_sw(struct sock *sk, struct tls_context *tls_ctx, |
1635 | struct msghdr *msg, struct tls_decrypt_arg *darg) | |
dafb67f3 | 1636 | { |
541cc48b | 1637 | struct tls_sw_context_rx *ctx = tls_sw_ctx_rx(tls_ctx); |
4509de14 | 1638 | struct tls_prot_info *prot = &tls_ctx->prot_info; |
541cc48b | 1639 | struct strp_msg *rxm; |
3764ae5b | 1640 | int pad, err; |
dafb67f3 | 1641 | |
dd47ed36 | 1642 | err = tls_decrypt_sg(sk, &msg->msg_iter, NULL, darg); |
a069a905 GP |
1643 | if (err < 0) { |
1644 | if (err == -EBADMSG) | |
1645 | TLS_INC_STATS(sock_net(sk), LINUX_MIB_TLSDECRYPTERROR); | |
3764ae5b | 1646 | return err; |
a069a905 | 1647 | } |
dd47ed36 JK |
1648 | /* keep going even for ->async, the code below is TLS 1.3 */ |
1649 | ||
ce61327c JK |
1650 | /* If opportunistic TLS 1.3 ZC failed retry without ZC */ |
1651 | if (unlikely(darg->zc && prot->version == TLS_1_3_VERSION && | |
1652 | darg->tail != TLS_RECORD_TYPE_DATA)) { | |
1653 | darg->zc = false; | |
bb56cea9 JK |
1654 | if (!darg->tail) |
1655 | TLS_INC_STATS(sock_net(sk), LINUX_MIB_TLSRXNOPADVIOL); | |
1090c1ea | 1656 | TLS_INC_STATS(sock_net(sk), LINUX_MIB_TLSDECRYPTRETRY); |
dd47ed36 | 1657 | return tls_decrypt_sw(sk, tls_ctx, msg, darg); |
ce61327c | 1658 | } |
dafb67f3 | 1659 | |
6bd116c8 JK |
1660 | pad = tls_padding_length(prot, darg->skb, darg); |
1661 | if (pad < 0) { | |
b93f5700 JK |
1662 | if (darg->skb != tls_strp_msg(ctx)) |
1663 | consume_skb(darg->skb); | |
3764ae5b | 1664 | return pad; |
6bd116c8 | 1665 | } |
3764ae5b | 1666 | |
6bd116c8 | 1667 | rxm = strp_msg(darg->skb); |
3764ae5b | 1668 | rxm->full_len -= pad; |
dd47ed36 JK |
1669 | |
1670 | return 0; | |
1671 | } | |
1672 | ||
1673 | static int | |
d4e5db64 JK |
1674 | tls_decrypt_device(struct sock *sk, struct msghdr *msg, |
1675 | struct tls_context *tls_ctx, struct tls_decrypt_arg *darg) | |
dd47ed36 JK |
1676 | { |
1677 | struct tls_sw_context_rx *ctx = tls_sw_ctx_rx(tls_ctx); | |
1678 | struct tls_prot_info *prot = &tls_ctx->prot_info; | |
1679 | struct strp_msg *rxm; | |
1680 | int pad, err; | |
1681 | ||
1682 | if (tls_ctx->rx_conf != TLS_HW) | |
1683 | return 0; | |
1684 | ||
1685 | err = tls_device_decrypted(sk, tls_ctx); | |
1686 | if (err <= 0) | |
1687 | return err; | |
1688 | ||
1689 | pad = tls_padding_length(prot, tls_strp_msg(ctx), darg); | |
1690 | if (pad < 0) | |
1691 | return pad; | |
1692 | ||
dd47ed36 JK |
1693 | darg->async = false; |
1694 | darg->skb = tls_strp_msg(ctx); | |
d4e5db64 JK |
1695 | /* ->zc downgrade check, in case TLS 1.3 gets here */ |
1696 | darg->zc &= !(prot->version == TLS_1_3_VERSION && | |
1697 | tls_msg(darg->skb)->control != TLS_RECORD_TYPE_DATA); | |
dd47ed36 JK |
1698 | |
1699 | rxm = strp_msg(darg->skb); | |
1700 | rxm->full_len -= pad; | |
d4e5db64 JK |
1701 | |
1702 | if (!darg->zc) { | |
1703 | /* Non-ZC case needs a real skb */ | |
1704 | darg->skb = tls_strp_msg_detach(ctx); | |
1705 | if (!darg->skb) | |
1706 | return -ENOMEM; | |
1707 | } else { | |
1708 | unsigned int off, len; | |
1709 | ||
1710 | /* In ZC case nobody cares about the output skb. | |
1711 | * Just copy the data here. Note the skb is not fully trimmed. | |
1712 | */ | |
1713 | off = rxm->offset + prot->prepend_size; | |
1714 | len = rxm->full_len - prot->overhead_size; | |
1715 | ||
1716 | err = skb_copy_datagram_msg(darg->skb, off, msg, len); | |
1717 | if (err) | |
1718 | return err; | |
1719 | } | |
dd47ed36 JK |
1720 | return 1; |
1721 | } | |
1722 | ||
1723 | static int tls_rx_one_record(struct sock *sk, struct msghdr *msg, | |
1724 | struct tls_decrypt_arg *darg) | |
1725 | { | |
1726 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
1727 | struct tls_prot_info *prot = &tls_ctx->prot_info; | |
1728 | struct strp_msg *rxm; | |
1729 | int err; | |
1730 | ||
d4e5db64 | 1731 | err = tls_decrypt_device(sk, msg, tls_ctx, darg); |
dd47ed36 JK |
1732 | if (!err) |
1733 | err = tls_decrypt_sw(sk, tls_ctx, msg, darg); | |
1734 | if (err < 0) | |
1735 | return err; | |
1736 | ||
1737 | rxm = strp_msg(darg->skb); | |
3764ae5b JK |
1738 | rxm->offset += prot->prepend_size; |
1739 | rxm->full_len -= prot->overhead_size; | |
3547a1f9 | 1740 | tls_advance_record_sn(sk, prot, &tls_ctx->rx); |
3764ae5b JK |
1741 | |
1742 | return 0; | |
dafb67f3 BP |
1743 | } |
1744 | ||
541cc48b | 1745 | int decrypt_skb(struct sock *sk, struct scatterlist *sgout) |
c46234eb | 1746 | { |
4175eac3 | 1747 | struct tls_decrypt_arg darg = { .zc = true, }; |
c46234eb | 1748 | |
541cc48b | 1749 | return tls_decrypt_sg(sk, NULL, sgout, &darg); |
c46234eb DW |
1750 | } |
1751 | ||
06554f4f JK |
1752 | static int tls_record_content_type(struct msghdr *msg, struct tls_msg *tlm, |
1753 | u8 *control) | |
1754 | { | |
1755 | int err; | |
1756 | ||
1757 | if (!*control) { | |
1758 | *control = tlm->control; | |
1759 | if (!*control) | |
1760 | return -EBADMSG; | |
1761 | ||
1762 | err = put_cmsg(msg, SOL_TLS, TLS_GET_RECORD_TYPE, | |
1763 | sizeof(*control), control); | |
1764 | if (*control != TLS_RECORD_TYPE_DATA) { | |
1765 | if (err || msg->msg_flags & MSG_CTRUNC) | |
1766 | return -EIO; | |
1767 | } | |
1768 | } else if (*control != tlm->control) { | |
1769 | return 0; | |
1770 | } | |
1771 | ||
1772 | return 1; | |
1773 | } | |
1774 | ||
abb47dc9 JK |
1775 | static void tls_rx_rec_done(struct tls_sw_context_rx *ctx) |
1776 | { | |
84c61fe1 | 1777 | tls_strp_msg_done(&ctx->strp); |
abb47dc9 JK |
1778 | } |
1779 | ||
692d7b5d | 1780 | /* This function traverses the rx_list in tls receive context to copies the |
2b794c40 | 1781 | * decrypted records into the buffer provided by caller zero copy is not |
692d7b5d VG |
1782 | * true. Further, the records are removed from the rx_list if it is not a peek |
1783 | * case and the record has been consumed completely. | |
1784 | */ | |
1785 | static int process_rx_list(struct tls_sw_context_rx *ctx, | |
1786 | struct msghdr *msg, | |
2b794c40 | 1787 | u8 *control, |
692d7b5d VG |
1788 | size_t skip, |
1789 | size_t len, | |
ec823bf3 SD |
1790 | bool is_peek, |
1791 | bool *more) | |
692d7b5d VG |
1792 | { |
1793 | struct sk_buff *skb = skb_peek(&ctx->rx_list); | |
2b794c40 | 1794 | struct tls_msg *tlm; |
692d7b5d | 1795 | ssize_t copied = 0; |
06554f4f | 1796 | int err; |
2b794c40 | 1797 | |
692d7b5d VG |
1798 | while (skip && skb) { |
1799 | struct strp_msg *rxm = strp_msg(skb); | |
2b794c40 VG |
1800 | tlm = tls_msg(skb); |
1801 | ||
06554f4f JK |
1802 | err = tls_record_content_type(msg, tlm, control); |
1803 | if (err <= 0) | |
ec823bf3 | 1804 | goto more; |
692d7b5d VG |
1805 | |
1806 | if (skip < rxm->full_len) | |
1807 | break; | |
1808 | ||
1809 | skip = skip - rxm->full_len; | |
1810 | skb = skb_peek_next(skb, &ctx->rx_list); | |
1811 | } | |
1812 | ||
1813 | while (len && skb) { | |
1814 | struct sk_buff *next_skb; | |
1815 | struct strp_msg *rxm = strp_msg(skb); | |
1816 | int chunk = min_t(unsigned int, rxm->full_len - skip, len); | |
1817 | ||
2b794c40 VG |
1818 | tlm = tls_msg(skb); |
1819 | ||
06554f4f JK |
1820 | err = tls_record_content_type(msg, tlm, control); |
1821 | if (err <= 0) | |
ec823bf3 | 1822 | goto more; |
2b794c40 | 1823 | |
cbbdee99 JK |
1824 | err = skb_copy_datagram_msg(skb, rxm->offset + skip, |
1825 | msg, chunk); | |
1826 | if (err < 0) | |
ec823bf3 | 1827 | goto more; |
692d7b5d VG |
1828 | |
1829 | len = len - chunk; | |
1830 | copied = copied + chunk; | |
1831 | ||
1832 | /* Consume the data from record if it is non-peek case*/ | |
1833 | if (!is_peek) { | |
1834 | rxm->offset = rxm->offset + chunk; | |
1835 | rxm->full_len = rxm->full_len - chunk; | |
1836 | ||
1837 | /* Return if there is unconsumed data in the record */ | |
1838 | if (rxm->full_len - skip) | |
1839 | break; | |
1840 | } | |
1841 | ||
1842 | /* The remaining skip-bytes must lie in 1st record in rx_list. | |
1843 | * So from the 2nd record, 'skip' should be 0. | |
1844 | */ | |
1845 | skip = 0; | |
1846 | ||
1847 | if (msg) | |
1848 | msg->msg_flags |= MSG_EOR; | |
1849 | ||
1850 | next_skb = skb_peek_next(skb, &ctx->rx_list); | |
1851 | ||
1852 | if (!is_peek) { | |
a30295c4 | 1853 | __skb_unlink(skb, &ctx->rx_list); |
a88c26f6 | 1854 | consume_skb(skb); |
692d7b5d VG |
1855 | } |
1856 | ||
1857 | skb = next_skb; | |
1858 | } | |
4dcdd971 | 1859 | err = 0; |
692d7b5d | 1860 | |
4dcdd971 JK |
1861 | out: |
1862 | return copied ? : err; | |
ec823bf3 SD |
1863 | more: |
1864 | if (more) | |
1865 | *more = true; | |
1866 | goto out; | |
692d7b5d VG |
1867 | } |
1868 | ||
84c61fe1 | 1869 | static bool |
c46b0183 JK |
1870 | tls_read_flush_backlog(struct sock *sk, struct tls_prot_info *prot, |
1871 | size_t len_left, size_t decrypted, ssize_t done, | |
1872 | size_t *flushed_at) | |
1873 | { | |
1874 | size_t max_rec; | |
1875 | ||
1876 | if (len_left <= decrypted) | |
84c61fe1 | 1877 | return false; |
c46b0183 JK |
1878 | |
1879 | max_rec = prot->overhead_size - prot->tail_size + TLS_MAX_PAYLOAD_SIZE; | |
1880 | if (done - *flushed_at < SZ_128K && tcp_inq(sk) > max_rec) | |
84c61fe1 | 1881 | return false; |
c46b0183 JK |
1882 | |
1883 | *flushed_at = done; | |
84c61fe1 | 1884 | return sk_flush_backlog(sk); |
c46b0183 JK |
1885 | } |
1886 | ||
f9ae3204 HR |
1887 | static int tls_rx_reader_acquire(struct sock *sk, struct tls_sw_context_rx *ctx, |
1888 | bool nonblock) | |
4cbc325e JK |
1889 | { |
1890 | long timeo; | |
419ce133 | 1891 | int ret; |
4cbc325e JK |
1892 | |
1893 | timeo = sock_rcvtimeo(sk, nonblock); | |
1894 | ||
1895 | while (unlikely(ctx->reader_present)) { | |
1896 | DEFINE_WAIT_FUNC(wait, woken_wake_function); | |
1897 | ||
1898 | ctx->reader_contended = 1; | |
1899 | ||
1900 | add_wait_queue(&ctx->wq, &wait); | |
419ce133 PA |
1901 | ret = sk_wait_event(sk, &timeo, |
1902 | !READ_ONCE(ctx->reader_present), &wait); | |
4cbc325e JK |
1903 | remove_wait_queue(&ctx->wq, &wait); |
1904 | ||
f9ae3204 HR |
1905 | if (timeo <= 0) |
1906 | return -EAGAIN; | |
1907 | if (signal_pending(current)) | |
1908 | return sock_intr_errno(timeo); | |
419ce133 PA |
1909 | if (ret < 0) |
1910 | return ret; | |
4cbc325e JK |
1911 | } |
1912 | ||
1913 | WRITE_ONCE(ctx->reader_present, 1); | |
1914 | ||
70f03fc2 | 1915 | return 0; |
f9ae3204 | 1916 | } |
dde06aaa | 1917 | |
f9ae3204 HR |
1918 | static int tls_rx_reader_lock(struct sock *sk, struct tls_sw_context_rx *ctx, |
1919 | bool nonblock) | |
1920 | { | |
1921 | int err; | |
1922 | ||
1923 | lock_sock(sk); | |
1924 | err = tls_rx_reader_acquire(sk, ctx, nonblock); | |
1925 | if (err) | |
1926 | release_sock(sk); | |
dde06aaa | 1927 | return err; |
4cbc325e JK |
1928 | } |
1929 | ||
f9ae3204 | 1930 | static void tls_rx_reader_release(struct sock *sk, struct tls_sw_context_rx *ctx) |
4cbc325e JK |
1931 | { |
1932 | if (unlikely(ctx->reader_contended)) { | |
1933 | if (wq_has_sleeper(&ctx->wq)) | |
1934 | wake_up(&ctx->wq); | |
1935 | else | |
1936 | ctx->reader_contended = 0; | |
1937 | ||
1938 | WARN_ON_ONCE(!ctx->reader_present); | |
1939 | } | |
1940 | ||
1941 | WRITE_ONCE(ctx->reader_present, 0); | |
f9ae3204 HR |
1942 | } |
1943 | ||
1944 | static void tls_rx_reader_unlock(struct sock *sk, struct tls_sw_context_rx *ctx) | |
1945 | { | |
1946 | tls_rx_reader_release(sk, ctx); | |
4cbc325e JK |
1947 | release_sock(sk); |
1948 | } | |
1949 | ||
c46234eb DW |
1950 | int tls_sw_recvmsg(struct sock *sk, |
1951 | struct msghdr *msg, | |
1952 | size_t len, | |
c46234eb DW |
1953 | int flags, |
1954 | int *addr_len) | |
1955 | { | |
1956 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
f66de3ee | 1957 | struct tls_sw_context_rx *ctx = tls_sw_ctx_rx(tls_ctx); |
4509de14 | 1958 | struct tls_prot_info *prot = &tls_ctx->prot_info; |
cbbdee99 | 1959 | ssize_t decrypted = 0, async_copy_bytes = 0; |
d3b18ad3 | 1960 | struct sk_psock *psock; |
692d7b5d | 1961 | unsigned char control = 0; |
c46b0183 | 1962 | size_t flushed_at = 0; |
c46234eb | 1963 | struct strp_msg *rxm; |
2b794c40 | 1964 | struct tls_msg *tlm; |
c46234eb | 1965 | ssize_t copied = 0; |
6caaf104 | 1966 | ssize_t peeked = 0; |
7da18bcc | 1967 | bool async = false; |
70f03fc2 | 1968 | int target, err; |
00e23707 | 1969 | bool is_kvec = iov_iter_is_kvec(&msg->msg_iter); |
692d7b5d | 1970 | bool is_peek = flags & MSG_PEEK; |
ec823bf3 | 1971 | bool rx_more = false; |
84c61fe1 | 1972 | bool released = true; |
e91de6af | 1973 | bool bpf_strp_enabled; |
ba13609d | 1974 | bool zc_capable; |
c46234eb | 1975 | |
c46234eb DW |
1976 | if (unlikely(flags & MSG_ERRQUEUE)) |
1977 | return sock_recv_errqueue(sk, msg, len, SOL_IP, IP_RECVERR); | |
1978 | ||
d3b18ad3 | 1979 | psock = sk_psock_get(sk); |
70f03fc2 JK |
1980 | err = tls_rx_reader_lock(sk, ctx, flags & MSG_DONTWAIT); |
1981 | if (err < 0) | |
1982 | return err; | |
e91de6af | 1983 | bpf_strp_enabled = sk_psock_strp_enabled(psock); |
c46234eb | 1984 | |
f314bfee JK |
1985 | /* If crypto failed the connection is broken */ |
1986 | err = ctx->async_wait.err; | |
1987 | if (err) | |
1988 | goto end; | |
1989 | ||
692d7b5d | 1990 | /* Process pending decrypted records. It must be non-zero-copy */ |
ec823bf3 | 1991 | err = process_rx_list(ctx, msg, &control, 0, len, is_peek, &rx_more); |
4dcdd971 | 1992 | if (err < 0) |
692d7b5d | 1993 | goto end; |
692d7b5d | 1994 | |
d5123edd | 1995 | copied = err; |
ec823bf3 | 1996 | if (len <= copied || (copied && control != TLS_RECORD_TYPE_DATA) || rx_more) |
bfc06e1a | 1997 | goto end; |
46a16959 JK |
1998 | |
1999 | target = sock_rcvlowat(sk, flags & MSG_WAITALL, len); | |
2000 | len = len - copied; | |
692d7b5d | 2001 | |
ba13609d | 2002 | zc_capable = !bpf_strp_enabled && !is_kvec && !is_peek && |
88527790 | 2003 | ctx->zc_capable; |
bfc06e1a | 2004 | decrypted = 0; |
b92a13d4 | 2005 | while (len && (decrypted + copied < target || tls_strp_msg_ready(ctx))) { |
6bd116c8 | 2006 | struct tls_decrypt_arg darg; |
9bdf75cc | 2007 | int to_decrypt, chunk; |
c46234eb | 2008 | |
70f03fc2 JK |
2009 | err = tls_rx_rec_wait(sk, psock, flags & MSG_DONTWAIT, |
2010 | released); | |
35560b7f | 2011 | if (err <= 0) { |
d3b18ad3 | 2012 | if (psock) { |
0775639c JK |
2013 | chunk = sk_msg_recvmsg(sk, psock, msg, len, |
2014 | flags); | |
008141de JK |
2015 | if (chunk > 0) { |
2016 | decrypted += chunk; | |
2017 | len -= chunk; | |
2018 | continue; | |
2019 | } | |
d3b18ad3 | 2020 | } |
c46234eb | 2021 | goto recv_end; |
d3b18ad3 | 2022 | } |
c46234eb | 2023 | |
6bd116c8 JK |
2024 | memset(&darg.inargs, 0, sizeof(darg.inargs)); |
2025 | ||
84c61fe1 JK |
2026 | rxm = strp_msg(tls_strp_msg(ctx)); |
2027 | tlm = tls_msg(tls_strp_msg(ctx)); | |
94524d8f | 2028 | |
4509de14 | 2029 | to_decrypt = rxm->full_len - prot->overhead_size; |
fedf201e | 2030 | |
ba13609d JK |
2031 | if (zc_capable && to_decrypt <= len && |
2032 | tlm->control == TLS_RECORD_TYPE_DATA) | |
4175eac3 | 2033 | darg.zc = true; |
fedf201e | 2034 | |
c0ab4732 | 2035 | /* Do not use async mode if record is non-data */ |
c3f6bb74 | 2036 | if (tlm->control == TLS_RECORD_TYPE_DATA && !bpf_strp_enabled) |
4175eac3 | 2037 | darg.async = ctx->async_capable; |
c0ab4732 | 2038 | else |
4175eac3 | 2039 | darg.async = false; |
c0ab4732 | 2040 | |
dd47ed36 | 2041 | err = tls_rx_one_record(sk, msg, &darg); |
3547a1f9 | 2042 | if (err < 0) { |
da353fac | 2043 | tls_err_abort(sk, -EBADMSG); |
fedf201e DW |
2044 | goto recv_end; |
2045 | } | |
2046 | ||
3547a1f9 | 2047 | async |= darg.async; |
2b794c40 VG |
2048 | |
2049 | /* If the type of records being processed is not known yet, | |
2050 | * set it to record type just dequeued. If it is already known, | |
2051 | * but does not match the record type just dequeued, go to end. | |
2052 | * We always get record type here since for tls1.2, record type | |
2053 | * is known just after record is dequeued from stream parser. | |
2054 | * For tls1.3, we disable async. | |
2055 | */ | |
b93f5700 | 2056 | err = tls_record_content_type(msg, tls_msg(darg.skb), &control); |
abb47dc9 | 2057 | if (err <= 0) { |
b93f5700 | 2058 | DEBUG_NET_WARN_ON_ONCE(darg.zc); |
abb47dc9 JK |
2059 | tls_rx_rec_done(ctx); |
2060 | put_on_rx_list_err: | |
b93f5700 | 2061 | __skb_queue_tail(&ctx->rx_list, darg.skb); |
2b794c40 | 2062 | goto recv_end; |
abb47dc9 | 2063 | } |
fedf201e | 2064 | |
c46b0183 | 2065 | /* periodically flush backlog, and feed strparser */ |
84c61fe1 JK |
2066 | released = tls_read_flush_backlog(sk, prot, len, to_decrypt, |
2067 | decrypted + copied, | |
2068 | &flushed_at); | |
c46b0183 | 2069 | |
abb47dc9 | 2070 | /* TLS 1.3 may have updated the length by more than overhead */ |
b93f5700 | 2071 | rxm = strp_msg(darg.skb); |
abb47dc9 JK |
2072 | chunk = rxm->full_len; |
2073 | tls_rx_rec_done(ctx); | |
b1a2c178 | 2074 | |
4175eac3 | 2075 | if (!darg.zc) { |
f940b6ef | 2076 | bool partially_consumed = chunk > len; |
b93f5700 JK |
2077 | struct sk_buff *skb = darg.skb; |
2078 | ||
e20691fa | 2079 | DEBUG_NET_WARN_ON_ONCE(darg.skb == ctx->strp.anchor); |
f940b6ef | 2080 | |
cbbdee99 JK |
2081 | if (async) { |
2082 | /* TLS 1.2-only, to_decrypt must be text len */ | |
2083 | chunk = min_t(int, to_decrypt, len); | |
2084 | async_copy_bytes += chunk; | |
2085 | put_on_rx_list: | |
2086 | decrypted += chunk; | |
2087 | len -= chunk; | |
2088 | __skb_queue_tail(&ctx->rx_list, skb); | |
10f41d07 SD |
2089 | if (unlikely(control != TLS_RECORD_TYPE_DATA)) |
2090 | break; | |
cbbdee99 JK |
2091 | continue; |
2092 | } | |
2093 | ||
e91de6af | 2094 | if (bpf_strp_enabled) { |
84c61fe1 | 2095 | released = true; |
e91de6af JF |
2096 | err = sk_psock_tls_strp_read(psock, skb); |
2097 | if (err != __SK_PASS) { | |
2098 | rxm->offset = rxm->offset + rxm->full_len; | |
2099 | rxm->full_len = 0; | |
2100 | if (err == __SK_DROP) | |
2101 | consume_skb(skb); | |
e91de6af JF |
2102 | continue; |
2103 | } | |
2104 | } | |
2105 | ||
f940b6ef | 2106 | if (partially_consumed) |
fedf201e | 2107 | chunk = len; |
692d7b5d | 2108 | |
fedf201e DW |
2109 | err = skb_copy_datagram_msg(skb, rxm->offset, |
2110 | msg, chunk); | |
abb47dc9 JK |
2111 | if (err < 0) |
2112 | goto put_on_rx_list_err; | |
94524d8f | 2113 | |
6caaf104 SD |
2114 | if (is_peek) { |
2115 | peeked += chunk; | |
008141de | 2116 | goto put_on_rx_list; |
6caaf104 | 2117 | } |
f940b6ef JK |
2118 | |
2119 | if (partially_consumed) { | |
2120 | rxm->offset += chunk; | |
2121 | rxm->full_len -= chunk; | |
008141de | 2122 | goto put_on_rx_list; |
692d7b5d | 2123 | } |
b93f5700 JK |
2124 | |
2125 | consume_skb(skb); | |
c46234eb DW |
2126 | } |
2127 | ||
692d7b5d | 2128 | decrypted += chunk; |
c46234eb | 2129 | len -= chunk; |
692d7b5d | 2130 | |
f940b6ef JK |
2131 | /* Return full control message to userspace before trying |
2132 | * to parse another message type | |
2133 | */ | |
2134 | msg->msg_flags |= MSG_EOR; | |
2135 | if (control != TLS_RECORD_TYPE_DATA) | |
2136 | break; | |
04b25a54 | 2137 | } |
c46234eb DW |
2138 | |
2139 | recv_end: | |
7da18bcc | 2140 | if (async) { |
c57ca512 | 2141 | int ret; |
7da18bcc | 2142 | |
94524d8f | 2143 | /* Wait for all previously submitted records to be decrypted */ |
c57ca512 | 2144 | ret = tls_decrypt_async_wait(ctx); |
c618db2a JK |
2145 | __skb_queue_purge(&ctx->async_hold); |
2146 | ||
2147 | if (ret) { | |
2148 | if (err >= 0 || err == -EINPROGRESS) | |
2149 | err = ret; | |
2150 | decrypted = 0; | |
2151 | goto end; | |
94524d8f | 2152 | } |
0cada332 | 2153 | |
692d7b5d VG |
2154 | /* Drain records from the rx_list & copy if required */ |
2155 | if (is_peek || is_kvec) | |
6caaf104 SD |
2156 | err = process_rx_list(ctx, msg, &control, copied + peeked, |
2157 | decrypted - peeked, is_peek, NULL); | |
692d7b5d | 2158 | else |
06554f4f | 2159 | err = process_rx_list(ctx, msg, &control, 0, |
ec823bf3 | 2160 | async_copy_bytes, is_peek, NULL); |
94524d8f VG |
2161 | } |
2162 | ||
692d7b5d VG |
2163 | copied += decrypted; |
2164 | ||
2165 | end: | |
4cbc325e | 2166 | tls_rx_reader_unlock(sk, ctx); |
d3b18ad3 JF |
2167 | if (psock) |
2168 | sk_psock_put(sk, psock); | |
c46234eb DW |
2169 | return copied ? : err; |
2170 | } | |
2171 | ||
2172 | ssize_t tls_sw_splice_read(struct socket *sock, loff_t *ppos, | |
2173 | struct pipe_inode_info *pipe, | |
2174 | size_t len, unsigned int flags) | |
2175 | { | |
2176 | struct tls_context *tls_ctx = tls_get_ctx(sock->sk); | |
f66de3ee | 2177 | struct tls_sw_context_rx *ctx = tls_sw_ctx_rx(tls_ctx); |
c46234eb DW |
2178 | struct strp_msg *rxm = NULL; |
2179 | struct sock *sk = sock->sk; | |
c3f6bb74 | 2180 | struct tls_msg *tlm; |
c46234eb DW |
2181 | struct sk_buff *skb; |
2182 | ssize_t copied = 0; | |
c46234eb | 2183 | int chunk; |
70f03fc2 | 2184 | int err; |
c46234eb | 2185 | |
70f03fc2 JK |
2186 | err = tls_rx_reader_lock(sk, ctx, flags & SPLICE_F_NONBLOCK); |
2187 | if (err < 0) | |
2188 | return err; | |
c46234eb | 2189 | |
abb47dc9 | 2190 | if (!skb_queue_empty(&ctx->rx_list)) { |
e062fe99 JK |
2191 | skb = __skb_dequeue(&ctx->rx_list); |
2192 | } else { | |
6bd116c8 | 2193 | struct tls_decrypt_arg darg; |
4175eac3 | 2194 | |
35560b7f | 2195 | err = tls_rx_rec_wait(sk, NULL, flags & SPLICE_F_NONBLOCK, |
70f03fc2 | 2196 | true); |
35560b7f | 2197 | if (err <= 0) |
e062fe99 | 2198 | goto splice_read_end; |
c46234eb | 2199 | |
6bd116c8 JK |
2200 | memset(&darg.inargs, 0, sizeof(darg.inargs)); |
2201 | ||
541cc48b | 2202 | err = tls_rx_one_record(sk, NULL, &darg); |
e062fe99 JK |
2203 | if (err < 0) { |
2204 | tls_err_abort(sk, -EBADMSG); | |
2205 | goto splice_read_end; | |
2206 | } | |
abb47dc9 JK |
2207 | |
2208 | tls_rx_rec_done(ctx); | |
6bd116c8 | 2209 | skb = darg.skb; |
520493f6 | 2210 | } |
fedf201e | 2211 | |
c3f6bb74 JK |
2212 | rxm = strp_msg(skb); |
2213 | tlm = tls_msg(skb); | |
2214 | ||
520493f6 | 2215 | /* splice does not support reading control messages */ |
c3f6bb74 | 2216 | if (tlm->control != TLS_RECORD_TYPE_DATA) { |
520493f6 | 2217 | err = -EINVAL; |
abb47dc9 | 2218 | goto splice_requeue; |
c46234eb | 2219 | } |
520493f6 | 2220 | |
c46234eb DW |
2221 | chunk = min_t(unsigned int, rxm->full_len, len); |
2222 | copied = skb_splice_bits(skb, sk, rxm->offset, pipe, chunk, flags); | |
2223 | if (copied < 0) | |
abb47dc9 | 2224 | goto splice_requeue; |
c46234eb | 2225 | |
e062fe99 | 2226 | if (chunk < rxm->full_len) { |
e062fe99 JK |
2227 | rxm->offset += len; |
2228 | rxm->full_len -= len; | |
abb47dc9 | 2229 | goto splice_requeue; |
e062fe99 | 2230 | } |
c46234eb | 2231 | |
abb47dc9 JK |
2232 | consume_skb(skb); |
2233 | ||
c46234eb | 2234 | splice_read_end: |
4cbc325e | 2235 | tls_rx_reader_unlock(sk, ctx); |
c46234eb | 2236 | return copied ? : err; |
abb47dc9 JK |
2237 | |
2238 | splice_requeue: | |
2239 | __skb_queue_head(&ctx->rx_list, skb); | |
2240 | goto splice_read_end; | |
c46234eb DW |
2241 | } |
2242 | ||
662fbcec HR |
2243 | int tls_sw_read_sock(struct sock *sk, read_descriptor_t *desc, |
2244 | sk_read_actor_t read_actor) | |
2245 | { | |
2246 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
2247 | struct tls_sw_context_rx *ctx = tls_sw_ctx_rx(tls_ctx); | |
2248 | struct tls_prot_info *prot = &tls_ctx->prot_info; | |
2249 | struct strp_msg *rxm = NULL; | |
2250 | struct sk_buff *skb = NULL; | |
2251 | struct sk_psock *psock; | |
2252 | size_t flushed_at = 0; | |
2253 | bool released = true; | |
2254 | struct tls_msg *tlm; | |
2255 | ssize_t copied = 0; | |
2256 | ssize_t decrypted; | |
2257 | int err, used; | |
2258 | ||
2259 | psock = sk_psock_get(sk); | |
2260 | if (psock) { | |
2261 | sk_psock_put(sk, psock); | |
2262 | return -EINVAL; | |
2263 | } | |
2264 | err = tls_rx_reader_acquire(sk, ctx, true); | |
2265 | if (err < 0) | |
2266 | return err; | |
2267 | ||
2268 | /* If crypto failed the connection is broken */ | |
2269 | err = ctx->async_wait.err; | |
2270 | if (err) | |
2271 | goto read_sock_end; | |
2272 | ||
2273 | decrypted = 0; | |
2274 | do { | |
2275 | if (!skb_queue_empty(&ctx->rx_list)) { | |
2276 | skb = __skb_dequeue(&ctx->rx_list); | |
2277 | rxm = strp_msg(skb); | |
2278 | tlm = tls_msg(skb); | |
2279 | } else { | |
2280 | struct tls_decrypt_arg darg; | |
662fbcec HR |
2281 | |
2282 | err = tls_rx_rec_wait(sk, NULL, true, released); | |
2283 | if (err <= 0) | |
2284 | goto read_sock_end; | |
2285 | ||
2286 | memset(&darg.inargs, 0, sizeof(darg.inargs)); | |
2287 | ||
662fbcec HR |
2288 | err = tls_rx_one_record(sk, NULL, &darg); |
2289 | if (err < 0) { | |
2290 | tls_err_abort(sk, -EBADMSG); | |
2291 | goto read_sock_end; | |
2292 | } | |
2293 | ||
ba4a734e HR |
2294 | released = tls_read_flush_backlog(sk, prot, INT_MAX, |
2295 | 0, decrypted, | |
2296 | &flushed_at); | |
662fbcec | 2297 | skb = darg.skb; |
ba4a734e HR |
2298 | rxm = strp_msg(skb); |
2299 | tlm = tls_msg(skb); | |
662fbcec HR |
2300 | decrypted += rxm->full_len; |
2301 | ||
2302 | tls_rx_rec_done(ctx); | |
2303 | } | |
2304 | ||
2305 | /* read_sock does not support reading control messages */ | |
2306 | if (tlm->control != TLS_RECORD_TYPE_DATA) { | |
2307 | err = -EINVAL; | |
2308 | goto read_sock_requeue; | |
2309 | } | |
2310 | ||
2311 | used = read_actor(desc, skb, rxm->offset, rxm->full_len); | |
2312 | if (used <= 0) { | |
2313 | if (!copied) | |
2314 | err = used; | |
2315 | goto read_sock_requeue; | |
2316 | } | |
2317 | copied += used; | |
2318 | if (used < rxm->full_len) { | |
2319 | rxm->offset += used; | |
2320 | rxm->full_len -= used; | |
2321 | if (!desc->count) | |
2322 | goto read_sock_requeue; | |
2323 | } else { | |
2324 | consume_skb(skb); | |
2325 | if (!desc->count) | |
2326 | skb = NULL; | |
2327 | } | |
2328 | } while (skb); | |
2329 | ||
2330 | read_sock_end: | |
2331 | tls_rx_reader_release(sk, ctx); | |
2332 | return copied ? : err; | |
2333 | ||
2334 | read_sock_requeue: | |
2335 | __skb_queue_head(&ctx->rx_list, skb); | |
2336 | goto read_sock_end; | |
2337 | } | |
2338 | ||
7b50ecfc | 2339 | bool tls_sw_sock_is_readable(struct sock *sk) |
c46234eb | 2340 | { |
c46234eb | 2341 | struct tls_context *tls_ctx = tls_get_ctx(sk); |
f66de3ee | 2342 | struct tls_sw_context_rx *ctx = tls_sw_ctx_rx(tls_ctx); |
d3b18ad3 JF |
2343 | bool ingress_empty = true; |
2344 | struct sk_psock *psock; | |
c46234eb | 2345 | |
d3b18ad3 JF |
2346 | rcu_read_lock(); |
2347 | psock = sk_psock(sk); | |
2348 | if (psock) | |
2349 | ingress_empty = list_empty(&psock->ingress_msg); | |
2350 | rcu_read_unlock(); | |
c46234eb | 2351 | |
b92a13d4 | 2352 | return !ingress_empty || tls_strp_msg_ready(ctx) || |
13aecb17 | 2353 | !skb_queue_empty(&ctx->rx_list); |
c46234eb DW |
2354 | } |
2355 | ||
84c61fe1 | 2356 | int tls_rx_msg_size(struct tls_strparser *strp, struct sk_buff *skb) |
c46234eb DW |
2357 | { |
2358 | struct tls_context *tls_ctx = tls_get_ctx(strp->sk); | |
4509de14 | 2359 | struct tls_prot_info *prot = &tls_ctx->prot_info; |
bee6b7b3 | 2360 | char header[TLS_HEADER_SIZE + TLS_MAX_IV_SIZE]; |
c46234eb DW |
2361 | size_t cipher_overhead; |
2362 | size_t data_len = 0; | |
2363 | int ret; | |
2364 | ||
2365 | /* Verify that we have a full TLS header, or wait for more data */ | |
84c61fe1 | 2366 | if (strp->stm.offset + prot->prepend_size > skb->len) |
c46234eb DW |
2367 | return 0; |
2368 | ||
3463e51d | 2369 | /* Sanity-check size of on-stack buffer. */ |
4509de14 | 2370 | if (WARN_ON(prot->prepend_size > sizeof(header))) { |
3463e51d KC |
2371 | ret = -EINVAL; |
2372 | goto read_failure; | |
2373 | } | |
2374 | ||
c46234eb | 2375 | /* Linearize header to local buffer */ |
84c61fe1 | 2376 | ret = skb_copy_bits(skb, strp->stm.offset, header, prot->prepend_size); |
c46234eb DW |
2377 | if (ret < 0) |
2378 | goto read_failure; | |
2379 | ||
84c61fe1 | 2380 | strp->mark = header[0]; |
c46234eb DW |
2381 | |
2382 | data_len = ((header[4] & 0xFF) | (header[3] << 8)); | |
2383 | ||
4509de14 | 2384 | cipher_overhead = prot->tag_size; |
a6acbe62 VF |
2385 | if (prot->version != TLS_1_3_VERSION && |
2386 | prot->cipher_type != TLS_CIPHER_CHACHA20_POLY1305) | |
4509de14 | 2387 | cipher_overhead += prot->iv_size; |
c46234eb | 2388 | |
130b392c | 2389 | if (data_len > TLS_MAX_PAYLOAD_SIZE + cipher_overhead + |
4509de14 | 2390 | prot->tail_size) { |
c46234eb DW |
2391 | ret = -EMSGSIZE; |
2392 | goto read_failure; | |
2393 | } | |
2394 | if (data_len < cipher_overhead) { | |
2395 | ret = -EBADMSG; | |
2396 | goto read_failure; | |
2397 | } | |
2398 | ||
130b392c DW |
2399 | /* Note that both TLS1.3 and TLS1.2 use TLS_1_2 version here */ |
2400 | if (header[1] != TLS_1_2_VERSION_MINOR || | |
2401 | header[2] != TLS_1_2_VERSION_MAJOR) { | |
c46234eb DW |
2402 | ret = -EINVAL; |
2403 | goto read_failure; | |
2404 | } | |
be2fbc15 | 2405 | |
f953d33b | 2406 | tls_device_rx_resync_new_rec(strp->sk, data_len + TLS_HEADER_SIZE, |
84c61fe1 | 2407 | TCP_SKB_CB(skb)->seq + strp->stm.offset); |
c46234eb DW |
2408 | return data_len + TLS_HEADER_SIZE; |
2409 | ||
2410 | read_failure: | |
2411 | tls_err_abort(strp->sk, ret); | |
2412 | ||
2413 | return ret; | |
2414 | } | |
2415 | ||
84c61fe1 | 2416 | void tls_rx_msg_ready(struct tls_strparser *strp) |
c46234eb | 2417 | { |
84c61fe1 | 2418 | struct tls_sw_context_rx *ctx; |
c46234eb | 2419 | |
84c61fe1 | 2420 | ctx = container_of(strp, struct tls_sw_context_rx, strp); |
ad13acce | 2421 | ctx->saved_data_ready(strp->sk); |
c46234eb DW |
2422 | } |
2423 | ||
2424 | static void tls_data_ready(struct sock *sk) | |
2425 | { | |
2426 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
f66de3ee | 2427 | struct tls_sw_context_rx *ctx = tls_sw_ctx_rx(tls_ctx); |
d3b18ad3 | 2428 | struct sk_psock *psock; |
74836ec8 | 2429 | gfp_t alloc_save; |
c46234eb | 2430 | |
40e0b090 PY |
2431 | trace_sk_data_ready(sk); |
2432 | ||
74836ec8 JK |
2433 | alloc_save = sk->sk_allocation; |
2434 | sk->sk_allocation = GFP_ATOMIC; | |
84c61fe1 | 2435 | tls_strp_data_ready(&ctx->strp); |
74836ec8 | 2436 | sk->sk_allocation = alloc_save; |
d3b18ad3 JF |
2437 | |
2438 | psock = sk_psock_get(sk); | |
62b4011f XY |
2439 | if (psock) { |
2440 | if (!list_empty(&psock->ingress_msg)) | |
2441 | ctx->saved_data_ready(sk); | |
d3b18ad3 JF |
2442 | sk_psock_put(sk, psock); |
2443 | } | |
c46234eb DW |
2444 | } |
2445 | ||
f87e62d4 JF |
2446 | void tls_sw_cancel_work_tx(struct tls_context *tls_ctx) |
2447 | { | |
2448 | struct tls_sw_context_tx *ctx = tls_sw_ctx_tx(tls_ctx); | |
2449 | ||
2450 | set_bit(BIT_TX_CLOSING, &ctx->tx_bitmask); | |
2451 | set_bit(BIT_TX_SCHEDULED, &ctx->tx_bitmask); | |
2452 | cancel_delayed_work_sync(&ctx->tx_work.work); | |
2453 | } | |
2454 | ||
313ab004 | 2455 | void tls_sw_release_resources_tx(struct sock *sk) |
3c4d7559 DW |
2456 | { |
2457 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
f66de3ee | 2458 | struct tls_sw_context_tx *ctx = tls_sw_ctx_tx(tls_ctx); |
a42055e8 VG |
2459 | struct tls_rec *rec, *tmp; |
2460 | ||
2461 | /* Wait for any pending async encryptions to complete */ | |
c57ca512 | 2462 | tls_encrypt_async_wait(ctx); |
a42055e8 | 2463 | |
a42055e8 VG |
2464 | tls_tx_records(sk, -1); |
2465 | ||
9932a29a | 2466 | /* Free up un-sent records in tx_list. First, free |
a42055e8 VG |
2467 | * the partially sent record if any at head of tx_list. |
2468 | */ | |
c5daa6cc JK |
2469 | if (tls_ctx->partially_sent_record) { |
2470 | tls_free_partial_record(sk, tls_ctx); | |
9932a29a | 2471 | rec = list_first_entry(&ctx->tx_list, |
a42055e8 VG |
2472 | struct tls_rec, list); |
2473 | list_del(&rec->list); | |
d829e9c4 | 2474 | sk_msg_free(sk, &rec->msg_plaintext); |
a42055e8 VG |
2475 | kfree(rec); |
2476 | } | |
2477 | ||
9932a29a | 2478 | list_for_each_entry_safe(rec, tmp, &ctx->tx_list, list) { |
a42055e8 | 2479 | list_del(&rec->list); |
d829e9c4 DB |
2480 | sk_msg_free(sk, &rec->msg_encrypted); |
2481 | sk_msg_free(sk, &rec->msg_plaintext); | |
a42055e8 VG |
2482 | kfree(rec); |
2483 | } | |
3c4d7559 | 2484 | |
201876b3 | 2485 | crypto_free_aead(ctx->aead_send); |
c774973e | 2486 | tls_free_open_rec(sk); |
313ab004 JF |
2487 | } |
2488 | ||
2489 | void tls_sw_free_ctx_tx(struct tls_context *tls_ctx) | |
2490 | { | |
2491 | struct tls_sw_context_tx *ctx = tls_sw_ctx_tx(tls_ctx); | |
f66de3ee BP |
2492 | |
2493 | kfree(ctx); | |
2494 | } | |
2495 | ||
39f56e1a | 2496 | void tls_sw_release_resources_rx(struct sock *sk) |
f66de3ee BP |
2497 | { |
2498 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
2499 | struct tls_sw_context_rx *ctx = tls_sw_ctx_rx(tls_ctx); | |
2500 | ||
c46234eb | 2501 | if (ctx->aead_recv) { |
a30295c4 | 2502 | __skb_queue_purge(&ctx->rx_list); |
c46234eb | 2503 | crypto_free_aead(ctx->aead_recv); |
84c61fe1 | 2504 | tls_strp_stop(&ctx->strp); |
313ab004 | 2505 | /* If tls_sw_strparser_arm() was not called (cleanup paths) |
84c61fe1 | 2506 | * we still want to tls_strp_stop(), but sk->sk_data_ready was |
313ab004 JF |
2507 | * never swapped. |
2508 | */ | |
2509 | if (ctx->saved_data_ready) { | |
2510 | write_lock_bh(&sk->sk_callback_lock); | |
2511 | sk->sk_data_ready = ctx->saved_data_ready; | |
2512 | write_unlock_bh(&sk->sk_callback_lock); | |
2513 | } | |
c46234eb | 2514 | } |
39f56e1a BP |
2515 | } |
2516 | ||
313ab004 | 2517 | void tls_sw_strparser_done(struct tls_context *tls_ctx) |
39f56e1a | 2518 | { |
39f56e1a BP |
2519 | struct tls_sw_context_rx *ctx = tls_sw_ctx_rx(tls_ctx); |
2520 | ||
84c61fe1 | 2521 | tls_strp_done(&ctx->strp); |
313ab004 JF |
2522 | } |
2523 | ||
2524 | void tls_sw_free_ctx_rx(struct tls_context *tls_ctx) | |
2525 | { | |
2526 | struct tls_sw_context_rx *ctx = tls_sw_ctx_rx(tls_ctx); | |
3c4d7559 | 2527 | |
3c4d7559 DW |
2528 | kfree(ctx); |
2529 | } | |
2530 | ||
313ab004 JF |
2531 | void tls_sw_free_resources_rx(struct sock *sk) |
2532 | { | |
2533 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
2534 | ||
2535 | tls_sw_release_resources_rx(sk); | |
2536 | tls_sw_free_ctx_rx(tls_ctx); | |
2537 | } | |
2538 | ||
9932a29a | 2539 | /* The work handler to transmitt the encrypted records in tx_list */ |
a42055e8 VG |
2540 | static void tx_work_handler(struct work_struct *work) |
2541 | { | |
2542 | struct delayed_work *delayed_work = to_delayed_work(work); | |
2543 | struct tx_work *tx_work = container_of(delayed_work, | |
2544 | struct tx_work, work); | |
2545 | struct sock *sk = tx_work->sk; | |
2546 | struct tls_context *tls_ctx = tls_get_ctx(sk); | |
f87e62d4 | 2547 | struct tls_sw_context_tx *ctx; |
a42055e8 | 2548 | |
f87e62d4 | 2549 | if (unlikely(!tls_ctx)) |
a42055e8 VG |
2550 | return; |
2551 | ||
f87e62d4 JF |
2552 | ctx = tls_sw_ctx_tx(tls_ctx); |
2553 | if (test_bit(BIT_TX_CLOSING, &ctx->tx_bitmask)) | |
2554 | return; | |
2555 | ||
2556 | if (!test_and_clear_bit(BIT_TX_SCHEDULED, &ctx->tx_bitmask)) | |
2557 | return; | |
f3221361 JK |
2558 | |
2559 | if (mutex_trylock(&tls_ctx->tx_lock)) { | |
2560 | lock_sock(sk); | |
2561 | tls_tx_records(sk, -1); | |
2562 | release_sock(sk); | |
2563 | mutex_unlock(&tls_ctx->tx_lock); | |
2564 | } else if (!test_and_set_bit(BIT_TX_SCHEDULED, &ctx->tx_bitmask)) { | |
2565 | /* Someone is holding the tx_lock, they will likely run Tx | |
2566 | * and cancel the work on their way out of the lock section. | |
2567 | * Schedule a long delay just in case. | |
2568 | */ | |
2569 | schedule_delayed_work(&ctx->tx_work.work, msecs_to_jiffies(10)); | |
2570 | } | |
a42055e8 VG |
2571 | } |
2572 | ||
58790314 JK |
2573 | static bool tls_is_tx_ready(struct tls_sw_context_tx *ctx) |
2574 | { | |
2575 | struct tls_rec *rec; | |
2576 | ||
ffe2a225 | 2577 | rec = list_first_entry_or_null(&ctx->tx_list, struct tls_rec, list); |
58790314 JK |
2578 | if (!rec) |
2579 | return false; | |
2580 | ||
2581 | return READ_ONCE(rec->tx_ready); | |
2582 | } | |
2583 | ||
7463d3a2 BP |
2584 | void tls_sw_write_space(struct sock *sk, struct tls_context *ctx) |
2585 | { | |
2586 | struct tls_sw_context_tx *tx_ctx = tls_sw_ctx_tx(ctx); | |
2587 | ||
2588 | /* Schedule the transmission if tx list is ready */ | |
58790314 | 2589 | if (tls_is_tx_ready(tx_ctx) && |
02b1fa07 JK |
2590 | !test_and_set_bit(BIT_TX_SCHEDULED, &tx_ctx->tx_bitmask)) |
2591 | schedule_delayed_work(&tx_ctx->tx_work.work, 0); | |
7463d3a2 BP |
2592 | } |
2593 | ||
318892ac JK |
2594 | void tls_sw_strparser_arm(struct sock *sk, struct tls_context *tls_ctx) |
2595 | { | |
2596 | struct tls_sw_context_rx *rx_ctx = tls_sw_ctx_rx(tls_ctx); | |
2597 | ||
2598 | write_lock_bh(&sk->sk_callback_lock); | |
2599 | rx_ctx->saved_data_ready = sk->sk_data_ready; | |
2600 | sk->sk_data_ready = tls_data_ready; | |
2601 | write_unlock_bh(&sk->sk_callback_lock); | |
318892ac JK |
2602 | } |
2603 | ||
88527790 JK |
2604 | void tls_update_rx_zc_capable(struct tls_context *tls_ctx) |
2605 | { | |
2606 | struct tls_sw_context_rx *rx_ctx = tls_sw_ctx_rx(tls_ctx); | |
2607 | ||
2608 | rx_ctx->zc_capable = tls_ctx->rx_no_pad || | |
2609 | tls_ctx->prot_info.version != TLS_1_3_VERSION; | |
2610 | } | |
2611 | ||
615580cb SD |
2612 | static struct tls_sw_context_tx *init_ctx_tx(struct tls_context *ctx, struct sock *sk) |
2613 | { | |
2614 | struct tls_sw_context_tx *sw_ctx_tx; | |
2615 | ||
2616 | if (!ctx->priv_ctx_tx) { | |
2617 | sw_ctx_tx = kzalloc(sizeof(*sw_ctx_tx), GFP_KERNEL); | |
2618 | if (!sw_ctx_tx) | |
2619 | return NULL; | |
2620 | } else { | |
2621 | sw_ctx_tx = ctx->priv_ctx_tx; | |
2622 | } | |
2623 | ||
2624 | crypto_init_wait(&sw_ctx_tx->async_wait); | |
aec79619 | 2625 | atomic_set(&sw_ctx_tx->encrypt_pending, 1); |
615580cb SD |
2626 | INIT_LIST_HEAD(&sw_ctx_tx->tx_list); |
2627 | INIT_DELAYED_WORK(&sw_ctx_tx->tx_work.work, tx_work_handler); | |
2628 | sw_ctx_tx->tx_work.sk = sk; | |
2629 | ||
2630 | return sw_ctx_tx; | |
2631 | } | |
2632 | ||
2633 | static struct tls_sw_context_rx *init_ctx_rx(struct tls_context *ctx) | |
2634 | { | |
2635 | struct tls_sw_context_rx *sw_ctx_rx; | |
2636 | ||
2637 | if (!ctx->priv_ctx_rx) { | |
2638 | sw_ctx_rx = kzalloc(sizeof(*sw_ctx_rx), GFP_KERNEL); | |
2639 | if (!sw_ctx_rx) | |
2640 | return NULL; | |
2641 | } else { | |
2642 | sw_ctx_rx = ctx->priv_ctx_rx; | |
2643 | } | |
2644 | ||
2645 | crypto_init_wait(&sw_ctx_rx->async_wait); | |
aec79619 | 2646 | atomic_set(&sw_ctx_rx->decrypt_pending, 1); |
615580cb SD |
2647 | init_waitqueue_head(&sw_ctx_rx->wq); |
2648 | skb_queue_head_init(&sw_ctx_rx->rx_list); | |
2649 | skb_queue_head_init(&sw_ctx_rx->async_hold); | |
2650 | ||
2651 | return sw_ctx_rx; | |
2652 | } | |
2653 | ||
1a074f76 SD |
2654 | int init_prot_info(struct tls_prot_info *prot, |
2655 | const struct tls_crypto_info *crypto_info, | |
b7c4f573 | 2656 | const struct tls_cipher_desc *cipher_desc) |
a9937816 SD |
2657 | { |
2658 | u16 nonce_size = cipher_desc->nonce; | |
2659 | ||
2660 | if (crypto_info->version == TLS_1_3_VERSION) { | |
2661 | nonce_size = 0; | |
2662 | prot->aad_size = TLS_HEADER_SIZE; | |
2663 | prot->tail_size = 1; | |
2664 | } else { | |
2665 | prot->aad_size = TLS_AAD_SPACE_SIZE; | |
2666 | prot->tail_size = 0; | |
2667 | } | |
2668 | ||
2669 | /* Sanity-check the sizes for stack allocations. */ | |
2670 | if (nonce_size > TLS_MAX_IV_SIZE || prot->aad_size > TLS_MAX_AAD_SIZE) | |
2671 | return -EINVAL; | |
2672 | ||
2673 | prot->version = crypto_info->version; | |
2674 | prot->cipher_type = crypto_info->cipher_type; | |
2675 | prot->prepend_size = TLS_HEADER_SIZE + nonce_size; | |
2676 | prot->tag_size = cipher_desc->tag; | |
2677 | prot->overhead_size = prot->prepend_size + prot->tag_size + prot->tail_size; | |
2678 | prot->iv_size = cipher_desc->iv; | |
2679 | prot->salt_size = cipher_desc->salt; | |
2680 | prot->rec_seq_size = cipher_desc->rec_seq; | |
2681 | ||
2682 | return 0; | |
2683 | } | |
2684 | ||
b6a30ec9 | 2685 | int tls_set_sw_offload(struct sock *sk, int tx) |
3c4d7559 | 2686 | { |
f66de3ee BP |
2687 | struct tls_sw_context_tx *sw_ctx_tx = NULL; |
2688 | struct tls_sw_context_rx *sw_ctx_rx = NULL; | |
b6a30ec9 SD |
2689 | const struct tls_cipher_desc *cipher_desc; |
2690 | struct tls_crypto_info *crypto_info; | |
2691 | char *iv, *rec_seq, *key, *salt; | |
c46234eb | 2692 | struct cipher_context *cctx; |
b6a30ec9 | 2693 | struct tls_prot_info *prot; |
c46234eb | 2694 | struct crypto_aead **aead; |
b6a30ec9 | 2695 | struct tls_context *ctx; |
692d7b5d | 2696 | struct crypto_tfm *tfm; |
3c4d7559 DW |
2697 | int rc = 0; |
2698 | ||
b6a30ec9 SD |
2699 | ctx = tls_get_ctx(sk); |
2700 | prot = &ctx->prot_info; | |
3c4d7559 | 2701 | |
f66de3ee | 2702 | if (tx) { |
615580cb SD |
2703 | ctx->priv_ctx_tx = init_ctx_tx(ctx, sk); |
2704 | if (!ctx->priv_ctx_tx) | |
2705 | return -ENOMEM; | |
3c4d7559 | 2706 | |
615580cb | 2707 | sw_ctx_tx = ctx->priv_ctx_tx; |
86029d10 | 2708 | crypto_info = &ctx->crypto_send.info; |
c46234eb | 2709 | cctx = &ctx->tx; |
f66de3ee | 2710 | aead = &sw_ctx_tx->aead_send; |
c46234eb | 2711 | } else { |
615580cb SD |
2712 | ctx->priv_ctx_rx = init_ctx_rx(ctx); |
2713 | if (!ctx->priv_ctx_rx) | |
2714 | return -ENOMEM; | |
2715 | ||
2716 | sw_ctx_rx = ctx->priv_ctx_rx; | |
86029d10 | 2717 | crypto_info = &ctx->crypto_recv.info; |
c46234eb | 2718 | cctx = &ctx->rx; |
f66de3ee | 2719 | aead = &sw_ctx_rx->aead_recv; |
c46234eb DW |
2720 | } |
2721 | ||
f3e444e3 SD |
2722 | cipher_desc = get_cipher_desc(crypto_info->cipher_type); |
2723 | if (!cipher_desc) { | |
3c4d7559 | 2724 | rc = -EINVAL; |
cf6d43ef | 2725 | goto free_priv; |
3c4d7559 DW |
2726 | } |
2727 | ||
b7c4f573 | 2728 | rc = init_prot_info(prot, crypto_info, cipher_desc); |
a9937816 SD |
2729 | if (rc) |
2730 | goto free_priv; | |
d9a6ca1a | 2731 | |
48dfad27 SD |
2732 | iv = crypto_info_iv(crypto_info, cipher_desc); |
2733 | key = crypto_info_key(crypto_info, cipher_desc); | |
2734 | salt = crypto_info_salt(crypto_info, cipher_desc); | |
2735 | rec_seq = crypto_info_rec_seq(crypto_info, cipher_desc); | |
2736 | ||
d9a6ca1a SD |
2737 | memcpy(cctx->iv, salt, cipher_desc->salt); |
2738 | memcpy(cctx->iv + cipher_desc->salt, iv, cipher_desc->iv); | |
6d5029e5 | 2739 | memcpy(cctx->rec_seq, rec_seq, cipher_desc->rec_seq); |
c46234eb | 2740 | |
c46234eb | 2741 | if (!*aead) { |
f3e444e3 | 2742 | *aead = crypto_alloc_aead(cipher_desc->cipher_name, 0, 0); |
c46234eb DW |
2743 | if (IS_ERR(*aead)) { |
2744 | rc = PTR_ERR(*aead); | |
2745 | *aead = NULL; | |
1c1cb311 | 2746 | goto free_priv; |
3c4d7559 DW |
2747 | } |
2748 | } | |
2749 | ||
2750 | ctx->push_pending_record = tls_sw_push_pending_record; | |
2751 | ||
d9a6ca1a | 2752 | rc = crypto_aead_setkey(*aead, key, cipher_desc->key); |
3c4d7559 DW |
2753 | if (rc) |
2754 | goto free_aead; | |
2755 | ||
4509de14 | 2756 | rc = crypto_aead_setauthsize(*aead, prot->tag_size); |
c46234eb DW |
2757 | if (rc) |
2758 | goto free_aead; | |
2759 | ||
f66de3ee | 2760 | if (sw_ctx_rx) { |
692d7b5d | 2761 | tfm = crypto_aead_tfm(sw_ctx_rx->aead_recv); |
8497ded2 | 2762 | |
88527790 JK |
2763 | tls_update_rx_zc_capable(ctx); |
2764 | sw_ctx_rx->async_capable = | |
2765 | crypto_info->version != TLS_1_3_VERSION && | |
2766 | !!(tfm->__crt_alg->cra_flags & CRYPTO_ALG_ASYNC); | |
692d7b5d | 2767 | |
849f16bb JK |
2768 | rc = tls_strp_init(&sw_ctx_rx->strp, sk); |
2769 | if (rc) | |
2770 | goto free_aead; | |
c46234eb DW |
2771 | } |
2772 | ||
2773 | goto out; | |
3c4d7559 DW |
2774 | |
2775 | free_aead: | |
c46234eb DW |
2776 | crypto_free_aead(*aead); |
2777 | *aead = NULL; | |
cf6d43ef | 2778 | free_priv: |
f66de3ee BP |
2779 | if (tx) { |
2780 | kfree(ctx->priv_ctx_tx); | |
2781 | ctx->priv_ctx_tx = NULL; | |
2782 | } else { | |
2783 | kfree(ctx->priv_ctx_rx); | |
2784 | ctx->priv_ctx_rx = NULL; | |
2785 | } | |
3c4d7559 DW |
2786 | out: |
2787 | return rc; | |
2788 | } |