Merge tag '4.20-rc1-smb3-fixes' of git://git.samba.org/sfrench/cifs-2.6
[linux-2.6-block.git] / net / 9p / trans_fd.c
CommitLineData
bd238fb4
LI
1/*
2 * linux/fs/9p/trans_fd.c
3 *
4 * Fd transport layer. Includes deprecated socket layer.
5 *
6 * Copyright (C) 2006 by Russ Cox <rsc@swtch.com>
7 * Copyright (C) 2004-2005 by Latchesar Ionkov <lucho@ionkov.net>
8a0dc95f 8 * Copyright (C) 2004-2008 by Eric Van Hensbergen <ericvh@gmail.com>
bd238fb4
LI
9 * Copyright (C) 1997-2002 by Ron Minnich <rminnich@sarnoff.com>
10 *
11 * This program is free software; you can redistribute it and/or modify
12 * it under the terms of the GNU General Public License version 2
13 * as published by the Free Software Foundation.
14 *
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU General Public License for more details.
19 *
20 * You should have received a copy of the GNU General Public License
21 * along with this program; if not, write to:
22 * Free Software Foundation
23 * 51 Franklin Street, Fifth Floor
24 * Boston, MA 02111-1301 USA
25 *
26 */
27
5d385153
JP
28#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
29
bd238fb4
LI
30#include <linux/in.h>
31#include <linux/module.h>
32#include <linux/net.h>
33#include <linux/ipv6.h>
8a0dc95f 34#include <linux/kthread.h>
bd238fb4
LI
35#include <linux/errno.h>
36#include <linux/kernel.h>
37#include <linux/un.h>
38#include <linux/uaccess.h>
39#include <linux/inet.h>
40#include <linux/idr.h>
41#include <linux/file.h>
a80d923e 42#include <linux/parser.h>
5a0e3ad6 43#include <linux/slab.h>
c4fac910 44#include <linux/seq_file.h>
bd238fb4 45#include <net/9p/9p.h>
8b81ef58 46#include <net/9p/client.h>
bd238fb4
LI
47#include <net/9p/transport.h>
48
6b18662e
AV
49#include <linux/syscalls.h> /* killme */
50
bd238fb4 51#define P9_PORT 564
a80d923e 52#define MAX_SOCK_BUF (64*1024)
8a0dc95f 53#define MAXPOLLWADDR 2
a80d923e 54
c4fac910
DH
55static struct p9_trans_module p9_tcp_trans;
56static struct p9_trans_module p9_fd_trans;
57
ee443996
EVH
58/**
59 * struct p9_fd_opts - per-transport options
60 * @rfd: file descriptor for reading (trans=fd)
61 * @wfd: file descriptor for writing (trans=fd)
62 * @port: port to connect to (trans=tcp)
63 *
64 */
65
a80d923e
EVH
66struct p9_fd_opts {
67 int rfd;
68 int wfd;
69 u16 port;
c4fac910 70 bool privport;
a80d923e 71};
bd238fb4 72
a80d923e
EVH
73/*
74 * Option Parsing (code inspired by NFS code)
75 * - a little lazy - parse all fd-transport options
76 */
bd238fb4 77
a80d923e
EVH
78enum {
79 /* Options that take integer arguments */
55762690 80 Opt_port, Opt_rfdno, Opt_wfdno, Opt_err,
2f28c8b3
JG
81 /* Options that take no arguments */
82 Opt_privport,
a80d923e 83};
bd238fb4 84
a447c093 85static const match_table_t tokens = {
a80d923e
EVH
86 {Opt_port, "port=%u"},
87 {Opt_rfdno, "rfdno=%u"},
88 {Opt_wfdno, "wfdno=%u"},
2f28c8b3 89 {Opt_privport, "privport"},
55762690 90 {Opt_err, NULL},
a80d923e 91};
bd238fb4 92
8a0dc95f
EVH
93enum {
94 Rworksched = 1, /* read work scheduled or running */
95 Rpending = 2, /* can read */
96 Wworksched = 4, /* write work scheduled or running */
97 Wpending = 8, /* can write */
98};
99
992b3f1d
TH
100struct p9_poll_wait {
101 struct p9_conn *conn;
ac6424b9 102 wait_queue_entry_t wait;
992b3f1d 103 wait_queue_head_t *wait_addr;
ee443996
EVH
104};
105
106/**
107 * struct p9_conn - fd mux connection state information
ee443996 108 * @mux_list: list link for mux to manage multiple connections (?)
8b81ef58 109 * @client: reference to client instance for this connection
ee443996 110 * @err: error state
ee443996
EVH
111 * @req_list: accounting for requests which have been sent
112 * @unsent_req_list: accounting for requests that haven't been sent
1b0a763b
EVH
113 * @req: current request being processed (if any)
114 * @tmp_buf: temporary buffer to read in header
947867aa 115 * @rc: temporary fcall for reading current frame
ee443996
EVH
116 * @wpos: write position for current frame
117 * @wsize: amount of data to write for current frame
118 * @wbuf: current write buffer
0e15597e 119 * @poll_pending_link: pending links to be polled per conn
ee443996 120 * @poll_wait: array of wait_q's for various worker threads
ee443996
EVH
121 * @pt: poll state
122 * @rq: current read work
123 * @wq: current write work
124 * @wsched: ????
125 *
126 */
8a0dc95f
EVH
127
128struct p9_conn {
8a0dc95f 129 struct list_head mux_list;
8b81ef58 130 struct p9_client *client;
8a0dc95f 131 int err;
8a0dc95f
EVH
132 struct list_head req_list;
133 struct list_head unsent_req_list;
6d35190f 134 struct p9_req_t *rreq;
728356de 135 struct p9_req_t *wreq;
1b0a763b 136 char tmp_buf[7];
947867aa 137 struct p9_fcall rc;
8a0dc95f
EVH
138 int wpos;
139 int wsize;
140 char *wbuf;
992b3f1d
TH
141 struct list_head poll_pending_link;
142 struct p9_poll_wait poll_wait[MAXPOLLWADDR];
8a0dc95f
EVH
143 poll_table pt;
144 struct work_struct rq;
145 struct work_struct wq;
146 unsigned long wsched;
147};
148
263c5828
SD
149/**
150 * struct p9_trans_fd - transport state
151 * @rd: reference to file to read from
152 * @wr: reference of file to write to
153 * @conn: connection state reference
154 *
155 */
156
157struct p9_trans_fd {
158 struct file *rd;
159 struct file *wr;
160 struct p9_conn conn;
161};
162
aa70c585
TH
163static void p9_poll_workfn(struct work_struct *work);
164
992b3f1d
TH
165static DEFINE_SPINLOCK(p9_poll_lock);
166static LIST_HEAD(p9_poll_pending_list);
aa70c585 167static DECLARE_WORK(p9_poll_work, p9_poll_workfn);
8a0dc95f 168
2f28c8b3
JG
169static unsigned int p9_ipport_resv_min = P9_DEF_MIN_RESVPORT;
170static unsigned int p9_ipport_resv_max = P9_DEF_MAX_RESVPORT;
171
992b3f1d 172static void p9_mux_poll_stop(struct p9_conn *m)
8a0dc95f 173{
992b3f1d
TH
174 unsigned long flags;
175 int i;
8a0dc95f 176
992b3f1d
TH
177 for (i = 0; i < ARRAY_SIZE(m->poll_wait); i++) {
178 struct p9_poll_wait *pwait = &m->poll_wait[i];
8a0dc95f 179
992b3f1d
TH
180 if (pwait->wait_addr) {
181 remove_wait_queue(pwait->wait_addr, &pwait->wait);
182 pwait->wait_addr = NULL;
8a0dc95f 183 }
8a0dc95f
EVH
184 }
185
992b3f1d
TH
186 spin_lock_irqsave(&p9_poll_lock, flags);
187 list_del_init(&m->poll_pending_link);
188 spin_unlock_irqrestore(&p9_poll_lock, flags);
430ac66e
TB
189
190 flush_work(&p9_poll_work);
8a0dc95f
EVH
191}
192
193/**
5503ac56
EVH
194 * p9_conn_cancel - cancel all pending requests with error
195 * @m: mux data
196 * @err: error code
8a0dc95f 197 *
8a0dc95f 198 */
ee443996 199
51a87c55 200static void p9_conn_cancel(struct p9_conn *m, int err)
8a0dc95f 201{
673d62cd 202 struct p9_req_t *req, *rtmp;
5503ac56 203 LIST_HEAD(cancel_list);
8a0dc95f 204
5d385153 205 p9_debug(P9_DEBUG_ERROR, "mux %p err %d\n", m, err);
7eb923b8 206
9f476d7c 207 spin_lock(&m->client->lock);
7eb923b8
EVH
208
209 if (m->err) {
9f476d7c 210 spin_unlock(&m->client->lock);
7eb923b8
EVH
211 return;
212 }
213
214 m->err = err;
215
5503ac56
EVH
216 list_for_each_entry_safe(req, rtmp, &m->req_list, req_list) {
217 list_move(&req->req_list, &cancel_list);
218 }
219 list_for_each_entry_safe(req, rtmp, &m->unsent_req_list, req_list) {
220 list_move(&req->req_list, &cancel_list);
8a0dc95f
EVH
221 }
222
5503ac56 223 list_for_each_entry_safe(req, rtmp, &cancel_list, req_list) {
5d385153 224 p9_debug(P9_DEBUG_ERROR, "call back req %p\n", req);
1bab88b2 225 list_del(&req->req_list);
2b6e72ed
DM
226 if (!req->t_err)
227 req->t_err = err;
228 p9_client_cb(m->client, req, REQ_STATUS_ERROR);
8a0dc95f 229 }
9f476d7c 230 spin_unlock(&m->client->lock);
8a0dc95f
EVH
231}
232
7594bf37
AV
233static __poll_t
234p9_fd_poll(struct p9_client *client, struct poll_table_struct *pt, int *err)
8a0dc95f 235{
9965ed17 236 __poll_t ret;
5503ac56 237 struct p9_trans_fd *ts = NULL;
8a0dc95f 238
5503ac56
EVH
239 if (client && client->status == Connected)
240 ts = client->trans;
7dc5d24b 241
7594bf37
AV
242 if (!ts) {
243 if (err)
244 *err = -EREMOTEIO;
a9a08845 245 return EPOLLERR;
7594bf37 246 }
7dc5d24b 247
9965ed17
CH
248 ret = vfs_poll(ts->rd, pt);
249 if (ts->rd != ts->wr)
250 ret = (ret & ~EPOLLOUT) | (vfs_poll(ts->wr, pt) & ~EPOLLIN);
5503ac56 251 return ret;
992b3f1d
TH
252}
253
8a0dc95f 254/**
5503ac56
EVH
255 * p9_fd_read- read from a fd
256 * @client: client instance
257 * @v: buffer to receive data into
258 * @len: size of receive buffer
ee443996 259 *
8a0dc95f 260 */
ee443996 261
5503ac56 262static int p9_fd_read(struct p9_client *client, void *v, int len)
8a0dc95f 263{
5503ac56
EVH
264 int ret;
265 struct p9_trans_fd *ts = NULL;
bdd1d2d3 266 loff_t pos;
8a0dc95f 267
5503ac56
EVH
268 if (client && client->status != Disconnected)
269 ts = client->trans;
8a0dc95f 270
5503ac56
EVH
271 if (!ts)
272 return -EREMOTEIO;
8a0dc95f 273
5503ac56 274 if (!(ts->rd->f_flags & O_NONBLOCK))
5d385153 275 p9_debug(P9_DEBUG_ERROR, "blocking read ...\n");
8a0dc95f 276
bdd1d2d3
CH
277 pos = ts->rd->f_pos;
278 ret = kernel_read(ts->rd, v, len, &pos);
5503ac56
EVH
279 if (ret <= 0 && ret != -ERESTARTSYS && ret != -EAGAIN)
280 client->status = Disconnected;
281 return ret;
8a0dc95f
EVH
282}
283
284/**
5503ac56
EVH
285 * p9_read_work - called when there is some data to be read from a transport
286 * @work: container of work to be done
ee443996 287 *
8a0dc95f 288 */
ee443996 289
5503ac56 290static void p9_read_work(struct work_struct *work)
8a0dc95f 291{
7594bf37
AV
292 __poll_t n;
293 int err;
5503ac56 294 struct p9_conn *m;
5503ac56
EVH
295
296 m = container_of(work, struct p9_conn, rq);
8a0dc95f
EVH
297
298 if (m->err < 0)
299 return;
300
947867aa 301 p9_debug(P9_DEBUG_TRANS, "start mux %p pos %zd\n", m, m->rc.offset);
8a0dc95f 302
947867aa
DM
303 if (!m->rc.sdata) {
304 m->rc.sdata = m->tmp_buf;
305 m->rc.offset = 0;
306 m->rc.capacity = 7; /* start by reading header */
8a0dc95f
EVH
307 }
308
5503ac56 309 clear_bit(Rpending, &m->wsched);
947867aa
DM
310 p9_debug(P9_DEBUG_TRANS, "read mux %p pos %zd size: %zd = %zd\n",
311 m, m->rc.offset, m->rc.capacity,
312 m->rc.capacity - m->rc.offset);
313 err = p9_fd_read(m->client, m->rc.sdata + m->rc.offset,
314 m->rc.capacity - m->rc.offset);
5d385153 315 p9_debug(P9_DEBUG_TRANS, "mux %p got %d bytes\n", m, err);
947867aa 316 if (err == -EAGAIN)
0462194d 317 goto end_clear;
8a0dc95f 318
5503ac56
EVH
319 if (err <= 0)
320 goto error;
321
947867aa 322 m->rc.offset += err;
1b0a763b 323
947867aa 324 /* header read in */
6d35190f 325 if ((!m->rreq) && (m->rc.offset == m->rc.capacity)) {
5d385153 326 p9_debug(P9_DEBUG_TRANS, "got new header\n");
1b0a763b 327
f984579a
TB
328 /* Header size */
329 m->rc.size = 7;
330 err = p9_parse_header(&m->rc, &m->rc.size, NULL, NULL, 0);
947867aa
DM
331 if (err) {
332 p9_debug(P9_DEBUG_ERROR,
333 "error parsing header: %d\n", err);
334 goto error;
335 }
336
337 if (m->rc.size >= m->client->msize) {
5d385153 338 p9_debug(P9_DEBUG_ERROR,
947867aa
DM
339 "requested packet size too big: %d\n",
340 m->rc.size);
5503ac56
EVH
341 err = -EIO;
342 goto error;
343 }
344
5d385153 345 p9_debug(P9_DEBUG_TRANS,
947867aa
DM
346 "mux %p pkt: size: %d bytes tag: %d\n",
347 m, m->rc.size, m->rc.tag);
1b0a763b 348
6d35190f
TB
349 m->rreq = p9_tag_lookup(m->client, m->rc.tag);
350 if (!m->rreq || (m->rreq->status != REQ_STATUS_SENT)) {
5d385153 351 p9_debug(P9_DEBUG_ERROR, "Unexpected packet tag %d\n",
947867aa 352 m->rc.tag);
1b0a763b
EVH
353 err = -EIO;
354 goto error;
355 }
356
6d35190f 357 if (!m->rreq->rc.sdata) {
3053600e
DM
358 p9_debug(P9_DEBUG_ERROR,
359 "No recv fcall for tag %d (req %p), disconnecting!\n",
6d35190f
TB
360 m->rc.tag, m->rreq);
361 m->rreq = NULL;
3053600e
DM
362 err = -EIO;
363 goto error;
1b0a763b 364 }
6d35190f 365 m->rc.sdata = m->rreq->rc.sdata;
947867aa
DM
366 memcpy(m->rc.sdata, m->tmp_buf, m->rc.capacity);
367 m->rc.capacity = m->rc.size;
1b0a763b 368 }
5503ac56 369
947867aa
DM
370 /* packet is read in
371 * not an else because some packets (like clunk) have no payload
372 */
6d35190f 373 if ((m->rreq) && (m->rc.offset == m->rc.capacity)) {
5d385153 374 p9_debug(P9_DEBUG_TRANS, "got new packet\n");
6d35190f 375 m->rreq->rc.size = m->rc.offset;
7eb923b8 376 spin_lock(&m->client->lock);
e4ca13f7
DM
377 if (m->rreq->status == REQ_STATUS_SENT) {
378 list_del(&m->rreq->req_list);
379 p9_client_cb(m->client, m->rreq, REQ_STATUS_RCVD);
380 } else {
381 spin_unlock(&m->client->lock);
382 p9_debug(P9_DEBUG_ERROR,
383 "Request tag %d errored out while we were reading the reply\n",
384 m->rc.tag);
385 err = -EIO;
386 goto error;
387 }
9f476d7c 388 spin_unlock(&m->client->lock);
947867aa
DM
389 m->rc.sdata = NULL;
390 m->rc.offset = 0;
391 m->rc.capacity = 0;
6d35190f
TB
392 p9_req_put(m->rreq);
393 m->rreq = NULL;
5503ac56
EVH
394 }
395
0462194d
SD
396end_clear:
397 clear_bit(Rworksched, &m->wsched);
398
5503ac56
EVH
399 if (!list_empty(&m->req_list)) {
400 if (test_and_clear_bit(Rpending, &m->wsched))
a9a08845 401 n = EPOLLIN;
5503ac56 402 else
7594bf37 403 n = p9_fd_poll(m->client, NULL, NULL);
5503ac56 404
a9a08845 405 if ((n & EPOLLIN) && !test_and_set_bit(Rworksched, &m->wsched)) {
5d385153 406 p9_debug(P9_DEBUG_TRANS, "sched read work %p\n", m);
61edeeed 407 schedule_work(&m->rq);
0462194d
SD
408 }
409 }
5503ac56
EVH
410
411 return;
5503ac56
EVH
412error:
413 p9_conn_cancel(m, err);
414 clear_bit(Rworksched, &m->wsched);
415}
416
417/**
418 * p9_fd_write - write to a socket
419 * @client: client instance
420 * @v: buffer to send data from
421 * @len: size of send buffer
ee443996 422 *
8a0dc95f 423 */
ee443996 424
5503ac56 425static int p9_fd_write(struct p9_client *client, void *v, int len)
8a0dc95f 426{
670986ec 427 ssize_t ret;
5503ac56 428 struct p9_trans_fd *ts = NULL;
8a0dc95f 429
5503ac56
EVH
430 if (client && client->status != Disconnected)
431 ts = client->trans;
8a0dc95f 432
5503ac56
EVH
433 if (!ts)
434 return -EREMOTEIO;
8a0dc95f 435
5503ac56 436 if (!(ts->wr->f_flags & O_NONBLOCK))
5d385153 437 p9_debug(P9_DEBUG_ERROR, "blocking write ...\n");
992b3f1d 438
670986ec 439 ret = kernel_write(ts->wr, v, len, &ts->wr->f_pos);
5503ac56
EVH
440 if (ret <= 0 && ret != -ERESTARTSYS && ret != -EAGAIN)
441 client->status = Disconnected;
442 return ret;
8a0dc95f
EVH
443}
444
445/**
446 * p9_write_work - called when a transport can send some data
ee443996
EVH
447 * @work: container for work to be done
448 *
8a0dc95f 449 */
ee443996 450
8a0dc95f
EVH
451static void p9_write_work(struct work_struct *work)
452{
7594bf37
AV
453 __poll_t n;
454 int err;
8a0dc95f 455 struct p9_conn *m;
673d62cd 456 struct p9_req_t *req;
8a0dc95f
EVH
457
458 m = container_of(work, struct p9_conn, wq);
459
460 if (m->err < 0) {
461 clear_bit(Wworksched, &m->wsched);
462 return;
463 }
464
465 if (!m->wsize) {
759f4298 466 spin_lock(&m->client->lock);
8a0dc95f
EVH
467 if (list_empty(&m->unsent_req_list)) {
468 clear_bit(Wworksched, &m->wsched);
759f4298 469 spin_unlock(&m->client->lock);
8a0dc95f
EVH
470 return;
471 }
472
673d62cd 473 req = list_entry(m->unsent_req_list.next, struct p9_req_t,
8a0dc95f 474 req_list);
673d62cd 475 req->status = REQ_STATUS_SENT;
5d385153 476 p9_debug(P9_DEBUG_TRANS, "move req %p\n", req);
8a0dc95f 477 list_move_tail(&req->req_list, &m->req_list);
8a0dc95f 478
523adb6c
DM
479 m->wbuf = req->tc.sdata;
480 m->wsize = req->tc.size;
8a0dc95f 481 m->wpos = 0;
728356de
TB
482 p9_req_get(req);
483 m->wreq = req;
673d62cd 484 spin_unlock(&m->client->lock);
8a0dc95f
EVH
485 }
486
5d385153
JP
487 p9_debug(P9_DEBUG_TRANS, "mux %p pos %d size %d\n",
488 m, m->wpos, m->wsize);
8a0dc95f 489 clear_bit(Wpending, &m->wsched);
8b81ef58 490 err = p9_fd_write(m->client, m->wbuf + m->wpos, m->wsize - m->wpos);
5d385153 491 p9_debug(P9_DEBUG_TRANS, "mux %p sent %d bytes\n", m, err);
584a8c13
SD
492 if (err == -EAGAIN)
493 goto end_clear;
494
8a0dc95f
EVH
495
496 if (err < 0)
497 goto error;
498 else if (err == 0) {
499 err = -EREMOTEIO;
500 goto error;
501 }
502
503 m->wpos += err;
728356de 504 if (m->wpos == m->wsize) {
8a0dc95f 505 m->wpos = m->wsize = 0;
728356de
TB
506 p9_req_put(m->wreq);
507 m->wreq = NULL;
508 }
8a0dc95f 509
584a8c13
SD
510end_clear:
511 clear_bit(Wworksched, &m->wsched);
512
1957b3a8 513 if (m->wsize || !list_empty(&m->unsent_req_list)) {
8a0dc95f 514 if (test_and_clear_bit(Wpending, &m->wsched))
a9a08845 515 n = EPOLLOUT;
8a0dc95f 516 else
7594bf37 517 n = p9_fd_poll(m->client, NULL, NULL);
8a0dc95f 518
a9a08845 519 if ((n & EPOLLOUT) &&
584a8c13 520 !test_and_set_bit(Wworksched, &m->wsched)) {
5d385153 521 p9_debug(P9_DEBUG_TRANS, "sched write work %p\n", m);
61edeeed 522 schedule_work(&m->wq);
584a8c13
SD
523 }
524 }
8a0dc95f
EVH
525
526 return;
527
528error:
529 p9_conn_cancel(m, err);
530 clear_bit(Wworksched, &m->wsched);
531}
532
ac6424b9 533static int p9_pollwake(wait_queue_entry_t *wait, unsigned int mode, int sync, void *key)
8a0dc95f 534{
5503ac56
EVH
535 struct p9_poll_wait *pwait =
536 container_of(wait, struct p9_poll_wait, wait);
537 struct p9_conn *m = pwait->conn;
538 unsigned long flags;
8a0dc95f 539
5503ac56
EVH
540 spin_lock_irqsave(&p9_poll_lock, flags);
541 if (list_empty(&m->poll_pending_link))
542 list_add_tail(&m->poll_pending_link, &p9_poll_pending_list);
543 spin_unlock_irqrestore(&p9_poll_lock, flags);
8a0dc95f 544
aa70c585
TH
545 schedule_work(&p9_poll_work);
546 return 1;
8a0dc95f
EVH
547}
548
549/**
5503ac56
EVH
550 * p9_pollwait - add poll task to the wait queue
551 * @filp: file pointer being polled
552 * @wait_address: wait_q to block on
553 * @p: poll state
ee443996 554 *
5503ac56 555 * called by files poll operation to add v9fs-poll task to files wait queue
8a0dc95f 556 */
ee443996 557
5503ac56
EVH
558static void
559p9_pollwait(struct file *filp, wait_queue_head_t *wait_address, poll_table *p)
8a0dc95f 560{
5503ac56
EVH
561 struct p9_conn *m = container_of(p, struct p9_conn, pt);
562 struct p9_poll_wait *pwait = NULL;
563 int i;
8a0dc95f 564
5503ac56
EVH
565 for (i = 0; i < ARRAY_SIZE(m->poll_wait); i++) {
566 if (m->poll_wait[i].wait_addr == NULL) {
567 pwait = &m->poll_wait[i];
568 break;
8a0dc95f 569 }
8a0dc95f
EVH
570 }
571
5503ac56 572 if (!pwait) {
5d385153 573 p9_debug(P9_DEBUG_ERROR, "not enough wait_address slots\n");
8a0dc95f
EVH
574 return;
575 }
576
5503ac56
EVH
577 pwait->conn = m;
578 pwait->wait_addr = wait_address;
579 init_waitqueue_func_entry(&pwait->wait, p9_pollwake);
580 add_wait_queue(wait_address, &pwait->wait);
581}
8a0dc95f 582
5503ac56 583/**
263c5828 584 * p9_conn_create - initialize the per-session mux data
5503ac56
EVH
585 * @client: client instance
586 *
587 * Note: Creates the polling task if this is the first session.
588 */
8a0dc95f 589
263c5828 590static void p9_conn_create(struct p9_client *client)
5503ac56 591{
7594bf37 592 __poll_t n;
263c5828
SD
593 struct p9_trans_fd *ts = client->trans;
594 struct p9_conn *m = &ts->conn;
8a0dc95f 595
5d385153 596 p9_debug(P9_DEBUG_TRANS, "client %p msize %d\n", client, client->msize);
8a0dc95f 597
5503ac56
EVH
598 INIT_LIST_HEAD(&m->mux_list);
599 m->client = client;
8a0dc95f 600
5503ac56
EVH
601 INIT_LIST_HEAD(&m->req_list);
602 INIT_LIST_HEAD(&m->unsent_req_list);
603 INIT_WORK(&m->rq, p9_read_work);
604 INIT_WORK(&m->wq, p9_write_work);
605 INIT_LIST_HEAD(&m->poll_pending_link);
606 init_poll_funcptr(&m->pt, p9_pollwait);
8a0dc95f 607
7594bf37 608 n = p9_fd_poll(client, &m->pt, NULL);
a9a08845 609 if (n & EPOLLIN) {
5d385153 610 p9_debug(P9_DEBUG_TRANS, "mux %p can read\n", m);
5503ac56
EVH
611 set_bit(Rpending, &m->wsched);
612 }
8a0dc95f 613
a9a08845 614 if (n & EPOLLOUT) {
5d385153 615 p9_debug(P9_DEBUG_TRANS, "mux %p can write\n", m);
5503ac56
EVH
616 set_bit(Wpending, &m->wsched);
617 }
5503ac56 618}
8a0dc95f 619
5503ac56
EVH
620/**
621 * p9_poll_mux - polls a mux and schedules read or write works if necessary
622 * @m: connection to poll
623 *
624 */
625
626static void p9_poll_mux(struct p9_conn *m)
627{
7594bf37
AV
628 __poll_t n;
629 int err = -ECONNRESET;
5503ac56
EVH
630
631 if (m->err < 0)
632 return;
633
7594bf37 634 n = p9_fd_poll(m->client, NULL, &err);
a9a08845 635 if (n & (EPOLLERR | EPOLLHUP | EPOLLNVAL)) {
5d385153 636 p9_debug(P9_DEBUG_TRANS, "error mux %p err %d\n", m, n);
7594bf37 637 p9_conn_cancel(m, err);
5503ac56
EVH
638 }
639
a9a08845 640 if (n & EPOLLIN) {
5503ac56 641 set_bit(Rpending, &m->wsched);
5d385153 642 p9_debug(P9_DEBUG_TRANS, "mux %p can read\n", m);
5503ac56 643 if (!test_and_set_bit(Rworksched, &m->wsched)) {
5d385153 644 p9_debug(P9_DEBUG_TRANS, "sched read work %p\n", m);
61edeeed 645 schedule_work(&m->rq);
5503ac56
EVH
646 }
647 }
8a0dc95f 648
a9a08845 649 if (n & EPOLLOUT) {
5503ac56 650 set_bit(Wpending, &m->wsched);
5d385153 651 p9_debug(P9_DEBUG_TRANS, "mux %p can write\n", m);
f64f9e71
JP
652 if ((m->wsize || !list_empty(&m->unsent_req_list)) &&
653 !test_and_set_bit(Wworksched, &m->wsched)) {
5d385153 654 p9_debug(P9_DEBUG_TRANS, "sched write work %p\n", m);
61edeeed 655 schedule_work(&m->wq);
5503ac56
EVH
656 }
657 }
8a0dc95f
EVH
658}
659
660/**
91b8534f 661 * p9_fd_request - send 9P request
8a0dc95f
EVH
662 * The function can sleep until the request is scheduled for sending.
663 * The function can be interrupted. Return from the function is not
91b8534f 664 * a guarantee that the request is sent successfully.
8a0dc95f 665 *
91b8534f
EVH
666 * @client: client instance
667 * @req: request to be sent
ee443996 668 *
8a0dc95f 669 */
ee443996 670
91b8534f 671static int p9_fd_request(struct p9_client *client, struct p9_req_t *req)
8a0dc95f 672{
7594bf37 673 __poll_t n;
91b8534f 674 struct p9_trans_fd *ts = client->trans;
263c5828 675 struct p9_conn *m = &ts->conn;
8a0dc95f 676
5d385153 677 p9_debug(P9_DEBUG_TRANS, "mux %p task %p tcall %p id %d\n",
523adb6c 678 m, current, &req->tc, req->tc.id);
8a0dc95f 679 if (m->err < 0)
91b8534f 680 return m->err;
8a0dc95f 681
91b8534f 682 spin_lock(&client->lock);
7eb923b8 683 req->status = REQ_STATUS_UNSENT;
8a0dc95f 684 list_add_tail(&req->req_list, &m->unsent_req_list);
91b8534f 685 spin_unlock(&client->lock);
8a0dc95f
EVH
686
687 if (test_and_clear_bit(Wpending, &m->wsched))
a9a08845 688 n = EPOLLOUT;
8a0dc95f 689 else
7594bf37 690 n = p9_fd_poll(m->client, NULL, NULL);
8a0dc95f 691
a9a08845 692 if (n & EPOLLOUT && !test_and_set_bit(Wworksched, &m->wsched))
61edeeed 693 schedule_work(&m->wq);
8a0dc95f 694
91b8534f 695 return 0;
8a0dc95f
EVH
696}
697
91b8534f 698static int p9_fd_cancel(struct p9_client *client, struct p9_req_t *req)
8a0dc95f 699{
7eb923b8 700 int ret = 1;
8a0dc95f 701
5d385153 702 p9_debug(P9_DEBUG_TRANS, "client %p req %p\n", client, req);
8a0dc95f 703
91b8534f 704 spin_lock(&client->lock);
91b8534f 705
91b8534f 706 if (req->status == REQ_STATUS_UNSENT) {
1bab88b2 707 list_del(&req->req_list);
91b8534f 708 req->status = REQ_STATUS_FLSHD;
728356de 709 p9_req_put(req);
7eb923b8 710 ret = 0;
0bfd6845 711 }
7eb923b8
EVH
712 spin_unlock(&client->lock);
713
714 return ret;
8a0dc95f
EVH
715}
716
afd8d654
SD
717static int p9_fd_cancelled(struct p9_client *client, struct p9_req_t *req)
718{
719 p9_debug(P9_DEBUG_TRANS, "client %p req %p\n", client, req);
720
721 /* we haven't received a response for oldreq,
722 * remove it from the list.
723 */
724 spin_lock(&client->lock);
725 list_del(&req->req_list);
726 spin_unlock(&client->lock);
728356de 727 p9_req_put(req);
afd8d654
SD
728
729 return 0;
730}
731
c4fac910
DH
732static int p9_fd_show_options(struct seq_file *m, struct p9_client *clnt)
733{
734 if (clnt->trans_mod == &p9_tcp_trans) {
735 if (clnt->trans_opts.tcp.port != P9_PORT)
61b272c3 736 seq_printf(m, ",port=%u", clnt->trans_opts.tcp.port);
c4fac910
DH
737 } else if (clnt->trans_mod == &p9_fd_trans) {
738 if (clnt->trans_opts.fd.rfd != ~0)
61b272c3 739 seq_printf(m, ",rfd=%u", clnt->trans_opts.fd.rfd);
c4fac910 740 if (clnt->trans_opts.fd.wfd != ~0)
61b272c3 741 seq_printf(m, ",wfd=%u", clnt->trans_opts.fd.wfd);
c4fac910
DH
742 }
743 return 0;
744}
745
a80d923e 746/**
0e15597e
AK
747 * parse_opts - parse mount options into p9_fd_opts structure
748 * @params: options string passed from mount
749 * @opts: fd transport-specific structure to parse options into
a80d923e 750 *
bb8ffdfc 751 * Returns 0 upon success, -ERRNO upon failure
a80d923e 752 */
bd238fb4 753
bb8ffdfc 754static int parse_opts(char *params, struct p9_fd_opts *opts)
bd238fb4 755{
a80d923e
EVH
756 char *p;
757 substring_t args[MAX_OPT_ARGS];
758 int option;
d8c8a9e3 759 char *options, *tmp_options;
bd238fb4 760
a80d923e
EVH
761 opts->port = P9_PORT;
762 opts->rfd = ~0;
763 opts->wfd = ~0;
c4fac910 764 opts->privport = false;
bd238fb4 765
bb8ffdfc
EVH
766 if (!params)
767 return 0;
768
d8c8a9e3
EVH
769 tmp_options = kstrdup(params, GFP_KERNEL);
770 if (!tmp_options) {
5d385153
JP
771 p9_debug(P9_DEBUG_ERROR,
772 "failed to allocate copy of option string\n");
bb8ffdfc
EVH
773 return -ENOMEM;
774 }
d8c8a9e3 775 options = tmp_options;
bd238fb4 776
a80d923e
EVH
777 while ((p = strsep(&options, ",")) != NULL) {
778 int token;
bb8ffdfc 779 int r;
a80d923e
EVH
780 if (!*p)
781 continue;
782 token = match_token(p, tokens, args);
2f28c8b3 783 if ((token != Opt_err) && (token != Opt_privport)) {
15da4b16
AK
784 r = match_int(&args[0], &option);
785 if (r < 0) {
5d385153
JP
786 p9_debug(P9_DEBUG_ERROR,
787 "integer field, but no integer?\n");
15da4b16
AK
788 continue;
789 }
a80d923e
EVH
790 }
791 switch (token) {
792 case Opt_port:
793 opts->port = option;
794 break;
795 case Opt_rfdno:
796 opts->rfd = option;
797 break;
798 case Opt_wfdno:
799 opts->wfd = option;
800 break;
2f28c8b3 801 case Opt_privport:
c4fac910 802 opts->privport = true;
2f28c8b3 803 break;
a80d923e
EVH
804 default:
805 continue;
806 }
bd238fb4 807 }
d8c8a9e3
EVH
808
809 kfree(tmp_options);
bb8ffdfc 810 return 0;
bd238fb4 811}
bd238fb4 812
8b81ef58 813static int p9_fd_open(struct p9_client *client, int rfd, int wfd)
bd238fb4 814{
263c5828 815 struct p9_trans_fd *ts = kzalloc(sizeof(struct p9_trans_fd),
a80d923e
EVH
816 GFP_KERNEL);
817 if (!ts)
818 return -ENOMEM;
bd238fb4 819
a80d923e
EVH
820 ts->rd = fget(rfd);
821 ts->wr = fget(wfd);
822 if (!ts->rd || !ts->wr) {
823 if (ts->rd)
824 fput(ts->rd);
825 if (ts->wr)
826 fput(ts->wr);
827 kfree(ts);
828 return -EIO;
bd238fb4
LI
829 }
830
8b81ef58
EVH
831 client->trans = ts;
832 client->status = Connected;
bd238fb4 833
a80d923e 834 return 0;
bd238fb4 835}
bd238fb4 836
8b81ef58 837static int p9_socket_open(struct p9_client *client, struct socket *csocket)
bd238fb4 838{
6b18662e 839 struct p9_trans_fd *p;
56b31d1c 840 struct file *file;
6b18662e 841
263c5828 842 p = kzalloc(sizeof(struct p9_trans_fd), GFP_KERNEL);
6b18662e
AV
843 if (!p)
844 return -ENOMEM;
bd238fb4
LI
845
846 csocket->sk->sk_allocation = GFP_NOIO;
aab174f0 847 file = sock_alloc_file(csocket, 0, NULL);
56b31d1c 848 if (IS_ERR(file)) {
5d385153
JP
849 pr_err("%s (%d): failed to map fd\n",
850 __func__, task_pid_nr(current));
6b18662e 851 kfree(p);
56b31d1c 852 return PTR_ERR(file);
bd238fb4
LI
853 }
854
56b31d1c
AV
855 get_file(file);
856 p->wr = p->rd = file;
6b18662e
AV
857 client->trans = p;
858 client->status = Connected;
859
6b18662e
AV
860 p->rd->f_flags |= O_NONBLOCK;
861
263c5828 862 p9_conn_create(client);
bd238fb4
LI
863 return 0;
864}
865
bd238fb4 866/**
263c5828 867 * p9_mux_destroy - cancels all pending requests of mux
5503ac56 868 * @m: mux to destroy
bd238fb4
LI
869 *
870 */
ee443996 871
5503ac56 872static void p9_conn_destroy(struct p9_conn *m)
bd238fb4 873{
5d385153
JP
874 p9_debug(P9_DEBUG_TRANS, "mux %p prev %p next %p\n",
875 m, m->mux_list.prev, m->mux_list.next);
bd238fb4 876
5503ac56
EVH
877 p9_mux_poll_stop(m);
878 cancel_work_sync(&m->rq);
fb488fc1
DM
879 if (m->rreq) {
880 p9_req_put(m->rreq);
881 m->rreq = NULL;
882 }
5503ac56 883 cancel_work_sync(&m->wq);
fb488fc1
DM
884 if (m->wreq) {
885 p9_req_put(m->wreq);
886 m->wreq = NULL;
887 }
bd238fb4 888
5503ac56 889 p9_conn_cancel(m, -ECONNRESET);
bd238fb4 890
5503ac56 891 m->client = NULL;
bd238fb4
LI
892}
893
894/**
8b81ef58
EVH
895 * p9_fd_close - shutdown file descriptor transport
896 * @client: client instance
bd238fb4
LI
897 *
898 */
ee443996 899
8b81ef58 900static void p9_fd_close(struct p9_client *client)
bd238fb4
LI
901{
902 struct p9_trans_fd *ts;
903
8b81ef58 904 if (!client)
bd238fb4
LI
905 return;
906
8b81ef58 907 ts = client->trans;
bd238fb4
LI
908 if (!ts)
909 return;
910
8b81ef58
EVH
911 client->status = Disconnected;
912
263c5828 913 p9_conn_destroy(&ts->conn);
8a0dc95f 914
bd238fb4
LI
915 if (ts->rd)
916 fput(ts->rd);
917 if (ts->wr)
918 fput(ts->wr);
8b81ef58 919
bd238fb4
LI
920 kfree(ts);
921}
922
887b3ece
EVH
923/*
924 * stolen from NFS - maybe should be made a generic function?
925 */
926static inline int valid_ipaddr4(const char *buf)
927{
928 int rc, count, in[4];
929
930 rc = sscanf(buf, "%d.%d.%d.%d", &in[0], &in[1], &in[2], &in[3]);
931 if (rc != 4)
932 return -EINVAL;
933 for (count = 0; count < 4; count++) {
934 if (in[count] > 255)
935 return -EINVAL;
936 }
937 return 0;
938}
939
2f28c8b3
JG
940static int p9_bind_privport(struct socket *sock)
941{
942 struct sockaddr_in cl;
943 int port, err = -EINVAL;
944
945 memset(&cl, 0, sizeof(cl));
946 cl.sin_family = AF_INET;
947 cl.sin_addr.s_addr = INADDR_ANY;
948 for (port = p9_ipport_resv_max; port >= p9_ipport_resv_min; port--) {
949 cl.sin_port = htons((ushort)port);
950 err = kernel_bind(sock, (struct sockaddr *)&cl, sizeof(cl));
951 if (err != -EADDRINUSE)
952 break;
953 }
954 return err;
955}
956
957
8b81ef58
EVH
958static int
959p9_fd_create_tcp(struct p9_client *client, const char *addr, char *args)
a80d923e
EVH
960{
961 int err;
a80d923e
EVH
962 struct socket *csocket;
963 struct sockaddr_in sin_server;
964 struct p9_fd_opts opts;
965
bb8ffdfc
EVH
966 err = parse_opts(args, &opts);
967 if (err < 0)
8b81ef58 968 return err;
a80d923e 969
10aa1452 970 if (addr == NULL || valid_ipaddr4(addr) < 0)
8b81ef58 971 return -EINVAL;
887b3ece 972
a80d923e 973 csocket = NULL;
a80d923e 974
c4fac910
DH
975 client->trans_opts.tcp.port = opts.port;
976 client->trans_opts.tcp.privport = opts.privport;
a80d923e
EVH
977 sin_server.sin_family = AF_INET;
978 sin_server.sin_addr.s_addr = in_aton(addr);
979 sin_server.sin_port = htons(opts.port);
0c5c9fb5 980 err = __sock_create(current->nsproxy->net_ns, PF_INET,
e75762fd 981 SOCK_STREAM, IPPROTO_TCP, &csocket, 1);
6b18662e 982 if (err) {
5d385153
JP
983 pr_err("%s (%d): problem creating socket\n",
984 __func__, task_pid_nr(current));
6b18662e 985 return err;
a80d923e
EVH
986 }
987
2f28c8b3
JG
988 if (opts.privport) {
989 err = p9_bind_privport(csocket);
990 if (err < 0) {
991 pr_err("%s (%d): problem binding to privport\n",
992 __func__, task_pid_nr(current));
993 sock_release(csocket);
994 return err;
995 }
996 }
997
a80d923e
EVH
998 err = csocket->ops->connect(csocket,
999 (struct sockaddr *)&sin_server,
1000 sizeof(struct sockaddr_in), 0);
1001 if (err < 0) {
5d385153
JP
1002 pr_err("%s (%d): problem connecting socket to %s\n",
1003 __func__, task_pid_nr(current), addr);
a80d923e 1004 sock_release(csocket);
6b18662e
AV
1005 return err;
1006 }
a80d923e 1007
6b18662e 1008 return p9_socket_open(client, csocket);
a80d923e
EVH
1009}
1010
8b81ef58
EVH
1011static int
1012p9_fd_create_unix(struct p9_client *client, const char *addr, char *args)
a80d923e
EVH
1013{
1014 int err;
1015 struct socket *csocket;
1016 struct sockaddr_un sun_server;
a80d923e
EVH
1017
1018 csocket = NULL;
a80d923e 1019
10aa1452
TB
1020 if (addr == NULL)
1021 return -EINVAL;
1022
cff6b8a9 1023 if (strlen(addr) >= UNIX_PATH_MAX) {
5d385153
JP
1024 pr_err("%s (%d): address too long: %s\n",
1025 __func__, task_pid_nr(current), addr);
6b18662e 1026 return -ENAMETOOLONG;
a80d923e
EVH
1027 }
1028
1029 sun_server.sun_family = PF_UNIX;
1030 strcpy(sun_server.sun_path, addr);
0c5c9fb5 1031 err = __sock_create(current->nsproxy->net_ns, PF_UNIX,
e75762fd 1032 SOCK_STREAM, 0, &csocket, 1);
6b18662e 1033 if (err < 0) {
5d385153
JP
1034 pr_err("%s (%d): problem creating socket\n",
1035 __func__, task_pid_nr(current));
1036
6b18662e
AV
1037 return err;
1038 }
a80d923e
EVH
1039 err = csocket->ops->connect(csocket, (struct sockaddr *)&sun_server,
1040 sizeof(struct sockaddr_un) - 1, 0);
1041 if (err < 0) {
5d385153
JP
1042 pr_err("%s (%d): problem connecting socket: %s: %d\n",
1043 __func__, task_pid_nr(current), addr, err);
a80d923e 1044 sock_release(csocket);
6b18662e
AV
1045 return err;
1046 }
a80d923e 1047
6b18662e 1048 return p9_socket_open(client, csocket);
a80d923e
EVH
1049}
1050
8b81ef58
EVH
1051static int
1052p9_fd_create(struct p9_client *client, const char *addr, char *args)
a80d923e
EVH
1053{
1054 int err;
a80d923e
EVH
1055 struct p9_fd_opts opts;
1056
1057 parse_opts(args, &opts);
c4fac910
DH
1058 client->trans_opts.fd.rfd = opts.rfd;
1059 client->trans_opts.fd.wfd = opts.wfd;
a80d923e
EVH
1060
1061 if (opts.rfd == ~0 || opts.wfd == ~0) {
5d385153 1062 pr_err("Insufficient options for proto=fd\n");
8b81ef58 1063 return -ENOPROTOOPT;
a80d923e
EVH
1064 }
1065
8b81ef58 1066 err = p9_fd_open(client, opts.rfd, opts.wfd);
a80d923e 1067 if (err < 0)
6b18662e 1068 return err;
a80d923e 1069
263c5828 1070 p9_conn_create(client);
8a0dc95f 1071
8b81ef58 1072 return 0;
a80d923e
EVH
1073}
1074
1075static struct p9_trans_module p9_tcp_trans = {
1076 .name = "tcp",
1077 .maxsize = MAX_SOCK_BUF,
f94741fd 1078 .def = 0,
8b81ef58
EVH
1079 .create = p9_fd_create_tcp,
1080 .close = p9_fd_close,
91b8534f
EVH
1081 .request = p9_fd_request,
1082 .cancel = p9_fd_cancel,
afd8d654 1083 .cancelled = p9_fd_cancelled,
c4fac910 1084 .show_options = p9_fd_show_options,
72029fe8 1085 .owner = THIS_MODULE,
a80d923e
EVH
1086};
1087
1088static struct p9_trans_module p9_unix_trans = {
1089 .name = "unix",
1090 .maxsize = MAX_SOCK_BUF,
1091 .def = 0,
8b81ef58
EVH
1092 .create = p9_fd_create_unix,
1093 .close = p9_fd_close,
91b8534f
EVH
1094 .request = p9_fd_request,
1095 .cancel = p9_fd_cancel,
afd8d654 1096 .cancelled = p9_fd_cancelled,
c4fac910 1097 .show_options = p9_fd_show_options,
72029fe8 1098 .owner = THIS_MODULE,
a80d923e
EVH
1099};
1100
1101static struct p9_trans_module p9_fd_trans = {
1102 .name = "fd",
1103 .maxsize = MAX_SOCK_BUF,
1104 .def = 0,
8b81ef58
EVH
1105 .create = p9_fd_create,
1106 .close = p9_fd_close,
91b8534f
EVH
1107 .request = p9_fd_request,
1108 .cancel = p9_fd_cancel,
afd8d654 1109 .cancelled = p9_fd_cancelled,
c4fac910 1110 .show_options = p9_fd_show_options,
72029fe8 1111 .owner = THIS_MODULE,
a80d923e
EVH
1112};
1113
5503ac56 1114/**
4a026da9
SL
1115 * p9_poll_workfn - poll worker thread
1116 * @work: work queue
5503ac56
EVH
1117 *
1118 * polls all v9fs transports for new events and queues the appropriate
1119 * work to the work queue
1120 *
1121 */
1122
aa70c585 1123static void p9_poll_workfn(struct work_struct *work)
5503ac56
EVH
1124{
1125 unsigned long flags;
1126
5d385153 1127 p9_debug(P9_DEBUG_TRANS, "start %p\n", current);
aa70c585 1128
5503ac56
EVH
1129 spin_lock_irqsave(&p9_poll_lock, flags);
1130 while (!list_empty(&p9_poll_pending_list)) {
1131 struct p9_conn *conn = list_first_entry(&p9_poll_pending_list,
1132 struct p9_conn,
1133 poll_pending_link);
1134 list_del_init(&conn->poll_pending_link);
1135 spin_unlock_irqrestore(&p9_poll_lock, flags);
1136
1137 p9_poll_mux(conn);
1138
1139 spin_lock_irqsave(&p9_poll_lock, flags);
1140 }
1141 spin_unlock_irqrestore(&p9_poll_lock, flags);
1142
5d385153 1143 p9_debug(P9_DEBUG_TRANS, "finish\n");
5503ac56
EVH
1144}
1145
887b3ece 1146int p9_trans_fd_init(void)
a80d923e
EVH
1147{
1148 v9fs_register_trans(&p9_tcp_trans);
1149 v9fs_register_trans(&p9_unix_trans);
1150 v9fs_register_trans(&p9_fd_trans);
1151
3387b804 1152 return 0;
a80d923e 1153}
72029fe8
TH
1154
1155void p9_trans_fd_exit(void)
1156{
43829731 1157 flush_work(&p9_poll_work);
72029fe8
TH
1158 v9fs_unregister_trans(&p9_tcp_trans);
1159 v9fs_unregister_trans(&p9_unix_trans);
1160 v9fs_unregister_trans(&p9_fd_trans);
1161}