net/9p/trans_fd.c: fix race by holding the lock
[linux-block.git] / net / 9p / trans_fd.c
CommitLineData
bd238fb4
LI
1/*
2 * linux/fs/9p/trans_fd.c
3 *
4 * Fd transport layer. Includes deprecated socket layer.
5 *
6 * Copyright (C) 2006 by Russ Cox <rsc@swtch.com>
7 * Copyright (C) 2004-2005 by Latchesar Ionkov <lucho@ionkov.net>
8a0dc95f 8 * Copyright (C) 2004-2008 by Eric Van Hensbergen <ericvh@gmail.com>
bd238fb4
LI
9 * Copyright (C) 1997-2002 by Ron Minnich <rminnich@sarnoff.com>
10 *
11 * This program is free software; you can redistribute it and/or modify
12 * it under the terms of the GNU General Public License version 2
13 * as published by the Free Software Foundation.
14 *
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU General Public License for more details.
19 *
20 * You should have received a copy of the GNU General Public License
21 * along with this program; if not, write to:
22 * Free Software Foundation
23 * 51 Franklin Street, Fifth Floor
24 * Boston, MA 02111-1301 USA
25 *
26 */
27
5d385153
JP
28#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
29
bd238fb4
LI
30#include <linux/in.h>
31#include <linux/module.h>
32#include <linux/net.h>
33#include <linux/ipv6.h>
8a0dc95f 34#include <linux/kthread.h>
bd238fb4
LI
35#include <linux/errno.h>
36#include <linux/kernel.h>
37#include <linux/un.h>
38#include <linux/uaccess.h>
39#include <linux/inet.h>
40#include <linux/idr.h>
41#include <linux/file.h>
a80d923e 42#include <linux/parser.h>
5a0e3ad6 43#include <linux/slab.h>
c4fac910 44#include <linux/seq_file.h>
bd238fb4 45#include <net/9p/9p.h>
8b81ef58 46#include <net/9p/client.h>
bd238fb4
LI
47#include <net/9p/transport.h>
48
6b18662e
AV
49#include <linux/syscalls.h> /* killme */
50
bd238fb4 51#define P9_PORT 564
a80d923e 52#define MAX_SOCK_BUF (64*1024)
8a0dc95f 53#define MAXPOLLWADDR 2
a80d923e 54
c4fac910
DH
55static struct p9_trans_module p9_tcp_trans;
56static struct p9_trans_module p9_fd_trans;
57
ee443996
EVH
58/**
59 * struct p9_fd_opts - per-transport options
60 * @rfd: file descriptor for reading (trans=fd)
61 * @wfd: file descriptor for writing (trans=fd)
62 * @port: port to connect to (trans=tcp)
63 *
64 */
65
a80d923e
EVH
66struct p9_fd_opts {
67 int rfd;
68 int wfd;
69 u16 port;
c4fac910 70 bool privport;
a80d923e 71};
bd238fb4 72
a80d923e
EVH
73/*
74 * Option Parsing (code inspired by NFS code)
75 * - a little lazy - parse all fd-transport options
76 */
bd238fb4 77
a80d923e
EVH
78enum {
79 /* Options that take integer arguments */
55762690 80 Opt_port, Opt_rfdno, Opt_wfdno, Opt_err,
2f28c8b3
JG
81 /* Options that take no arguments */
82 Opt_privport,
a80d923e 83};
bd238fb4 84
a447c093 85static const match_table_t tokens = {
a80d923e
EVH
86 {Opt_port, "port=%u"},
87 {Opt_rfdno, "rfdno=%u"},
88 {Opt_wfdno, "wfdno=%u"},
2f28c8b3 89 {Opt_privport, "privport"},
55762690 90 {Opt_err, NULL},
a80d923e 91};
bd238fb4 92
8a0dc95f
EVH
93enum {
94 Rworksched = 1, /* read work scheduled or running */
95 Rpending = 2, /* can read */
96 Wworksched = 4, /* write work scheduled or running */
97 Wpending = 8, /* can write */
98};
99
992b3f1d
TH
100struct p9_poll_wait {
101 struct p9_conn *conn;
ac6424b9 102 wait_queue_entry_t wait;
992b3f1d 103 wait_queue_head_t *wait_addr;
ee443996
EVH
104};
105
106/**
107 * struct p9_conn - fd mux connection state information
ee443996 108 * @mux_list: list link for mux to manage multiple connections (?)
8b81ef58 109 * @client: reference to client instance for this connection
ee443996 110 * @err: error state
ee443996
EVH
111 * @req_list: accounting for requests which have been sent
112 * @unsent_req_list: accounting for requests that haven't been sent
1b0a763b
EVH
113 * @req: current request being processed (if any)
114 * @tmp_buf: temporary buffer to read in header
947867aa 115 * @rc: temporary fcall for reading current frame
ee443996
EVH
116 * @wpos: write position for current frame
117 * @wsize: amount of data to write for current frame
118 * @wbuf: current write buffer
0e15597e 119 * @poll_pending_link: pending links to be polled per conn
ee443996 120 * @poll_wait: array of wait_q's for various worker threads
ee443996
EVH
121 * @pt: poll state
122 * @rq: current read work
123 * @wq: current write work
124 * @wsched: ????
125 *
126 */
8a0dc95f
EVH
127
128struct p9_conn {
8a0dc95f 129 struct list_head mux_list;
8b81ef58 130 struct p9_client *client;
8a0dc95f 131 int err;
8a0dc95f
EVH
132 struct list_head req_list;
133 struct list_head unsent_req_list;
1b0a763b
EVH
134 struct p9_req_t *req;
135 char tmp_buf[7];
947867aa 136 struct p9_fcall rc;
8a0dc95f
EVH
137 int wpos;
138 int wsize;
139 char *wbuf;
992b3f1d
TH
140 struct list_head poll_pending_link;
141 struct p9_poll_wait poll_wait[MAXPOLLWADDR];
8a0dc95f
EVH
142 poll_table pt;
143 struct work_struct rq;
144 struct work_struct wq;
145 unsigned long wsched;
146};
147
263c5828
SD
148/**
149 * struct p9_trans_fd - transport state
150 * @rd: reference to file to read from
151 * @wr: reference of file to write to
152 * @conn: connection state reference
153 *
154 */
155
156struct p9_trans_fd {
157 struct file *rd;
158 struct file *wr;
159 struct p9_conn conn;
160};
161
aa70c585
TH
162static void p9_poll_workfn(struct work_struct *work);
163
992b3f1d
TH
164static DEFINE_SPINLOCK(p9_poll_lock);
165static LIST_HEAD(p9_poll_pending_list);
aa70c585 166static DECLARE_WORK(p9_poll_work, p9_poll_workfn);
8a0dc95f 167
2f28c8b3
JG
168static unsigned int p9_ipport_resv_min = P9_DEF_MIN_RESVPORT;
169static unsigned int p9_ipport_resv_max = P9_DEF_MAX_RESVPORT;
170
992b3f1d 171static void p9_mux_poll_stop(struct p9_conn *m)
8a0dc95f 172{
992b3f1d
TH
173 unsigned long flags;
174 int i;
8a0dc95f 175
992b3f1d
TH
176 for (i = 0; i < ARRAY_SIZE(m->poll_wait); i++) {
177 struct p9_poll_wait *pwait = &m->poll_wait[i];
8a0dc95f 178
992b3f1d
TH
179 if (pwait->wait_addr) {
180 remove_wait_queue(pwait->wait_addr, &pwait->wait);
181 pwait->wait_addr = NULL;
8a0dc95f 182 }
8a0dc95f
EVH
183 }
184
992b3f1d
TH
185 spin_lock_irqsave(&p9_poll_lock, flags);
186 list_del_init(&m->poll_pending_link);
187 spin_unlock_irqrestore(&p9_poll_lock, flags);
430ac66e
TB
188
189 flush_work(&p9_poll_work);
8a0dc95f
EVH
190}
191
192/**
5503ac56
EVH
193 * p9_conn_cancel - cancel all pending requests with error
194 * @m: mux data
195 * @err: error code
8a0dc95f 196 *
8a0dc95f 197 */
ee443996 198
51a87c55 199static void p9_conn_cancel(struct p9_conn *m, int err)
8a0dc95f 200{
673d62cd 201 struct p9_req_t *req, *rtmp;
5503ac56 202 LIST_HEAD(cancel_list);
8a0dc95f 203
5d385153 204 p9_debug(P9_DEBUG_ERROR, "mux %p err %d\n", m, err);
7eb923b8 205
9f476d7c 206 spin_lock(&m->client->lock);
7eb923b8
EVH
207
208 if (m->err) {
9f476d7c 209 spin_unlock(&m->client->lock);
7eb923b8
EVH
210 return;
211 }
212
213 m->err = err;
214
5503ac56
EVH
215 list_for_each_entry_safe(req, rtmp, &m->req_list, req_list) {
216 list_move(&req->req_list, &cancel_list);
217 }
218 list_for_each_entry_safe(req, rtmp, &m->unsent_req_list, req_list) {
219 list_move(&req->req_list, &cancel_list);
8a0dc95f
EVH
220 }
221
5503ac56 222 list_for_each_entry_safe(req, rtmp, &cancel_list, req_list) {
5d385153 223 p9_debug(P9_DEBUG_ERROR, "call back req %p\n", req);
1bab88b2 224 list_del(&req->req_list);
2b6e72ed
DM
225 if (!req->t_err)
226 req->t_err = err;
227 p9_client_cb(m->client, req, REQ_STATUS_ERROR);
8a0dc95f 228 }
9f476d7c 229 spin_unlock(&m->client->lock);
8a0dc95f
EVH
230}
231
7594bf37
AV
232static __poll_t
233p9_fd_poll(struct p9_client *client, struct poll_table_struct *pt, int *err)
8a0dc95f 234{
9965ed17 235 __poll_t ret;
5503ac56 236 struct p9_trans_fd *ts = NULL;
8a0dc95f 237
5503ac56
EVH
238 if (client && client->status == Connected)
239 ts = client->trans;
7dc5d24b 240
7594bf37
AV
241 if (!ts) {
242 if (err)
243 *err = -EREMOTEIO;
a9a08845 244 return EPOLLERR;
7594bf37 245 }
7dc5d24b 246
9965ed17
CH
247 ret = vfs_poll(ts->rd, pt);
248 if (ts->rd != ts->wr)
249 ret = (ret & ~EPOLLOUT) | (vfs_poll(ts->wr, pt) & ~EPOLLIN);
5503ac56 250 return ret;
992b3f1d
TH
251}
252
8a0dc95f 253/**
5503ac56
EVH
254 * p9_fd_read- read from a fd
255 * @client: client instance
256 * @v: buffer to receive data into
257 * @len: size of receive buffer
ee443996 258 *
8a0dc95f 259 */
ee443996 260
5503ac56 261static int p9_fd_read(struct p9_client *client, void *v, int len)
8a0dc95f 262{
5503ac56
EVH
263 int ret;
264 struct p9_trans_fd *ts = NULL;
bdd1d2d3 265 loff_t pos;
8a0dc95f 266
5503ac56
EVH
267 if (client && client->status != Disconnected)
268 ts = client->trans;
8a0dc95f 269
5503ac56
EVH
270 if (!ts)
271 return -EREMOTEIO;
8a0dc95f 272
5503ac56 273 if (!(ts->rd->f_flags & O_NONBLOCK))
5d385153 274 p9_debug(P9_DEBUG_ERROR, "blocking read ...\n");
8a0dc95f 275
bdd1d2d3
CH
276 pos = ts->rd->f_pos;
277 ret = kernel_read(ts->rd, v, len, &pos);
5503ac56
EVH
278 if (ret <= 0 && ret != -ERESTARTSYS && ret != -EAGAIN)
279 client->status = Disconnected;
280 return ret;
8a0dc95f
EVH
281}
282
283/**
5503ac56
EVH
284 * p9_read_work - called when there is some data to be read from a transport
285 * @work: container of work to be done
ee443996 286 *
8a0dc95f 287 */
ee443996 288
5503ac56 289static void p9_read_work(struct work_struct *work)
8a0dc95f 290{
7594bf37
AV
291 __poll_t n;
292 int err;
5503ac56 293 struct p9_conn *m;
2b6e72ed 294 int status = REQ_STATUS_ERROR;
5503ac56
EVH
295
296 m = container_of(work, struct p9_conn, rq);
8a0dc95f
EVH
297
298 if (m->err < 0)
299 return;
300
947867aa 301 p9_debug(P9_DEBUG_TRANS, "start mux %p pos %zd\n", m, m->rc.offset);
8a0dc95f 302
947867aa
DM
303 if (!m->rc.sdata) {
304 m->rc.sdata = m->tmp_buf;
305 m->rc.offset = 0;
306 m->rc.capacity = 7; /* start by reading header */
8a0dc95f
EVH
307 }
308
5503ac56 309 clear_bit(Rpending, &m->wsched);
947867aa
DM
310 p9_debug(P9_DEBUG_TRANS, "read mux %p pos %zd size: %zd = %zd\n",
311 m, m->rc.offset, m->rc.capacity,
312 m->rc.capacity - m->rc.offset);
313 err = p9_fd_read(m->client, m->rc.sdata + m->rc.offset,
314 m->rc.capacity - m->rc.offset);
5d385153 315 p9_debug(P9_DEBUG_TRANS, "mux %p got %d bytes\n", m, err);
947867aa 316 if (err == -EAGAIN)
0462194d 317 goto end_clear;
8a0dc95f 318
5503ac56
EVH
319 if (err <= 0)
320 goto error;
321
947867aa 322 m->rc.offset += err;
1b0a763b 323
947867aa
DM
324 /* header read in */
325 if ((!m->req) && (m->rc.offset == m->rc.capacity)) {
5d385153 326 p9_debug(P9_DEBUG_TRANS, "got new header\n");
1b0a763b 327
947867aa
DM
328 err = p9_parse_header(&m->rc, NULL, NULL, NULL, 0);
329 if (err) {
330 p9_debug(P9_DEBUG_ERROR,
331 "error parsing header: %d\n", err);
332 goto error;
333 }
334
335 if (m->rc.size >= m->client->msize) {
5d385153 336 p9_debug(P9_DEBUG_ERROR,
947867aa
DM
337 "requested packet size too big: %d\n",
338 m->rc.size);
5503ac56
EVH
339 err = -EIO;
340 goto error;
341 }
342
5d385153 343 p9_debug(P9_DEBUG_TRANS,
947867aa
DM
344 "mux %p pkt: size: %d bytes tag: %d\n",
345 m, m->rc.size, m->rc.tag);
1b0a763b 346
947867aa 347 m->req = p9_tag_lookup(m->client, m->rc.tag);
0bfd6845 348 if (!m->req || (m->req->status != REQ_STATUS_SENT)) {
5d385153 349 p9_debug(P9_DEBUG_ERROR, "Unexpected packet tag %d\n",
947867aa 350 m->rc.tag);
1b0a763b
EVH
351 err = -EIO;
352 goto error;
353 }
354
355 if (m->req->rc == NULL) {
3053600e
DM
356 p9_debug(P9_DEBUG_ERROR,
357 "No recv fcall for tag %d (req %p), disconnecting!\n",
358 m->rc.tag, m->req);
359 m->req = NULL;
360 err = -EIO;
361 goto error;
1b0a763b 362 }
947867aa
DM
363 m->rc.sdata = (char *)m->req->rc + sizeof(struct p9_fcall);
364 memcpy(m->rc.sdata, m->tmp_buf, m->rc.capacity);
365 m->rc.capacity = m->rc.size;
1b0a763b 366 }
5503ac56 367
947867aa
DM
368 /* packet is read in
369 * not an else because some packets (like clunk) have no payload
370 */
371 if ((m->req) && (m->rc.offset == m->rc.capacity)) {
5d385153 372 p9_debug(P9_DEBUG_TRANS, "got new packet\n");
7eb923b8 373 spin_lock(&m->client->lock);
1bab88b2 374 if (m->req->status != REQ_STATUS_ERROR)
2b6e72ed 375 status = REQ_STATUS_RCVD;
91b8534f 376 list_del(&m->req->req_list);
9f476d7c 377 /* update req->status while holding client->lock */
2b6e72ed 378 p9_client_cb(m->client, m->req, status);
9f476d7c 379 spin_unlock(&m->client->lock);
947867aa
DM
380 m->rc.sdata = NULL;
381 m->rc.offset = 0;
382 m->rc.capacity = 0;
1b0a763b 383 m->req = NULL;
5503ac56
EVH
384 }
385
0462194d
SD
386end_clear:
387 clear_bit(Rworksched, &m->wsched);
388
5503ac56
EVH
389 if (!list_empty(&m->req_list)) {
390 if (test_and_clear_bit(Rpending, &m->wsched))
a9a08845 391 n = EPOLLIN;
5503ac56 392 else
7594bf37 393 n = p9_fd_poll(m->client, NULL, NULL);
5503ac56 394
a9a08845 395 if ((n & EPOLLIN) && !test_and_set_bit(Rworksched, &m->wsched)) {
5d385153 396 p9_debug(P9_DEBUG_TRANS, "sched read work %p\n", m);
61edeeed 397 schedule_work(&m->rq);
0462194d
SD
398 }
399 }
5503ac56
EVH
400
401 return;
5503ac56
EVH
402error:
403 p9_conn_cancel(m, err);
404 clear_bit(Rworksched, &m->wsched);
405}
406
407/**
408 * p9_fd_write - write to a socket
409 * @client: client instance
410 * @v: buffer to send data from
411 * @len: size of send buffer
ee443996 412 *
8a0dc95f 413 */
ee443996 414
5503ac56 415static int p9_fd_write(struct p9_client *client, void *v, int len)
8a0dc95f 416{
670986ec 417 ssize_t ret;
5503ac56 418 struct p9_trans_fd *ts = NULL;
8a0dc95f 419
5503ac56
EVH
420 if (client && client->status != Disconnected)
421 ts = client->trans;
8a0dc95f 422
5503ac56
EVH
423 if (!ts)
424 return -EREMOTEIO;
8a0dc95f 425
5503ac56 426 if (!(ts->wr->f_flags & O_NONBLOCK))
5d385153 427 p9_debug(P9_DEBUG_ERROR, "blocking write ...\n");
992b3f1d 428
670986ec 429 ret = kernel_write(ts->wr, v, len, &ts->wr->f_pos);
5503ac56
EVH
430 if (ret <= 0 && ret != -ERESTARTSYS && ret != -EAGAIN)
431 client->status = Disconnected;
432 return ret;
8a0dc95f
EVH
433}
434
435/**
436 * p9_write_work - called when a transport can send some data
ee443996
EVH
437 * @work: container for work to be done
438 *
8a0dc95f 439 */
ee443996 440
8a0dc95f
EVH
441static void p9_write_work(struct work_struct *work)
442{
7594bf37
AV
443 __poll_t n;
444 int err;
8a0dc95f 445 struct p9_conn *m;
673d62cd 446 struct p9_req_t *req;
8a0dc95f
EVH
447
448 m = container_of(work, struct p9_conn, wq);
449
450 if (m->err < 0) {
451 clear_bit(Wworksched, &m->wsched);
452 return;
453 }
454
455 if (!m->wsize) {
759f4298 456 spin_lock(&m->client->lock);
8a0dc95f
EVH
457 if (list_empty(&m->unsent_req_list)) {
458 clear_bit(Wworksched, &m->wsched);
759f4298 459 spin_unlock(&m->client->lock);
8a0dc95f
EVH
460 return;
461 }
462
673d62cd 463 req = list_entry(m->unsent_req_list.next, struct p9_req_t,
8a0dc95f 464 req_list);
673d62cd 465 req->status = REQ_STATUS_SENT;
5d385153 466 p9_debug(P9_DEBUG_TRANS, "move req %p\n", req);
8a0dc95f 467 list_move_tail(&req->req_list, &m->req_list);
8a0dc95f 468
673d62cd
EVH
469 m->wbuf = req->tc->sdata;
470 m->wsize = req->tc->size;
8a0dc95f 471 m->wpos = 0;
673d62cd 472 spin_unlock(&m->client->lock);
8a0dc95f
EVH
473 }
474
5d385153
JP
475 p9_debug(P9_DEBUG_TRANS, "mux %p pos %d size %d\n",
476 m, m->wpos, m->wsize);
8a0dc95f 477 clear_bit(Wpending, &m->wsched);
8b81ef58 478 err = p9_fd_write(m->client, m->wbuf + m->wpos, m->wsize - m->wpos);
5d385153 479 p9_debug(P9_DEBUG_TRANS, "mux %p sent %d bytes\n", m, err);
584a8c13
SD
480 if (err == -EAGAIN)
481 goto end_clear;
482
8a0dc95f
EVH
483
484 if (err < 0)
485 goto error;
486 else if (err == 0) {
487 err = -EREMOTEIO;
488 goto error;
489 }
490
491 m->wpos += err;
492 if (m->wpos == m->wsize)
493 m->wpos = m->wsize = 0;
494
584a8c13
SD
495end_clear:
496 clear_bit(Wworksched, &m->wsched);
497
1957b3a8 498 if (m->wsize || !list_empty(&m->unsent_req_list)) {
8a0dc95f 499 if (test_and_clear_bit(Wpending, &m->wsched))
a9a08845 500 n = EPOLLOUT;
8a0dc95f 501 else
7594bf37 502 n = p9_fd_poll(m->client, NULL, NULL);
8a0dc95f 503
a9a08845 504 if ((n & EPOLLOUT) &&
584a8c13 505 !test_and_set_bit(Wworksched, &m->wsched)) {
5d385153 506 p9_debug(P9_DEBUG_TRANS, "sched write work %p\n", m);
61edeeed 507 schedule_work(&m->wq);
584a8c13
SD
508 }
509 }
8a0dc95f
EVH
510
511 return;
512
513error:
514 p9_conn_cancel(m, err);
515 clear_bit(Wworksched, &m->wsched);
516}
517
ac6424b9 518static int p9_pollwake(wait_queue_entry_t *wait, unsigned int mode, int sync, void *key)
8a0dc95f 519{
5503ac56
EVH
520 struct p9_poll_wait *pwait =
521 container_of(wait, struct p9_poll_wait, wait);
522 struct p9_conn *m = pwait->conn;
523 unsigned long flags;
8a0dc95f 524
5503ac56
EVH
525 spin_lock_irqsave(&p9_poll_lock, flags);
526 if (list_empty(&m->poll_pending_link))
527 list_add_tail(&m->poll_pending_link, &p9_poll_pending_list);
528 spin_unlock_irqrestore(&p9_poll_lock, flags);
8a0dc95f 529
aa70c585
TH
530 schedule_work(&p9_poll_work);
531 return 1;
8a0dc95f
EVH
532}
533
534/**
5503ac56
EVH
535 * p9_pollwait - add poll task to the wait queue
536 * @filp: file pointer being polled
537 * @wait_address: wait_q to block on
538 * @p: poll state
ee443996 539 *
5503ac56 540 * called by files poll operation to add v9fs-poll task to files wait queue
8a0dc95f 541 */
ee443996 542
5503ac56
EVH
543static void
544p9_pollwait(struct file *filp, wait_queue_head_t *wait_address, poll_table *p)
8a0dc95f 545{
5503ac56
EVH
546 struct p9_conn *m = container_of(p, struct p9_conn, pt);
547 struct p9_poll_wait *pwait = NULL;
548 int i;
8a0dc95f 549
5503ac56
EVH
550 for (i = 0; i < ARRAY_SIZE(m->poll_wait); i++) {
551 if (m->poll_wait[i].wait_addr == NULL) {
552 pwait = &m->poll_wait[i];
553 break;
8a0dc95f 554 }
8a0dc95f
EVH
555 }
556
5503ac56 557 if (!pwait) {
5d385153 558 p9_debug(P9_DEBUG_ERROR, "not enough wait_address slots\n");
8a0dc95f
EVH
559 return;
560 }
561
5503ac56
EVH
562 pwait->conn = m;
563 pwait->wait_addr = wait_address;
564 init_waitqueue_func_entry(&pwait->wait, p9_pollwake);
565 add_wait_queue(wait_address, &pwait->wait);
566}
8a0dc95f 567
5503ac56 568/**
263c5828 569 * p9_conn_create - initialize the per-session mux data
5503ac56
EVH
570 * @client: client instance
571 *
572 * Note: Creates the polling task if this is the first session.
573 */
8a0dc95f 574
263c5828 575static void p9_conn_create(struct p9_client *client)
5503ac56 576{
7594bf37 577 __poll_t n;
263c5828
SD
578 struct p9_trans_fd *ts = client->trans;
579 struct p9_conn *m = &ts->conn;
8a0dc95f 580
5d385153 581 p9_debug(P9_DEBUG_TRANS, "client %p msize %d\n", client, client->msize);
8a0dc95f 582
5503ac56
EVH
583 INIT_LIST_HEAD(&m->mux_list);
584 m->client = client;
8a0dc95f 585
5503ac56
EVH
586 INIT_LIST_HEAD(&m->req_list);
587 INIT_LIST_HEAD(&m->unsent_req_list);
588 INIT_WORK(&m->rq, p9_read_work);
589 INIT_WORK(&m->wq, p9_write_work);
590 INIT_LIST_HEAD(&m->poll_pending_link);
591 init_poll_funcptr(&m->pt, p9_pollwait);
8a0dc95f 592
7594bf37 593 n = p9_fd_poll(client, &m->pt, NULL);
a9a08845 594 if (n & EPOLLIN) {
5d385153 595 p9_debug(P9_DEBUG_TRANS, "mux %p can read\n", m);
5503ac56
EVH
596 set_bit(Rpending, &m->wsched);
597 }
8a0dc95f 598
a9a08845 599 if (n & EPOLLOUT) {
5d385153 600 p9_debug(P9_DEBUG_TRANS, "mux %p can write\n", m);
5503ac56
EVH
601 set_bit(Wpending, &m->wsched);
602 }
5503ac56 603}
8a0dc95f 604
5503ac56
EVH
605/**
606 * p9_poll_mux - polls a mux and schedules read or write works if necessary
607 * @m: connection to poll
608 *
609 */
610
611static void p9_poll_mux(struct p9_conn *m)
612{
7594bf37
AV
613 __poll_t n;
614 int err = -ECONNRESET;
5503ac56
EVH
615
616 if (m->err < 0)
617 return;
618
7594bf37 619 n = p9_fd_poll(m->client, NULL, &err);
a9a08845 620 if (n & (EPOLLERR | EPOLLHUP | EPOLLNVAL)) {
5d385153 621 p9_debug(P9_DEBUG_TRANS, "error mux %p err %d\n", m, n);
7594bf37 622 p9_conn_cancel(m, err);
5503ac56
EVH
623 }
624
a9a08845 625 if (n & EPOLLIN) {
5503ac56 626 set_bit(Rpending, &m->wsched);
5d385153 627 p9_debug(P9_DEBUG_TRANS, "mux %p can read\n", m);
5503ac56 628 if (!test_and_set_bit(Rworksched, &m->wsched)) {
5d385153 629 p9_debug(P9_DEBUG_TRANS, "sched read work %p\n", m);
61edeeed 630 schedule_work(&m->rq);
5503ac56
EVH
631 }
632 }
8a0dc95f 633
a9a08845 634 if (n & EPOLLOUT) {
5503ac56 635 set_bit(Wpending, &m->wsched);
5d385153 636 p9_debug(P9_DEBUG_TRANS, "mux %p can write\n", m);
f64f9e71
JP
637 if ((m->wsize || !list_empty(&m->unsent_req_list)) &&
638 !test_and_set_bit(Wworksched, &m->wsched)) {
5d385153 639 p9_debug(P9_DEBUG_TRANS, "sched write work %p\n", m);
61edeeed 640 schedule_work(&m->wq);
5503ac56
EVH
641 }
642 }
8a0dc95f
EVH
643}
644
645/**
91b8534f 646 * p9_fd_request - send 9P request
8a0dc95f
EVH
647 * The function can sleep until the request is scheduled for sending.
648 * The function can be interrupted. Return from the function is not
91b8534f 649 * a guarantee that the request is sent successfully.
8a0dc95f 650 *
91b8534f
EVH
651 * @client: client instance
652 * @req: request to be sent
ee443996 653 *
8a0dc95f 654 */
ee443996 655
91b8534f 656static int p9_fd_request(struct p9_client *client, struct p9_req_t *req)
8a0dc95f 657{
7594bf37 658 __poll_t n;
91b8534f 659 struct p9_trans_fd *ts = client->trans;
263c5828 660 struct p9_conn *m = &ts->conn;
8a0dc95f 661
5d385153
JP
662 p9_debug(P9_DEBUG_TRANS, "mux %p task %p tcall %p id %d\n",
663 m, current, req->tc, req->tc->id);
8a0dc95f 664 if (m->err < 0)
91b8534f 665 return m->err;
8a0dc95f 666
91b8534f 667 spin_lock(&client->lock);
7eb923b8 668 req->status = REQ_STATUS_UNSENT;
8a0dc95f 669 list_add_tail(&req->req_list, &m->unsent_req_list);
91b8534f 670 spin_unlock(&client->lock);
8a0dc95f
EVH
671
672 if (test_and_clear_bit(Wpending, &m->wsched))
a9a08845 673 n = EPOLLOUT;
8a0dc95f 674 else
7594bf37 675 n = p9_fd_poll(m->client, NULL, NULL);
8a0dc95f 676
a9a08845 677 if (n & EPOLLOUT && !test_and_set_bit(Wworksched, &m->wsched))
61edeeed 678 schedule_work(&m->wq);
8a0dc95f 679
91b8534f 680 return 0;
8a0dc95f
EVH
681}
682
91b8534f 683static int p9_fd_cancel(struct p9_client *client, struct p9_req_t *req)
8a0dc95f 684{
7eb923b8 685 int ret = 1;
8a0dc95f 686
5d385153 687 p9_debug(P9_DEBUG_TRANS, "client %p req %p\n", client, req);
8a0dc95f 688
91b8534f 689 spin_lock(&client->lock);
91b8534f 690
91b8534f 691 if (req->status == REQ_STATUS_UNSENT) {
1bab88b2 692 list_del(&req->req_list);
91b8534f 693 req->status = REQ_STATUS_FLSHD;
7eb923b8 694 ret = 0;
0bfd6845 695 }
7eb923b8
EVH
696 spin_unlock(&client->lock);
697
698 return ret;
8a0dc95f
EVH
699}
700
afd8d654
SD
701static int p9_fd_cancelled(struct p9_client *client, struct p9_req_t *req)
702{
703 p9_debug(P9_DEBUG_TRANS, "client %p req %p\n", client, req);
704
705 /* we haven't received a response for oldreq,
706 * remove it from the list.
707 */
708 spin_lock(&client->lock);
709 list_del(&req->req_list);
710 spin_unlock(&client->lock);
711
712 return 0;
713}
714
c4fac910
DH
715static int p9_fd_show_options(struct seq_file *m, struct p9_client *clnt)
716{
717 if (clnt->trans_mod == &p9_tcp_trans) {
718 if (clnt->trans_opts.tcp.port != P9_PORT)
61b272c3 719 seq_printf(m, ",port=%u", clnt->trans_opts.tcp.port);
c4fac910
DH
720 } else if (clnt->trans_mod == &p9_fd_trans) {
721 if (clnt->trans_opts.fd.rfd != ~0)
61b272c3 722 seq_printf(m, ",rfd=%u", clnt->trans_opts.fd.rfd);
c4fac910 723 if (clnt->trans_opts.fd.wfd != ~0)
61b272c3 724 seq_printf(m, ",wfd=%u", clnt->trans_opts.fd.wfd);
c4fac910
DH
725 }
726 return 0;
727}
728
a80d923e 729/**
0e15597e
AK
730 * parse_opts - parse mount options into p9_fd_opts structure
731 * @params: options string passed from mount
732 * @opts: fd transport-specific structure to parse options into
a80d923e 733 *
bb8ffdfc 734 * Returns 0 upon success, -ERRNO upon failure
a80d923e 735 */
bd238fb4 736
bb8ffdfc 737static int parse_opts(char *params, struct p9_fd_opts *opts)
bd238fb4 738{
a80d923e
EVH
739 char *p;
740 substring_t args[MAX_OPT_ARGS];
741 int option;
d8c8a9e3 742 char *options, *tmp_options;
bd238fb4 743
a80d923e
EVH
744 opts->port = P9_PORT;
745 opts->rfd = ~0;
746 opts->wfd = ~0;
c4fac910 747 opts->privport = false;
bd238fb4 748
bb8ffdfc
EVH
749 if (!params)
750 return 0;
751
d8c8a9e3
EVH
752 tmp_options = kstrdup(params, GFP_KERNEL);
753 if (!tmp_options) {
5d385153
JP
754 p9_debug(P9_DEBUG_ERROR,
755 "failed to allocate copy of option string\n");
bb8ffdfc
EVH
756 return -ENOMEM;
757 }
d8c8a9e3 758 options = tmp_options;
bd238fb4 759
a80d923e
EVH
760 while ((p = strsep(&options, ",")) != NULL) {
761 int token;
bb8ffdfc 762 int r;
a80d923e
EVH
763 if (!*p)
764 continue;
765 token = match_token(p, tokens, args);
2f28c8b3 766 if ((token != Opt_err) && (token != Opt_privport)) {
15da4b16
AK
767 r = match_int(&args[0], &option);
768 if (r < 0) {
5d385153
JP
769 p9_debug(P9_DEBUG_ERROR,
770 "integer field, but no integer?\n");
15da4b16
AK
771 continue;
772 }
a80d923e
EVH
773 }
774 switch (token) {
775 case Opt_port:
776 opts->port = option;
777 break;
778 case Opt_rfdno:
779 opts->rfd = option;
780 break;
781 case Opt_wfdno:
782 opts->wfd = option;
783 break;
2f28c8b3 784 case Opt_privport:
c4fac910 785 opts->privport = true;
2f28c8b3 786 break;
a80d923e
EVH
787 default:
788 continue;
789 }
bd238fb4 790 }
d8c8a9e3
EVH
791
792 kfree(tmp_options);
bb8ffdfc 793 return 0;
bd238fb4 794}
bd238fb4 795
8b81ef58 796static int p9_fd_open(struct p9_client *client, int rfd, int wfd)
bd238fb4 797{
263c5828 798 struct p9_trans_fd *ts = kzalloc(sizeof(struct p9_trans_fd),
a80d923e
EVH
799 GFP_KERNEL);
800 if (!ts)
801 return -ENOMEM;
bd238fb4 802
a80d923e
EVH
803 ts->rd = fget(rfd);
804 ts->wr = fget(wfd);
805 if (!ts->rd || !ts->wr) {
806 if (ts->rd)
807 fput(ts->rd);
808 if (ts->wr)
809 fput(ts->wr);
810 kfree(ts);
811 return -EIO;
bd238fb4
LI
812 }
813
8b81ef58
EVH
814 client->trans = ts;
815 client->status = Connected;
bd238fb4 816
a80d923e 817 return 0;
bd238fb4 818}
bd238fb4 819
8b81ef58 820static int p9_socket_open(struct p9_client *client, struct socket *csocket)
bd238fb4 821{
6b18662e 822 struct p9_trans_fd *p;
56b31d1c 823 struct file *file;
6b18662e 824
263c5828 825 p = kzalloc(sizeof(struct p9_trans_fd), GFP_KERNEL);
6b18662e
AV
826 if (!p)
827 return -ENOMEM;
bd238fb4
LI
828
829 csocket->sk->sk_allocation = GFP_NOIO;
aab174f0 830 file = sock_alloc_file(csocket, 0, NULL);
56b31d1c 831 if (IS_ERR(file)) {
5d385153
JP
832 pr_err("%s (%d): failed to map fd\n",
833 __func__, task_pid_nr(current));
6b18662e 834 kfree(p);
56b31d1c 835 return PTR_ERR(file);
bd238fb4
LI
836 }
837
56b31d1c
AV
838 get_file(file);
839 p->wr = p->rd = file;
6b18662e
AV
840 client->trans = p;
841 client->status = Connected;
842
6b18662e
AV
843 p->rd->f_flags |= O_NONBLOCK;
844
263c5828 845 p9_conn_create(client);
bd238fb4
LI
846 return 0;
847}
848
bd238fb4 849/**
263c5828 850 * p9_mux_destroy - cancels all pending requests of mux
5503ac56 851 * @m: mux to destroy
bd238fb4
LI
852 *
853 */
ee443996 854
5503ac56 855static void p9_conn_destroy(struct p9_conn *m)
bd238fb4 856{
5d385153
JP
857 p9_debug(P9_DEBUG_TRANS, "mux %p prev %p next %p\n",
858 m, m->mux_list.prev, m->mux_list.next);
bd238fb4 859
5503ac56
EVH
860 p9_mux_poll_stop(m);
861 cancel_work_sync(&m->rq);
862 cancel_work_sync(&m->wq);
bd238fb4 863
5503ac56 864 p9_conn_cancel(m, -ECONNRESET);
bd238fb4 865
5503ac56 866 m->client = NULL;
bd238fb4
LI
867}
868
869/**
8b81ef58
EVH
870 * p9_fd_close - shutdown file descriptor transport
871 * @client: client instance
bd238fb4
LI
872 *
873 */
ee443996 874
8b81ef58 875static void p9_fd_close(struct p9_client *client)
bd238fb4
LI
876{
877 struct p9_trans_fd *ts;
878
8b81ef58 879 if (!client)
bd238fb4
LI
880 return;
881
8b81ef58 882 ts = client->trans;
bd238fb4
LI
883 if (!ts)
884 return;
885
8b81ef58
EVH
886 client->status = Disconnected;
887
263c5828 888 p9_conn_destroy(&ts->conn);
8a0dc95f 889
bd238fb4
LI
890 if (ts->rd)
891 fput(ts->rd);
892 if (ts->wr)
893 fput(ts->wr);
8b81ef58 894
bd238fb4
LI
895 kfree(ts);
896}
897
887b3ece
EVH
898/*
899 * stolen from NFS - maybe should be made a generic function?
900 */
901static inline int valid_ipaddr4(const char *buf)
902{
903 int rc, count, in[4];
904
905 rc = sscanf(buf, "%d.%d.%d.%d", &in[0], &in[1], &in[2], &in[3]);
906 if (rc != 4)
907 return -EINVAL;
908 for (count = 0; count < 4; count++) {
909 if (in[count] > 255)
910 return -EINVAL;
911 }
912 return 0;
913}
914
2f28c8b3
JG
915static int p9_bind_privport(struct socket *sock)
916{
917 struct sockaddr_in cl;
918 int port, err = -EINVAL;
919
920 memset(&cl, 0, sizeof(cl));
921 cl.sin_family = AF_INET;
922 cl.sin_addr.s_addr = INADDR_ANY;
923 for (port = p9_ipport_resv_max; port >= p9_ipport_resv_min; port--) {
924 cl.sin_port = htons((ushort)port);
925 err = kernel_bind(sock, (struct sockaddr *)&cl, sizeof(cl));
926 if (err != -EADDRINUSE)
927 break;
928 }
929 return err;
930}
931
932
8b81ef58
EVH
933static int
934p9_fd_create_tcp(struct p9_client *client, const char *addr, char *args)
a80d923e
EVH
935{
936 int err;
a80d923e
EVH
937 struct socket *csocket;
938 struct sockaddr_in sin_server;
939 struct p9_fd_opts opts;
940
bb8ffdfc
EVH
941 err = parse_opts(args, &opts);
942 if (err < 0)
8b81ef58 943 return err;
a80d923e 944
887b3ece 945 if (valid_ipaddr4(addr) < 0)
8b81ef58 946 return -EINVAL;
887b3ece 947
a80d923e 948 csocket = NULL;
a80d923e 949
c4fac910
DH
950 client->trans_opts.tcp.port = opts.port;
951 client->trans_opts.tcp.privport = opts.privport;
a80d923e
EVH
952 sin_server.sin_family = AF_INET;
953 sin_server.sin_addr.s_addr = in_aton(addr);
954 sin_server.sin_port = htons(opts.port);
0c5c9fb5 955 err = __sock_create(current->nsproxy->net_ns, PF_INET,
e75762fd 956 SOCK_STREAM, IPPROTO_TCP, &csocket, 1);
6b18662e 957 if (err) {
5d385153
JP
958 pr_err("%s (%d): problem creating socket\n",
959 __func__, task_pid_nr(current));
6b18662e 960 return err;
a80d923e
EVH
961 }
962
2f28c8b3
JG
963 if (opts.privport) {
964 err = p9_bind_privport(csocket);
965 if (err < 0) {
966 pr_err("%s (%d): problem binding to privport\n",
967 __func__, task_pid_nr(current));
968 sock_release(csocket);
969 return err;
970 }
971 }
972
a80d923e
EVH
973 err = csocket->ops->connect(csocket,
974 (struct sockaddr *)&sin_server,
975 sizeof(struct sockaddr_in), 0);
976 if (err < 0) {
5d385153
JP
977 pr_err("%s (%d): problem connecting socket to %s\n",
978 __func__, task_pid_nr(current), addr);
a80d923e 979 sock_release(csocket);
6b18662e
AV
980 return err;
981 }
a80d923e 982
6b18662e 983 return p9_socket_open(client, csocket);
a80d923e
EVH
984}
985
8b81ef58
EVH
986static int
987p9_fd_create_unix(struct p9_client *client, const char *addr, char *args)
a80d923e
EVH
988{
989 int err;
990 struct socket *csocket;
991 struct sockaddr_un sun_server;
a80d923e
EVH
992
993 csocket = NULL;
a80d923e 994
cff6b8a9 995 if (strlen(addr) >= UNIX_PATH_MAX) {
5d385153
JP
996 pr_err("%s (%d): address too long: %s\n",
997 __func__, task_pid_nr(current), addr);
6b18662e 998 return -ENAMETOOLONG;
a80d923e
EVH
999 }
1000
1001 sun_server.sun_family = PF_UNIX;
1002 strcpy(sun_server.sun_path, addr);
0c5c9fb5 1003 err = __sock_create(current->nsproxy->net_ns, PF_UNIX,
e75762fd 1004 SOCK_STREAM, 0, &csocket, 1);
6b18662e 1005 if (err < 0) {
5d385153
JP
1006 pr_err("%s (%d): problem creating socket\n",
1007 __func__, task_pid_nr(current));
1008
6b18662e
AV
1009 return err;
1010 }
a80d923e
EVH
1011 err = csocket->ops->connect(csocket, (struct sockaddr *)&sun_server,
1012 sizeof(struct sockaddr_un) - 1, 0);
1013 if (err < 0) {
5d385153
JP
1014 pr_err("%s (%d): problem connecting socket: %s: %d\n",
1015 __func__, task_pid_nr(current), addr, err);
a80d923e 1016 sock_release(csocket);
6b18662e
AV
1017 return err;
1018 }
a80d923e 1019
6b18662e 1020 return p9_socket_open(client, csocket);
a80d923e
EVH
1021}
1022
8b81ef58
EVH
1023static int
1024p9_fd_create(struct p9_client *client, const char *addr, char *args)
a80d923e
EVH
1025{
1026 int err;
a80d923e
EVH
1027 struct p9_fd_opts opts;
1028
1029 parse_opts(args, &opts);
c4fac910
DH
1030 client->trans_opts.fd.rfd = opts.rfd;
1031 client->trans_opts.fd.wfd = opts.wfd;
a80d923e
EVH
1032
1033 if (opts.rfd == ~0 || opts.wfd == ~0) {
5d385153 1034 pr_err("Insufficient options for proto=fd\n");
8b81ef58 1035 return -ENOPROTOOPT;
a80d923e
EVH
1036 }
1037
8b81ef58 1038 err = p9_fd_open(client, opts.rfd, opts.wfd);
a80d923e 1039 if (err < 0)
6b18662e 1040 return err;
a80d923e 1041
263c5828 1042 p9_conn_create(client);
8a0dc95f 1043
8b81ef58 1044 return 0;
a80d923e
EVH
1045}
1046
1047static struct p9_trans_module p9_tcp_trans = {
1048 .name = "tcp",
1049 .maxsize = MAX_SOCK_BUF,
f94741fd 1050 .def = 0,
8b81ef58
EVH
1051 .create = p9_fd_create_tcp,
1052 .close = p9_fd_close,
91b8534f
EVH
1053 .request = p9_fd_request,
1054 .cancel = p9_fd_cancel,
afd8d654 1055 .cancelled = p9_fd_cancelled,
c4fac910 1056 .show_options = p9_fd_show_options,
72029fe8 1057 .owner = THIS_MODULE,
a80d923e
EVH
1058};
1059
1060static struct p9_trans_module p9_unix_trans = {
1061 .name = "unix",
1062 .maxsize = MAX_SOCK_BUF,
1063 .def = 0,
8b81ef58
EVH
1064 .create = p9_fd_create_unix,
1065 .close = p9_fd_close,
91b8534f
EVH
1066 .request = p9_fd_request,
1067 .cancel = p9_fd_cancel,
afd8d654 1068 .cancelled = p9_fd_cancelled,
c4fac910 1069 .show_options = p9_fd_show_options,
72029fe8 1070 .owner = THIS_MODULE,
a80d923e
EVH
1071};
1072
1073static struct p9_trans_module p9_fd_trans = {
1074 .name = "fd",
1075 .maxsize = MAX_SOCK_BUF,
1076 .def = 0,
8b81ef58
EVH
1077 .create = p9_fd_create,
1078 .close = p9_fd_close,
91b8534f
EVH
1079 .request = p9_fd_request,
1080 .cancel = p9_fd_cancel,
afd8d654 1081 .cancelled = p9_fd_cancelled,
c4fac910 1082 .show_options = p9_fd_show_options,
72029fe8 1083 .owner = THIS_MODULE,
a80d923e
EVH
1084};
1085
5503ac56 1086/**
4a026da9
SL
1087 * p9_poll_workfn - poll worker thread
1088 * @work: work queue
5503ac56
EVH
1089 *
1090 * polls all v9fs transports for new events and queues the appropriate
1091 * work to the work queue
1092 *
1093 */
1094
aa70c585 1095static void p9_poll_workfn(struct work_struct *work)
5503ac56
EVH
1096{
1097 unsigned long flags;
1098
5d385153 1099 p9_debug(P9_DEBUG_TRANS, "start %p\n", current);
aa70c585 1100
5503ac56
EVH
1101 spin_lock_irqsave(&p9_poll_lock, flags);
1102 while (!list_empty(&p9_poll_pending_list)) {
1103 struct p9_conn *conn = list_first_entry(&p9_poll_pending_list,
1104 struct p9_conn,
1105 poll_pending_link);
1106 list_del_init(&conn->poll_pending_link);
1107 spin_unlock_irqrestore(&p9_poll_lock, flags);
1108
1109 p9_poll_mux(conn);
1110
1111 spin_lock_irqsave(&p9_poll_lock, flags);
1112 }
1113 spin_unlock_irqrestore(&p9_poll_lock, flags);
1114
5d385153 1115 p9_debug(P9_DEBUG_TRANS, "finish\n");
5503ac56
EVH
1116}
1117
887b3ece 1118int p9_trans_fd_init(void)
a80d923e
EVH
1119{
1120 v9fs_register_trans(&p9_tcp_trans);
1121 v9fs_register_trans(&p9_unix_trans);
1122 v9fs_register_trans(&p9_fd_trans);
1123
3387b804 1124 return 0;
a80d923e 1125}
72029fe8
TH
1126
1127void p9_trans_fd_exit(void)
1128{
43829731 1129 flush_work(&p9_poll_work);
72029fe8
TH
1130 v9fs_unregister_trans(&p9_tcp_trans);
1131 v9fs_unregister_trans(&p9_unix_trans);
1132 v9fs_unregister_trans(&p9_fd_trans);
1133}