Merge branch 'overlayfs-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/mszer...
[linux-2.6-block.git] / net / 9p / trans_fd.c
CommitLineData
bd238fb4
LI
1/*
2 * linux/fs/9p/trans_fd.c
3 *
4 * Fd transport layer. Includes deprecated socket layer.
5 *
6 * Copyright (C) 2006 by Russ Cox <rsc@swtch.com>
7 * Copyright (C) 2004-2005 by Latchesar Ionkov <lucho@ionkov.net>
8a0dc95f 8 * Copyright (C) 2004-2008 by Eric Van Hensbergen <ericvh@gmail.com>
bd238fb4
LI
9 * Copyright (C) 1997-2002 by Ron Minnich <rminnich@sarnoff.com>
10 *
11 * This program is free software; you can redistribute it and/or modify
12 * it under the terms of the GNU General Public License version 2
13 * as published by the Free Software Foundation.
14 *
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU General Public License for more details.
19 *
20 * You should have received a copy of the GNU General Public License
21 * along with this program; if not, write to:
22 * Free Software Foundation
23 * 51 Franklin Street, Fifth Floor
24 * Boston, MA 02111-1301 USA
25 *
26 */
27
5d385153
JP
28#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
29
bd238fb4
LI
30#include <linux/in.h>
31#include <linux/module.h>
32#include <linux/net.h>
33#include <linux/ipv6.h>
8a0dc95f 34#include <linux/kthread.h>
bd238fb4
LI
35#include <linux/errno.h>
36#include <linux/kernel.h>
37#include <linux/un.h>
38#include <linux/uaccess.h>
39#include <linux/inet.h>
40#include <linux/idr.h>
41#include <linux/file.h>
a80d923e 42#include <linux/parser.h>
5a0e3ad6 43#include <linux/slab.h>
bd238fb4 44#include <net/9p/9p.h>
8b81ef58 45#include <net/9p/client.h>
bd238fb4
LI
46#include <net/9p/transport.h>
47
6b18662e
AV
48#include <linux/syscalls.h> /* killme */
49
bd238fb4 50#define P9_PORT 564
a80d923e 51#define MAX_SOCK_BUF (64*1024)
8a0dc95f 52#define MAXPOLLWADDR 2
a80d923e 53
ee443996
EVH
54/**
55 * struct p9_fd_opts - per-transport options
56 * @rfd: file descriptor for reading (trans=fd)
57 * @wfd: file descriptor for writing (trans=fd)
58 * @port: port to connect to (trans=tcp)
59 *
60 */
61
a80d923e
EVH
62struct p9_fd_opts {
63 int rfd;
64 int wfd;
65 u16 port;
2f28c8b3 66 int privport;
a80d923e 67};
bd238fb4 68
a80d923e
EVH
69/*
70 * Option Parsing (code inspired by NFS code)
71 * - a little lazy - parse all fd-transport options
72 */
bd238fb4 73
a80d923e
EVH
74enum {
75 /* Options that take integer arguments */
55762690 76 Opt_port, Opt_rfdno, Opt_wfdno, Opt_err,
2f28c8b3
JG
77 /* Options that take no arguments */
78 Opt_privport,
a80d923e 79};
bd238fb4 80
a447c093 81static const match_table_t tokens = {
a80d923e
EVH
82 {Opt_port, "port=%u"},
83 {Opt_rfdno, "rfdno=%u"},
84 {Opt_wfdno, "wfdno=%u"},
2f28c8b3 85 {Opt_privport, "privport"},
55762690 86 {Opt_err, NULL},
a80d923e 87};
bd238fb4 88
8a0dc95f
EVH
89enum {
90 Rworksched = 1, /* read work scheduled or running */
91 Rpending = 2, /* can read */
92 Wworksched = 4, /* write work scheduled or running */
93 Wpending = 8, /* can write */
94};
95
992b3f1d
TH
96struct p9_poll_wait {
97 struct p9_conn *conn;
98 wait_queue_t wait;
99 wait_queue_head_t *wait_addr;
ee443996
EVH
100};
101
102/**
103 * struct p9_conn - fd mux connection state information
ee443996 104 * @mux_list: list link for mux to manage multiple connections (?)
8b81ef58 105 * @client: reference to client instance for this connection
ee443996 106 * @err: error state
ee443996
EVH
107 * @req_list: accounting for requests which have been sent
108 * @unsent_req_list: accounting for requests that haven't been sent
1b0a763b
EVH
109 * @req: current request being processed (if any)
110 * @tmp_buf: temporary buffer to read in header
947867aa 111 * @rc: temporary fcall for reading current frame
ee443996
EVH
112 * @wpos: write position for current frame
113 * @wsize: amount of data to write for current frame
114 * @wbuf: current write buffer
0e15597e 115 * @poll_pending_link: pending links to be polled per conn
ee443996 116 * @poll_wait: array of wait_q's for various worker threads
ee443996
EVH
117 * @pt: poll state
118 * @rq: current read work
119 * @wq: current write work
120 * @wsched: ????
121 *
122 */
8a0dc95f
EVH
123
124struct p9_conn {
8a0dc95f 125 struct list_head mux_list;
8b81ef58 126 struct p9_client *client;
8a0dc95f 127 int err;
8a0dc95f
EVH
128 struct list_head req_list;
129 struct list_head unsent_req_list;
1b0a763b
EVH
130 struct p9_req_t *req;
131 char tmp_buf[7];
947867aa 132 struct p9_fcall rc;
8a0dc95f
EVH
133 int wpos;
134 int wsize;
135 char *wbuf;
992b3f1d
TH
136 struct list_head poll_pending_link;
137 struct p9_poll_wait poll_wait[MAXPOLLWADDR];
8a0dc95f
EVH
138 poll_table pt;
139 struct work_struct rq;
140 struct work_struct wq;
141 unsigned long wsched;
142};
143
263c5828
SD
144/**
145 * struct p9_trans_fd - transport state
146 * @rd: reference to file to read from
147 * @wr: reference of file to write to
148 * @conn: connection state reference
149 *
150 */
151
152struct p9_trans_fd {
153 struct file *rd;
154 struct file *wr;
155 struct p9_conn conn;
156};
157
aa70c585
TH
158static void p9_poll_workfn(struct work_struct *work);
159
992b3f1d
TH
160static DEFINE_SPINLOCK(p9_poll_lock);
161static LIST_HEAD(p9_poll_pending_list);
aa70c585 162static DECLARE_WORK(p9_poll_work, p9_poll_workfn);
8a0dc95f 163
2f28c8b3
JG
164static unsigned int p9_ipport_resv_min = P9_DEF_MIN_RESVPORT;
165static unsigned int p9_ipport_resv_max = P9_DEF_MAX_RESVPORT;
166
992b3f1d 167static void p9_mux_poll_stop(struct p9_conn *m)
8a0dc95f 168{
992b3f1d
TH
169 unsigned long flags;
170 int i;
8a0dc95f 171
992b3f1d
TH
172 for (i = 0; i < ARRAY_SIZE(m->poll_wait); i++) {
173 struct p9_poll_wait *pwait = &m->poll_wait[i];
8a0dc95f 174
992b3f1d
TH
175 if (pwait->wait_addr) {
176 remove_wait_queue(pwait->wait_addr, &pwait->wait);
177 pwait->wait_addr = NULL;
8a0dc95f 178 }
8a0dc95f
EVH
179 }
180
992b3f1d
TH
181 spin_lock_irqsave(&p9_poll_lock, flags);
182 list_del_init(&m->poll_pending_link);
183 spin_unlock_irqrestore(&p9_poll_lock, flags);
8a0dc95f
EVH
184}
185
186/**
5503ac56
EVH
187 * p9_conn_cancel - cancel all pending requests with error
188 * @m: mux data
189 * @err: error code
8a0dc95f 190 *
8a0dc95f 191 */
ee443996 192
51a87c55 193static void p9_conn_cancel(struct p9_conn *m, int err)
8a0dc95f 194{
673d62cd 195 struct p9_req_t *req, *rtmp;
91b8534f 196 unsigned long flags;
5503ac56 197 LIST_HEAD(cancel_list);
8a0dc95f 198
5d385153 199 p9_debug(P9_DEBUG_ERROR, "mux %p err %d\n", m, err);
7eb923b8 200
91b8534f 201 spin_lock_irqsave(&m->client->lock, flags);
7eb923b8
EVH
202
203 if (m->err) {
204 spin_unlock_irqrestore(&m->client->lock, flags);
205 return;
206 }
207
208 m->err = err;
209
5503ac56
EVH
210 list_for_each_entry_safe(req, rtmp, &m->req_list, req_list) {
211 list_move(&req->req_list, &cancel_list);
212 }
213 list_for_each_entry_safe(req, rtmp, &m->unsent_req_list, req_list) {
214 list_move(&req->req_list, &cancel_list);
8a0dc95f 215 }
91b8534f 216 spin_unlock_irqrestore(&m->client->lock, flags);
8a0dc95f 217
5503ac56 218 list_for_each_entry_safe(req, rtmp, &cancel_list, req_list) {
5d385153 219 p9_debug(P9_DEBUG_ERROR, "call back req %p\n", req);
1bab88b2 220 list_del(&req->req_list);
2b6e72ed
DM
221 if (!req->t_err)
222 req->t_err = err;
223 p9_client_cb(m->client, req, REQ_STATUS_ERROR);
8a0dc95f 224 }
8a0dc95f
EVH
225}
226
29af9309 227static int
5503ac56 228p9_fd_poll(struct p9_client *client, struct poll_table_struct *pt)
8a0dc95f 229{
5503ac56
EVH
230 int ret, n;
231 struct p9_trans_fd *ts = NULL;
8a0dc95f 232
5503ac56
EVH
233 if (client && client->status == Connected)
234 ts = client->trans;
7dc5d24b 235
5503ac56
EVH
236 if (!ts)
237 return -EREMOTEIO;
7dc5d24b 238
72c2d531 239 if (!ts->rd->f_op->poll)
5503ac56 240 return -EIO;
8a0dc95f 241
72c2d531 242 if (!ts->wr->f_op->poll)
5503ac56 243 return -EIO;
992b3f1d 244
5503ac56
EVH
245 ret = ts->rd->f_op->poll(ts->rd, pt);
246 if (ret < 0)
247 return ret;
992b3f1d 248
5503ac56
EVH
249 if (ts->rd != ts->wr) {
250 n = ts->wr->f_op->poll(ts->wr, pt);
251 if (n < 0)
252 return n;
253 ret = (ret & ~POLLOUT) | (n & ~POLLIN);
254 }
255
256 return ret;
992b3f1d
TH
257}
258
8a0dc95f 259/**
5503ac56
EVH
260 * p9_fd_read- read from a fd
261 * @client: client instance
262 * @v: buffer to receive data into
263 * @len: size of receive buffer
ee443996 264 *
8a0dc95f 265 */
ee443996 266
5503ac56 267static int p9_fd_read(struct p9_client *client, void *v, int len)
8a0dc95f 268{
5503ac56
EVH
269 int ret;
270 struct p9_trans_fd *ts = NULL;
8a0dc95f 271
5503ac56
EVH
272 if (client && client->status != Disconnected)
273 ts = client->trans;
8a0dc95f 274
5503ac56
EVH
275 if (!ts)
276 return -EREMOTEIO;
8a0dc95f 277
5503ac56 278 if (!(ts->rd->f_flags & O_NONBLOCK))
5d385153 279 p9_debug(P9_DEBUG_ERROR, "blocking read ...\n");
8a0dc95f 280
5503ac56
EVH
281 ret = kernel_read(ts->rd, ts->rd->f_pos, v, len);
282 if (ret <= 0 && ret != -ERESTARTSYS && ret != -EAGAIN)
283 client->status = Disconnected;
284 return ret;
8a0dc95f
EVH
285}
286
287/**
5503ac56
EVH
288 * p9_read_work - called when there is some data to be read from a transport
289 * @work: container of work to be done
ee443996 290 *
8a0dc95f 291 */
ee443996 292
5503ac56 293static void p9_read_work(struct work_struct *work)
8a0dc95f 294{
5503ac56
EVH
295 int n, err;
296 struct p9_conn *m;
2b6e72ed 297 int status = REQ_STATUS_ERROR;
5503ac56
EVH
298
299 m = container_of(work, struct p9_conn, rq);
8a0dc95f
EVH
300
301 if (m->err < 0)
302 return;
303
947867aa 304 p9_debug(P9_DEBUG_TRANS, "start mux %p pos %zd\n", m, m->rc.offset);
8a0dc95f 305
947867aa
DM
306 if (!m->rc.sdata) {
307 m->rc.sdata = m->tmp_buf;
308 m->rc.offset = 0;
309 m->rc.capacity = 7; /* start by reading header */
8a0dc95f
EVH
310 }
311
5503ac56 312 clear_bit(Rpending, &m->wsched);
947867aa
DM
313 p9_debug(P9_DEBUG_TRANS, "read mux %p pos %zd size: %zd = %zd\n",
314 m, m->rc.offset, m->rc.capacity,
315 m->rc.capacity - m->rc.offset);
316 err = p9_fd_read(m->client, m->rc.sdata + m->rc.offset,
317 m->rc.capacity - m->rc.offset);
5d385153 318 p9_debug(P9_DEBUG_TRANS, "mux %p got %d bytes\n", m, err);
947867aa 319 if (err == -EAGAIN)
0462194d 320 goto end_clear;
8a0dc95f 321
5503ac56
EVH
322 if (err <= 0)
323 goto error;
324
947867aa 325 m->rc.offset += err;
1b0a763b 326
947867aa
DM
327 /* header read in */
328 if ((!m->req) && (m->rc.offset == m->rc.capacity)) {
5d385153 329 p9_debug(P9_DEBUG_TRANS, "got new header\n");
1b0a763b 330
947867aa
DM
331 err = p9_parse_header(&m->rc, NULL, NULL, NULL, 0);
332 if (err) {
333 p9_debug(P9_DEBUG_ERROR,
334 "error parsing header: %d\n", err);
335 goto error;
336 }
337
338 if (m->rc.size >= m->client->msize) {
5d385153 339 p9_debug(P9_DEBUG_ERROR,
947867aa
DM
340 "requested packet size too big: %d\n",
341 m->rc.size);
5503ac56
EVH
342 err = -EIO;
343 goto error;
344 }
345
5d385153 346 p9_debug(P9_DEBUG_TRANS,
947867aa
DM
347 "mux %p pkt: size: %d bytes tag: %d\n",
348 m, m->rc.size, m->rc.tag);
1b0a763b 349
947867aa 350 m->req = p9_tag_lookup(m->client, m->rc.tag);
0bfd6845 351 if (!m->req || (m->req->status != REQ_STATUS_SENT)) {
5d385153 352 p9_debug(P9_DEBUG_ERROR, "Unexpected packet tag %d\n",
947867aa 353 m->rc.tag);
1b0a763b
EVH
354 err = -EIO;
355 goto error;
356 }
357
358 if (m->req->rc == NULL) {
3053600e
DM
359 p9_debug(P9_DEBUG_ERROR,
360 "No recv fcall for tag %d (req %p), disconnecting!\n",
361 m->rc.tag, m->req);
362 m->req = NULL;
363 err = -EIO;
364 goto error;
1b0a763b 365 }
947867aa
DM
366 m->rc.sdata = (char *)m->req->rc + sizeof(struct p9_fcall);
367 memcpy(m->rc.sdata, m->tmp_buf, m->rc.capacity);
368 m->rc.capacity = m->rc.size;
1b0a763b 369 }
5503ac56 370
947867aa
DM
371 /* packet is read in
372 * not an else because some packets (like clunk) have no payload
373 */
374 if ((m->req) && (m->rc.offset == m->rc.capacity)) {
5d385153 375 p9_debug(P9_DEBUG_TRANS, "got new packet\n");
7eb923b8 376 spin_lock(&m->client->lock);
1bab88b2 377 if (m->req->status != REQ_STATUS_ERROR)
2b6e72ed 378 status = REQ_STATUS_RCVD;
91b8534f 379 list_del(&m->req->req_list);
7eb923b8 380 spin_unlock(&m->client->lock);
2b6e72ed 381 p9_client_cb(m->client, m->req, status);
947867aa
DM
382 m->rc.sdata = NULL;
383 m->rc.offset = 0;
384 m->rc.capacity = 0;
1b0a763b 385 m->req = NULL;
5503ac56
EVH
386 }
387
0462194d
SD
388end_clear:
389 clear_bit(Rworksched, &m->wsched);
390
5503ac56
EVH
391 if (!list_empty(&m->req_list)) {
392 if (test_and_clear_bit(Rpending, &m->wsched))
393 n = POLLIN;
394 else
395 n = p9_fd_poll(m->client, NULL);
396
0462194d 397 if ((n & POLLIN) && !test_and_set_bit(Rworksched, &m->wsched)) {
5d385153 398 p9_debug(P9_DEBUG_TRANS, "sched read work %p\n", m);
61edeeed 399 schedule_work(&m->rq);
0462194d
SD
400 }
401 }
5503ac56
EVH
402
403 return;
5503ac56
EVH
404error:
405 p9_conn_cancel(m, err);
406 clear_bit(Rworksched, &m->wsched);
407}
408
409/**
410 * p9_fd_write - write to a socket
411 * @client: client instance
412 * @v: buffer to send data from
413 * @len: size of send buffer
ee443996 414 *
8a0dc95f 415 */
ee443996 416
5503ac56 417static int p9_fd_write(struct p9_client *client, void *v, int len)
8a0dc95f 418{
5503ac56
EVH
419 int ret;
420 mm_segment_t oldfs;
421 struct p9_trans_fd *ts = NULL;
8a0dc95f 422
5503ac56
EVH
423 if (client && client->status != Disconnected)
424 ts = client->trans;
8a0dc95f 425
5503ac56
EVH
426 if (!ts)
427 return -EREMOTEIO;
8a0dc95f 428
5503ac56 429 if (!(ts->wr->f_flags & O_NONBLOCK))
5d385153 430 p9_debug(P9_DEBUG_ERROR, "blocking write ...\n");
992b3f1d 431
5503ac56
EVH
432 oldfs = get_fs();
433 set_fs(get_ds());
434 /* The cast to a user pointer is valid due to the set_fs() */
e3db6cb4 435 ret = vfs_write(ts->wr, (__force void __user *)v, len, &ts->wr->f_pos);
5503ac56 436 set_fs(oldfs);
992b3f1d 437
5503ac56
EVH
438 if (ret <= 0 && ret != -ERESTARTSYS && ret != -EAGAIN)
439 client->status = Disconnected;
440 return ret;
8a0dc95f
EVH
441}
442
443/**
444 * p9_write_work - called when a transport can send some data
ee443996
EVH
445 * @work: container for work to be done
446 *
8a0dc95f 447 */
ee443996 448
8a0dc95f
EVH
449static void p9_write_work(struct work_struct *work)
450{
451 int n, err;
452 struct p9_conn *m;
673d62cd 453 struct p9_req_t *req;
8a0dc95f
EVH
454
455 m = container_of(work, struct p9_conn, wq);
456
457 if (m->err < 0) {
458 clear_bit(Wworksched, &m->wsched);
459 return;
460 }
461
462 if (!m->wsize) {
759f4298 463 spin_lock(&m->client->lock);
8a0dc95f
EVH
464 if (list_empty(&m->unsent_req_list)) {
465 clear_bit(Wworksched, &m->wsched);
759f4298 466 spin_unlock(&m->client->lock);
8a0dc95f
EVH
467 return;
468 }
469
673d62cd 470 req = list_entry(m->unsent_req_list.next, struct p9_req_t,
8a0dc95f 471 req_list);
673d62cd 472 req->status = REQ_STATUS_SENT;
5d385153 473 p9_debug(P9_DEBUG_TRANS, "move req %p\n", req);
8a0dc95f 474 list_move_tail(&req->req_list, &m->req_list);
8a0dc95f 475
673d62cd
EVH
476 m->wbuf = req->tc->sdata;
477 m->wsize = req->tc->size;
8a0dc95f 478 m->wpos = 0;
673d62cd 479 spin_unlock(&m->client->lock);
8a0dc95f
EVH
480 }
481
5d385153
JP
482 p9_debug(P9_DEBUG_TRANS, "mux %p pos %d size %d\n",
483 m, m->wpos, m->wsize);
8a0dc95f 484 clear_bit(Wpending, &m->wsched);
8b81ef58 485 err = p9_fd_write(m->client, m->wbuf + m->wpos, m->wsize - m->wpos);
5d385153 486 p9_debug(P9_DEBUG_TRANS, "mux %p sent %d bytes\n", m, err);
584a8c13
SD
487 if (err == -EAGAIN)
488 goto end_clear;
489
8a0dc95f
EVH
490
491 if (err < 0)
492 goto error;
493 else if (err == 0) {
494 err = -EREMOTEIO;
495 goto error;
496 }
497
498 m->wpos += err;
499 if (m->wpos == m->wsize)
500 m->wpos = m->wsize = 0;
501
584a8c13
SD
502end_clear:
503 clear_bit(Wworksched, &m->wsched);
504
1957b3a8 505 if (m->wsize || !list_empty(&m->unsent_req_list)) {
8a0dc95f
EVH
506 if (test_and_clear_bit(Wpending, &m->wsched))
507 n = POLLOUT;
508 else
8b81ef58 509 n = p9_fd_poll(m->client, NULL);
8a0dc95f 510
584a8c13
SD
511 if ((n & POLLOUT) &&
512 !test_and_set_bit(Wworksched, &m->wsched)) {
5d385153 513 p9_debug(P9_DEBUG_TRANS, "sched write work %p\n", m);
61edeeed 514 schedule_work(&m->wq);
584a8c13
SD
515 }
516 }
8a0dc95f
EVH
517
518 return;
519
520error:
521 p9_conn_cancel(m, err);
522 clear_bit(Wworksched, &m->wsched);
523}
524
95c96174 525static int p9_pollwake(wait_queue_t *wait, unsigned int mode, int sync, void *key)
8a0dc95f 526{
5503ac56
EVH
527 struct p9_poll_wait *pwait =
528 container_of(wait, struct p9_poll_wait, wait);
529 struct p9_conn *m = pwait->conn;
530 unsigned long flags;
8a0dc95f 531
5503ac56
EVH
532 spin_lock_irqsave(&p9_poll_lock, flags);
533 if (list_empty(&m->poll_pending_link))
534 list_add_tail(&m->poll_pending_link, &p9_poll_pending_list);
535 spin_unlock_irqrestore(&p9_poll_lock, flags);
8a0dc95f 536
aa70c585
TH
537 schedule_work(&p9_poll_work);
538 return 1;
8a0dc95f
EVH
539}
540
541/**
5503ac56
EVH
542 * p9_pollwait - add poll task to the wait queue
543 * @filp: file pointer being polled
544 * @wait_address: wait_q to block on
545 * @p: poll state
ee443996 546 *
5503ac56 547 * called by files poll operation to add v9fs-poll task to files wait queue
8a0dc95f 548 */
ee443996 549
5503ac56
EVH
550static void
551p9_pollwait(struct file *filp, wait_queue_head_t *wait_address, poll_table *p)
8a0dc95f 552{
5503ac56
EVH
553 struct p9_conn *m = container_of(p, struct p9_conn, pt);
554 struct p9_poll_wait *pwait = NULL;
555 int i;
8a0dc95f 556
5503ac56
EVH
557 for (i = 0; i < ARRAY_SIZE(m->poll_wait); i++) {
558 if (m->poll_wait[i].wait_addr == NULL) {
559 pwait = &m->poll_wait[i];
560 break;
8a0dc95f 561 }
8a0dc95f
EVH
562 }
563
5503ac56 564 if (!pwait) {
5d385153 565 p9_debug(P9_DEBUG_ERROR, "not enough wait_address slots\n");
8a0dc95f
EVH
566 return;
567 }
568
5503ac56
EVH
569 pwait->conn = m;
570 pwait->wait_addr = wait_address;
571 init_waitqueue_func_entry(&pwait->wait, p9_pollwake);
572 add_wait_queue(wait_address, &pwait->wait);
573}
8a0dc95f 574
5503ac56 575/**
263c5828 576 * p9_conn_create - initialize the per-session mux data
5503ac56
EVH
577 * @client: client instance
578 *
579 * Note: Creates the polling task if this is the first session.
580 */
8a0dc95f 581
263c5828 582static void p9_conn_create(struct p9_client *client)
5503ac56 583{
95820a36 584 int n;
263c5828
SD
585 struct p9_trans_fd *ts = client->trans;
586 struct p9_conn *m = &ts->conn;
8a0dc95f 587
5d385153 588 p9_debug(P9_DEBUG_TRANS, "client %p msize %d\n", client, client->msize);
8a0dc95f 589
5503ac56
EVH
590 INIT_LIST_HEAD(&m->mux_list);
591 m->client = client;
8a0dc95f 592
5503ac56
EVH
593 INIT_LIST_HEAD(&m->req_list);
594 INIT_LIST_HEAD(&m->unsent_req_list);
595 INIT_WORK(&m->rq, p9_read_work);
596 INIT_WORK(&m->wq, p9_write_work);
597 INIT_LIST_HEAD(&m->poll_pending_link);
598 init_poll_funcptr(&m->pt, p9_pollwait);
8a0dc95f 599
5503ac56
EVH
600 n = p9_fd_poll(client, &m->pt);
601 if (n & POLLIN) {
5d385153 602 p9_debug(P9_DEBUG_TRANS, "mux %p can read\n", m);
5503ac56
EVH
603 set_bit(Rpending, &m->wsched);
604 }
8a0dc95f 605
5503ac56 606 if (n & POLLOUT) {
5d385153 607 p9_debug(P9_DEBUG_TRANS, "mux %p can write\n", m);
5503ac56
EVH
608 set_bit(Wpending, &m->wsched);
609 }
5503ac56 610}
8a0dc95f 611
5503ac56
EVH
612/**
613 * p9_poll_mux - polls a mux and schedules read or write works if necessary
614 * @m: connection to poll
615 *
616 */
617
618static void p9_poll_mux(struct p9_conn *m)
619{
620 int n;
621
622 if (m->err < 0)
623 return;
624
625 n = p9_fd_poll(m->client, NULL);
626 if (n < 0 || n & (POLLERR | POLLHUP | POLLNVAL)) {
5d385153 627 p9_debug(P9_DEBUG_TRANS, "error mux %p err %d\n", m, n);
5503ac56
EVH
628 if (n >= 0)
629 n = -ECONNRESET;
630 p9_conn_cancel(m, n);
631 }
632
633 if (n & POLLIN) {
634 set_bit(Rpending, &m->wsched);
5d385153 635 p9_debug(P9_DEBUG_TRANS, "mux %p can read\n", m);
5503ac56 636 if (!test_and_set_bit(Rworksched, &m->wsched)) {
5d385153 637 p9_debug(P9_DEBUG_TRANS, "sched read work %p\n", m);
61edeeed 638 schedule_work(&m->rq);
5503ac56
EVH
639 }
640 }
8a0dc95f 641
5503ac56
EVH
642 if (n & POLLOUT) {
643 set_bit(Wpending, &m->wsched);
5d385153 644 p9_debug(P9_DEBUG_TRANS, "mux %p can write\n", m);
f64f9e71
JP
645 if ((m->wsize || !list_empty(&m->unsent_req_list)) &&
646 !test_and_set_bit(Wworksched, &m->wsched)) {
5d385153 647 p9_debug(P9_DEBUG_TRANS, "sched write work %p\n", m);
61edeeed 648 schedule_work(&m->wq);
5503ac56
EVH
649 }
650 }
8a0dc95f
EVH
651}
652
653/**
91b8534f 654 * p9_fd_request - send 9P request
8a0dc95f
EVH
655 * The function can sleep until the request is scheduled for sending.
656 * The function can be interrupted. Return from the function is not
91b8534f 657 * a guarantee that the request is sent successfully.
8a0dc95f 658 *
91b8534f
EVH
659 * @client: client instance
660 * @req: request to be sent
ee443996 661 *
8a0dc95f 662 */
ee443996 663
91b8534f 664static int p9_fd_request(struct p9_client *client, struct p9_req_t *req)
8a0dc95f
EVH
665{
666 int n;
91b8534f 667 struct p9_trans_fd *ts = client->trans;
263c5828 668 struct p9_conn *m = &ts->conn;
8a0dc95f 669
5d385153
JP
670 p9_debug(P9_DEBUG_TRANS, "mux %p task %p tcall %p id %d\n",
671 m, current, req->tc, req->tc->id);
8a0dc95f 672 if (m->err < 0)
91b8534f 673 return m->err;
8a0dc95f 674
91b8534f 675 spin_lock(&client->lock);
7eb923b8 676 req->status = REQ_STATUS_UNSENT;
8a0dc95f 677 list_add_tail(&req->req_list, &m->unsent_req_list);
91b8534f 678 spin_unlock(&client->lock);
8a0dc95f
EVH
679
680 if (test_and_clear_bit(Wpending, &m->wsched))
681 n = POLLOUT;
682 else
8b81ef58 683 n = p9_fd_poll(m->client, NULL);
8a0dc95f
EVH
684
685 if (n & POLLOUT && !test_and_set_bit(Wworksched, &m->wsched))
61edeeed 686 schedule_work(&m->wq);
8a0dc95f 687
91b8534f 688 return 0;
8a0dc95f
EVH
689}
690
91b8534f 691static int p9_fd_cancel(struct p9_client *client, struct p9_req_t *req)
8a0dc95f 692{
7eb923b8 693 int ret = 1;
8a0dc95f 694
5d385153 695 p9_debug(P9_DEBUG_TRANS, "client %p req %p\n", client, req);
8a0dc95f 696
91b8534f 697 spin_lock(&client->lock);
91b8534f 698
91b8534f 699 if (req->status == REQ_STATUS_UNSENT) {
1bab88b2 700 list_del(&req->req_list);
91b8534f 701 req->status = REQ_STATUS_FLSHD;
7eb923b8 702 ret = 0;
0bfd6845 703 }
7eb923b8
EVH
704 spin_unlock(&client->lock);
705
706 return ret;
8a0dc95f
EVH
707}
708
afd8d654
SD
709static int p9_fd_cancelled(struct p9_client *client, struct p9_req_t *req)
710{
711 p9_debug(P9_DEBUG_TRANS, "client %p req %p\n", client, req);
712
713 /* we haven't received a response for oldreq,
714 * remove it from the list.
715 */
716 spin_lock(&client->lock);
717 list_del(&req->req_list);
718 spin_unlock(&client->lock);
719
720 return 0;
721}
722
a80d923e 723/**
0e15597e
AK
724 * parse_opts - parse mount options into p9_fd_opts structure
725 * @params: options string passed from mount
726 * @opts: fd transport-specific structure to parse options into
a80d923e 727 *
bb8ffdfc 728 * Returns 0 upon success, -ERRNO upon failure
a80d923e 729 */
bd238fb4 730
bb8ffdfc 731static int parse_opts(char *params, struct p9_fd_opts *opts)
bd238fb4 732{
a80d923e
EVH
733 char *p;
734 substring_t args[MAX_OPT_ARGS];
735 int option;
d8c8a9e3 736 char *options, *tmp_options;
bd238fb4 737
a80d923e
EVH
738 opts->port = P9_PORT;
739 opts->rfd = ~0;
740 opts->wfd = ~0;
b99baa43 741 opts->privport = 0;
bd238fb4 742
bb8ffdfc
EVH
743 if (!params)
744 return 0;
745
d8c8a9e3
EVH
746 tmp_options = kstrdup(params, GFP_KERNEL);
747 if (!tmp_options) {
5d385153
JP
748 p9_debug(P9_DEBUG_ERROR,
749 "failed to allocate copy of option string\n");
bb8ffdfc
EVH
750 return -ENOMEM;
751 }
d8c8a9e3 752 options = tmp_options;
bd238fb4 753
a80d923e
EVH
754 while ((p = strsep(&options, ",")) != NULL) {
755 int token;
bb8ffdfc 756 int r;
a80d923e
EVH
757 if (!*p)
758 continue;
759 token = match_token(p, tokens, args);
2f28c8b3 760 if ((token != Opt_err) && (token != Opt_privport)) {
15da4b16
AK
761 r = match_int(&args[0], &option);
762 if (r < 0) {
5d385153
JP
763 p9_debug(P9_DEBUG_ERROR,
764 "integer field, but no integer?\n");
15da4b16
AK
765 continue;
766 }
a80d923e
EVH
767 }
768 switch (token) {
769 case Opt_port:
770 opts->port = option;
771 break;
772 case Opt_rfdno:
773 opts->rfd = option;
774 break;
775 case Opt_wfdno:
776 opts->wfd = option;
777 break;
2f28c8b3
JG
778 case Opt_privport:
779 opts->privport = 1;
780 break;
a80d923e
EVH
781 default:
782 continue;
783 }
bd238fb4 784 }
d8c8a9e3
EVH
785
786 kfree(tmp_options);
bb8ffdfc 787 return 0;
bd238fb4 788}
bd238fb4 789
8b81ef58 790static int p9_fd_open(struct p9_client *client, int rfd, int wfd)
bd238fb4 791{
263c5828 792 struct p9_trans_fd *ts = kzalloc(sizeof(struct p9_trans_fd),
a80d923e
EVH
793 GFP_KERNEL);
794 if (!ts)
795 return -ENOMEM;
bd238fb4 796
a80d923e
EVH
797 ts->rd = fget(rfd);
798 ts->wr = fget(wfd);
799 if (!ts->rd || !ts->wr) {
800 if (ts->rd)
801 fput(ts->rd);
802 if (ts->wr)
803 fput(ts->wr);
804 kfree(ts);
805 return -EIO;
bd238fb4
LI
806 }
807
8b81ef58
EVH
808 client->trans = ts;
809 client->status = Connected;
bd238fb4 810
a80d923e 811 return 0;
bd238fb4 812}
bd238fb4 813
8b81ef58 814static int p9_socket_open(struct p9_client *client, struct socket *csocket)
bd238fb4 815{
6b18662e 816 struct p9_trans_fd *p;
56b31d1c 817 struct file *file;
6b18662e 818
263c5828 819 p = kzalloc(sizeof(struct p9_trans_fd), GFP_KERNEL);
6b18662e
AV
820 if (!p)
821 return -ENOMEM;
bd238fb4
LI
822
823 csocket->sk->sk_allocation = GFP_NOIO;
aab174f0 824 file = sock_alloc_file(csocket, 0, NULL);
56b31d1c 825 if (IS_ERR(file)) {
5d385153
JP
826 pr_err("%s (%d): failed to map fd\n",
827 __func__, task_pid_nr(current));
6b18662e
AV
828 sock_release(csocket);
829 kfree(p);
56b31d1c 830 return PTR_ERR(file);
bd238fb4
LI
831 }
832
56b31d1c
AV
833 get_file(file);
834 p->wr = p->rd = file;
6b18662e
AV
835 client->trans = p;
836 client->status = Connected;
837
6b18662e
AV
838 p->rd->f_flags |= O_NONBLOCK;
839
263c5828 840 p9_conn_create(client);
bd238fb4
LI
841 return 0;
842}
843
bd238fb4 844/**
263c5828 845 * p9_mux_destroy - cancels all pending requests of mux
5503ac56 846 * @m: mux to destroy
bd238fb4
LI
847 *
848 */
ee443996 849
5503ac56 850static void p9_conn_destroy(struct p9_conn *m)
bd238fb4 851{
5d385153
JP
852 p9_debug(P9_DEBUG_TRANS, "mux %p prev %p next %p\n",
853 m, m->mux_list.prev, m->mux_list.next);
bd238fb4 854
5503ac56
EVH
855 p9_mux_poll_stop(m);
856 cancel_work_sync(&m->rq);
857 cancel_work_sync(&m->wq);
bd238fb4 858
5503ac56 859 p9_conn_cancel(m, -ECONNRESET);
bd238fb4 860
5503ac56 861 m->client = NULL;
bd238fb4
LI
862}
863
864/**
8b81ef58
EVH
865 * p9_fd_close - shutdown file descriptor transport
866 * @client: client instance
bd238fb4
LI
867 *
868 */
ee443996 869
8b81ef58 870static void p9_fd_close(struct p9_client *client)
bd238fb4
LI
871{
872 struct p9_trans_fd *ts;
873
8b81ef58 874 if (!client)
bd238fb4
LI
875 return;
876
8b81ef58 877 ts = client->trans;
bd238fb4
LI
878 if (!ts)
879 return;
880
8b81ef58
EVH
881 client->status = Disconnected;
882
263c5828 883 p9_conn_destroy(&ts->conn);
8a0dc95f 884
bd238fb4
LI
885 if (ts->rd)
886 fput(ts->rd);
887 if (ts->wr)
888 fput(ts->wr);
8b81ef58 889
bd238fb4
LI
890 kfree(ts);
891}
892
887b3ece
EVH
893/*
894 * stolen from NFS - maybe should be made a generic function?
895 */
896static inline int valid_ipaddr4(const char *buf)
897{
898 int rc, count, in[4];
899
900 rc = sscanf(buf, "%d.%d.%d.%d", &in[0], &in[1], &in[2], &in[3]);
901 if (rc != 4)
902 return -EINVAL;
903 for (count = 0; count < 4; count++) {
904 if (in[count] > 255)
905 return -EINVAL;
906 }
907 return 0;
908}
909
2f28c8b3
JG
910static int p9_bind_privport(struct socket *sock)
911{
912 struct sockaddr_in cl;
913 int port, err = -EINVAL;
914
915 memset(&cl, 0, sizeof(cl));
916 cl.sin_family = AF_INET;
917 cl.sin_addr.s_addr = INADDR_ANY;
918 for (port = p9_ipport_resv_max; port >= p9_ipport_resv_min; port--) {
919 cl.sin_port = htons((ushort)port);
920 err = kernel_bind(sock, (struct sockaddr *)&cl, sizeof(cl));
921 if (err != -EADDRINUSE)
922 break;
923 }
924 return err;
925}
926
927
8b81ef58
EVH
928static int
929p9_fd_create_tcp(struct p9_client *client, const char *addr, char *args)
a80d923e
EVH
930{
931 int err;
a80d923e
EVH
932 struct socket *csocket;
933 struct sockaddr_in sin_server;
934 struct p9_fd_opts opts;
935
bb8ffdfc
EVH
936 err = parse_opts(args, &opts);
937 if (err < 0)
8b81ef58 938 return err;
a80d923e 939
887b3ece 940 if (valid_ipaddr4(addr) < 0)
8b81ef58 941 return -EINVAL;
887b3ece 942
a80d923e 943 csocket = NULL;
a80d923e
EVH
944
945 sin_server.sin_family = AF_INET;
946 sin_server.sin_addr.s_addr = in_aton(addr);
947 sin_server.sin_port = htons(opts.port);
0c5c9fb5 948 err = __sock_create(current->nsproxy->net_ns, PF_INET,
e75762fd 949 SOCK_STREAM, IPPROTO_TCP, &csocket, 1);
6b18662e 950 if (err) {
5d385153
JP
951 pr_err("%s (%d): problem creating socket\n",
952 __func__, task_pid_nr(current));
6b18662e 953 return err;
a80d923e
EVH
954 }
955
2f28c8b3
JG
956 if (opts.privport) {
957 err = p9_bind_privport(csocket);
958 if (err < 0) {
959 pr_err("%s (%d): problem binding to privport\n",
960 __func__, task_pid_nr(current));
961 sock_release(csocket);
962 return err;
963 }
964 }
965
a80d923e
EVH
966 err = csocket->ops->connect(csocket,
967 (struct sockaddr *)&sin_server,
968 sizeof(struct sockaddr_in), 0);
969 if (err < 0) {
5d385153
JP
970 pr_err("%s (%d): problem connecting socket to %s\n",
971 __func__, task_pid_nr(current), addr);
a80d923e 972 sock_release(csocket);
6b18662e
AV
973 return err;
974 }
a80d923e 975
6b18662e 976 return p9_socket_open(client, csocket);
a80d923e
EVH
977}
978
8b81ef58
EVH
979static int
980p9_fd_create_unix(struct p9_client *client, const char *addr, char *args)
a80d923e
EVH
981{
982 int err;
983 struct socket *csocket;
984 struct sockaddr_un sun_server;
a80d923e
EVH
985
986 csocket = NULL;
a80d923e 987
cff6b8a9 988 if (strlen(addr) >= UNIX_PATH_MAX) {
5d385153
JP
989 pr_err("%s (%d): address too long: %s\n",
990 __func__, task_pid_nr(current), addr);
6b18662e 991 return -ENAMETOOLONG;
a80d923e
EVH
992 }
993
994 sun_server.sun_family = PF_UNIX;
995 strcpy(sun_server.sun_path, addr);
0c5c9fb5 996 err = __sock_create(current->nsproxy->net_ns, PF_UNIX,
e75762fd 997 SOCK_STREAM, 0, &csocket, 1);
6b18662e 998 if (err < 0) {
5d385153
JP
999 pr_err("%s (%d): problem creating socket\n",
1000 __func__, task_pid_nr(current));
1001
6b18662e
AV
1002 return err;
1003 }
a80d923e
EVH
1004 err = csocket->ops->connect(csocket, (struct sockaddr *)&sun_server,
1005 sizeof(struct sockaddr_un) - 1, 0);
1006 if (err < 0) {
5d385153
JP
1007 pr_err("%s (%d): problem connecting socket: %s: %d\n",
1008 __func__, task_pid_nr(current), addr, err);
a80d923e 1009 sock_release(csocket);
6b18662e
AV
1010 return err;
1011 }
a80d923e 1012
6b18662e 1013 return p9_socket_open(client, csocket);
a80d923e
EVH
1014}
1015
8b81ef58
EVH
1016static int
1017p9_fd_create(struct p9_client *client, const char *addr, char *args)
a80d923e
EVH
1018{
1019 int err;
a80d923e
EVH
1020 struct p9_fd_opts opts;
1021
1022 parse_opts(args, &opts);
1023
1024 if (opts.rfd == ~0 || opts.wfd == ~0) {
5d385153 1025 pr_err("Insufficient options for proto=fd\n");
8b81ef58 1026 return -ENOPROTOOPT;
a80d923e
EVH
1027 }
1028
8b81ef58 1029 err = p9_fd_open(client, opts.rfd, opts.wfd);
a80d923e 1030 if (err < 0)
6b18662e 1031 return err;
a80d923e 1032
263c5828 1033 p9_conn_create(client);
8a0dc95f 1034
8b81ef58 1035 return 0;
a80d923e
EVH
1036}
1037
1038static struct p9_trans_module p9_tcp_trans = {
1039 .name = "tcp",
1040 .maxsize = MAX_SOCK_BUF,
f94741fd 1041 .def = 0,
8b81ef58
EVH
1042 .create = p9_fd_create_tcp,
1043 .close = p9_fd_close,
91b8534f
EVH
1044 .request = p9_fd_request,
1045 .cancel = p9_fd_cancel,
afd8d654 1046 .cancelled = p9_fd_cancelled,
72029fe8 1047 .owner = THIS_MODULE,
a80d923e
EVH
1048};
1049
1050static struct p9_trans_module p9_unix_trans = {
1051 .name = "unix",
1052 .maxsize = MAX_SOCK_BUF,
1053 .def = 0,
8b81ef58
EVH
1054 .create = p9_fd_create_unix,
1055 .close = p9_fd_close,
91b8534f
EVH
1056 .request = p9_fd_request,
1057 .cancel = p9_fd_cancel,
afd8d654 1058 .cancelled = p9_fd_cancelled,
72029fe8 1059 .owner = THIS_MODULE,
a80d923e
EVH
1060};
1061
1062static struct p9_trans_module p9_fd_trans = {
1063 .name = "fd",
1064 .maxsize = MAX_SOCK_BUF,
1065 .def = 0,
8b81ef58
EVH
1066 .create = p9_fd_create,
1067 .close = p9_fd_close,
91b8534f
EVH
1068 .request = p9_fd_request,
1069 .cancel = p9_fd_cancel,
afd8d654 1070 .cancelled = p9_fd_cancelled,
72029fe8 1071 .owner = THIS_MODULE,
a80d923e
EVH
1072};
1073
5503ac56
EVH
1074/**
1075 * p9_poll_proc - poll worker thread
1076 * @a: thread state and arguments
1077 *
1078 * polls all v9fs transports for new events and queues the appropriate
1079 * work to the work queue
1080 *
1081 */
1082
aa70c585 1083static void p9_poll_workfn(struct work_struct *work)
5503ac56
EVH
1084{
1085 unsigned long flags;
1086
5d385153 1087 p9_debug(P9_DEBUG_TRANS, "start %p\n", current);
aa70c585 1088
5503ac56
EVH
1089 spin_lock_irqsave(&p9_poll_lock, flags);
1090 while (!list_empty(&p9_poll_pending_list)) {
1091 struct p9_conn *conn = list_first_entry(&p9_poll_pending_list,
1092 struct p9_conn,
1093 poll_pending_link);
1094 list_del_init(&conn->poll_pending_link);
1095 spin_unlock_irqrestore(&p9_poll_lock, flags);
1096
1097 p9_poll_mux(conn);
1098
1099 spin_lock_irqsave(&p9_poll_lock, flags);
1100 }
1101 spin_unlock_irqrestore(&p9_poll_lock, flags);
1102
5d385153 1103 p9_debug(P9_DEBUG_TRANS, "finish\n");
5503ac56
EVH
1104}
1105
887b3ece 1106int p9_trans_fd_init(void)
a80d923e
EVH
1107{
1108 v9fs_register_trans(&p9_tcp_trans);
1109 v9fs_register_trans(&p9_unix_trans);
1110 v9fs_register_trans(&p9_fd_trans);
1111
3387b804 1112 return 0;
a80d923e 1113}
72029fe8
TH
1114
1115void p9_trans_fd_exit(void)
1116{
43829731 1117 flush_work(&p9_poll_work);
72029fe8
TH
1118 v9fs_unregister_trans(&p9_tcp_trans);
1119 v9fs_unregister_trans(&p9_unix_trans);
1120 v9fs_unregister_trans(&p9_fd_trans);
1121}