9P: Add memory barriers to protect request fields over cb/rpc threads handoff
[linux-2.6-block.git] / net / 9p / trans_fd.c
CommitLineData
bd238fb4
LI
1/*
2 * linux/fs/9p/trans_fd.c
3 *
4 * Fd transport layer. Includes deprecated socket layer.
5 *
6 * Copyright (C) 2006 by Russ Cox <rsc@swtch.com>
7 * Copyright (C) 2004-2005 by Latchesar Ionkov <lucho@ionkov.net>
8a0dc95f 8 * Copyright (C) 2004-2008 by Eric Van Hensbergen <ericvh@gmail.com>
bd238fb4
LI
9 * Copyright (C) 1997-2002 by Ron Minnich <rminnich@sarnoff.com>
10 *
11 * This program is free software; you can redistribute it and/or modify
12 * it under the terms of the GNU General Public License version 2
13 * as published by the Free Software Foundation.
14 *
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU General Public License for more details.
19 *
20 * You should have received a copy of the GNU General Public License
21 * along with this program; if not, write to:
22 * Free Software Foundation
23 * 51 Franklin Street, Fifth Floor
24 * Boston, MA 02111-1301 USA
25 *
26 */
27
5d385153
JP
28#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
29
bd238fb4
LI
30#include <linux/in.h>
31#include <linux/module.h>
32#include <linux/net.h>
33#include <linux/ipv6.h>
8a0dc95f 34#include <linux/kthread.h>
bd238fb4
LI
35#include <linux/errno.h>
36#include <linux/kernel.h>
37#include <linux/un.h>
38#include <linux/uaccess.h>
39#include <linux/inet.h>
40#include <linux/idr.h>
41#include <linux/file.h>
a80d923e 42#include <linux/parser.h>
5a0e3ad6 43#include <linux/slab.h>
bd238fb4 44#include <net/9p/9p.h>
8b81ef58 45#include <net/9p/client.h>
bd238fb4
LI
46#include <net/9p/transport.h>
47
6b18662e
AV
48#include <linux/syscalls.h> /* killme */
49
bd238fb4 50#define P9_PORT 564
a80d923e 51#define MAX_SOCK_BUF (64*1024)
8a0dc95f 52#define MAXPOLLWADDR 2
a80d923e 53
ee443996
EVH
54/**
55 * struct p9_fd_opts - per-transport options
56 * @rfd: file descriptor for reading (trans=fd)
57 * @wfd: file descriptor for writing (trans=fd)
58 * @port: port to connect to (trans=tcp)
59 *
60 */
61
a80d923e
EVH
62struct p9_fd_opts {
63 int rfd;
64 int wfd;
65 u16 port;
2f28c8b3 66 int privport;
a80d923e 67};
bd238fb4 68
ee443996
EVH
69/**
70 * struct p9_trans_fd - transport state
71 * @rd: reference to file to read from
72 * @wr: reference of file to write to
73 * @conn: connection state reference
74 *
75 */
76
bd238fb4
LI
77struct p9_trans_fd {
78 struct file *rd;
79 struct file *wr;
8a0dc95f 80 struct p9_conn *conn;
bd238fb4
LI
81};
82
a80d923e
EVH
83/*
84 * Option Parsing (code inspired by NFS code)
85 * - a little lazy - parse all fd-transport options
86 */
bd238fb4 87
a80d923e
EVH
88enum {
89 /* Options that take integer arguments */
55762690 90 Opt_port, Opt_rfdno, Opt_wfdno, Opt_err,
2f28c8b3
JG
91 /* Options that take no arguments */
92 Opt_privport,
a80d923e 93};
bd238fb4 94
a447c093 95static const match_table_t tokens = {
a80d923e
EVH
96 {Opt_port, "port=%u"},
97 {Opt_rfdno, "rfdno=%u"},
98 {Opt_wfdno, "wfdno=%u"},
2f28c8b3 99 {Opt_privport, "privport"},
55762690 100 {Opt_err, NULL},
a80d923e 101};
bd238fb4 102
8a0dc95f
EVH
103enum {
104 Rworksched = 1, /* read work scheduled or running */
105 Rpending = 2, /* can read */
106 Wworksched = 4, /* write work scheduled or running */
107 Wpending = 8, /* can write */
108};
109
992b3f1d
TH
110struct p9_poll_wait {
111 struct p9_conn *conn;
112 wait_queue_t wait;
113 wait_queue_head_t *wait_addr;
ee443996
EVH
114};
115
116/**
117 * struct p9_conn - fd mux connection state information
ee443996 118 * @mux_list: list link for mux to manage multiple connections (?)
8b81ef58 119 * @client: reference to client instance for this connection
ee443996 120 * @err: error state
ee443996
EVH
121 * @req_list: accounting for requests which have been sent
122 * @unsent_req_list: accounting for requests that haven't been sent
1b0a763b
EVH
123 * @req: current request being processed (if any)
124 * @tmp_buf: temporary buffer to read in header
125 * @rsize: amount to read for current frame
ee443996
EVH
126 * @rpos: read position in current frame
127 * @rbuf: current read buffer
128 * @wpos: write position for current frame
129 * @wsize: amount of data to write for current frame
130 * @wbuf: current write buffer
0e15597e 131 * @poll_pending_link: pending links to be polled per conn
ee443996 132 * @poll_wait: array of wait_q's for various worker threads
ee443996
EVH
133 * @pt: poll state
134 * @rq: current read work
135 * @wq: current write work
136 * @wsched: ????
137 *
138 */
8a0dc95f
EVH
139
140struct p9_conn {
8a0dc95f 141 struct list_head mux_list;
8b81ef58 142 struct p9_client *client;
8a0dc95f 143 int err;
8a0dc95f
EVH
144 struct list_head req_list;
145 struct list_head unsent_req_list;
1b0a763b
EVH
146 struct p9_req_t *req;
147 char tmp_buf[7];
148 int rsize;
8a0dc95f
EVH
149 int rpos;
150 char *rbuf;
151 int wpos;
152 int wsize;
153 char *wbuf;
992b3f1d
TH
154 struct list_head poll_pending_link;
155 struct p9_poll_wait poll_wait[MAXPOLLWADDR];
8a0dc95f
EVH
156 poll_table pt;
157 struct work_struct rq;
158 struct work_struct wq;
159 unsigned long wsched;
160};
161
aa70c585
TH
162static void p9_poll_workfn(struct work_struct *work);
163
992b3f1d
TH
164static DEFINE_SPINLOCK(p9_poll_lock);
165static LIST_HEAD(p9_poll_pending_list);
aa70c585 166static DECLARE_WORK(p9_poll_work, p9_poll_workfn);
8a0dc95f 167
2f28c8b3
JG
168static unsigned int p9_ipport_resv_min = P9_DEF_MIN_RESVPORT;
169static unsigned int p9_ipport_resv_max = P9_DEF_MAX_RESVPORT;
170
992b3f1d 171static void p9_mux_poll_stop(struct p9_conn *m)
8a0dc95f 172{
992b3f1d
TH
173 unsigned long flags;
174 int i;
8a0dc95f 175
992b3f1d
TH
176 for (i = 0; i < ARRAY_SIZE(m->poll_wait); i++) {
177 struct p9_poll_wait *pwait = &m->poll_wait[i];
8a0dc95f 178
992b3f1d
TH
179 if (pwait->wait_addr) {
180 remove_wait_queue(pwait->wait_addr, &pwait->wait);
181 pwait->wait_addr = NULL;
8a0dc95f 182 }
8a0dc95f
EVH
183 }
184
992b3f1d
TH
185 spin_lock_irqsave(&p9_poll_lock, flags);
186 list_del_init(&m->poll_pending_link);
187 spin_unlock_irqrestore(&p9_poll_lock, flags);
8a0dc95f
EVH
188}
189
190/**
5503ac56
EVH
191 * p9_conn_cancel - cancel all pending requests with error
192 * @m: mux data
193 * @err: error code
8a0dc95f 194 *
8a0dc95f 195 */
ee443996 196
51a87c55 197static void p9_conn_cancel(struct p9_conn *m, int err)
8a0dc95f 198{
673d62cd 199 struct p9_req_t *req, *rtmp;
91b8534f 200 unsigned long flags;
5503ac56 201 LIST_HEAD(cancel_list);
8a0dc95f 202
5d385153 203 p9_debug(P9_DEBUG_ERROR, "mux %p err %d\n", m, err);
7eb923b8 204
91b8534f 205 spin_lock_irqsave(&m->client->lock, flags);
7eb923b8
EVH
206
207 if (m->err) {
208 spin_unlock_irqrestore(&m->client->lock, flags);
209 return;
210 }
211
212 m->err = err;
213
5503ac56
EVH
214 list_for_each_entry_safe(req, rtmp, &m->req_list, req_list) {
215 list_move(&req->req_list, &cancel_list);
216 }
217 list_for_each_entry_safe(req, rtmp, &m->unsent_req_list, req_list) {
218 list_move(&req->req_list, &cancel_list);
8a0dc95f 219 }
91b8534f 220 spin_unlock_irqrestore(&m->client->lock, flags);
8a0dc95f 221
5503ac56 222 list_for_each_entry_safe(req, rtmp, &cancel_list, req_list) {
5d385153 223 p9_debug(P9_DEBUG_ERROR, "call back req %p\n", req);
1bab88b2 224 list_del(&req->req_list);
2b6e72ed
DM
225 if (!req->t_err)
226 req->t_err = err;
227 p9_client_cb(m->client, req, REQ_STATUS_ERROR);
8a0dc95f 228 }
8a0dc95f
EVH
229}
230
29af9309 231static int
5503ac56 232p9_fd_poll(struct p9_client *client, struct poll_table_struct *pt)
8a0dc95f 233{
5503ac56
EVH
234 int ret, n;
235 struct p9_trans_fd *ts = NULL;
8a0dc95f 236
5503ac56
EVH
237 if (client && client->status == Connected)
238 ts = client->trans;
7dc5d24b 239
5503ac56
EVH
240 if (!ts)
241 return -EREMOTEIO;
7dc5d24b 242
72c2d531 243 if (!ts->rd->f_op->poll)
5503ac56 244 return -EIO;
8a0dc95f 245
72c2d531 246 if (!ts->wr->f_op->poll)
5503ac56 247 return -EIO;
992b3f1d 248
5503ac56
EVH
249 ret = ts->rd->f_op->poll(ts->rd, pt);
250 if (ret < 0)
251 return ret;
992b3f1d 252
5503ac56
EVH
253 if (ts->rd != ts->wr) {
254 n = ts->wr->f_op->poll(ts->wr, pt);
255 if (n < 0)
256 return n;
257 ret = (ret & ~POLLOUT) | (n & ~POLLIN);
258 }
259
260 return ret;
992b3f1d
TH
261}
262
8a0dc95f 263/**
5503ac56
EVH
264 * p9_fd_read- read from a fd
265 * @client: client instance
266 * @v: buffer to receive data into
267 * @len: size of receive buffer
ee443996 268 *
8a0dc95f 269 */
ee443996 270
5503ac56 271static int p9_fd_read(struct p9_client *client, void *v, int len)
8a0dc95f 272{
5503ac56
EVH
273 int ret;
274 struct p9_trans_fd *ts = NULL;
8a0dc95f 275
5503ac56
EVH
276 if (client && client->status != Disconnected)
277 ts = client->trans;
8a0dc95f 278
5503ac56
EVH
279 if (!ts)
280 return -EREMOTEIO;
8a0dc95f 281
5503ac56 282 if (!(ts->rd->f_flags & O_NONBLOCK))
5d385153 283 p9_debug(P9_DEBUG_ERROR, "blocking read ...\n");
8a0dc95f 284
5503ac56
EVH
285 ret = kernel_read(ts->rd, ts->rd->f_pos, v, len);
286 if (ret <= 0 && ret != -ERESTARTSYS && ret != -EAGAIN)
287 client->status = Disconnected;
288 return ret;
8a0dc95f
EVH
289}
290
291/**
5503ac56
EVH
292 * p9_read_work - called when there is some data to be read from a transport
293 * @work: container of work to be done
ee443996 294 *
8a0dc95f 295 */
ee443996 296
5503ac56 297static void p9_read_work(struct work_struct *work)
8a0dc95f 298{
5503ac56
EVH
299 int n, err;
300 struct p9_conn *m;
2b6e72ed 301 int status = REQ_STATUS_ERROR;
5503ac56
EVH
302
303 m = container_of(work, struct p9_conn, rq);
8a0dc95f
EVH
304
305 if (m->err < 0)
306 return;
307
5d385153 308 p9_debug(P9_DEBUG_TRANS, "start mux %p pos %d\n", m, m->rpos);
8a0dc95f 309
1b0a763b
EVH
310 if (!m->rbuf) {
311 m->rbuf = m->tmp_buf;
5503ac56 312 m->rpos = 0;
1b0a763b 313 m->rsize = 7; /* start by reading header */
8a0dc95f
EVH
314 }
315
5503ac56 316 clear_bit(Rpending, &m->wsched);
5d385153
JP
317 p9_debug(P9_DEBUG_TRANS, "read mux %p pos %d size: %d = %d\n",
318 m, m->rpos, m->rsize, m->rsize-m->rpos);
5503ac56 319 err = p9_fd_read(m->client, m->rbuf + m->rpos,
1b0a763b 320 m->rsize - m->rpos);
5d385153 321 p9_debug(P9_DEBUG_TRANS, "mux %p got %d bytes\n", m, err);
5503ac56 322 if (err == -EAGAIN) {
0462194d 323 goto end_clear;
8a0dc95f 324 }
8a0dc95f 325
5503ac56
EVH
326 if (err <= 0)
327 goto error;
328
329 m->rpos += err;
1b0a763b
EVH
330
331 if ((!m->req) && (m->rpos == m->rsize)) { /* header read in */
332 u16 tag;
5d385153 333 p9_debug(P9_DEBUG_TRANS, "got new header\n");
1b0a763b
EVH
334
335 n = le32_to_cpu(*(__le32 *) m->rbuf); /* read packet size */
5503ac56 336 if (n >= m->client->msize) {
5d385153
JP
337 p9_debug(P9_DEBUG_ERROR,
338 "requested packet size too big: %d\n", n);
5503ac56
EVH
339 err = -EIO;
340 goto error;
341 }
342
1b0a763b 343 tag = le16_to_cpu(*(__le16 *) (m->rbuf+5)); /* read tag */
5d385153
JP
344 p9_debug(P9_DEBUG_TRANS,
345 "mux %p pkt: size: %d bytes tag: %d\n", m, n, tag);
1b0a763b
EVH
346
347 m->req = p9_tag_lookup(m->client, tag);
1bab88b2
LI
348 if (!m->req || (m->req->status != REQ_STATUS_SENT &&
349 m->req->status != REQ_STATUS_FLSH)) {
5d385153
JP
350 p9_debug(P9_DEBUG_ERROR, "Unexpected packet tag %d\n",
351 tag);
1b0a763b
EVH
352 err = -EIO;
353 goto error;
354 }
355
356 if (m->req->rc == NULL) {
357 m->req->rc = kmalloc(sizeof(struct p9_fcall) +
eeff66ef 358 m->client->msize, GFP_NOFS);
1b0a763b
EVH
359 if (!m->req->rc) {
360 m->req = NULL;
361 err = -ENOMEM;
362 goto error;
363 }
364 }
365 m->rbuf = (char *)m->req->rc + sizeof(struct p9_fcall);
366 memcpy(m->rbuf, m->tmp_buf, m->rsize);
367 m->rsize = n;
368 }
5503ac56 369
1b0a763b
EVH
370 /* not an else because some packets (like clunk) have no payload */
371 if ((m->req) && (m->rpos == m->rsize)) { /* packet is read in */
5d385153 372 p9_debug(P9_DEBUG_TRANS, "got new packet\n");
7eb923b8 373 spin_lock(&m->client->lock);
1bab88b2 374 if (m->req->status != REQ_STATUS_ERROR)
2b6e72ed 375 status = REQ_STATUS_RCVD;
91b8534f 376 list_del(&m->req->req_list);
7eb923b8 377 spin_unlock(&m->client->lock);
2b6e72ed 378 p9_client_cb(m->client, m->req, status);
1b0a763b
EVH
379 m->rbuf = NULL;
380 m->rpos = 0;
381 m->rsize = 0;
1b0a763b 382 m->req = NULL;
5503ac56
EVH
383 }
384
0462194d
SD
385end_clear:
386 clear_bit(Rworksched, &m->wsched);
387
5503ac56
EVH
388 if (!list_empty(&m->req_list)) {
389 if (test_and_clear_bit(Rpending, &m->wsched))
390 n = POLLIN;
391 else
392 n = p9_fd_poll(m->client, NULL);
393
0462194d 394 if ((n & POLLIN) && !test_and_set_bit(Rworksched, &m->wsched)) {
5d385153 395 p9_debug(P9_DEBUG_TRANS, "sched read work %p\n", m);
61edeeed 396 schedule_work(&m->rq);
0462194d
SD
397 }
398 }
5503ac56
EVH
399
400 return;
5503ac56
EVH
401error:
402 p9_conn_cancel(m, err);
403 clear_bit(Rworksched, &m->wsched);
404}
405
406/**
407 * p9_fd_write - write to a socket
408 * @client: client instance
409 * @v: buffer to send data from
410 * @len: size of send buffer
ee443996 411 *
8a0dc95f 412 */
ee443996 413
5503ac56 414static int p9_fd_write(struct p9_client *client, void *v, int len)
8a0dc95f 415{
5503ac56
EVH
416 int ret;
417 mm_segment_t oldfs;
418 struct p9_trans_fd *ts = NULL;
8a0dc95f 419
5503ac56
EVH
420 if (client && client->status != Disconnected)
421 ts = client->trans;
8a0dc95f 422
5503ac56
EVH
423 if (!ts)
424 return -EREMOTEIO;
8a0dc95f 425
5503ac56 426 if (!(ts->wr->f_flags & O_NONBLOCK))
5d385153 427 p9_debug(P9_DEBUG_ERROR, "blocking write ...\n");
992b3f1d 428
5503ac56
EVH
429 oldfs = get_fs();
430 set_fs(get_ds());
431 /* The cast to a user pointer is valid due to the set_fs() */
e3db6cb4 432 ret = vfs_write(ts->wr, (__force void __user *)v, len, &ts->wr->f_pos);
5503ac56 433 set_fs(oldfs);
992b3f1d 434
5503ac56
EVH
435 if (ret <= 0 && ret != -ERESTARTSYS && ret != -EAGAIN)
436 client->status = Disconnected;
437 return ret;
8a0dc95f
EVH
438}
439
440/**
441 * p9_write_work - called when a transport can send some data
ee443996
EVH
442 * @work: container for work to be done
443 *
8a0dc95f 444 */
ee443996 445
8a0dc95f
EVH
446static void p9_write_work(struct work_struct *work)
447{
448 int n, err;
449 struct p9_conn *m;
673d62cd 450 struct p9_req_t *req;
8a0dc95f
EVH
451
452 m = container_of(work, struct p9_conn, wq);
453
454 if (m->err < 0) {
455 clear_bit(Wworksched, &m->wsched);
456 return;
457 }
458
459 if (!m->wsize) {
759f4298 460 spin_lock(&m->client->lock);
8a0dc95f
EVH
461 if (list_empty(&m->unsent_req_list)) {
462 clear_bit(Wworksched, &m->wsched);
759f4298 463 spin_unlock(&m->client->lock);
8a0dc95f
EVH
464 return;
465 }
466
673d62cd 467 req = list_entry(m->unsent_req_list.next, struct p9_req_t,
8a0dc95f 468 req_list);
673d62cd 469 req->status = REQ_STATUS_SENT;
5d385153 470 p9_debug(P9_DEBUG_TRANS, "move req %p\n", req);
8a0dc95f 471 list_move_tail(&req->req_list, &m->req_list);
8a0dc95f 472
673d62cd
EVH
473 m->wbuf = req->tc->sdata;
474 m->wsize = req->tc->size;
8a0dc95f 475 m->wpos = 0;
673d62cd 476 spin_unlock(&m->client->lock);
8a0dc95f
EVH
477 }
478
5d385153
JP
479 p9_debug(P9_DEBUG_TRANS, "mux %p pos %d size %d\n",
480 m, m->wpos, m->wsize);
8a0dc95f 481 clear_bit(Wpending, &m->wsched);
8b81ef58 482 err = p9_fd_write(m->client, m->wbuf + m->wpos, m->wsize - m->wpos);
5d385153 483 p9_debug(P9_DEBUG_TRANS, "mux %p sent %d bytes\n", m, err);
584a8c13
SD
484 if (err == -EAGAIN)
485 goto end_clear;
486
8a0dc95f
EVH
487
488 if (err < 0)
489 goto error;
490 else if (err == 0) {
491 err = -EREMOTEIO;
492 goto error;
493 }
494
495 m->wpos += err;
496 if (m->wpos == m->wsize)
497 m->wpos = m->wsize = 0;
498
584a8c13
SD
499end_clear:
500 clear_bit(Wworksched, &m->wsched);
501
1957b3a8 502 if (m->wsize || !list_empty(&m->unsent_req_list)) {
8a0dc95f
EVH
503 if (test_and_clear_bit(Wpending, &m->wsched))
504 n = POLLOUT;
505 else
8b81ef58 506 n = p9_fd_poll(m->client, NULL);
8a0dc95f 507
584a8c13
SD
508 if ((n & POLLOUT) &&
509 !test_and_set_bit(Wworksched, &m->wsched)) {
5d385153 510 p9_debug(P9_DEBUG_TRANS, "sched write work %p\n", m);
61edeeed 511 schedule_work(&m->wq);
584a8c13
SD
512 }
513 }
8a0dc95f
EVH
514
515 return;
516
517error:
518 p9_conn_cancel(m, err);
519 clear_bit(Wworksched, &m->wsched);
520}
521
95c96174 522static int p9_pollwake(wait_queue_t *wait, unsigned int mode, int sync, void *key)
8a0dc95f 523{
5503ac56
EVH
524 struct p9_poll_wait *pwait =
525 container_of(wait, struct p9_poll_wait, wait);
526 struct p9_conn *m = pwait->conn;
527 unsigned long flags;
8a0dc95f 528
5503ac56
EVH
529 spin_lock_irqsave(&p9_poll_lock, flags);
530 if (list_empty(&m->poll_pending_link))
531 list_add_tail(&m->poll_pending_link, &p9_poll_pending_list);
532 spin_unlock_irqrestore(&p9_poll_lock, flags);
8a0dc95f 533
aa70c585
TH
534 schedule_work(&p9_poll_work);
535 return 1;
8a0dc95f
EVH
536}
537
538/**
5503ac56
EVH
539 * p9_pollwait - add poll task to the wait queue
540 * @filp: file pointer being polled
541 * @wait_address: wait_q to block on
542 * @p: poll state
ee443996 543 *
5503ac56 544 * called by files poll operation to add v9fs-poll task to files wait queue
8a0dc95f 545 */
ee443996 546
5503ac56
EVH
547static void
548p9_pollwait(struct file *filp, wait_queue_head_t *wait_address, poll_table *p)
8a0dc95f 549{
5503ac56
EVH
550 struct p9_conn *m = container_of(p, struct p9_conn, pt);
551 struct p9_poll_wait *pwait = NULL;
552 int i;
8a0dc95f 553
5503ac56
EVH
554 for (i = 0; i < ARRAY_SIZE(m->poll_wait); i++) {
555 if (m->poll_wait[i].wait_addr == NULL) {
556 pwait = &m->poll_wait[i];
557 break;
8a0dc95f 558 }
8a0dc95f
EVH
559 }
560
5503ac56 561 if (!pwait) {
5d385153 562 p9_debug(P9_DEBUG_ERROR, "not enough wait_address slots\n");
8a0dc95f
EVH
563 return;
564 }
565
5503ac56
EVH
566 pwait->conn = m;
567 pwait->wait_addr = wait_address;
568 init_waitqueue_func_entry(&pwait->wait, p9_pollwake);
569 add_wait_queue(wait_address, &pwait->wait);
570}
8a0dc95f 571
5503ac56
EVH
572/**
573 * p9_conn_create - allocate and initialize the per-session mux data
574 * @client: client instance
575 *
576 * Note: Creates the polling task if this is the first session.
577 */
8a0dc95f 578
5503ac56
EVH
579static struct p9_conn *p9_conn_create(struct p9_client *client)
580{
95820a36 581 int n;
5503ac56 582 struct p9_conn *m;
8a0dc95f 583
5d385153 584 p9_debug(P9_DEBUG_TRANS, "client %p msize %d\n", client, client->msize);
5503ac56
EVH
585 m = kzalloc(sizeof(struct p9_conn), GFP_KERNEL);
586 if (!m)
587 return ERR_PTR(-ENOMEM);
8a0dc95f 588
5503ac56
EVH
589 INIT_LIST_HEAD(&m->mux_list);
590 m->client = client;
8a0dc95f 591
5503ac56
EVH
592 INIT_LIST_HEAD(&m->req_list);
593 INIT_LIST_HEAD(&m->unsent_req_list);
594 INIT_WORK(&m->rq, p9_read_work);
595 INIT_WORK(&m->wq, p9_write_work);
596 INIT_LIST_HEAD(&m->poll_pending_link);
597 init_poll_funcptr(&m->pt, p9_pollwait);
8a0dc95f 598
5503ac56
EVH
599 n = p9_fd_poll(client, &m->pt);
600 if (n & POLLIN) {
5d385153 601 p9_debug(P9_DEBUG_TRANS, "mux %p can read\n", m);
5503ac56
EVH
602 set_bit(Rpending, &m->wsched);
603 }
8a0dc95f 604
5503ac56 605 if (n & POLLOUT) {
5d385153 606 p9_debug(P9_DEBUG_TRANS, "mux %p can write\n", m);
5503ac56
EVH
607 set_bit(Wpending, &m->wsched);
608 }
609
5503ac56
EVH
610 return m;
611}
8a0dc95f 612
5503ac56
EVH
613/**
614 * p9_poll_mux - polls a mux and schedules read or write works if necessary
615 * @m: connection to poll
616 *
617 */
618
619static void p9_poll_mux(struct p9_conn *m)
620{
621 int n;
622
623 if (m->err < 0)
624 return;
625
626 n = p9_fd_poll(m->client, NULL);
627 if (n < 0 || n & (POLLERR | POLLHUP | POLLNVAL)) {
5d385153 628 p9_debug(P9_DEBUG_TRANS, "error mux %p err %d\n", m, n);
5503ac56
EVH
629 if (n >= 0)
630 n = -ECONNRESET;
631 p9_conn_cancel(m, n);
632 }
633
634 if (n & POLLIN) {
635 set_bit(Rpending, &m->wsched);
5d385153 636 p9_debug(P9_DEBUG_TRANS, "mux %p can read\n", m);
5503ac56 637 if (!test_and_set_bit(Rworksched, &m->wsched)) {
5d385153 638 p9_debug(P9_DEBUG_TRANS, "sched read work %p\n", m);
61edeeed 639 schedule_work(&m->rq);
5503ac56
EVH
640 }
641 }
8a0dc95f 642
5503ac56
EVH
643 if (n & POLLOUT) {
644 set_bit(Wpending, &m->wsched);
5d385153 645 p9_debug(P9_DEBUG_TRANS, "mux %p can write\n", m);
f64f9e71
JP
646 if ((m->wsize || !list_empty(&m->unsent_req_list)) &&
647 !test_and_set_bit(Wworksched, &m->wsched)) {
5d385153 648 p9_debug(P9_DEBUG_TRANS, "sched write work %p\n", m);
61edeeed 649 schedule_work(&m->wq);
5503ac56
EVH
650 }
651 }
8a0dc95f
EVH
652}
653
654/**
91b8534f 655 * p9_fd_request - send 9P request
8a0dc95f
EVH
656 * The function can sleep until the request is scheduled for sending.
657 * The function can be interrupted. Return from the function is not
91b8534f 658 * a guarantee that the request is sent successfully.
8a0dc95f 659 *
91b8534f
EVH
660 * @client: client instance
661 * @req: request to be sent
ee443996 662 *
8a0dc95f 663 */
ee443996 664
91b8534f 665static int p9_fd_request(struct p9_client *client, struct p9_req_t *req)
8a0dc95f
EVH
666{
667 int n;
91b8534f
EVH
668 struct p9_trans_fd *ts = client->trans;
669 struct p9_conn *m = ts->conn;
8a0dc95f 670
5d385153
JP
671 p9_debug(P9_DEBUG_TRANS, "mux %p task %p tcall %p id %d\n",
672 m, current, req->tc, req->tc->id);
8a0dc95f 673 if (m->err < 0)
91b8534f 674 return m->err;
8a0dc95f 675
91b8534f 676 spin_lock(&client->lock);
7eb923b8 677 req->status = REQ_STATUS_UNSENT;
8a0dc95f 678 list_add_tail(&req->req_list, &m->unsent_req_list);
91b8534f 679 spin_unlock(&client->lock);
8a0dc95f
EVH
680
681 if (test_and_clear_bit(Wpending, &m->wsched))
682 n = POLLOUT;
683 else
8b81ef58 684 n = p9_fd_poll(m->client, NULL);
8a0dc95f
EVH
685
686 if (n & POLLOUT && !test_and_set_bit(Wworksched, &m->wsched))
61edeeed 687 schedule_work(&m->wq);
8a0dc95f 688
91b8534f 689 return 0;
8a0dc95f
EVH
690}
691
91b8534f 692static int p9_fd_cancel(struct p9_client *client, struct p9_req_t *req)
8a0dc95f 693{
7eb923b8 694 int ret = 1;
8a0dc95f 695
5d385153 696 p9_debug(P9_DEBUG_TRANS, "client %p req %p\n", client, req);
8a0dc95f 697
91b8534f 698 spin_lock(&client->lock);
91b8534f 699
91b8534f 700 if (req->status == REQ_STATUS_UNSENT) {
1bab88b2 701 list_del(&req->req_list);
91b8534f 702 req->status = REQ_STATUS_FLSHD;
7eb923b8 703 ret = 0;
1bab88b2
LI
704 } else if (req->status == REQ_STATUS_SENT)
705 req->status = REQ_STATUS_FLSH;
8a0dc95f 706
7eb923b8
EVH
707 spin_unlock(&client->lock);
708
709 return ret;
8a0dc95f
EVH
710}
711
a80d923e 712/**
0e15597e
AK
713 * parse_opts - parse mount options into p9_fd_opts structure
714 * @params: options string passed from mount
715 * @opts: fd transport-specific structure to parse options into
a80d923e 716 *
bb8ffdfc 717 * Returns 0 upon success, -ERRNO upon failure
a80d923e 718 */
bd238fb4 719
bb8ffdfc 720static int parse_opts(char *params, struct p9_fd_opts *opts)
bd238fb4 721{
a80d923e
EVH
722 char *p;
723 substring_t args[MAX_OPT_ARGS];
724 int option;
d8c8a9e3 725 char *options, *tmp_options;
bd238fb4 726
a80d923e
EVH
727 opts->port = P9_PORT;
728 opts->rfd = ~0;
729 opts->wfd = ~0;
bd238fb4 730
bb8ffdfc
EVH
731 if (!params)
732 return 0;
733
d8c8a9e3
EVH
734 tmp_options = kstrdup(params, GFP_KERNEL);
735 if (!tmp_options) {
5d385153
JP
736 p9_debug(P9_DEBUG_ERROR,
737 "failed to allocate copy of option string\n");
bb8ffdfc
EVH
738 return -ENOMEM;
739 }
d8c8a9e3 740 options = tmp_options;
bd238fb4 741
a80d923e
EVH
742 while ((p = strsep(&options, ",")) != NULL) {
743 int token;
bb8ffdfc 744 int r;
a80d923e
EVH
745 if (!*p)
746 continue;
747 token = match_token(p, tokens, args);
2f28c8b3 748 if ((token != Opt_err) && (token != Opt_privport)) {
15da4b16
AK
749 r = match_int(&args[0], &option);
750 if (r < 0) {
5d385153
JP
751 p9_debug(P9_DEBUG_ERROR,
752 "integer field, but no integer?\n");
15da4b16
AK
753 continue;
754 }
a80d923e
EVH
755 }
756 switch (token) {
757 case Opt_port:
758 opts->port = option;
759 break;
760 case Opt_rfdno:
761 opts->rfd = option;
762 break;
763 case Opt_wfdno:
764 opts->wfd = option;
765 break;
2f28c8b3
JG
766 case Opt_privport:
767 opts->privport = 1;
768 break;
a80d923e
EVH
769 default:
770 continue;
771 }
bd238fb4 772 }
d8c8a9e3
EVH
773
774 kfree(tmp_options);
bb8ffdfc 775 return 0;
bd238fb4 776}
bd238fb4 777
8b81ef58 778static int p9_fd_open(struct p9_client *client, int rfd, int wfd)
bd238fb4 779{
a80d923e
EVH
780 struct p9_trans_fd *ts = kmalloc(sizeof(struct p9_trans_fd),
781 GFP_KERNEL);
782 if (!ts)
783 return -ENOMEM;
bd238fb4 784
a80d923e
EVH
785 ts->rd = fget(rfd);
786 ts->wr = fget(wfd);
787 if (!ts->rd || !ts->wr) {
788 if (ts->rd)
789 fput(ts->rd);
790 if (ts->wr)
791 fput(ts->wr);
792 kfree(ts);
793 return -EIO;
bd238fb4
LI
794 }
795
8b81ef58
EVH
796 client->trans = ts;
797 client->status = Connected;
bd238fb4 798
a80d923e 799 return 0;
bd238fb4 800}
bd238fb4 801
8b81ef58 802static int p9_socket_open(struct p9_client *client, struct socket *csocket)
bd238fb4 803{
6b18662e 804 struct p9_trans_fd *p;
56b31d1c
AV
805 struct file *file;
806 int ret;
6b18662e
AV
807
808 p = kmalloc(sizeof(struct p9_trans_fd), GFP_KERNEL);
809 if (!p)
810 return -ENOMEM;
bd238fb4
LI
811
812 csocket->sk->sk_allocation = GFP_NOIO;
aab174f0 813 file = sock_alloc_file(csocket, 0, NULL);
56b31d1c 814 if (IS_ERR(file)) {
5d385153
JP
815 pr_err("%s (%d): failed to map fd\n",
816 __func__, task_pid_nr(current));
6b18662e
AV
817 sock_release(csocket);
818 kfree(p);
56b31d1c 819 return PTR_ERR(file);
bd238fb4
LI
820 }
821
56b31d1c
AV
822 get_file(file);
823 p->wr = p->rd = file;
6b18662e
AV
824 client->trans = p;
825 client->status = Connected;
826
6b18662e
AV
827 p->rd->f_flags |= O_NONBLOCK;
828
829 p->conn = p9_conn_create(client);
830 if (IS_ERR(p->conn)) {
831 ret = PTR_ERR(p->conn);
832 p->conn = NULL;
833 kfree(p);
834 sockfd_put(csocket);
bd238fb4
LI
835 sockfd_put(csocket);
836 return ret;
837 }
bd238fb4
LI
838 return 0;
839}
840
bd238fb4 841/**
5503ac56
EVH
842 * p9_mux_destroy - cancels all pending requests and frees mux resources
843 * @m: mux to destroy
bd238fb4
LI
844 *
845 */
ee443996 846
5503ac56 847static void p9_conn_destroy(struct p9_conn *m)
bd238fb4 848{
5d385153
JP
849 p9_debug(P9_DEBUG_TRANS, "mux %p prev %p next %p\n",
850 m, m->mux_list.prev, m->mux_list.next);
bd238fb4 851
5503ac56
EVH
852 p9_mux_poll_stop(m);
853 cancel_work_sync(&m->rq);
854 cancel_work_sync(&m->wq);
bd238fb4 855
5503ac56 856 p9_conn_cancel(m, -ECONNRESET);
bd238fb4 857
5503ac56 858 m->client = NULL;
5503ac56 859 kfree(m);
bd238fb4
LI
860}
861
862/**
8b81ef58
EVH
863 * p9_fd_close - shutdown file descriptor transport
864 * @client: client instance
bd238fb4
LI
865 *
866 */
ee443996 867
8b81ef58 868static void p9_fd_close(struct p9_client *client)
bd238fb4
LI
869{
870 struct p9_trans_fd *ts;
871
8b81ef58 872 if (!client)
bd238fb4
LI
873 return;
874
8b81ef58 875 ts = client->trans;
bd238fb4
LI
876 if (!ts)
877 return;
878
8b81ef58
EVH
879 client->status = Disconnected;
880
8a0dc95f
EVH
881 p9_conn_destroy(ts->conn);
882
bd238fb4
LI
883 if (ts->rd)
884 fput(ts->rd);
885 if (ts->wr)
886 fput(ts->wr);
8b81ef58 887
bd238fb4
LI
888 kfree(ts);
889}
890
887b3ece
EVH
891/*
892 * stolen from NFS - maybe should be made a generic function?
893 */
894static inline int valid_ipaddr4(const char *buf)
895{
896 int rc, count, in[4];
897
898 rc = sscanf(buf, "%d.%d.%d.%d", &in[0], &in[1], &in[2], &in[3]);
899 if (rc != 4)
900 return -EINVAL;
901 for (count = 0; count < 4; count++) {
902 if (in[count] > 255)
903 return -EINVAL;
904 }
905 return 0;
906}
907
2f28c8b3
JG
908static int p9_bind_privport(struct socket *sock)
909{
910 struct sockaddr_in cl;
911 int port, err = -EINVAL;
912
913 memset(&cl, 0, sizeof(cl));
914 cl.sin_family = AF_INET;
915 cl.sin_addr.s_addr = INADDR_ANY;
916 for (port = p9_ipport_resv_max; port >= p9_ipport_resv_min; port--) {
917 cl.sin_port = htons((ushort)port);
918 err = kernel_bind(sock, (struct sockaddr *)&cl, sizeof(cl));
919 if (err != -EADDRINUSE)
920 break;
921 }
922 return err;
923}
924
925
8b81ef58
EVH
926static int
927p9_fd_create_tcp(struct p9_client *client, const char *addr, char *args)
a80d923e
EVH
928{
929 int err;
a80d923e
EVH
930 struct socket *csocket;
931 struct sockaddr_in sin_server;
932 struct p9_fd_opts opts;
933
bb8ffdfc
EVH
934 err = parse_opts(args, &opts);
935 if (err < 0)
8b81ef58 936 return err;
a80d923e 937
887b3ece 938 if (valid_ipaddr4(addr) < 0)
8b81ef58 939 return -EINVAL;
887b3ece 940
a80d923e 941 csocket = NULL;
a80d923e
EVH
942
943 sin_server.sin_family = AF_INET;
944 sin_server.sin_addr.s_addr = in_aton(addr);
945 sin_server.sin_port = htons(opts.port);
e75762fd
RL
946 err = __sock_create(read_pnet(&current->nsproxy->net_ns), PF_INET,
947 SOCK_STREAM, IPPROTO_TCP, &csocket, 1);
6b18662e 948 if (err) {
5d385153
JP
949 pr_err("%s (%d): problem creating socket\n",
950 __func__, task_pid_nr(current));
6b18662e 951 return err;
a80d923e
EVH
952 }
953
2f28c8b3
JG
954 if (opts.privport) {
955 err = p9_bind_privport(csocket);
956 if (err < 0) {
957 pr_err("%s (%d): problem binding to privport\n",
958 __func__, task_pid_nr(current));
959 sock_release(csocket);
960 return err;
961 }
962 }
963
a80d923e
EVH
964 err = csocket->ops->connect(csocket,
965 (struct sockaddr *)&sin_server,
966 sizeof(struct sockaddr_in), 0);
967 if (err < 0) {
5d385153
JP
968 pr_err("%s (%d): problem connecting socket to %s\n",
969 __func__, task_pid_nr(current), addr);
a80d923e 970 sock_release(csocket);
6b18662e
AV
971 return err;
972 }
a80d923e 973
6b18662e 974 return p9_socket_open(client, csocket);
a80d923e
EVH
975}
976
8b81ef58
EVH
977static int
978p9_fd_create_unix(struct p9_client *client, const char *addr, char *args)
a80d923e
EVH
979{
980 int err;
981 struct socket *csocket;
982 struct sockaddr_un sun_server;
a80d923e
EVH
983
984 csocket = NULL;
a80d923e 985
cff6b8a9 986 if (strlen(addr) >= UNIX_PATH_MAX) {
5d385153
JP
987 pr_err("%s (%d): address too long: %s\n",
988 __func__, task_pid_nr(current), addr);
6b18662e 989 return -ENAMETOOLONG;
a80d923e
EVH
990 }
991
992 sun_server.sun_family = PF_UNIX;
993 strcpy(sun_server.sun_path, addr);
e75762fd
RL
994 err = __sock_create(read_pnet(&current->nsproxy->net_ns), PF_UNIX,
995 SOCK_STREAM, 0, &csocket, 1);
6b18662e 996 if (err < 0) {
5d385153
JP
997 pr_err("%s (%d): problem creating socket\n",
998 __func__, task_pid_nr(current));
999
6b18662e
AV
1000 return err;
1001 }
a80d923e
EVH
1002 err = csocket->ops->connect(csocket, (struct sockaddr *)&sun_server,
1003 sizeof(struct sockaddr_un) - 1, 0);
1004 if (err < 0) {
5d385153
JP
1005 pr_err("%s (%d): problem connecting socket: %s: %d\n",
1006 __func__, task_pid_nr(current), addr, err);
a80d923e 1007 sock_release(csocket);
6b18662e
AV
1008 return err;
1009 }
a80d923e 1010
6b18662e 1011 return p9_socket_open(client, csocket);
a80d923e
EVH
1012}
1013
8b81ef58
EVH
1014static int
1015p9_fd_create(struct p9_client *client, const char *addr, char *args)
a80d923e
EVH
1016{
1017 int err;
a80d923e 1018 struct p9_fd_opts opts;
6b18662e 1019 struct p9_trans_fd *p;
a80d923e
EVH
1020
1021 parse_opts(args, &opts);
1022
1023 if (opts.rfd == ~0 || opts.wfd == ~0) {
5d385153 1024 pr_err("Insufficient options for proto=fd\n");
8b81ef58 1025 return -ENOPROTOOPT;
a80d923e
EVH
1026 }
1027
8b81ef58 1028 err = p9_fd_open(client, opts.rfd, opts.wfd);
a80d923e 1029 if (err < 0)
6b18662e 1030 return err;
a80d923e 1031
8b81ef58
EVH
1032 p = (struct p9_trans_fd *) client->trans;
1033 p->conn = p9_conn_create(client);
8a0dc95f
EVH
1034 if (IS_ERR(p->conn)) {
1035 err = PTR_ERR(p->conn);
1036 p->conn = NULL;
6b18662e
AV
1037 fput(p->rd);
1038 fput(p->wr);
1039 return err;
8a0dc95f
EVH
1040 }
1041
8b81ef58 1042 return 0;
a80d923e
EVH
1043}
1044
1045static struct p9_trans_module p9_tcp_trans = {
1046 .name = "tcp",
1047 .maxsize = MAX_SOCK_BUF,
f94741fd 1048 .def = 0,
8b81ef58
EVH
1049 .create = p9_fd_create_tcp,
1050 .close = p9_fd_close,
91b8534f
EVH
1051 .request = p9_fd_request,
1052 .cancel = p9_fd_cancel,
72029fe8 1053 .owner = THIS_MODULE,
a80d923e
EVH
1054};
1055
1056static struct p9_trans_module p9_unix_trans = {
1057 .name = "unix",
1058 .maxsize = MAX_SOCK_BUF,
1059 .def = 0,
8b81ef58
EVH
1060 .create = p9_fd_create_unix,
1061 .close = p9_fd_close,
91b8534f
EVH
1062 .request = p9_fd_request,
1063 .cancel = p9_fd_cancel,
72029fe8 1064 .owner = THIS_MODULE,
a80d923e
EVH
1065};
1066
1067static struct p9_trans_module p9_fd_trans = {
1068 .name = "fd",
1069 .maxsize = MAX_SOCK_BUF,
1070 .def = 0,
8b81ef58
EVH
1071 .create = p9_fd_create,
1072 .close = p9_fd_close,
91b8534f
EVH
1073 .request = p9_fd_request,
1074 .cancel = p9_fd_cancel,
72029fe8 1075 .owner = THIS_MODULE,
a80d923e
EVH
1076};
1077
5503ac56
EVH
1078/**
1079 * p9_poll_proc - poll worker thread
1080 * @a: thread state and arguments
1081 *
1082 * polls all v9fs transports for new events and queues the appropriate
1083 * work to the work queue
1084 *
1085 */
1086
aa70c585 1087static void p9_poll_workfn(struct work_struct *work)
5503ac56
EVH
1088{
1089 unsigned long flags;
1090
5d385153 1091 p9_debug(P9_DEBUG_TRANS, "start %p\n", current);
aa70c585 1092
5503ac56
EVH
1093 spin_lock_irqsave(&p9_poll_lock, flags);
1094 while (!list_empty(&p9_poll_pending_list)) {
1095 struct p9_conn *conn = list_first_entry(&p9_poll_pending_list,
1096 struct p9_conn,
1097 poll_pending_link);
1098 list_del_init(&conn->poll_pending_link);
1099 spin_unlock_irqrestore(&p9_poll_lock, flags);
1100
1101 p9_poll_mux(conn);
1102
1103 spin_lock_irqsave(&p9_poll_lock, flags);
1104 }
1105 spin_unlock_irqrestore(&p9_poll_lock, flags);
1106
5d385153 1107 p9_debug(P9_DEBUG_TRANS, "finish\n");
5503ac56
EVH
1108}
1109
887b3ece 1110int p9_trans_fd_init(void)
a80d923e
EVH
1111{
1112 v9fs_register_trans(&p9_tcp_trans);
1113 v9fs_register_trans(&p9_unix_trans);
1114 v9fs_register_trans(&p9_fd_trans);
1115
3387b804 1116 return 0;
a80d923e 1117}
72029fe8
TH
1118
1119void p9_trans_fd_exit(void)
1120{
43829731 1121 flush_work(&p9_poll_work);
72029fe8
TH
1122 v9fs_unregister_trans(&p9_tcp_trans);
1123 v9fs_unregister_trans(&p9_unix_trans);
1124 v9fs_unregister_trans(&p9_fd_trans);
1125}