]> bbs.cooldavid.org Git - net-next-2.6.git/blame - net/9p/trans_fd.c
merge sock_alloc_fd/sock_attach_fd into a new helper
[net-next-2.6.git] / net / 9p / trans_fd.c
CommitLineData
bd238fb4
LI
1/*
2 * linux/fs/9p/trans_fd.c
3 *
4 * Fd transport layer. Includes deprecated socket layer.
5 *
6 * Copyright (C) 2006 by Russ Cox <rsc@swtch.com>
7 * Copyright (C) 2004-2005 by Latchesar Ionkov <lucho@ionkov.net>
8a0dc95f 8 * Copyright (C) 2004-2008 by Eric Van Hensbergen <ericvh@gmail.com>
bd238fb4
LI
9 * Copyright (C) 1997-2002 by Ron Minnich <rminnich@sarnoff.com>
10 *
11 * This program is free software; you can redistribute it and/or modify
12 * it under the terms of the GNU General Public License version 2
13 * as published by the Free Software Foundation.
14 *
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU General Public License for more details.
19 *
20 * You should have received a copy of the GNU General Public License
21 * along with this program; if not, write to:
22 * Free Software Foundation
23 * 51 Franklin Street, Fifth Floor
24 * Boston, MA 02111-1301 USA
25 *
26 */
27
28#include <linux/in.h>
29#include <linux/module.h>
30#include <linux/net.h>
31#include <linux/ipv6.h>
8a0dc95f 32#include <linux/kthread.h>
bd238fb4
LI
33#include <linux/errno.h>
34#include <linux/kernel.h>
35#include <linux/un.h>
36#include <linux/uaccess.h>
37#include <linux/inet.h>
38#include <linux/idr.h>
39#include <linux/file.h>
a80d923e 40#include <linux/parser.h>
bd238fb4 41#include <net/9p/9p.h>
8b81ef58 42#include <net/9p/client.h>
bd238fb4
LI
43#include <net/9p/transport.h>
44
45#define P9_PORT 564
a80d923e 46#define MAX_SOCK_BUF (64*1024)
8a0dc95f 47#define MAXPOLLWADDR 2
a80d923e 48
ee443996
EVH
49/**
50 * struct p9_fd_opts - per-transport options
51 * @rfd: file descriptor for reading (trans=fd)
52 * @wfd: file descriptor for writing (trans=fd)
53 * @port: port to connect to (trans=tcp)
54 *
55 */
56
a80d923e
EVH
57struct p9_fd_opts {
58 int rfd;
59 int wfd;
60 u16 port;
61};
bd238fb4 62
ee443996
EVH
63/**
64 * struct p9_trans_fd - transport state
65 * @rd: reference to file to read from
66 * @wr: reference of file to write to
67 * @conn: connection state reference
68 *
69 */
70
bd238fb4
LI
71struct p9_trans_fd {
72 struct file *rd;
73 struct file *wr;
8a0dc95f 74 struct p9_conn *conn;
bd238fb4
LI
75};
76
a80d923e
EVH
77/*
78 * Option Parsing (code inspired by NFS code)
79 * - a little lazy - parse all fd-transport options
80 */
bd238fb4 81
a80d923e
EVH
82enum {
83 /* Options that take integer arguments */
55762690 84 Opt_port, Opt_rfdno, Opt_wfdno, Opt_err,
a80d923e 85};
bd238fb4 86
a447c093 87static const match_table_t tokens = {
a80d923e
EVH
88 {Opt_port, "port=%u"},
89 {Opt_rfdno, "rfdno=%u"},
90 {Opt_wfdno, "wfdno=%u"},
55762690 91 {Opt_err, NULL},
a80d923e 92};
bd238fb4 93
8a0dc95f
EVH
94enum {
95 Rworksched = 1, /* read work scheduled or running */
96 Rpending = 2, /* can read */
97 Wworksched = 4, /* write work scheduled or running */
98 Wpending = 8, /* can write */
99};
100
992b3f1d
TH
101struct p9_poll_wait {
102 struct p9_conn *conn;
103 wait_queue_t wait;
104 wait_queue_head_t *wait_addr;
ee443996
EVH
105};
106
107/**
108 * struct p9_conn - fd mux connection state information
ee443996 109 * @mux_list: list link for mux to manage multiple connections (?)
8b81ef58 110 * @client: reference to client instance for this connection
ee443996 111 * @err: error state
ee443996
EVH
112 * @req_list: accounting for requests which have been sent
113 * @unsent_req_list: accounting for requests that haven't been sent
1b0a763b
EVH
114 * @req: current request being processed (if any)
115 * @tmp_buf: temporary buffer to read in header
116 * @rsize: amount to read for current frame
ee443996
EVH
117 * @rpos: read position in current frame
118 * @rbuf: current read buffer
119 * @wpos: write position for current frame
120 * @wsize: amount of data to write for current frame
121 * @wbuf: current write buffer
0e15597e 122 * @poll_pending_link: pending links to be polled per conn
ee443996 123 * @poll_wait: array of wait_q's for various worker threads
ee443996
EVH
124 * @pt: poll state
125 * @rq: current read work
126 * @wq: current write work
127 * @wsched: ????
128 *
129 */
8a0dc95f
EVH
130
131struct p9_conn {
8a0dc95f 132 struct list_head mux_list;
8b81ef58 133 struct p9_client *client;
8a0dc95f 134 int err;
8a0dc95f
EVH
135 struct list_head req_list;
136 struct list_head unsent_req_list;
1b0a763b
EVH
137 struct p9_req_t *req;
138 char tmp_buf[7];
139 int rsize;
8a0dc95f
EVH
140 int rpos;
141 char *rbuf;
142 int wpos;
143 int wsize;
144 char *wbuf;
992b3f1d
TH
145 struct list_head poll_pending_link;
146 struct p9_poll_wait poll_wait[MAXPOLLWADDR];
8a0dc95f
EVH
147 poll_table pt;
148 struct work_struct rq;
149 struct work_struct wq;
150 unsigned long wsched;
151};
152
992b3f1d
TH
153static DEFINE_SPINLOCK(p9_poll_lock);
154static LIST_HEAD(p9_poll_pending_list);
8a0dc95f 155static struct workqueue_struct *p9_mux_wq;
992b3f1d 156static struct task_struct *p9_poll_task;
8a0dc95f 157
992b3f1d 158static void p9_mux_poll_stop(struct p9_conn *m)
8a0dc95f 159{
992b3f1d
TH
160 unsigned long flags;
161 int i;
8a0dc95f 162
992b3f1d
TH
163 for (i = 0; i < ARRAY_SIZE(m->poll_wait); i++) {
164 struct p9_poll_wait *pwait = &m->poll_wait[i];
8a0dc95f 165
992b3f1d
TH
166 if (pwait->wait_addr) {
167 remove_wait_queue(pwait->wait_addr, &pwait->wait);
168 pwait->wait_addr = NULL;
8a0dc95f 169 }
8a0dc95f
EVH
170 }
171
992b3f1d
TH
172 spin_lock_irqsave(&p9_poll_lock, flags);
173 list_del_init(&m->poll_pending_link);
174 spin_unlock_irqrestore(&p9_poll_lock, flags);
8a0dc95f
EVH
175}
176
177/**
5503ac56
EVH
178 * p9_conn_cancel - cancel all pending requests with error
179 * @m: mux data
180 * @err: error code
8a0dc95f 181 *
8a0dc95f 182 */
ee443996 183
51a87c55 184static void p9_conn_cancel(struct p9_conn *m, int err)
8a0dc95f 185{
673d62cd 186 struct p9_req_t *req, *rtmp;
91b8534f 187 unsigned long flags;
5503ac56 188 LIST_HEAD(cancel_list);
8a0dc95f 189
5503ac56 190 P9_DPRINTK(P9_DEBUG_ERROR, "mux %p err %d\n", m, err);
7eb923b8 191
91b8534f 192 spin_lock_irqsave(&m->client->lock, flags);
7eb923b8
EVH
193
194 if (m->err) {
195 spin_unlock_irqrestore(&m->client->lock, flags);
196 return;
197 }
198
199 m->err = err;
200
5503ac56 201 list_for_each_entry_safe(req, rtmp, &m->req_list, req_list) {
673d62cd
EVH
202 req->status = REQ_STATUS_ERROR;
203 if (!req->t_err)
204 req->t_err = err;
5503ac56
EVH
205 list_move(&req->req_list, &cancel_list);
206 }
207 list_for_each_entry_safe(req, rtmp, &m->unsent_req_list, req_list) {
673d62cd
EVH
208 req->status = REQ_STATUS_ERROR;
209 if (!req->t_err)
210 req->t_err = err;
5503ac56 211 list_move(&req->req_list, &cancel_list);
8a0dc95f 212 }
91b8534f 213 spin_unlock_irqrestore(&m->client->lock, flags);
8a0dc95f 214
5503ac56 215 list_for_each_entry_safe(req, rtmp, &cancel_list, req_list) {
91b8534f 216 P9_DPRINTK(P9_DEBUG_ERROR, "call back req %p\n", req);
1bab88b2 217 list_del(&req->req_list);
91b8534f 218 p9_client_cb(m->client, req);
8a0dc95f 219 }
8a0dc95f
EVH
220}
221
5503ac56
EVH
222static unsigned int
223p9_fd_poll(struct p9_client *client, struct poll_table_struct *pt)
8a0dc95f 224{
5503ac56
EVH
225 int ret, n;
226 struct p9_trans_fd *ts = NULL;
8a0dc95f 227
5503ac56
EVH
228 if (client && client->status == Connected)
229 ts = client->trans;
7dc5d24b 230
5503ac56
EVH
231 if (!ts)
232 return -EREMOTEIO;
7dc5d24b 233
5503ac56
EVH
234 if (!ts->rd->f_op || !ts->rd->f_op->poll)
235 return -EIO;
8a0dc95f 236
5503ac56
EVH
237 if (!ts->wr->f_op || !ts->wr->f_op->poll)
238 return -EIO;
992b3f1d 239
5503ac56
EVH
240 ret = ts->rd->f_op->poll(ts->rd, pt);
241 if (ret < 0)
242 return ret;
992b3f1d 243
5503ac56
EVH
244 if (ts->rd != ts->wr) {
245 n = ts->wr->f_op->poll(ts->wr, pt);
246 if (n < 0)
247 return n;
248 ret = (ret & ~POLLOUT) | (n & ~POLLIN);
249 }
250
251 return ret;
992b3f1d
TH
252}
253
8a0dc95f 254/**
5503ac56
EVH
255 * p9_fd_read- read from a fd
256 * @client: client instance
257 * @v: buffer to receive data into
258 * @len: size of receive buffer
ee443996 259 *
8a0dc95f 260 */
ee443996 261
5503ac56 262static int p9_fd_read(struct p9_client *client, void *v, int len)
8a0dc95f 263{
5503ac56
EVH
264 int ret;
265 struct p9_trans_fd *ts = NULL;
8a0dc95f 266
5503ac56
EVH
267 if (client && client->status != Disconnected)
268 ts = client->trans;
8a0dc95f 269
5503ac56
EVH
270 if (!ts)
271 return -EREMOTEIO;
8a0dc95f 272
5503ac56
EVH
273 if (!(ts->rd->f_flags & O_NONBLOCK))
274 P9_DPRINTK(P9_DEBUG_ERROR, "blocking read ...\n");
8a0dc95f 275
5503ac56
EVH
276 ret = kernel_read(ts->rd, ts->rd->f_pos, v, len);
277 if (ret <= 0 && ret != -ERESTARTSYS && ret != -EAGAIN)
278 client->status = Disconnected;
279 return ret;
8a0dc95f
EVH
280}
281
282/**
5503ac56
EVH
283 * p9_read_work - called when there is some data to be read from a transport
284 * @work: container of work to be done
ee443996 285 *
8a0dc95f 286 */
ee443996 287
5503ac56 288static void p9_read_work(struct work_struct *work)
8a0dc95f 289{
5503ac56
EVH
290 int n, err;
291 struct p9_conn *m;
5503ac56
EVH
292
293 m = container_of(work, struct p9_conn, rq);
8a0dc95f
EVH
294
295 if (m->err < 0)
296 return;
297
51a87c55 298 P9_DPRINTK(P9_DEBUG_TRANS, "start mux %p pos %d\n", m, m->rpos);
8a0dc95f 299
1b0a763b
EVH
300 if (!m->rbuf) {
301 m->rbuf = m->tmp_buf;
5503ac56 302 m->rpos = 0;
1b0a763b 303 m->rsize = 7; /* start by reading header */
8a0dc95f
EVH
304 }
305
5503ac56 306 clear_bit(Rpending, &m->wsched);
51a87c55 307 P9_DPRINTK(P9_DEBUG_TRANS, "read mux %p pos %d size: %d = %d\n", m,
1b0a763b 308 m->rpos, m->rsize, m->rsize-m->rpos);
5503ac56 309 err = p9_fd_read(m->client, m->rbuf + m->rpos,
1b0a763b 310 m->rsize - m->rpos);
51a87c55 311 P9_DPRINTK(P9_DEBUG_TRANS, "mux %p got %d bytes\n", m, err);
5503ac56
EVH
312 if (err == -EAGAIN) {
313 clear_bit(Rworksched, &m->wsched);
314 return;
8a0dc95f 315 }
8a0dc95f 316
5503ac56
EVH
317 if (err <= 0)
318 goto error;
319
320 m->rpos += err;
1b0a763b
EVH
321
322 if ((!m->req) && (m->rpos == m->rsize)) { /* header read in */
323 u16 tag;
51a87c55 324 P9_DPRINTK(P9_DEBUG_TRANS, "got new header\n");
1b0a763b
EVH
325
326 n = le32_to_cpu(*(__le32 *) m->rbuf); /* read packet size */
5503ac56
EVH
327 if (n >= m->client->msize) {
328 P9_DPRINTK(P9_DEBUG_ERROR,
329 "requested packet size too big: %d\n", n);
330 err = -EIO;
331 goto error;
332 }
333
1b0a763b 334 tag = le16_to_cpu(*(__le16 *) (m->rbuf+5)); /* read tag */
51a87c55
EVH
335 P9_DPRINTK(P9_DEBUG_TRANS,
336 "mux %p pkt: size: %d bytes tag: %d\n", m, n, tag);
1b0a763b
EVH
337
338 m->req = p9_tag_lookup(m->client, tag);
1bab88b2
LI
339 if (!m->req || (m->req->status != REQ_STATUS_SENT &&
340 m->req->status != REQ_STATUS_FLSH)) {
1b0a763b
EVH
341 P9_DPRINTK(P9_DEBUG_ERROR, "Unexpected packet tag %d\n",
342 tag);
343 err = -EIO;
344 goto error;
345 }
346
347 if (m->req->rc == NULL) {
348 m->req->rc = kmalloc(sizeof(struct p9_fcall) +
349 m->client->msize, GFP_KERNEL);
350 if (!m->req->rc) {
351 m->req = NULL;
352 err = -ENOMEM;
353 goto error;
354 }
355 }
356 m->rbuf = (char *)m->req->rc + sizeof(struct p9_fcall);
357 memcpy(m->rbuf, m->tmp_buf, m->rsize);
358 m->rsize = n;
359 }
5503ac56 360
1b0a763b
EVH
361 /* not an else because some packets (like clunk) have no payload */
362 if ((m->req) && (m->rpos == m->rsize)) { /* packet is read in */
51a87c55 363 P9_DPRINTK(P9_DEBUG_TRANS, "got new packet\n");
7eb923b8 364 spin_lock(&m->client->lock);
1bab88b2
LI
365 if (m->req->status != REQ_STATUS_ERROR)
366 m->req->status = REQ_STATUS_RCVD;
91b8534f 367 list_del(&m->req->req_list);
7eb923b8 368 spin_unlock(&m->client->lock);
91b8534f 369 p9_client_cb(m->client, m->req);
1b0a763b
EVH
370 m->rbuf = NULL;
371 m->rpos = 0;
372 m->rsize = 0;
1b0a763b 373 m->req = NULL;
5503ac56
EVH
374 }
375
376 if (!list_empty(&m->req_list)) {
377 if (test_and_clear_bit(Rpending, &m->wsched))
378 n = POLLIN;
379 else
380 n = p9_fd_poll(m->client, NULL);
381
382 if (n & POLLIN) {
51a87c55 383 P9_DPRINTK(P9_DEBUG_TRANS, "sched read work %p\n", m);
5503ac56
EVH
384 queue_work(p9_mux_wq, &m->rq);
385 } else
386 clear_bit(Rworksched, &m->wsched);
387 } else
388 clear_bit(Rworksched, &m->wsched);
389
390 return;
5503ac56
EVH
391error:
392 p9_conn_cancel(m, err);
393 clear_bit(Rworksched, &m->wsched);
394}
395
396/**
397 * p9_fd_write - write to a socket
398 * @client: client instance
399 * @v: buffer to send data from
400 * @len: size of send buffer
ee443996 401 *
8a0dc95f 402 */
ee443996 403
5503ac56 404static int p9_fd_write(struct p9_client *client, void *v, int len)
8a0dc95f 405{
5503ac56
EVH
406 int ret;
407 mm_segment_t oldfs;
408 struct p9_trans_fd *ts = NULL;
8a0dc95f 409
5503ac56
EVH
410 if (client && client->status != Disconnected)
411 ts = client->trans;
8a0dc95f 412
5503ac56
EVH
413 if (!ts)
414 return -EREMOTEIO;
8a0dc95f 415
5503ac56
EVH
416 if (!(ts->wr->f_flags & O_NONBLOCK))
417 P9_DPRINTK(P9_DEBUG_ERROR, "blocking write ...\n");
992b3f1d 418
5503ac56
EVH
419 oldfs = get_fs();
420 set_fs(get_ds());
421 /* The cast to a user pointer is valid due to the set_fs() */
e3db6cb4 422 ret = vfs_write(ts->wr, (__force void __user *)v, len, &ts->wr->f_pos);
5503ac56 423 set_fs(oldfs);
992b3f1d 424
5503ac56
EVH
425 if (ret <= 0 && ret != -ERESTARTSYS && ret != -EAGAIN)
426 client->status = Disconnected;
427 return ret;
8a0dc95f
EVH
428}
429
430/**
431 * p9_write_work - called when a transport can send some data
ee443996
EVH
432 * @work: container for work to be done
433 *
8a0dc95f 434 */
ee443996 435
8a0dc95f
EVH
436static void p9_write_work(struct work_struct *work)
437{
438 int n, err;
439 struct p9_conn *m;
673d62cd 440 struct p9_req_t *req;
8a0dc95f
EVH
441
442 m = container_of(work, struct p9_conn, wq);
443
444 if (m->err < 0) {
445 clear_bit(Wworksched, &m->wsched);
446 return;
447 }
448
449 if (!m->wsize) {
450 if (list_empty(&m->unsent_req_list)) {
451 clear_bit(Wworksched, &m->wsched);
452 return;
453 }
454
673d62cd
EVH
455 spin_lock(&m->client->lock);
456 req = list_entry(m->unsent_req_list.next, struct p9_req_t,
8a0dc95f 457 req_list);
673d62cd 458 req->status = REQ_STATUS_SENT;
1bab88b2 459 P9_DPRINTK(P9_DEBUG_TRANS, "move req %p\n", req);
8a0dc95f 460 list_move_tail(&req->req_list, &m->req_list);
8a0dc95f 461
673d62cd
EVH
462 m->wbuf = req->tc->sdata;
463 m->wsize = req->tc->size;
8a0dc95f 464 m->wpos = 0;
673d62cd 465 spin_unlock(&m->client->lock);
8a0dc95f
EVH
466 }
467
51a87c55 468 P9_DPRINTK(P9_DEBUG_TRANS, "mux %p pos %d size %d\n", m, m->wpos,
8a0dc95f
EVH
469 m->wsize);
470 clear_bit(Wpending, &m->wsched);
8b81ef58 471 err = p9_fd_write(m->client, m->wbuf + m->wpos, m->wsize - m->wpos);
51a87c55 472 P9_DPRINTK(P9_DEBUG_TRANS, "mux %p sent %d bytes\n", m, err);
8a0dc95f
EVH
473 if (err == -EAGAIN) {
474 clear_bit(Wworksched, &m->wsched);
475 return;
476 }
477
478 if (err < 0)
479 goto error;
480 else if (err == 0) {
481 err = -EREMOTEIO;
482 goto error;
483 }
484
485 m->wpos += err;
486 if (m->wpos == m->wsize)
487 m->wpos = m->wsize = 0;
488
489 if (m->wsize == 0 && !list_empty(&m->unsent_req_list)) {
490 if (test_and_clear_bit(Wpending, &m->wsched))
491 n = POLLOUT;
492 else
8b81ef58 493 n = p9_fd_poll(m->client, NULL);
8a0dc95f
EVH
494
495 if (n & POLLOUT) {
51a87c55 496 P9_DPRINTK(P9_DEBUG_TRANS, "sched write work %p\n", m);
8a0dc95f
EVH
497 queue_work(p9_mux_wq, &m->wq);
498 } else
499 clear_bit(Wworksched, &m->wsched);
500 } else
501 clear_bit(Wworksched, &m->wsched);
502
503 return;
504
505error:
506 p9_conn_cancel(m, err);
507 clear_bit(Wworksched, &m->wsched);
508}
509
5503ac56 510static int p9_pollwake(wait_queue_t *wait, unsigned mode, int sync, void *key)
8a0dc95f 511{
5503ac56
EVH
512 struct p9_poll_wait *pwait =
513 container_of(wait, struct p9_poll_wait, wait);
514 struct p9_conn *m = pwait->conn;
515 unsigned long flags;
516 DECLARE_WAITQUEUE(dummy_wait, p9_poll_task);
8a0dc95f 517
5503ac56
EVH
518 spin_lock_irqsave(&p9_poll_lock, flags);
519 if (list_empty(&m->poll_pending_link))
520 list_add_tail(&m->poll_pending_link, &p9_poll_pending_list);
521 spin_unlock_irqrestore(&p9_poll_lock, flags);
8a0dc95f 522
5503ac56
EVH
523 /* perform the default wake up operation */
524 return default_wake_function(&dummy_wait, mode, sync, key);
8a0dc95f
EVH
525}
526
527/**
5503ac56
EVH
528 * p9_pollwait - add poll task to the wait queue
529 * @filp: file pointer being polled
530 * @wait_address: wait_q to block on
531 * @p: poll state
ee443996 532 *
5503ac56 533 * called by files poll operation to add v9fs-poll task to files wait queue
8a0dc95f 534 */
ee443996 535
5503ac56
EVH
536static void
537p9_pollwait(struct file *filp, wait_queue_head_t *wait_address, poll_table *p)
8a0dc95f 538{
5503ac56
EVH
539 struct p9_conn *m = container_of(p, struct p9_conn, pt);
540 struct p9_poll_wait *pwait = NULL;
541 int i;
8a0dc95f 542
5503ac56
EVH
543 for (i = 0; i < ARRAY_SIZE(m->poll_wait); i++) {
544 if (m->poll_wait[i].wait_addr == NULL) {
545 pwait = &m->poll_wait[i];
546 break;
8a0dc95f 547 }
8a0dc95f
EVH
548 }
549
5503ac56
EVH
550 if (!pwait) {
551 P9_DPRINTK(P9_DEBUG_ERROR, "not enough wait_address slots\n");
8a0dc95f
EVH
552 return;
553 }
554
5503ac56
EVH
555 pwait->conn = m;
556 pwait->wait_addr = wait_address;
557 init_waitqueue_func_entry(&pwait->wait, p9_pollwake);
558 add_wait_queue(wait_address, &pwait->wait);
559}
8a0dc95f 560
5503ac56
EVH
561/**
562 * p9_conn_create - allocate and initialize the per-session mux data
563 * @client: client instance
564 *
565 * Note: Creates the polling task if this is the first session.
566 */
8a0dc95f 567
5503ac56
EVH
568static struct p9_conn *p9_conn_create(struct p9_client *client)
569{
95820a36 570 int n;
5503ac56 571 struct p9_conn *m;
8a0dc95f 572
51a87c55
EVH
573 P9_DPRINTK(P9_DEBUG_TRANS, "client %p msize %d\n", client,
574 client->msize);
5503ac56
EVH
575 m = kzalloc(sizeof(struct p9_conn), GFP_KERNEL);
576 if (!m)
577 return ERR_PTR(-ENOMEM);
8a0dc95f 578
5503ac56
EVH
579 INIT_LIST_HEAD(&m->mux_list);
580 m->client = client;
8a0dc95f 581
5503ac56
EVH
582 INIT_LIST_HEAD(&m->req_list);
583 INIT_LIST_HEAD(&m->unsent_req_list);
584 INIT_WORK(&m->rq, p9_read_work);
585 INIT_WORK(&m->wq, p9_write_work);
586 INIT_LIST_HEAD(&m->poll_pending_link);
587 init_poll_funcptr(&m->pt, p9_pollwait);
8a0dc95f 588
5503ac56
EVH
589 n = p9_fd_poll(client, &m->pt);
590 if (n & POLLIN) {
51a87c55 591 P9_DPRINTK(P9_DEBUG_TRANS, "mux %p can read\n", m);
5503ac56
EVH
592 set_bit(Rpending, &m->wsched);
593 }
8a0dc95f 594
5503ac56 595 if (n & POLLOUT) {
51a87c55 596 P9_DPRINTK(P9_DEBUG_TRANS, "mux %p can write\n", m);
5503ac56
EVH
597 set_bit(Wpending, &m->wsched);
598 }
599
5503ac56
EVH
600 return m;
601}
8a0dc95f 602
5503ac56
EVH
603/**
604 * p9_poll_mux - polls a mux and schedules read or write works if necessary
605 * @m: connection to poll
606 *
607 */
608
609static void p9_poll_mux(struct p9_conn *m)
610{
611 int n;
612
613 if (m->err < 0)
614 return;
615
616 n = p9_fd_poll(m->client, NULL);
617 if (n < 0 || n & (POLLERR | POLLHUP | POLLNVAL)) {
51a87c55 618 P9_DPRINTK(P9_DEBUG_TRANS, "error mux %p err %d\n", m, n);
5503ac56
EVH
619 if (n >= 0)
620 n = -ECONNRESET;
621 p9_conn_cancel(m, n);
622 }
623
624 if (n & POLLIN) {
625 set_bit(Rpending, &m->wsched);
51a87c55 626 P9_DPRINTK(P9_DEBUG_TRANS, "mux %p can read\n", m);
5503ac56 627 if (!test_and_set_bit(Rworksched, &m->wsched)) {
51a87c55 628 P9_DPRINTK(P9_DEBUG_TRANS, "sched read work %p\n", m);
8a0dc95f 629 queue_work(p9_mux_wq, &m->rq);
5503ac56
EVH
630 }
631 }
8a0dc95f 632
5503ac56
EVH
633 if (n & POLLOUT) {
634 set_bit(Wpending, &m->wsched);
51a87c55 635 P9_DPRINTK(P9_DEBUG_TRANS, "mux %p can write\n", m);
f64f9e71
JP
636 if ((m->wsize || !list_empty(&m->unsent_req_list)) &&
637 !test_and_set_bit(Wworksched, &m->wsched)) {
51a87c55 638 P9_DPRINTK(P9_DEBUG_TRANS, "sched write work %p\n", m);
5503ac56
EVH
639 queue_work(p9_mux_wq, &m->wq);
640 }
641 }
8a0dc95f
EVH
642}
643
644/**
91b8534f 645 * p9_fd_request - send 9P request
8a0dc95f
EVH
646 * The function can sleep until the request is scheduled for sending.
647 * The function can be interrupted. Return from the function is not
91b8534f 648 * a guarantee that the request is sent successfully.
8a0dc95f 649 *
91b8534f
EVH
650 * @client: client instance
651 * @req: request to be sent
ee443996 652 *
8a0dc95f 653 */
ee443996 654
91b8534f 655static int p9_fd_request(struct p9_client *client, struct p9_req_t *req)
8a0dc95f
EVH
656{
657 int n;
91b8534f
EVH
658 struct p9_trans_fd *ts = client->trans;
659 struct p9_conn *m = ts->conn;
8a0dc95f 660
51a87c55
EVH
661 P9_DPRINTK(P9_DEBUG_TRANS, "mux %p task %p tcall %p id %d\n", m,
662 current, req->tc, req->tc->id);
8a0dc95f 663 if (m->err < 0)
91b8534f 664 return m->err;
8a0dc95f 665
91b8534f 666 spin_lock(&client->lock);
7eb923b8 667 req->status = REQ_STATUS_UNSENT;
8a0dc95f 668 list_add_tail(&req->req_list, &m->unsent_req_list);
91b8534f 669 spin_unlock(&client->lock);
8a0dc95f
EVH
670
671 if (test_and_clear_bit(Wpending, &m->wsched))
672 n = POLLOUT;
673 else
8b81ef58 674 n = p9_fd_poll(m->client, NULL);
8a0dc95f
EVH
675
676 if (n & POLLOUT && !test_and_set_bit(Wworksched, &m->wsched))
677 queue_work(p9_mux_wq, &m->wq);
678
91b8534f 679 return 0;
8a0dc95f
EVH
680}
681
91b8534f 682static int p9_fd_cancel(struct p9_client *client, struct p9_req_t *req)
8a0dc95f 683{
7eb923b8 684 int ret = 1;
8a0dc95f 685
0b15a3a5 686 P9_DPRINTK(P9_DEBUG_TRANS, "client %p req %p\n", client, req);
8a0dc95f 687
91b8534f 688 spin_lock(&client->lock);
91b8534f 689
91b8534f 690 if (req->status == REQ_STATUS_UNSENT) {
1bab88b2 691 list_del(&req->req_list);
91b8534f 692 req->status = REQ_STATUS_FLSHD;
7eb923b8 693 ret = 0;
1bab88b2
LI
694 } else if (req->status == REQ_STATUS_SENT)
695 req->status = REQ_STATUS_FLSH;
8a0dc95f 696
7eb923b8
EVH
697 spin_unlock(&client->lock);
698
699 return ret;
8a0dc95f
EVH
700}
701
a80d923e 702/**
0e15597e
AK
703 * parse_opts - parse mount options into p9_fd_opts structure
704 * @params: options string passed from mount
705 * @opts: fd transport-specific structure to parse options into
a80d923e 706 *
bb8ffdfc 707 * Returns 0 upon success, -ERRNO upon failure
a80d923e 708 */
bd238fb4 709
bb8ffdfc 710static int parse_opts(char *params, struct p9_fd_opts *opts)
bd238fb4 711{
a80d923e
EVH
712 char *p;
713 substring_t args[MAX_OPT_ARGS];
714 int option;
bb8ffdfc 715 char *options;
a80d923e 716 int ret;
bd238fb4 717
a80d923e
EVH
718 opts->port = P9_PORT;
719 opts->rfd = ~0;
720 opts->wfd = ~0;
bd238fb4 721
bb8ffdfc
EVH
722 if (!params)
723 return 0;
724
725 options = kstrdup(params, GFP_KERNEL);
726 if (!options) {
727 P9_DPRINTK(P9_DEBUG_ERROR,
728 "failed to allocate copy of option string\n");
729 return -ENOMEM;
730 }
bd238fb4 731
a80d923e
EVH
732 while ((p = strsep(&options, ",")) != NULL) {
733 int token;
bb8ffdfc 734 int r;
a80d923e
EVH
735 if (!*p)
736 continue;
737 token = match_token(p, tokens, args);
15da4b16
AK
738 if (token != Opt_err) {
739 r = match_int(&args[0], &option);
740 if (r < 0) {
741 P9_DPRINTK(P9_DEBUG_ERROR,
742 "integer field, but no integer?\n");
743 ret = r;
744 continue;
745 }
a80d923e
EVH
746 }
747 switch (token) {
748 case Opt_port:
749 opts->port = option;
750 break;
751 case Opt_rfdno:
752 opts->rfd = option;
753 break;
754 case Opt_wfdno:
755 opts->wfd = option;
756 break;
757 default:
758 continue;
759 }
bd238fb4 760 }
bb8ffdfc
EVH
761 kfree(options);
762 return 0;
bd238fb4 763}
bd238fb4 764
8b81ef58 765static int p9_fd_open(struct p9_client *client, int rfd, int wfd)
bd238fb4 766{
a80d923e
EVH
767 struct p9_trans_fd *ts = kmalloc(sizeof(struct p9_trans_fd),
768 GFP_KERNEL);
769 if (!ts)
770 return -ENOMEM;
bd238fb4 771
a80d923e
EVH
772 ts->rd = fget(rfd);
773 ts->wr = fget(wfd);
774 if (!ts->rd || !ts->wr) {
775 if (ts->rd)
776 fput(ts->rd);
777 if (ts->wr)
778 fput(ts->wr);
779 kfree(ts);
780 return -EIO;
bd238fb4
LI
781 }
782
8b81ef58
EVH
783 client->trans = ts;
784 client->status = Connected;
bd238fb4 785
a80d923e 786 return 0;
bd238fb4 787}
bd238fb4 788
8b81ef58 789static int p9_socket_open(struct p9_client *client, struct socket *csocket)
bd238fb4
LI
790{
791 int fd, ret;
792
793 csocket->sk->sk_allocation = GFP_NOIO;
a677a039 794 fd = sock_map_fd(csocket, 0);
bd238fb4
LI
795 if (fd < 0) {
796 P9_EPRINTK(KERN_ERR, "p9_socket_open: failed to map fd\n");
797 return fd;
798 }
799
8b81ef58 800 ret = p9_fd_open(client, fd, fd);
bd238fb4
LI
801 if (ret < 0) {
802 P9_EPRINTK(KERN_ERR, "p9_socket_open: failed to open fd\n");
803 sockfd_put(csocket);
804 return ret;
805 }
806
8b81ef58 807 ((struct p9_trans_fd *)client->trans)->rd->f_flags |= O_NONBLOCK;
bd238fb4
LI
808
809 return 0;
810}
811
bd238fb4 812/**
5503ac56
EVH
813 * p9_mux_destroy - cancels all pending requests and frees mux resources
814 * @m: mux to destroy
bd238fb4
LI
815 *
816 */
ee443996 817
5503ac56 818static void p9_conn_destroy(struct p9_conn *m)
bd238fb4 819{
51a87c55 820 P9_DPRINTK(P9_DEBUG_TRANS, "mux %p prev %p next %p\n", m,
5503ac56 821 m->mux_list.prev, m->mux_list.next);
bd238fb4 822
5503ac56
EVH
823 p9_mux_poll_stop(m);
824 cancel_work_sync(&m->rq);
825 cancel_work_sync(&m->wq);
bd238fb4 826
5503ac56 827 p9_conn_cancel(m, -ECONNRESET);
bd238fb4 828
5503ac56 829 m->client = NULL;
5503ac56 830 kfree(m);
bd238fb4
LI
831}
832
833/**
8b81ef58
EVH
834 * p9_fd_close - shutdown file descriptor transport
835 * @client: client instance
bd238fb4
LI
836 *
837 */
ee443996 838
8b81ef58 839static void p9_fd_close(struct p9_client *client)
bd238fb4
LI
840{
841 struct p9_trans_fd *ts;
842
8b81ef58 843 if (!client)
bd238fb4
LI
844 return;
845
8b81ef58 846 ts = client->trans;
bd238fb4
LI
847 if (!ts)
848 return;
849
8b81ef58
EVH
850 client->status = Disconnected;
851
8a0dc95f
EVH
852 p9_conn_destroy(ts->conn);
853
bd238fb4
LI
854 if (ts->rd)
855 fput(ts->rd);
856 if (ts->wr)
857 fput(ts->wr);
8b81ef58 858
bd238fb4
LI
859 kfree(ts);
860}
861
887b3ece
EVH
862/*
863 * stolen from NFS - maybe should be made a generic function?
864 */
865static inline int valid_ipaddr4(const char *buf)
866{
867 int rc, count, in[4];
868
869 rc = sscanf(buf, "%d.%d.%d.%d", &in[0], &in[1], &in[2], &in[3]);
870 if (rc != 4)
871 return -EINVAL;
872 for (count = 0; count < 4; count++) {
873 if (in[count] > 255)
874 return -EINVAL;
875 }
876 return 0;
877}
878
8b81ef58
EVH
879static int
880p9_fd_create_tcp(struct p9_client *client, const char *addr, char *args)
a80d923e
EVH
881{
882 int err;
a80d923e
EVH
883 struct socket *csocket;
884 struct sockaddr_in sin_server;
885 struct p9_fd_opts opts;
8b81ef58 886 struct p9_trans_fd *p = NULL; /* this gets allocated in p9_fd_open */
a80d923e 887
bb8ffdfc
EVH
888 err = parse_opts(args, &opts);
889 if (err < 0)
8b81ef58 890 return err;
a80d923e 891
887b3ece 892 if (valid_ipaddr4(addr) < 0)
8b81ef58 893 return -EINVAL;
887b3ece 894
a80d923e 895 csocket = NULL;
a80d923e
EVH
896
897 sin_server.sin_family = AF_INET;
898 sin_server.sin_addr.s_addr = in_aton(addr);
899 sin_server.sin_port = htons(opts.port);
900 sock_create_kern(PF_INET, SOCK_STREAM, IPPROTO_TCP, &csocket);
901
902 if (!csocket) {
903 P9_EPRINTK(KERN_ERR, "p9_trans_tcp: problem creating socket\n");
904 err = -EIO;
905 goto error;
906 }
907
908 err = csocket->ops->connect(csocket,
909 (struct sockaddr *)&sin_server,
910 sizeof(struct sockaddr_in), 0);
911 if (err < 0) {
912 P9_EPRINTK(KERN_ERR,
913 "p9_trans_tcp: problem connecting socket to %s\n",
914 addr);
915 goto error;
916 }
917
8b81ef58 918 err = p9_socket_open(client, csocket);
a80d923e
EVH
919 if (err < 0)
920 goto error;
921
8b81ef58
EVH
922 p = (struct p9_trans_fd *) client->trans;
923 p->conn = p9_conn_create(client);
8a0dc95f
EVH
924 if (IS_ERR(p->conn)) {
925 err = PTR_ERR(p->conn);
926 p->conn = NULL;
927 goto error;
928 }
929
8b81ef58 930 return 0;
a80d923e
EVH
931
932error:
933 if (csocket)
934 sock_release(csocket);
935
8b81ef58
EVH
936 kfree(p);
937
938 return err;
a80d923e
EVH
939}
940
8b81ef58
EVH
941static int
942p9_fd_create_unix(struct p9_client *client, const char *addr, char *args)
a80d923e
EVH
943{
944 int err;
945 struct socket *csocket;
946 struct sockaddr_un sun_server;
8b81ef58 947 struct p9_trans_fd *p = NULL; /* this gets allocated in p9_fd_open */
a80d923e
EVH
948
949 csocket = NULL;
a80d923e
EVH
950
951 if (strlen(addr) > UNIX_PATH_MAX) {
952 P9_EPRINTK(KERN_ERR, "p9_trans_unix: address too long: %s\n",
953 addr);
954 err = -ENAMETOOLONG;
955 goto error;
956 }
957
958 sun_server.sun_family = PF_UNIX;
959 strcpy(sun_server.sun_path, addr);
960 sock_create_kern(PF_UNIX, SOCK_STREAM, 0, &csocket);
961 err = csocket->ops->connect(csocket, (struct sockaddr *)&sun_server,
962 sizeof(struct sockaddr_un) - 1, 0);
963 if (err < 0) {
964 P9_EPRINTK(KERN_ERR,
965 "p9_trans_unix: problem connecting socket: %s: %d\n",
966 addr, err);
967 goto error;
968 }
969
8b81ef58 970 err = p9_socket_open(client, csocket);
a80d923e
EVH
971 if (err < 0)
972 goto error;
973
8b81ef58
EVH
974 p = (struct p9_trans_fd *) client->trans;
975 p->conn = p9_conn_create(client);
8a0dc95f
EVH
976 if (IS_ERR(p->conn)) {
977 err = PTR_ERR(p->conn);
978 p->conn = NULL;
979 goto error;
980 }
981
8b81ef58 982 return 0;
a80d923e
EVH
983
984error:
985 if (csocket)
986 sock_release(csocket);
987
8b81ef58
EVH
988 kfree(p);
989 return err;
a80d923e
EVH
990}
991
8b81ef58
EVH
992static int
993p9_fd_create(struct p9_client *client, const char *addr, char *args)
a80d923e
EVH
994{
995 int err;
a80d923e 996 struct p9_fd_opts opts;
8b81ef58 997 struct p9_trans_fd *p = NULL; /* this get allocated in p9_fd_open */
a80d923e
EVH
998
999 parse_opts(args, &opts);
1000
1001 if (opts.rfd == ~0 || opts.wfd == ~0) {
1002 printk(KERN_ERR "v9fs: Insufficient options for proto=fd\n");
8b81ef58 1003 return -ENOPROTOOPT;
a80d923e
EVH
1004 }
1005
8b81ef58 1006 err = p9_fd_open(client, opts.rfd, opts.wfd);
a80d923e
EVH
1007 if (err < 0)
1008 goto error;
1009
8b81ef58
EVH
1010 p = (struct p9_trans_fd *) client->trans;
1011 p->conn = p9_conn_create(client);
8a0dc95f
EVH
1012 if (IS_ERR(p->conn)) {
1013 err = PTR_ERR(p->conn);
1014 p->conn = NULL;
1015 goto error;
1016 }
1017
8b81ef58 1018 return 0;
a80d923e
EVH
1019
1020error:
8b81ef58
EVH
1021 kfree(p);
1022 return err;
a80d923e
EVH
1023}
1024
1025static struct p9_trans_module p9_tcp_trans = {
1026 .name = "tcp",
1027 .maxsize = MAX_SOCK_BUF,
1028 .def = 1,
8b81ef58
EVH
1029 .create = p9_fd_create_tcp,
1030 .close = p9_fd_close,
91b8534f
EVH
1031 .request = p9_fd_request,
1032 .cancel = p9_fd_cancel,
72029fe8 1033 .owner = THIS_MODULE,
a80d923e
EVH
1034};
1035
1036static struct p9_trans_module p9_unix_trans = {
1037 .name = "unix",
1038 .maxsize = MAX_SOCK_BUF,
1039 .def = 0,
8b81ef58
EVH
1040 .create = p9_fd_create_unix,
1041 .close = p9_fd_close,
91b8534f
EVH
1042 .request = p9_fd_request,
1043 .cancel = p9_fd_cancel,
72029fe8 1044 .owner = THIS_MODULE,
a80d923e
EVH
1045};
1046
1047static struct p9_trans_module p9_fd_trans = {
1048 .name = "fd",
1049 .maxsize = MAX_SOCK_BUF,
1050 .def = 0,
8b81ef58
EVH
1051 .create = p9_fd_create,
1052 .close = p9_fd_close,
91b8534f
EVH
1053 .request = p9_fd_request,
1054 .cancel = p9_fd_cancel,
72029fe8 1055 .owner = THIS_MODULE,
a80d923e
EVH
1056};
1057
5503ac56
EVH
1058/**
1059 * p9_poll_proc - poll worker thread
1060 * @a: thread state and arguments
1061 *
1062 * polls all v9fs transports for new events and queues the appropriate
1063 * work to the work queue
1064 *
1065 */
1066
1067static int p9_poll_proc(void *a)
1068{
1069 unsigned long flags;
1070
51a87c55 1071 P9_DPRINTK(P9_DEBUG_TRANS, "start %p\n", current);
5503ac56
EVH
1072 repeat:
1073 spin_lock_irqsave(&p9_poll_lock, flags);
1074 while (!list_empty(&p9_poll_pending_list)) {
1075 struct p9_conn *conn = list_first_entry(&p9_poll_pending_list,
1076 struct p9_conn,
1077 poll_pending_link);
1078 list_del_init(&conn->poll_pending_link);
1079 spin_unlock_irqrestore(&p9_poll_lock, flags);
1080
1081 p9_poll_mux(conn);
1082
1083 spin_lock_irqsave(&p9_poll_lock, flags);
1084 }
1085 spin_unlock_irqrestore(&p9_poll_lock, flags);
1086
1087 set_current_state(TASK_INTERRUPTIBLE);
1088 if (list_empty(&p9_poll_pending_list)) {
51a87c55 1089 P9_DPRINTK(P9_DEBUG_TRANS, "sleeping...\n");
5503ac56
EVH
1090 schedule();
1091 }
1092 __set_current_state(TASK_RUNNING);
1093
1094 if (!kthread_should_stop())
1095 goto repeat;
1096
51a87c55 1097 P9_DPRINTK(P9_DEBUG_TRANS, "finish\n");
5503ac56
EVH
1098 return 0;
1099}
1100
887b3ece 1101int p9_trans_fd_init(void)
a80d923e 1102{
206ca50d
TH
1103 p9_mux_wq = create_workqueue("v9fs");
1104 if (!p9_mux_wq) {
1105 printk(KERN_WARNING "v9fs: mux: creating workqueue failed\n");
1106 return -ENOMEM;
8a0dc95f
EVH
1107 }
1108
992b3f1d
TH
1109 p9_poll_task = kthread_run(p9_poll_proc, NULL, "v9fs-poll");
1110 if (IS_ERR(p9_poll_task)) {
1111 destroy_workqueue(p9_mux_wq);
1112 printk(KERN_WARNING "v9fs: mux: creating poll task failed\n");
1113 return PTR_ERR(p9_poll_task);
1114 }
1115
a80d923e
EVH
1116 v9fs_register_trans(&p9_tcp_trans);
1117 v9fs_register_trans(&p9_unix_trans);
1118 v9fs_register_trans(&p9_fd_trans);
1119
3387b804 1120 return 0;
a80d923e 1121}
72029fe8
TH
1122
1123void p9_trans_fd_exit(void)
1124{
992b3f1d 1125 kthread_stop(p9_poll_task);
72029fe8
TH
1126 v9fs_unregister_trans(&p9_tcp_trans);
1127 v9fs_unregister_trans(&p9_unix_trans);
1128 v9fs_unregister_trans(&p9_fd_trans);
206ca50d
TH
1129
1130 destroy_workqueue(p9_mux_wq);
72029fe8 1131}