9P: Fix race in p9_write_work()
[deliverable/linux.git] / net / 9p / trans_fd.c
CommitLineData
bd238fb4
LI
1/*
2 * linux/fs/9p/trans_fd.c
3 *
4 * Fd transport layer. Includes deprecated socket layer.
5 *
6 * Copyright (C) 2006 by Russ Cox <rsc@swtch.com>
7 * Copyright (C) 2004-2005 by Latchesar Ionkov <lucho@ionkov.net>
8a0dc95f 8 * Copyright (C) 2004-2008 by Eric Van Hensbergen <ericvh@gmail.com>
bd238fb4
LI
9 * Copyright (C) 1997-2002 by Ron Minnich <rminnich@sarnoff.com>
10 *
11 * This program is free software; you can redistribute it and/or modify
12 * it under the terms of the GNU General Public License version 2
13 * as published by the Free Software Foundation.
14 *
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU General Public License for more details.
19 *
20 * You should have received a copy of the GNU General Public License
21 * along with this program; if not, write to:
22 * Free Software Foundation
23 * 51 Franklin Street, Fifth Floor
24 * Boston, MA 02111-1301 USA
25 *
26 */
27
5d385153
JP
28#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
29
bd238fb4
LI
30#include <linux/in.h>
31#include <linux/module.h>
32#include <linux/net.h>
33#include <linux/ipv6.h>
8a0dc95f 34#include <linux/kthread.h>
bd238fb4
LI
35#include <linux/errno.h>
36#include <linux/kernel.h>
37#include <linux/un.h>
38#include <linux/uaccess.h>
39#include <linux/inet.h>
40#include <linux/idr.h>
41#include <linux/file.h>
a80d923e 42#include <linux/parser.h>
5a0e3ad6 43#include <linux/slab.h>
bd238fb4 44#include <net/9p/9p.h>
8b81ef58 45#include <net/9p/client.h>
bd238fb4
LI
46#include <net/9p/transport.h>
47
6b18662e
AV
48#include <linux/syscalls.h> /* killme */
49
bd238fb4 50#define P9_PORT 564
a80d923e 51#define MAX_SOCK_BUF (64*1024)
8a0dc95f 52#define MAXPOLLWADDR 2
a80d923e 53
ee443996
EVH
54/**
55 * struct p9_fd_opts - per-transport options
56 * @rfd: file descriptor for reading (trans=fd)
57 * @wfd: file descriptor for writing (trans=fd)
58 * @port: port to connect to (trans=tcp)
59 *
60 */
61
a80d923e
EVH
62struct p9_fd_opts {
63 int rfd;
64 int wfd;
65 u16 port;
66};
bd238fb4 67
ee443996
EVH
68/**
69 * struct p9_trans_fd - transport state
70 * @rd: reference to file to read from
71 * @wr: reference of file to write to
72 * @conn: connection state reference
73 *
74 */
75
bd238fb4
LI
76struct p9_trans_fd {
77 struct file *rd;
78 struct file *wr;
8a0dc95f 79 struct p9_conn *conn;
bd238fb4
LI
80};
81
a80d923e
EVH
82/*
83 * Option Parsing (code inspired by NFS code)
84 * - a little lazy - parse all fd-transport options
85 */
bd238fb4 86
a80d923e
EVH
87enum {
88 /* Options that take integer arguments */
55762690 89 Opt_port, Opt_rfdno, Opt_wfdno, Opt_err,
a80d923e 90};
bd238fb4 91
a447c093 92static const match_table_t tokens = {
a80d923e
EVH
93 {Opt_port, "port=%u"},
94 {Opt_rfdno, "rfdno=%u"},
95 {Opt_wfdno, "wfdno=%u"},
55762690 96 {Opt_err, NULL},
a80d923e 97};
bd238fb4 98
8a0dc95f
EVH
99enum {
100 Rworksched = 1, /* read work scheduled or running */
101 Rpending = 2, /* can read */
102 Wworksched = 4, /* write work scheduled or running */
103 Wpending = 8, /* can write */
104};
105
992b3f1d
TH
106struct p9_poll_wait {
107 struct p9_conn *conn;
108 wait_queue_t wait;
109 wait_queue_head_t *wait_addr;
ee443996
EVH
110};
111
112/**
113 * struct p9_conn - fd mux connection state information
ee443996 114 * @mux_list: list link for mux to manage multiple connections (?)
8b81ef58 115 * @client: reference to client instance for this connection
ee443996 116 * @err: error state
ee443996
EVH
117 * @req_list: accounting for requests which have been sent
118 * @unsent_req_list: accounting for requests that haven't been sent
1b0a763b
EVH
119 * @req: current request being processed (if any)
120 * @tmp_buf: temporary buffer to read in header
121 * @rsize: amount to read for current frame
ee443996
EVH
122 * @rpos: read position in current frame
123 * @rbuf: current read buffer
124 * @wpos: write position for current frame
125 * @wsize: amount of data to write for current frame
126 * @wbuf: current write buffer
0e15597e 127 * @poll_pending_link: pending links to be polled per conn
ee443996 128 * @poll_wait: array of wait_q's for various worker threads
ee443996
EVH
129 * @pt: poll state
130 * @rq: current read work
131 * @wq: current write work
132 * @wsched: ????
133 *
134 */
8a0dc95f
EVH
135
136struct p9_conn {
8a0dc95f 137 struct list_head mux_list;
8b81ef58 138 struct p9_client *client;
8a0dc95f 139 int err;
8a0dc95f
EVH
140 struct list_head req_list;
141 struct list_head unsent_req_list;
1b0a763b
EVH
142 struct p9_req_t *req;
143 char tmp_buf[7];
144 int rsize;
8a0dc95f
EVH
145 int rpos;
146 char *rbuf;
147 int wpos;
148 int wsize;
149 char *wbuf;
992b3f1d
TH
150 struct list_head poll_pending_link;
151 struct p9_poll_wait poll_wait[MAXPOLLWADDR];
8a0dc95f
EVH
152 poll_table pt;
153 struct work_struct rq;
154 struct work_struct wq;
155 unsigned long wsched;
156};
157
aa70c585
TH
158static void p9_poll_workfn(struct work_struct *work);
159
992b3f1d
TH
160static DEFINE_SPINLOCK(p9_poll_lock);
161static LIST_HEAD(p9_poll_pending_list);
aa70c585 162static DECLARE_WORK(p9_poll_work, p9_poll_workfn);
8a0dc95f 163
992b3f1d 164static void p9_mux_poll_stop(struct p9_conn *m)
8a0dc95f 165{
992b3f1d
TH
166 unsigned long flags;
167 int i;
8a0dc95f 168
992b3f1d
TH
169 for (i = 0; i < ARRAY_SIZE(m->poll_wait); i++) {
170 struct p9_poll_wait *pwait = &m->poll_wait[i];
8a0dc95f 171
992b3f1d
TH
172 if (pwait->wait_addr) {
173 remove_wait_queue(pwait->wait_addr, &pwait->wait);
174 pwait->wait_addr = NULL;
8a0dc95f 175 }
8a0dc95f
EVH
176 }
177
992b3f1d
TH
178 spin_lock_irqsave(&p9_poll_lock, flags);
179 list_del_init(&m->poll_pending_link);
180 spin_unlock_irqrestore(&p9_poll_lock, flags);
8a0dc95f
EVH
181}
182
183/**
5503ac56
EVH
184 * p9_conn_cancel - cancel all pending requests with error
185 * @m: mux data
186 * @err: error code
8a0dc95f 187 *
8a0dc95f 188 */
ee443996 189
51a87c55 190static void p9_conn_cancel(struct p9_conn *m, int err)
8a0dc95f 191{
673d62cd 192 struct p9_req_t *req, *rtmp;
91b8534f 193 unsigned long flags;
5503ac56 194 LIST_HEAD(cancel_list);
8a0dc95f 195
5d385153 196 p9_debug(P9_DEBUG_ERROR, "mux %p err %d\n", m, err);
7eb923b8 197
91b8534f 198 spin_lock_irqsave(&m->client->lock, flags);
7eb923b8
EVH
199
200 if (m->err) {
201 spin_unlock_irqrestore(&m->client->lock, flags);
202 return;
203 }
204
205 m->err = err;
206
5503ac56 207 list_for_each_entry_safe(req, rtmp, &m->req_list, req_list) {
673d62cd
EVH
208 req->status = REQ_STATUS_ERROR;
209 if (!req->t_err)
210 req->t_err = err;
5503ac56
EVH
211 list_move(&req->req_list, &cancel_list);
212 }
213 list_for_each_entry_safe(req, rtmp, &m->unsent_req_list, req_list) {
673d62cd
EVH
214 req->status = REQ_STATUS_ERROR;
215 if (!req->t_err)
216 req->t_err = err;
5503ac56 217 list_move(&req->req_list, &cancel_list);
8a0dc95f 218 }
91b8534f 219 spin_unlock_irqrestore(&m->client->lock, flags);
8a0dc95f 220
5503ac56 221 list_for_each_entry_safe(req, rtmp, &cancel_list, req_list) {
5d385153 222 p9_debug(P9_DEBUG_ERROR, "call back req %p\n", req);
1bab88b2 223 list_del(&req->req_list);
91b8534f 224 p9_client_cb(m->client, req);
8a0dc95f 225 }
8a0dc95f
EVH
226}
227
29af9309 228static int
5503ac56 229p9_fd_poll(struct p9_client *client, struct poll_table_struct *pt)
8a0dc95f 230{
5503ac56
EVH
231 int ret, n;
232 struct p9_trans_fd *ts = NULL;
8a0dc95f 233
5503ac56
EVH
234 if (client && client->status == Connected)
235 ts = client->trans;
7dc5d24b 236
5503ac56
EVH
237 if (!ts)
238 return -EREMOTEIO;
7dc5d24b 239
5503ac56
EVH
240 if (!ts->rd->f_op || !ts->rd->f_op->poll)
241 return -EIO;
8a0dc95f 242
5503ac56
EVH
243 if (!ts->wr->f_op || !ts->wr->f_op->poll)
244 return -EIO;
992b3f1d 245
5503ac56
EVH
246 ret = ts->rd->f_op->poll(ts->rd, pt);
247 if (ret < 0)
248 return ret;
992b3f1d 249
5503ac56
EVH
250 if (ts->rd != ts->wr) {
251 n = ts->wr->f_op->poll(ts->wr, pt);
252 if (n < 0)
253 return n;
254 ret = (ret & ~POLLOUT) | (n & ~POLLIN);
255 }
256
257 return ret;
992b3f1d
TH
258}
259
8a0dc95f 260/**
5503ac56
EVH
261 * p9_fd_read- read from a fd
262 * @client: client instance
263 * @v: buffer to receive data into
264 * @len: size of receive buffer
ee443996 265 *
8a0dc95f 266 */
ee443996 267
5503ac56 268static int p9_fd_read(struct p9_client *client, void *v, int len)
8a0dc95f 269{
5503ac56
EVH
270 int ret;
271 struct p9_trans_fd *ts = NULL;
8a0dc95f 272
5503ac56
EVH
273 if (client && client->status != Disconnected)
274 ts = client->trans;
8a0dc95f 275
5503ac56
EVH
276 if (!ts)
277 return -EREMOTEIO;
8a0dc95f 278
5503ac56 279 if (!(ts->rd->f_flags & O_NONBLOCK))
5d385153 280 p9_debug(P9_DEBUG_ERROR, "blocking read ...\n");
8a0dc95f 281
5503ac56
EVH
282 ret = kernel_read(ts->rd, ts->rd->f_pos, v, len);
283 if (ret <= 0 && ret != -ERESTARTSYS && ret != -EAGAIN)
284 client->status = Disconnected;
285 return ret;
8a0dc95f
EVH
286}
287
288/**
5503ac56
EVH
289 * p9_read_work - called when there is some data to be read from a transport
290 * @work: container of work to be done
ee443996 291 *
8a0dc95f 292 */
ee443996 293
5503ac56 294static void p9_read_work(struct work_struct *work)
8a0dc95f 295{
5503ac56
EVH
296 int n, err;
297 struct p9_conn *m;
5503ac56
EVH
298
299 m = container_of(work, struct p9_conn, rq);
8a0dc95f
EVH
300
301 if (m->err < 0)
302 return;
303
5d385153 304 p9_debug(P9_DEBUG_TRANS, "start mux %p pos %d\n", m, m->rpos);
8a0dc95f 305
1b0a763b
EVH
306 if (!m->rbuf) {
307 m->rbuf = m->tmp_buf;
5503ac56 308 m->rpos = 0;
1b0a763b 309 m->rsize = 7; /* start by reading header */
8a0dc95f
EVH
310 }
311
5503ac56 312 clear_bit(Rpending, &m->wsched);
5d385153
JP
313 p9_debug(P9_DEBUG_TRANS, "read mux %p pos %d size: %d = %d\n",
314 m, m->rpos, m->rsize, m->rsize-m->rpos);
5503ac56 315 err = p9_fd_read(m->client, m->rbuf + m->rpos,
1b0a763b 316 m->rsize - m->rpos);
5d385153 317 p9_debug(P9_DEBUG_TRANS, "mux %p got %d bytes\n", m, err);
5503ac56 318 if (err == -EAGAIN) {
0462194d 319 goto end_clear;
8a0dc95f 320 }
8a0dc95f 321
5503ac56
EVH
322 if (err <= 0)
323 goto error;
324
325 m->rpos += err;
1b0a763b
EVH
326
327 if ((!m->req) && (m->rpos == m->rsize)) { /* header read in */
328 u16 tag;
5d385153 329 p9_debug(P9_DEBUG_TRANS, "got new header\n");
1b0a763b
EVH
330
331 n = le32_to_cpu(*(__le32 *) m->rbuf); /* read packet size */
5503ac56 332 if (n >= m->client->msize) {
5d385153
JP
333 p9_debug(P9_DEBUG_ERROR,
334 "requested packet size too big: %d\n", n);
5503ac56
EVH
335 err = -EIO;
336 goto error;
337 }
338
1b0a763b 339 tag = le16_to_cpu(*(__le16 *) (m->rbuf+5)); /* read tag */
5d385153
JP
340 p9_debug(P9_DEBUG_TRANS,
341 "mux %p pkt: size: %d bytes tag: %d\n", m, n, tag);
1b0a763b
EVH
342
343 m->req = p9_tag_lookup(m->client, tag);
1bab88b2
LI
344 if (!m->req || (m->req->status != REQ_STATUS_SENT &&
345 m->req->status != REQ_STATUS_FLSH)) {
5d385153
JP
346 p9_debug(P9_DEBUG_ERROR, "Unexpected packet tag %d\n",
347 tag);
1b0a763b
EVH
348 err = -EIO;
349 goto error;
350 }
351
352 if (m->req->rc == NULL) {
353 m->req->rc = kmalloc(sizeof(struct p9_fcall) +
eeff66ef 354 m->client->msize, GFP_NOFS);
1b0a763b
EVH
355 if (!m->req->rc) {
356 m->req = NULL;
357 err = -ENOMEM;
358 goto error;
359 }
360 }
361 m->rbuf = (char *)m->req->rc + sizeof(struct p9_fcall);
362 memcpy(m->rbuf, m->tmp_buf, m->rsize);
363 m->rsize = n;
364 }
5503ac56 365
1b0a763b
EVH
366 /* not an else because some packets (like clunk) have no payload */
367 if ((m->req) && (m->rpos == m->rsize)) { /* packet is read in */
5d385153 368 p9_debug(P9_DEBUG_TRANS, "got new packet\n");
7eb923b8 369 spin_lock(&m->client->lock);
1bab88b2
LI
370 if (m->req->status != REQ_STATUS_ERROR)
371 m->req->status = REQ_STATUS_RCVD;
91b8534f 372 list_del(&m->req->req_list);
7eb923b8 373 spin_unlock(&m->client->lock);
91b8534f 374 p9_client_cb(m->client, m->req);
1b0a763b
EVH
375 m->rbuf = NULL;
376 m->rpos = 0;
377 m->rsize = 0;
1b0a763b 378 m->req = NULL;
5503ac56
EVH
379 }
380
0462194d
SD
381end_clear:
382 clear_bit(Rworksched, &m->wsched);
383
5503ac56
EVH
384 if (!list_empty(&m->req_list)) {
385 if (test_and_clear_bit(Rpending, &m->wsched))
386 n = POLLIN;
387 else
388 n = p9_fd_poll(m->client, NULL);
389
0462194d 390 if ((n & POLLIN) && !test_and_set_bit(Rworksched, &m->wsched)) {
5d385153 391 p9_debug(P9_DEBUG_TRANS, "sched read work %p\n", m);
61edeeed 392 schedule_work(&m->rq);
0462194d
SD
393 }
394 }
5503ac56
EVH
395
396 return;
5503ac56
EVH
397error:
398 p9_conn_cancel(m, err);
399 clear_bit(Rworksched, &m->wsched);
400}
401
402/**
403 * p9_fd_write - write to a socket
404 * @client: client instance
405 * @v: buffer to send data from
406 * @len: size of send buffer
ee443996 407 *
8a0dc95f 408 */
ee443996 409
5503ac56 410static int p9_fd_write(struct p9_client *client, void *v, int len)
8a0dc95f 411{
5503ac56
EVH
412 int ret;
413 mm_segment_t oldfs;
414 struct p9_trans_fd *ts = NULL;
8a0dc95f 415
5503ac56
EVH
416 if (client && client->status != Disconnected)
417 ts = client->trans;
8a0dc95f 418
5503ac56
EVH
419 if (!ts)
420 return -EREMOTEIO;
8a0dc95f 421
5503ac56 422 if (!(ts->wr->f_flags & O_NONBLOCK))
5d385153 423 p9_debug(P9_DEBUG_ERROR, "blocking write ...\n");
992b3f1d 424
5503ac56
EVH
425 oldfs = get_fs();
426 set_fs(get_ds());
427 /* The cast to a user pointer is valid due to the set_fs() */
e3db6cb4 428 ret = vfs_write(ts->wr, (__force void __user *)v, len, &ts->wr->f_pos);
5503ac56 429 set_fs(oldfs);
992b3f1d 430
5503ac56
EVH
431 if (ret <= 0 && ret != -ERESTARTSYS && ret != -EAGAIN)
432 client->status = Disconnected;
433 return ret;
8a0dc95f
EVH
434}
435
436/**
437 * p9_write_work - called when a transport can send some data
ee443996
EVH
438 * @work: container for work to be done
439 *
8a0dc95f 440 */
ee443996 441
8a0dc95f
EVH
442static void p9_write_work(struct work_struct *work)
443{
444 int n, err;
445 struct p9_conn *m;
673d62cd 446 struct p9_req_t *req;
8a0dc95f
EVH
447
448 m = container_of(work, struct p9_conn, wq);
449
450 if (m->err < 0) {
451 clear_bit(Wworksched, &m->wsched);
452 return;
453 }
454
455 if (!m->wsize) {
456 if (list_empty(&m->unsent_req_list)) {
457 clear_bit(Wworksched, &m->wsched);
458 return;
459 }
460
673d62cd
EVH
461 spin_lock(&m->client->lock);
462 req = list_entry(m->unsent_req_list.next, struct p9_req_t,
8a0dc95f 463 req_list);
673d62cd 464 req->status = REQ_STATUS_SENT;
5d385153 465 p9_debug(P9_DEBUG_TRANS, "move req %p\n", req);
8a0dc95f 466 list_move_tail(&req->req_list, &m->req_list);
8a0dc95f 467
673d62cd
EVH
468 m->wbuf = req->tc->sdata;
469 m->wsize = req->tc->size;
8a0dc95f 470 m->wpos = 0;
673d62cd 471 spin_unlock(&m->client->lock);
8a0dc95f
EVH
472 }
473
5d385153
JP
474 p9_debug(P9_DEBUG_TRANS, "mux %p pos %d size %d\n",
475 m, m->wpos, m->wsize);
8a0dc95f 476 clear_bit(Wpending, &m->wsched);
8b81ef58 477 err = p9_fd_write(m->client, m->wbuf + m->wpos, m->wsize - m->wpos);
5d385153 478 p9_debug(P9_DEBUG_TRANS, "mux %p sent %d bytes\n", m, err);
584a8c13
SD
479 if (err == -EAGAIN)
480 goto end_clear;
481
8a0dc95f
EVH
482
483 if (err < 0)
484 goto error;
485 else if (err == 0) {
486 err = -EREMOTEIO;
487 goto error;
488 }
489
490 m->wpos += err;
491 if (m->wpos == m->wsize)
492 m->wpos = m->wsize = 0;
493
584a8c13
SD
494end_clear:
495 clear_bit(Wworksched, &m->wsched);
496
1957b3a8 497 if (m->wsize || !list_empty(&m->unsent_req_list)) {
8a0dc95f
EVH
498 if (test_and_clear_bit(Wpending, &m->wsched))
499 n = POLLOUT;
500 else
8b81ef58 501 n = p9_fd_poll(m->client, NULL);
8a0dc95f 502
584a8c13
SD
503 if ((n & POLLOUT) &&
504 !test_and_set_bit(Wworksched, &m->wsched)) {
5d385153 505 p9_debug(P9_DEBUG_TRANS, "sched write work %p\n", m);
61edeeed 506 schedule_work(&m->wq);
584a8c13
SD
507 }
508 }
8a0dc95f
EVH
509
510 return;
511
512error:
513 p9_conn_cancel(m, err);
514 clear_bit(Wworksched, &m->wsched);
515}
516
95c96174 517static int p9_pollwake(wait_queue_t *wait, unsigned int mode, int sync, void *key)
8a0dc95f 518{
5503ac56
EVH
519 struct p9_poll_wait *pwait =
520 container_of(wait, struct p9_poll_wait, wait);
521 struct p9_conn *m = pwait->conn;
522 unsigned long flags;
8a0dc95f 523
5503ac56
EVH
524 spin_lock_irqsave(&p9_poll_lock, flags);
525 if (list_empty(&m->poll_pending_link))
526 list_add_tail(&m->poll_pending_link, &p9_poll_pending_list);
527 spin_unlock_irqrestore(&p9_poll_lock, flags);
8a0dc95f 528
aa70c585
TH
529 schedule_work(&p9_poll_work);
530 return 1;
8a0dc95f
EVH
531}
532
533/**
5503ac56
EVH
534 * p9_pollwait - add poll task to the wait queue
535 * @filp: file pointer being polled
536 * @wait_address: wait_q to block on
537 * @p: poll state
ee443996 538 *
5503ac56 539 * called by files poll operation to add v9fs-poll task to files wait queue
8a0dc95f 540 */
ee443996 541
5503ac56
EVH
542static void
543p9_pollwait(struct file *filp, wait_queue_head_t *wait_address, poll_table *p)
8a0dc95f 544{
5503ac56
EVH
545 struct p9_conn *m = container_of(p, struct p9_conn, pt);
546 struct p9_poll_wait *pwait = NULL;
547 int i;
8a0dc95f 548
5503ac56
EVH
549 for (i = 0; i < ARRAY_SIZE(m->poll_wait); i++) {
550 if (m->poll_wait[i].wait_addr == NULL) {
551 pwait = &m->poll_wait[i];
552 break;
8a0dc95f 553 }
8a0dc95f
EVH
554 }
555
5503ac56 556 if (!pwait) {
5d385153 557 p9_debug(P9_DEBUG_ERROR, "not enough wait_address slots\n");
8a0dc95f
EVH
558 return;
559 }
560
5503ac56
EVH
561 pwait->conn = m;
562 pwait->wait_addr = wait_address;
563 init_waitqueue_func_entry(&pwait->wait, p9_pollwake);
564 add_wait_queue(wait_address, &pwait->wait);
565}
8a0dc95f 566
5503ac56
EVH
567/**
568 * p9_conn_create - allocate and initialize the per-session mux data
569 * @client: client instance
570 *
571 * Note: Creates the polling task if this is the first session.
572 */
8a0dc95f 573
5503ac56
EVH
574static struct p9_conn *p9_conn_create(struct p9_client *client)
575{
95820a36 576 int n;
5503ac56 577 struct p9_conn *m;
8a0dc95f 578
5d385153 579 p9_debug(P9_DEBUG_TRANS, "client %p msize %d\n", client, client->msize);
5503ac56
EVH
580 m = kzalloc(sizeof(struct p9_conn), GFP_KERNEL);
581 if (!m)
582 return ERR_PTR(-ENOMEM);
8a0dc95f 583
5503ac56
EVH
584 INIT_LIST_HEAD(&m->mux_list);
585 m->client = client;
8a0dc95f 586
5503ac56
EVH
587 INIT_LIST_HEAD(&m->req_list);
588 INIT_LIST_HEAD(&m->unsent_req_list);
589 INIT_WORK(&m->rq, p9_read_work);
590 INIT_WORK(&m->wq, p9_write_work);
591 INIT_LIST_HEAD(&m->poll_pending_link);
592 init_poll_funcptr(&m->pt, p9_pollwait);
8a0dc95f 593
5503ac56
EVH
594 n = p9_fd_poll(client, &m->pt);
595 if (n & POLLIN) {
5d385153 596 p9_debug(P9_DEBUG_TRANS, "mux %p can read\n", m);
5503ac56
EVH
597 set_bit(Rpending, &m->wsched);
598 }
8a0dc95f 599
5503ac56 600 if (n & POLLOUT) {
5d385153 601 p9_debug(P9_DEBUG_TRANS, "mux %p can write\n", m);
5503ac56
EVH
602 set_bit(Wpending, &m->wsched);
603 }
604
5503ac56
EVH
605 return m;
606}
8a0dc95f 607
5503ac56
EVH
608/**
609 * p9_poll_mux - polls a mux and schedules read or write works if necessary
610 * @m: connection to poll
611 *
612 */
613
614static void p9_poll_mux(struct p9_conn *m)
615{
616 int n;
617
618 if (m->err < 0)
619 return;
620
621 n = p9_fd_poll(m->client, NULL);
622 if (n < 0 || n & (POLLERR | POLLHUP | POLLNVAL)) {
5d385153 623 p9_debug(P9_DEBUG_TRANS, "error mux %p err %d\n", m, n);
5503ac56
EVH
624 if (n >= 0)
625 n = -ECONNRESET;
626 p9_conn_cancel(m, n);
627 }
628
629 if (n & POLLIN) {
630 set_bit(Rpending, &m->wsched);
5d385153 631 p9_debug(P9_DEBUG_TRANS, "mux %p can read\n", m);
5503ac56 632 if (!test_and_set_bit(Rworksched, &m->wsched)) {
5d385153 633 p9_debug(P9_DEBUG_TRANS, "sched read work %p\n", m);
61edeeed 634 schedule_work(&m->rq);
5503ac56
EVH
635 }
636 }
8a0dc95f 637
5503ac56
EVH
638 if (n & POLLOUT) {
639 set_bit(Wpending, &m->wsched);
5d385153 640 p9_debug(P9_DEBUG_TRANS, "mux %p can write\n", m);
f64f9e71
JP
641 if ((m->wsize || !list_empty(&m->unsent_req_list)) &&
642 !test_and_set_bit(Wworksched, &m->wsched)) {
5d385153 643 p9_debug(P9_DEBUG_TRANS, "sched write work %p\n", m);
61edeeed 644 schedule_work(&m->wq);
5503ac56
EVH
645 }
646 }
8a0dc95f
EVH
647}
648
649/**
91b8534f 650 * p9_fd_request - send 9P request
8a0dc95f
EVH
651 * The function can sleep until the request is scheduled for sending.
652 * The function can be interrupted. Return from the function is not
91b8534f 653 * a guarantee that the request is sent successfully.
8a0dc95f 654 *
91b8534f
EVH
655 * @client: client instance
656 * @req: request to be sent
ee443996 657 *
8a0dc95f 658 */
ee443996 659
91b8534f 660static int p9_fd_request(struct p9_client *client, struct p9_req_t *req)
8a0dc95f
EVH
661{
662 int n;
91b8534f
EVH
663 struct p9_trans_fd *ts = client->trans;
664 struct p9_conn *m = ts->conn;
8a0dc95f 665
5d385153
JP
666 p9_debug(P9_DEBUG_TRANS, "mux %p task %p tcall %p id %d\n",
667 m, current, req->tc, req->tc->id);
8a0dc95f 668 if (m->err < 0)
91b8534f 669 return m->err;
8a0dc95f 670
91b8534f 671 spin_lock(&client->lock);
7eb923b8 672 req->status = REQ_STATUS_UNSENT;
8a0dc95f 673 list_add_tail(&req->req_list, &m->unsent_req_list);
91b8534f 674 spin_unlock(&client->lock);
8a0dc95f
EVH
675
676 if (test_and_clear_bit(Wpending, &m->wsched))
677 n = POLLOUT;
678 else
8b81ef58 679 n = p9_fd_poll(m->client, NULL);
8a0dc95f
EVH
680
681 if (n & POLLOUT && !test_and_set_bit(Wworksched, &m->wsched))
61edeeed 682 schedule_work(&m->wq);
8a0dc95f 683
91b8534f 684 return 0;
8a0dc95f
EVH
685}
686
91b8534f 687static int p9_fd_cancel(struct p9_client *client, struct p9_req_t *req)
8a0dc95f 688{
7eb923b8 689 int ret = 1;
8a0dc95f 690
5d385153 691 p9_debug(P9_DEBUG_TRANS, "client %p req %p\n", client, req);
8a0dc95f 692
91b8534f 693 spin_lock(&client->lock);
91b8534f 694
91b8534f 695 if (req->status == REQ_STATUS_UNSENT) {
1bab88b2 696 list_del(&req->req_list);
91b8534f 697 req->status = REQ_STATUS_FLSHD;
7eb923b8 698 ret = 0;
1bab88b2
LI
699 } else if (req->status == REQ_STATUS_SENT)
700 req->status = REQ_STATUS_FLSH;
8a0dc95f 701
7eb923b8
EVH
702 spin_unlock(&client->lock);
703
704 return ret;
8a0dc95f
EVH
705}
706
a80d923e 707/**
0e15597e
AK
708 * parse_opts - parse mount options into p9_fd_opts structure
709 * @params: options string passed from mount
710 * @opts: fd transport-specific structure to parse options into
a80d923e 711 *
bb8ffdfc 712 * Returns 0 upon success, -ERRNO upon failure
a80d923e 713 */
bd238fb4 714
bb8ffdfc 715static int parse_opts(char *params, struct p9_fd_opts *opts)
bd238fb4 716{
a80d923e
EVH
717 char *p;
718 substring_t args[MAX_OPT_ARGS];
719 int option;
d8c8a9e3 720 char *options, *tmp_options;
bd238fb4 721
a80d923e
EVH
722 opts->port = P9_PORT;
723 opts->rfd = ~0;
724 opts->wfd = ~0;
bd238fb4 725
bb8ffdfc
EVH
726 if (!params)
727 return 0;
728
d8c8a9e3
EVH
729 tmp_options = kstrdup(params, GFP_KERNEL);
730 if (!tmp_options) {
5d385153
JP
731 p9_debug(P9_DEBUG_ERROR,
732 "failed to allocate copy of option string\n");
bb8ffdfc
EVH
733 return -ENOMEM;
734 }
d8c8a9e3 735 options = tmp_options;
bd238fb4 736
a80d923e
EVH
737 while ((p = strsep(&options, ",")) != NULL) {
738 int token;
bb8ffdfc 739 int r;
a80d923e
EVH
740 if (!*p)
741 continue;
742 token = match_token(p, tokens, args);
15da4b16
AK
743 if (token != Opt_err) {
744 r = match_int(&args[0], &option);
745 if (r < 0) {
5d385153
JP
746 p9_debug(P9_DEBUG_ERROR,
747 "integer field, but no integer?\n");
15da4b16
AK
748 continue;
749 }
a80d923e
EVH
750 }
751 switch (token) {
752 case Opt_port:
753 opts->port = option;
754 break;
755 case Opt_rfdno:
756 opts->rfd = option;
757 break;
758 case Opt_wfdno:
759 opts->wfd = option;
760 break;
761 default:
762 continue;
763 }
bd238fb4 764 }
d8c8a9e3
EVH
765
766 kfree(tmp_options);
bb8ffdfc 767 return 0;
bd238fb4 768}
bd238fb4 769
8b81ef58 770static int p9_fd_open(struct p9_client *client, int rfd, int wfd)
bd238fb4 771{
a80d923e
EVH
772 struct p9_trans_fd *ts = kmalloc(sizeof(struct p9_trans_fd),
773 GFP_KERNEL);
774 if (!ts)
775 return -ENOMEM;
bd238fb4 776
a80d923e
EVH
777 ts->rd = fget(rfd);
778 ts->wr = fget(wfd);
779 if (!ts->rd || !ts->wr) {
780 if (ts->rd)
781 fput(ts->rd);
782 if (ts->wr)
783 fput(ts->wr);
784 kfree(ts);
785 return -EIO;
bd238fb4
LI
786 }
787
8b81ef58
EVH
788 client->trans = ts;
789 client->status = Connected;
bd238fb4 790
a80d923e 791 return 0;
bd238fb4 792}
bd238fb4 793
8b81ef58 794static int p9_socket_open(struct p9_client *client, struct socket *csocket)
bd238fb4 795{
6b18662e
AV
796 struct p9_trans_fd *p;
797 int ret, fd;
798
799 p = kmalloc(sizeof(struct p9_trans_fd), GFP_KERNEL);
800 if (!p)
801 return -ENOMEM;
bd238fb4
LI
802
803 csocket->sk->sk_allocation = GFP_NOIO;
a677a039 804 fd = sock_map_fd(csocket, 0);
bd238fb4 805 if (fd < 0) {
5d385153
JP
806 pr_err("%s (%d): failed to map fd\n",
807 __func__, task_pid_nr(current));
6b18662e
AV
808 sock_release(csocket);
809 kfree(p);
bd238fb4
LI
810 return fd;
811 }
812
6b18662e
AV
813 get_file(csocket->file);
814 get_file(csocket->file);
815 p->wr = p->rd = csocket->file;
816 client->trans = p;
817 client->status = Connected;
818
819 sys_close(fd); /* still racy */
820
821 p->rd->f_flags |= O_NONBLOCK;
822
823 p->conn = p9_conn_create(client);
824 if (IS_ERR(p->conn)) {
825 ret = PTR_ERR(p->conn);
826 p->conn = NULL;
827 kfree(p);
828 sockfd_put(csocket);
bd238fb4
LI
829 sockfd_put(csocket);
830 return ret;
831 }
bd238fb4
LI
832 return 0;
833}
834
bd238fb4 835/**
5503ac56
EVH
836 * p9_mux_destroy - cancels all pending requests and frees mux resources
837 * @m: mux to destroy
bd238fb4
LI
838 *
839 */
ee443996 840
5503ac56 841static void p9_conn_destroy(struct p9_conn *m)
bd238fb4 842{
5d385153
JP
843 p9_debug(P9_DEBUG_TRANS, "mux %p prev %p next %p\n",
844 m, m->mux_list.prev, m->mux_list.next);
bd238fb4 845
5503ac56
EVH
846 p9_mux_poll_stop(m);
847 cancel_work_sync(&m->rq);
848 cancel_work_sync(&m->wq);
bd238fb4 849
5503ac56 850 p9_conn_cancel(m, -ECONNRESET);
bd238fb4 851
5503ac56 852 m->client = NULL;
5503ac56 853 kfree(m);
bd238fb4
LI
854}
855
856/**
8b81ef58
EVH
857 * p9_fd_close - shutdown file descriptor transport
858 * @client: client instance
bd238fb4
LI
859 *
860 */
ee443996 861
8b81ef58 862static void p9_fd_close(struct p9_client *client)
bd238fb4
LI
863{
864 struct p9_trans_fd *ts;
865
8b81ef58 866 if (!client)
bd238fb4
LI
867 return;
868
8b81ef58 869 ts = client->trans;
bd238fb4
LI
870 if (!ts)
871 return;
872
8b81ef58
EVH
873 client->status = Disconnected;
874
8a0dc95f
EVH
875 p9_conn_destroy(ts->conn);
876
bd238fb4
LI
877 if (ts->rd)
878 fput(ts->rd);
879 if (ts->wr)
880 fput(ts->wr);
8b81ef58 881
bd238fb4
LI
882 kfree(ts);
883}
884
887b3ece
EVH
885/*
886 * stolen from NFS - maybe should be made a generic function?
887 */
888static inline int valid_ipaddr4(const char *buf)
889{
890 int rc, count, in[4];
891
892 rc = sscanf(buf, "%d.%d.%d.%d", &in[0], &in[1], &in[2], &in[3]);
893 if (rc != 4)
894 return -EINVAL;
895 for (count = 0; count < 4; count++) {
896 if (in[count] > 255)
897 return -EINVAL;
898 }
899 return 0;
900}
901
8b81ef58
EVH
902static int
903p9_fd_create_tcp(struct p9_client *client, const char *addr, char *args)
a80d923e
EVH
904{
905 int err;
a80d923e
EVH
906 struct socket *csocket;
907 struct sockaddr_in sin_server;
908 struct p9_fd_opts opts;
909
bb8ffdfc
EVH
910 err = parse_opts(args, &opts);
911 if (err < 0)
8b81ef58 912 return err;
a80d923e 913
887b3ece 914 if (valid_ipaddr4(addr) < 0)
8b81ef58 915 return -EINVAL;
887b3ece 916
a80d923e 917 csocket = NULL;
a80d923e
EVH
918
919 sin_server.sin_family = AF_INET;
920 sin_server.sin_addr.s_addr = in_aton(addr);
921 sin_server.sin_port = htons(opts.port);
e75762fd
RL
922 err = __sock_create(read_pnet(&current->nsproxy->net_ns), PF_INET,
923 SOCK_STREAM, IPPROTO_TCP, &csocket, 1);
6b18662e 924 if (err) {
5d385153
JP
925 pr_err("%s (%d): problem creating socket\n",
926 __func__, task_pid_nr(current));
6b18662e 927 return err;
a80d923e
EVH
928 }
929
930 err = csocket->ops->connect(csocket,
931 (struct sockaddr *)&sin_server,
932 sizeof(struct sockaddr_in), 0);
933 if (err < 0) {
5d385153
JP
934 pr_err("%s (%d): problem connecting socket to %s\n",
935 __func__, task_pid_nr(current), addr);
a80d923e 936 sock_release(csocket);
6b18662e
AV
937 return err;
938 }
a80d923e 939
6b18662e 940 return p9_socket_open(client, csocket);
a80d923e
EVH
941}
942
8b81ef58
EVH
943static int
944p9_fd_create_unix(struct p9_client *client, const char *addr, char *args)
a80d923e
EVH
945{
946 int err;
947 struct socket *csocket;
948 struct sockaddr_un sun_server;
a80d923e
EVH
949
950 csocket = NULL;
a80d923e 951
cff6b8a9 952 if (strlen(addr) >= UNIX_PATH_MAX) {
5d385153
JP
953 pr_err("%s (%d): address too long: %s\n",
954 __func__, task_pid_nr(current), addr);
6b18662e 955 return -ENAMETOOLONG;
a80d923e
EVH
956 }
957
958 sun_server.sun_family = PF_UNIX;
959 strcpy(sun_server.sun_path, addr);
e75762fd
RL
960 err = __sock_create(read_pnet(&current->nsproxy->net_ns), PF_UNIX,
961 SOCK_STREAM, 0, &csocket, 1);
6b18662e 962 if (err < 0) {
5d385153
JP
963 pr_err("%s (%d): problem creating socket\n",
964 __func__, task_pid_nr(current));
965
6b18662e
AV
966 return err;
967 }
a80d923e
EVH
968 err = csocket->ops->connect(csocket, (struct sockaddr *)&sun_server,
969 sizeof(struct sockaddr_un) - 1, 0);
970 if (err < 0) {
5d385153
JP
971 pr_err("%s (%d): problem connecting socket: %s: %d\n",
972 __func__, task_pid_nr(current), addr, err);
a80d923e 973 sock_release(csocket);
6b18662e
AV
974 return err;
975 }
a80d923e 976
6b18662e 977 return p9_socket_open(client, csocket);
a80d923e
EVH
978}
979
8b81ef58
EVH
980static int
981p9_fd_create(struct p9_client *client, const char *addr, char *args)
a80d923e
EVH
982{
983 int err;
a80d923e 984 struct p9_fd_opts opts;
6b18662e 985 struct p9_trans_fd *p;
a80d923e
EVH
986
987 parse_opts(args, &opts);
988
989 if (opts.rfd == ~0 || opts.wfd == ~0) {
5d385153 990 pr_err("Insufficient options for proto=fd\n");
8b81ef58 991 return -ENOPROTOOPT;
a80d923e
EVH
992 }
993
8b81ef58 994 err = p9_fd_open(client, opts.rfd, opts.wfd);
a80d923e 995 if (err < 0)
6b18662e 996 return err;
a80d923e 997
8b81ef58
EVH
998 p = (struct p9_trans_fd *) client->trans;
999 p->conn = p9_conn_create(client);
8a0dc95f
EVH
1000 if (IS_ERR(p->conn)) {
1001 err = PTR_ERR(p->conn);
1002 p->conn = NULL;
6b18662e
AV
1003 fput(p->rd);
1004 fput(p->wr);
1005 return err;
8a0dc95f
EVH
1006 }
1007
8b81ef58 1008 return 0;
a80d923e
EVH
1009}
1010
1011static struct p9_trans_module p9_tcp_trans = {
1012 .name = "tcp",
1013 .maxsize = MAX_SOCK_BUF,
1014 .def = 1,
8b81ef58
EVH
1015 .create = p9_fd_create_tcp,
1016 .close = p9_fd_close,
91b8534f
EVH
1017 .request = p9_fd_request,
1018 .cancel = p9_fd_cancel,
72029fe8 1019 .owner = THIS_MODULE,
a80d923e
EVH
1020};
1021
1022static struct p9_trans_module p9_unix_trans = {
1023 .name = "unix",
1024 .maxsize = MAX_SOCK_BUF,
1025 .def = 0,
8b81ef58
EVH
1026 .create = p9_fd_create_unix,
1027 .close = p9_fd_close,
91b8534f
EVH
1028 .request = p9_fd_request,
1029 .cancel = p9_fd_cancel,
72029fe8 1030 .owner = THIS_MODULE,
a80d923e
EVH
1031};
1032
1033static struct p9_trans_module p9_fd_trans = {
1034 .name = "fd",
1035 .maxsize = MAX_SOCK_BUF,
1036 .def = 0,
8b81ef58
EVH
1037 .create = p9_fd_create,
1038 .close = p9_fd_close,
91b8534f
EVH
1039 .request = p9_fd_request,
1040 .cancel = p9_fd_cancel,
72029fe8 1041 .owner = THIS_MODULE,
a80d923e
EVH
1042};
1043
5503ac56
EVH
1044/**
1045 * p9_poll_proc - poll worker thread
1046 * @a: thread state and arguments
1047 *
1048 * polls all v9fs transports for new events and queues the appropriate
1049 * work to the work queue
1050 *
1051 */
1052
aa70c585 1053static void p9_poll_workfn(struct work_struct *work)
5503ac56
EVH
1054{
1055 unsigned long flags;
1056
5d385153 1057 p9_debug(P9_DEBUG_TRANS, "start %p\n", current);
aa70c585 1058
5503ac56
EVH
1059 spin_lock_irqsave(&p9_poll_lock, flags);
1060 while (!list_empty(&p9_poll_pending_list)) {
1061 struct p9_conn *conn = list_first_entry(&p9_poll_pending_list,
1062 struct p9_conn,
1063 poll_pending_link);
1064 list_del_init(&conn->poll_pending_link);
1065 spin_unlock_irqrestore(&p9_poll_lock, flags);
1066
1067 p9_poll_mux(conn);
1068
1069 spin_lock_irqsave(&p9_poll_lock, flags);
1070 }
1071 spin_unlock_irqrestore(&p9_poll_lock, flags);
1072
5d385153 1073 p9_debug(P9_DEBUG_TRANS, "finish\n");
5503ac56
EVH
1074}
1075
887b3ece 1076int p9_trans_fd_init(void)
a80d923e
EVH
1077{
1078 v9fs_register_trans(&p9_tcp_trans);
1079 v9fs_register_trans(&p9_unix_trans);
1080 v9fs_register_trans(&p9_fd_trans);
1081
3387b804 1082 return 0;
a80d923e 1083}
72029fe8
TH
1084
1085void p9_trans_fd_exit(void)
1086{
aa70c585 1087 flush_work_sync(&p9_poll_work);
72029fe8
TH
1088 v9fs_unregister_trans(&p9_tcp_trans);
1089 v9fs_unregister_trans(&p9_unix_trans);
1090 v9fs_unregister_trans(&p9_fd_trans);
1091}
This page took 0.461817 seconds and 5 git commands to generate.