SUNRPC: Call the default socket callbacks instead of open coding
[deliverable/linux.git] / net / sunrpc / svcsock.c
CommitLineData
1da177e4
LT
1/*
2 * linux/net/sunrpc/svcsock.c
3 *
4 * These are the RPC server socket internals.
5 *
6 * The server scheduling algorithm does not always distribute the load
7 * evenly when servicing a single client. May need to modify the
f6150c3c 8 * svc_xprt_enqueue procedure...
1da177e4
LT
9 *
10 * TCP support is largely untested and may be a little slow. The problem
11 * is that we currently do two separate recvfrom's, one for the 4-byte
12 * record length, and the second for the actual record. This could possibly
13 * be improved by always reading a minimum size of around 100 bytes and
14 * tucking any superfluous bytes away in a temporary store. Still, that
15 * leaves write requests out in the rain. An alternative may be to peek at
16 * the first skb in the queue, and if it matches the next TCP sequence
17 * number, to extract the record marker. Yuck.
18 *
19 * Copyright (C) 1995, 1996 Olaf Kirch <okir@monad.swb.de>
20 */
21
172589cc 22#include <linux/kernel.h>
1da177e4 23#include <linux/sched.h>
3a9a231d 24#include <linux/module.h>
1da177e4
LT
25#include <linux/errno.h>
26#include <linux/fcntl.h>
27#include <linux/net.h>
28#include <linux/in.h>
29#include <linux/inet.h>
30#include <linux/udp.h>
91483c4b 31#include <linux/tcp.h>
1da177e4
LT
32#include <linux/unistd.h>
33#include <linux/slab.h>
34#include <linux/netdevice.h>
35#include <linux/skbuff.h>
b41b66d6 36#include <linux/file.h>
7dfb7103 37#include <linux/freezer.h>
1da177e4
LT
38#include <net/sock.h>
39#include <net/checksum.h>
40#include <net/ip.h>
b92503b2 41#include <net/ipv6.h>
b7872fe8 42#include <net/tcp.h>
c752f073 43#include <net/tcp_states.h>
1da177e4
LT
44#include <asm/uaccess.h>
45#include <asm/ioctls.h>
22911fc5 46#include <trace/events/skb.h>
1da177e4
LT
47
48#include <linux/sunrpc/types.h>
ad06e4bd 49#include <linux/sunrpc/clnt.h>
1da177e4 50#include <linux/sunrpc/xdr.h>
c0401ea0 51#include <linux/sunrpc/msg_prot.h>
1da177e4
LT
52#include <linux/sunrpc/svcsock.h>
53#include <linux/sunrpc/stats.h>
4cfc7e60 54#include <linux/sunrpc/xprt.h>
1da177e4 55
177e4f99
HS
56#include "sunrpc.h"
57
360d8738 58#define RPCDBG_FACILITY RPCDBG_SVCXPRT
1da177e4
LT
59
60
61static struct svc_sock *svc_setup_socket(struct svc_serv *, struct socket *,
72c35376 62 int flags);
1da177e4
LT
63static int svc_udp_recvfrom(struct svc_rqst *);
64static int svc_udp_sendto(struct svc_rqst *);
755cceab 65static void svc_sock_detach(struct svc_xprt *);
69b6ba37 66static void svc_tcp_sock_detach(struct svc_xprt *);
755cceab 67static void svc_sock_free(struct svc_xprt *);
1da177e4 68
b700cbb1 69static struct svc_xprt *svc_create_socket(struct svc_serv *, int,
62832c03
PE
70 struct net *, struct sockaddr *,
71 int, int);
9e00abc3 72#if defined(CONFIG_SUNRPC_BACKCHANNEL)
1f11a034
AA
73static struct svc_xprt *svc_bc_create_socket(struct svc_serv *, int,
74 struct net *, struct sockaddr *,
75 int, int);
76static void svc_bc_sock_free(struct svc_xprt *xprt);
9e00abc3 77#endif /* CONFIG_SUNRPC_BACKCHANNEL */
1f11a034 78
ed07536e
PZ
79#ifdef CONFIG_DEBUG_LOCK_ALLOC
80static struct lock_class_key svc_key[2];
81static struct lock_class_key svc_slock_key[2];
82
0f0257ea 83static void svc_reclassify_socket(struct socket *sock)
ed07536e
PZ
84{
85 struct sock *sk = sock->sk;
1b7a1819 86
fafc4e1e 87 if (WARN_ON_ONCE(!sock_allow_reclassification(sk)))
1b7a1819
WAA
88 return;
89
ed07536e
PZ
90 switch (sk->sk_family) {
91 case AF_INET:
92 sock_lock_init_class_and_name(sk, "slock-AF_INET-NFSD",
def13d74
TT
93 &svc_slock_key[0],
94 "sk_xprt.xpt_lock-AF_INET-NFSD",
95 &svc_key[0]);
ed07536e
PZ
96 break;
97
98 case AF_INET6:
99 sock_lock_init_class_and_name(sk, "slock-AF_INET6-NFSD",
def13d74
TT
100 &svc_slock_key[1],
101 "sk_xprt.xpt_lock-AF_INET6-NFSD",
102 &svc_key[1]);
ed07536e
PZ
103 break;
104
105 default:
106 BUG();
107 }
108}
109#else
0f0257ea 110static void svc_reclassify_socket(struct socket *sock)
ed07536e
PZ
111{
112}
113#endif
114
1da177e4
LT
115/*
116 * Release an skbuff after use
117 */
5148bf4e 118static void svc_release_skb(struct svc_rqst *rqstp)
1da177e4 119{
5148bf4e 120 struct sk_buff *skb = rqstp->rq_xprt_ctxt;
1da177e4
LT
121
122 if (skb) {
57b1d3ba
TT
123 struct svc_sock *svsk =
124 container_of(rqstp->rq_xprt, struct svc_sock, sk_xprt);
5148bf4e 125 rqstp->rq_xprt_ctxt = NULL;
1da177e4
LT
126
127 dprintk("svc: service %p, releasing skb %p\n", rqstp, skb);
9d410c79 128 skb_free_datagram_locked(svsk->sk_sk, skb);
1da177e4 129 }
1da177e4
LT
130}
131
b92503b2
CL
132union svc_pktinfo_u {
133 struct in_pktinfo pkti;
b92503b2 134 struct in6_pktinfo pkti6;
b92503b2 135};
bc375ea7
DM
136#define SVC_PKTINFO_SPACE \
137 CMSG_SPACE(sizeof(union svc_pktinfo_u))
b92503b2
CL
138
139static void svc_set_cmsg_data(struct svc_rqst *rqstp, struct cmsghdr *cmh)
140{
57b1d3ba
TT
141 struct svc_sock *svsk =
142 container_of(rqstp->rq_xprt, struct svc_sock, sk_xprt);
143 switch (svsk->sk_sk->sk_family) {
b92503b2
CL
144 case AF_INET: {
145 struct in_pktinfo *pki = CMSG_DATA(cmh);
146
147 cmh->cmsg_level = SOL_IP;
148 cmh->cmsg_type = IP_PKTINFO;
149 pki->ipi_ifindex = 0;
849a1cf1
MJ
150 pki->ipi_spec_dst.s_addr =
151 svc_daddr_in(rqstp)->sin_addr.s_addr;
b92503b2
CL
152 cmh->cmsg_len = CMSG_LEN(sizeof(*pki));
153 }
154 break;
5a05ed73 155
b92503b2
CL
156 case AF_INET6: {
157 struct in6_pktinfo *pki = CMSG_DATA(cmh);
849a1cf1 158 struct sockaddr_in6 *daddr = svc_daddr_in6(rqstp);
b92503b2
CL
159
160 cmh->cmsg_level = SOL_IPV6;
161 cmh->cmsg_type = IPV6_PKTINFO;
849a1cf1 162 pki->ipi6_ifindex = daddr->sin6_scope_id;
4e3fd7a0 163 pki->ipi6_addr = daddr->sin6_addr;
b92503b2
CL
164 cmh->cmsg_len = CMSG_LEN(sizeof(*pki));
165 }
166 break;
b92503b2 167 }
b92503b2
CL
168}
169
1da177e4 170/*
4cfc7e60 171 * send routine intended to be shared by the fore- and back-channel
1da177e4 172 */
4cfc7e60
RI
173int svc_send_common(struct socket *sock, struct xdr_buf *xdr,
174 struct page *headpage, unsigned long headoffset,
175 struct page *tailpage, unsigned long tailoffset)
1da177e4 176{
1da177e4
LT
177 int result;
178 int size;
179 struct page **ppage = xdr->pages;
180 size_t base = xdr->page_base;
181 unsigned int pglen = xdr->page_len;
226453d8 182 unsigned int flags = MSG_MORE | MSG_SENDPAGE_NOTLAST;
4cfc7e60
RI
183 int slen;
184 int len = 0;
1da177e4
LT
185
186 slen = xdr->len;
187
1da177e4
LT
188 /* send head */
189 if (slen == xdr->head[0].iov_len)
190 flags = 0;
4cfc7e60 191 len = kernel_sendpage(sock, headpage, headoffset,
44524359 192 xdr->head[0].iov_len, flags);
1da177e4
LT
193 if (len != xdr->head[0].iov_len)
194 goto out;
195 slen -= xdr->head[0].iov_len;
196 if (slen == 0)
197 goto out;
198
199 /* send page data */
200 size = PAGE_SIZE - base < pglen ? PAGE_SIZE - base : pglen;
201 while (pglen > 0) {
202 if (slen == size)
203 flags = 0;
e6242e92 204 result = kernel_sendpage(sock, *ppage, base, size, flags);
1da177e4
LT
205 if (result > 0)
206 len += result;
207 if (result != size)
208 goto out;
209 slen -= size;
210 pglen -= size;
211 size = PAGE_SIZE < pglen ? PAGE_SIZE : pglen;
212 base = 0;
213 ppage++;
214 }
4cfc7e60 215
1da177e4
LT
216 /* send tail */
217 if (xdr->tail[0].iov_len) {
4cfc7e60
RI
218 result = kernel_sendpage(sock, tailpage, tailoffset,
219 xdr->tail[0].iov_len, 0);
1da177e4
LT
220 if (result > 0)
221 len += result;
222 }
4cfc7e60
RI
223
224out:
225 return len;
226}
227
228
229/*
230 * Generic sendto routine
231 */
232static int svc_sendto(struct svc_rqst *rqstp, struct xdr_buf *xdr)
233{
234 struct svc_sock *svsk =
235 container_of(rqstp->rq_xprt, struct svc_sock, sk_xprt);
236 struct socket *sock = svsk->sk_sock;
237 union {
238 struct cmsghdr hdr;
239 long all[SVC_PKTINFO_SPACE / sizeof(long)];
240 } buffer;
241 struct cmsghdr *cmh = &buffer.hdr;
242 int len = 0;
243 unsigned long tailoff;
244 unsigned long headoff;
245 RPC_IFDEBUG(char buf[RPC_MAX_ADDRBUFLEN]);
246
247 if (rqstp->rq_prot == IPPROTO_UDP) {
248 struct msghdr msg = {
249 .msg_name = &rqstp->rq_addr,
250 .msg_namelen = rqstp->rq_addrlen,
251 .msg_control = cmh,
252 .msg_controllen = sizeof(buffer),
253 .msg_flags = MSG_MORE,
254 };
255
256 svc_set_cmsg_data(rqstp, cmh);
257
d8725c86 258 if (sock_sendmsg(sock, &msg) < 0)
4cfc7e60
RI
259 goto out;
260 }
261
262 tailoff = ((unsigned long)xdr->tail[0].iov_base) & (PAGE_SIZE-1);
263 headoff = 0;
264 len = svc_send_common(sock, xdr, rqstp->rq_respages[0], headoff,
265 rqstp->rq_respages[0], tailoff);
266
1da177e4 267out:
ad06e4bd 268 dprintk("svc: socket %p sendto([%p %Zu... ], %d) = %d (addr %s)\n",
57b1d3ba 269 svsk, xdr->head[0].iov_base, xdr->head[0].iov_len,
ad06e4bd 270 xdr->len, len, svc_print_addr(rqstp, buf, sizeof(buf)));
1da177e4
LT
271
272 return len;
273}
274
80212d59
N
275/*
276 * Report socket names for nfsdfs
277 */
e7942b9f 278static int svc_one_sock_name(struct svc_sock *svsk, char *buf, int remaining)
80212d59 279{
017cb47f
CL
280 const struct sock *sk = svsk->sk_sk;
281 const char *proto_name = sk->sk_protocol == IPPROTO_UDP ?
282 "udp" : "tcp";
80212d59
N
283 int len;
284
017cb47f 285 switch (sk->sk_family) {
e7942b9f
CL
286 case PF_INET:
287 len = snprintf(buf, remaining, "ipv4 %s %pI4 %d\n",
017cb47f 288 proto_name,
c720c7e8
ED
289 &inet_sk(sk)->inet_rcv_saddr,
290 inet_sk(sk)->inet_num);
80212d59 291 break;
c2bb06db 292#if IS_ENABLED(CONFIG_IPV6)
58de2f86
CL
293 case PF_INET6:
294 len = snprintf(buf, remaining, "ipv6 %s %pI6 %d\n",
017cb47f 295 proto_name,
efe4208f 296 &sk->sk_v6_rcv_saddr,
c720c7e8 297 inet_sk(sk)->inet_num);
80212d59 298 break;
c2bb06db 299#endif
80212d59 300 default:
e7942b9f 301 len = snprintf(buf, remaining, "*unknown-%d*\n",
017cb47f 302 sk->sk_family);
80212d59 303 }
e7942b9f
CL
304
305 if (len >= remaining) {
306 *buf = '\0';
307 return -ENAMETOOLONG;
80212d59
N
308 }
309 return len;
310}
311
1da177e4
LT
312/*
313 * Generic recvfrom routine.
314 */
0f0257ea
TT
315static int svc_recvfrom(struct svc_rqst *rqstp, struct kvec *iov, int nr,
316 int buflen)
1da177e4 317{
57b1d3ba
TT
318 struct svc_sock *svsk =
319 container_of(rqstp->rq_xprt, struct svc_sock, sk_xprt);
1ba95105
CL
320 struct msghdr msg = {
321 .msg_flags = MSG_DONTWAIT,
322 };
323 int len;
1da177e4 324
260c1d12
TT
325 rqstp->rq_xprt_hlen = 0;
326
f8d1ff47 327 clear_bit(XPT_DATA, &svsk->sk_xprt.xpt_flags);
1ba95105
CL
328 len = kernel_recvmsg(svsk->sk_sock, &msg, iov, nr, buflen,
329 msg.msg_flags);
f8d1ff47
TM
330 /* If we read a full record, then assume there may be more
331 * data to read (stream based sockets only!)
332 */
333 if (len == buflen)
334 set_bit(XPT_DATA, &svsk->sk_xprt.xpt_flags);
1da177e4 335
1da177e4 336 dprintk("svc: socket %p recvfrom(%p, %Zu) = %d\n",
1ba95105 337 svsk, iov[0].iov_base, iov[0].iov_len, len);
1da177e4
LT
338 return len;
339}
340
31d68ef6
BF
341static int svc_partial_recvfrom(struct svc_rqst *rqstp,
342 struct kvec *iov, int nr,
343 int buflen, unsigned int base)
344{
345 size_t save_iovlen;
09acfea5 346 void *save_iovbase;
31d68ef6
BF
347 unsigned int i;
348 int ret;
349
350 if (base == 0)
351 return svc_recvfrom(rqstp, iov, nr, buflen);
352
353 for (i = 0; i < nr; i++) {
354 if (iov[i].iov_len > base)
355 break;
356 base -= iov[i].iov_len;
357 }
358 save_iovlen = iov[i].iov_len;
359 save_iovbase = iov[i].iov_base;
360 iov[i].iov_len -= base;
361 iov[i].iov_base += base;
362 ret = svc_recvfrom(rqstp, &iov[i], nr - i, buflen);
363 iov[i].iov_len = save_iovlen;
364 iov[i].iov_base = save_iovbase;
365 return ret;
366}
367
1da177e4
LT
368/*
369 * Set socket snd and rcv buffer lengths
370 */
0f0257ea
TT
371static void svc_sock_setbufsize(struct socket *sock, unsigned int snd,
372 unsigned int rcv)
1da177e4
LT
373{
374#if 0
375 mm_segment_t oldfs;
376 oldfs = get_fs(); set_fs(KERNEL_DS);
377 sock_setsockopt(sock, SOL_SOCKET, SO_SNDBUF,
378 (char*)&snd, sizeof(snd));
379 sock_setsockopt(sock, SOL_SOCKET, SO_RCVBUF,
380 (char*)&rcv, sizeof(rcv));
381#else
382 /* sock_setsockopt limits use to sysctl_?mem_max,
383 * which isn't acceptable. Until that is made conditional
384 * on not having CAP_SYS_RESOURCE or similar, we go direct...
385 * DaveM said I could!
386 */
387 lock_sock(sock->sk);
388 sock->sk->sk_sndbuf = snd * 2;
389 sock->sk->sk_rcvbuf = rcv * 2;
47fcb03f 390 sock->sk->sk_write_space(sock->sk);
1da177e4
LT
391 release_sock(sock->sk);
392#endif
393}
16e4d93f
CL
394
395static int svc_sock_secure_port(struct svc_rqst *rqstp)
396{
397 return svc_port_is_privileged(svc_addr(rqstp));
398}
399
1da177e4
LT
400/*
401 * INET callback when data has been received on the socket.
402 */
fa9251af 403static void svc_data_ready(struct sock *sk)
1da177e4 404{
939bb7ef 405 struct svc_sock *svsk = (struct svc_sock *)sk->sk_user_data;
1da177e4 406
939bb7ef 407 if (svsk) {
676d2369
DM
408 dprintk("svc: socket %p(inet %p), busy=%d\n",
409 svsk, sk,
02fc6c36 410 test_bit(XPT_BUSY, &svsk->sk_xprt.xpt_flags));
fa9251af 411 svsk->sk_odata(sk);
02fc6c36 412 set_bit(XPT_DATA, &svsk->sk_xprt.xpt_flags);
f6150c3c 413 svc_xprt_enqueue(&svsk->sk_xprt);
939bb7ef 414 }
1da177e4
LT
415}
416
417/*
418 * INET callback when space is newly available on the socket.
419 */
0f0257ea 420static void svc_write_space(struct sock *sk)
1da177e4
LT
421{
422 struct svc_sock *svsk = (struct svc_sock *)(sk->sk_user_data);
423
424 if (svsk) {
425 dprintk("svc: socket %p(inet %p), write_space busy=%d\n",
02fc6c36 426 svsk, sk, test_bit(XPT_BUSY, &svsk->sk_xprt.xpt_flags));
fa9251af 427 svsk->sk_owspace(sk);
f6150c3c 428 svc_xprt_enqueue(&svsk->sk_xprt);
1da177e4 429 }
1da177e4
LT
430}
431
c7fb3f06
TM
432static int svc_tcp_has_wspace(struct svc_xprt *xprt)
433{
434 struct svc_sock *svsk = container_of(xprt, struct svc_sock, sk_xprt);
435 struct svc_serv *serv = svsk->sk_xprt.xpt_server;
436 int required;
437
438 if (test_bit(XPT_LISTENER, &xprt->xpt_flags))
439 return 1;
440 required = atomic_read(&xprt->xpt_reserved) + serv->sv_max_mesg;
441 if (sk_stream_wspace(svsk->sk_sk) >= required ||
442 (sk_stream_min_wspace(svsk->sk_sk) == 0 &&
443 atomic_read(&xprt->xpt_reserved) == 0))
444 return 1;
445 set_bit(SOCK_NOSPACE, &svsk->sk_sock->flags);
446 return 0;
447}
448
47fcb03f
TM
449static void svc_tcp_write_space(struct sock *sk)
450{
c7fb3f06 451 struct svc_sock *svsk = (struct svc_sock *)(sk->sk_user_data);
47fcb03f
TM
452 struct socket *sock = sk->sk_socket;
453
fa9251af
TM
454 if (!svsk)
455 return;
456
c7fb3f06
TM
457 if (!sk_stream_is_writeable(sk) || !sock)
458 return;
fa9251af 459 if (svc_tcp_has_wspace(&svsk->sk_xprt)) {
47fcb03f 460 clear_bit(SOCK_NOSPACE, &sock->flags);
fa9251af
TM
461 svc_write_space(sk);
462 }
47fcb03f
TM
463}
464
51877680
TM
465static void svc_tcp_adjust_wspace(struct svc_xprt *xprt)
466{
467 struct svc_sock *svsk = container_of(xprt, struct svc_sock, sk_xprt);
468
469 if (svc_tcp_has_wspace(xprt))
470 clear_bit(SOCK_NOSPACE, &svsk->sk_sock->flags);
471}
472
7702ce40
CL
473/*
474 * See net/ipv6/ip_sockglue.c : ip_cmsg_recv_pktinfo
475 */
476static int svc_udp_get_dest_address4(struct svc_rqst *rqstp,
477 struct cmsghdr *cmh)
478{
479 struct in_pktinfo *pki = CMSG_DATA(cmh);
849a1cf1
MJ
480 struct sockaddr_in *daddr = svc_daddr_in(rqstp);
481
7702ce40
CL
482 if (cmh->cmsg_type != IP_PKTINFO)
483 return 0;
849a1cf1
MJ
484
485 daddr->sin_family = AF_INET;
486 daddr->sin_addr.s_addr = pki->ipi_spec_dst.s_addr;
7702ce40
CL
487 return 1;
488}
489
490/*
73df66f8 491 * See net/ipv6/datagram.c : ip6_datagram_recv_ctl
7702ce40
CL
492 */
493static int svc_udp_get_dest_address6(struct svc_rqst *rqstp,
494 struct cmsghdr *cmh)
495{
496 struct in6_pktinfo *pki = CMSG_DATA(cmh);
849a1cf1
MJ
497 struct sockaddr_in6 *daddr = svc_daddr_in6(rqstp);
498
7702ce40
CL
499 if (cmh->cmsg_type != IPV6_PKTINFO)
500 return 0;
849a1cf1
MJ
501
502 daddr->sin6_family = AF_INET6;
4e3fd7a0 503 daddr->sin6_addr = pki->ipi6_addr;
849a1cf1 504 daddr->sin6_scope_id = pki->ipi6_ifindex;
7702ce40
CL
505 return 1;
506}
507
9dbc240f
TT
508/*
509 * Copy the UDP datagram's destination address to the rqstp structure.
510 * The 'destination' address in this case is the address to which the
511 * peer sent the datagram, i.e. our local address. For multihomed
512 * hosts, this can change from msg to msg. Note that only the IP
513 * address changes, the port number should remain the same.
514 */
7702ce40
CL
515static int svc_udp_get_dest_address(struct svc_rqst *rqstp,
516 struct cmsghdr *cmh)
95756482 517{
7702ce40
CL
518 switch (cmh->cmsg_level) {
519 case SOL_IP:
520 return svc_udp_get_dest_address4(rqstp, cmh);
521 case SOL_IPV6:
522 return svc_udp_get_dest_address6(rqstp, cmh);
95756482 523 }
7702ce40
CL
524
525 return 0;
95756482
CL
526}
527
1da177e4
LT
528/*
529 * Receive a datagram from a UDP socket.
530 */
0f0257ea 531static int svc_udp_recvfrom(struct svc_rqst *rqstp)
1da177e4 532{
57b1d3ba
TT
533 struct svc_sock *svsk =
534 container_of(rqstp->rq_xprt, struct svc_sock, sk_xprt);
bb5cf160 535 struct svc_serv *serv = svsk->sk_xprt.xpt_server;
1da177e4 536 struct sk_buff *skb;
bc375ea7
DM
537 union {
538 struct cmsghdr hdr;
539 long all[SVC_PKTINFO_SPACE / sizeof(long)];
540 } buffer;
541 struct cmsghdr *cmh = &buffer.hdr;
7a37f578
N
542 struct msghdr msg = {
543 .msg_name = svc_addr(rqstp),
544 .msg_control = cmh,
545 .msg_controllen = sizeof(buffer),
546 .msg_flags = MSG_DONTWAIT,
547 };
abc5c44d
CL
548 size_t len;
549 int err;
1da177e4 550
02fc6c36 551 if (test_and_clear_bit(XPT_CHNGBUF, &svsk->sk_xprt.xpt_flags))
1da177e4
LT
552 /* udp sockets need large rcvbuf as all pending
553 * requests are still in that buffer. sndbuf must
554 * also be large enough that there is enough space
3262c816
GB
555 * for one reply per thread. We count all threads
556 * rather than threads in a particular pool, which
557 * provides an upper bound on the number of threads
558 * which will access the socket.
1da177e4
LT
559 */
560 svc_sock_setbufsize(svsk->sk_sock,
c6b0a9f8
N
561 (serv->sv_nrthreads+3) * serv->sv_max_mesg,
562 (serv->sv_nrthreads+3) * serv->sv_max_mesg);
1da177e4 563
02fc6c36 564 clear_bit(XPT_DATA, &svsk->sk_xprt.xpt_flags);
05ed690e
N
565 skb = NULL;
566 err = kernel_recvmsg(svsk->sk_sock, &msg, NULL,
567 0, 0, MSG_PEEK | MSG_DONTWAIT);
568 if (err >= 0)
569 skb = skb_recv_datagram(svsk->sk_sk, 0, 1, &err);
570
571 if (skb == NULL) {
572 if (err != -EAGAIN) {
573 /* possibly an icmp error */
574 dprintk("svc: recvfrom returned error %d\n", -err);
02fc6c36 575 set_bit(XPT_DATA, &svsk->sk_xprt.xpt_flags);
1da177e4 576 }
9f9d2ebe 577 return 0;
1da177e4 578 }
9dbc240f 579 len = svc_addr_len(svc_addr(rqstp));
9dbc240f 580 rqstp->rq_addrlen = len;
b7aa0bf7
ED
581 if (skb->tstamp.tv64 == 0) {
582 skb->tstamp = ktime_get_real();
cca5172a 583 /* Don't enable netstamp, sunrpc doesn't
1da177e4
LT
584 need that much accuracy */
585 }
b7aa0bf7 586 svsk->sk_sk->sk_stamp = skb->tstamp;
02fc6c36 587 set_bit(XPT_DATA, &svsk->sk_xprt.xpt_flags); /* there may be more data... */
1da177e4 588
1da8c681 589 len = skb->len;
1da177e4
LT
590 rqstp->rq_arg.len = len;
591
95756482 592 rqstp->rq_prot = IPPROTO_UDP;
27459f09 593
7702ce40 594 if (!svc_udp_get_dest_address(rqstp, cmh)) {
e87cc472
JP
595 net_warn_ratelimited("svc: received unknown control message %d/%d; dropping RPC reply datagram\n",
596 cmh->cmsg_level, cmh->cmsg_type);
f23abfdb 597 goto out_free;
7a37f578 598 }
849a1cf1 599 rqstp->rq_daddrlen = svc_addr_len(svc_daddr(rqstp));
1da177e4
LT
600
601 if (skb_is_nonlinear(skb)) {
602 /* we have to copy */
603 local_bh_disable();
604 if (csum_partial_copy_to_xdr(&rqstp->rq_arg, skb)) {
605 local_bh_enable();
606 /* checksum error */
22911fc5 607 goto out_free;
1da177e4
LT
608 }
609 local_bh_enable();
9d410c79 610 skb_free_datagram_locked(svsk->sk_sk, skb);
1da177e4
LT
611 } else {
612 /* we can use it in-place */
1da8c681 613 rqstp->rq_arg.head[0].iov_base = skb->data;
1da177e4 614 rqstp->rq_arg.head[0].iov_len = len;
22911fc5
ED
615 if (skb_checksum_complete(skb))
616 goto out_free;
5148bf4e 617 rqstp->rq_xprt_ctxt = skb;
1da177e4
LT
618 }
619
620 rqstp->rq_arg.page_base = 0;
621 if (len <= rqstp->rq_arg.head[0].iov_len) {
622 rqstp->rq_arg.head[0].iov_len = len;
623 rqstp->rq_arg.page_len = 0;
44524359 624 rqstp->rq_respages = rqstp->rq_pages+1;
1da177e4
LT
625 } else {
626 rqstp->rq_arg.page_len = len - rqstp->rq_arg.head[0].iov_len;
44524359 627 rqstp->rq_respages = rqstp->rq_pages + 1 +
172589cc 628 DIV_ROUND_UP(rqstp->rq_arg.page_len, PAGE_SIZE);
1da177e4 629 }
afc59400 630 rqstp->rq_next_page = rqstp->rq_respages+1;
1da177e4
LT
631
632 if (serv->sv_stats)
633 serv->sv_stats->netudpcnt++;
634
635 return len;
f23abfdb
BF
636out_free:
637 trace_kfree_skb(skb, svc_udp_recvfrom);
638 skb_free_datagram_locked(svsk->sk_sk, skb);
639 return 0;
1da177e4
LT
640}
641
642static int
643svc_udp_sendto(struct svc_rqst *rqstp)
644{
645 int error;
646
647 error = svc_sendto(rqstp, &rqstp->rq_res);
648 if (error == -ECONNREFUSED)
649 /* ICMP error on earlier request. */
650 error = svc_sendto(rqstp, &rqstp->rq_res);
651
652 return error;
653}
654
e831fe65
TT
655static void svc_udp_prep_reply_hdr(struct svc_rqst *rqstp)
656{
657}
658
323bee32
TT
659static int svc_udp_has_wspace(struct svc_xprt *xprt)
660{
661 struct svc_sock *svsk = container_of(xprt, struct svc_sock, sk_xprt);
bb5cf160 662 struct svc_serv *serv = xprt->xpt_server;
323bee32
TT
663 unsigned long required;
664
665 /*
666 * Set the SOCK_NOSPACE flag before checking the available
667 * sock space.
668 */
669 set_bit(SOCK_NOSPACE, &svsk->sk_sock->flags);
7a90e8cc 670 required = atomic_read(&svsk->sk_xprt.xpt_reserved) + serv->sv_max_mesg;
323bee32
TT
671 if (required*2 > sock_wspace(svsk->sk_sk))
672 return 0;
673 clear_bit(SOCK_NOSPACE, &svsk->sk_sock->flags);
674 return 1;
675}
676
38a417cc
TT
677static struct svc_xprt *svc_udp_accept(struct svc_xprt *xprt)
678{
679 BUG();
680 return NULL;
681}
682
b700cbb1 683static struct svc_xprt *svc_udp_create(struct svc_serv *serv,
62832c03 684 struct net *net,
b700cbb1
TT
685 struct sockaddr *sa, int salen,
686 int flags)
687{
62832c03 688 return svc_create_socket(serv, IPPROTO_UDP, net, sa, salen, flags);
b700cbb1
TT
689}
690
360d8738 691static struct svc_xprt_ops svc_udp_ops = {
b700cbb1 692 .xpo_create = svc_udp_create,
5d137990
TT
693 .xpo_recvfrom = svc_udp_recvfrom,
694 .xpo_sendto = svc_udp_sendto,
5148bf4e 695 .xpo_release_rqst = svc_release_skb,
755cceab
TT
696 .xpo_detach = svc_sock_detach,
697 .xpo_free = svc_sock_free,
e831fe65 698 .xpo_prep_reply_hdr = svc_udp_prep_reply_hdr,
323bee32 699 .xpo_has_wspace = svc_udp_has_wspace,
38a417cc 700 .xpo_accept = svc_udp_accept,
16e4d93f 701 .xpo_secure_port = svc_sock_secure_port,
360d8738
TT
702};
703
704static struct svc_xprt_class svc_udp_class = {
705 .xcl_name = "udp",
b700cbb1 706 .xcl_owner = THIS_MODULE,
360d8738 707 .xcl_ops = &svc_udp_ops,
49023155 708 .xcl_max_payload = RPCSVC_MAXPAYLOAD_UDP,
3c45ddf8 709 .xcl_ident = XPRT_TRANSPORT_UDP,
360d8738
TT
710};
711
bb5cf160 712static void svc_udp_init(struct svc_sock *svsk, struct svc_serv *serv)
1da177e4 713{
7702ce40 714 int err, level, optname, one = 1;
7a37f578 715
bd4620dd
SK
716 svc_xprt_init(sock_net(svsk->sk_sock->sk), &svc_udp_class,
717 &svsk->sk_xprt, serv);
def13d74 718 clear_bit(XPT_CACHE_AUTH, &svsk->sk_xprt.xpt_flags);
fa9251af 719 svsk->sk_sk->sk_data_ready = svc_data_ready;
1da177e4 720 svsk->sk_sk->sk_write_space = svc_write_space;
1da177e4
LT
721
722 /* initialise setting must have enough space to
cca5172a 723 * receive and respond to one request.
1da177e4
LT
724 * svc_udp_recvfrom will re-adjust if necessary
725 */
726 svc_sock_setbufsize(svsk->sk_sock,
bb5cf160
TT
727 3 * svsk->sk_xprt.xpt_server->sv_max_mesg,
728 3 * svsk->sk_xprt.xpt_server->sv_max_mesg);
1da177e4 729
0f0257ea
TT
730 /* data might have come in before data_ready set up */
731 set_bit(XPT_DATA, &svsk->sk_xprt.xpt_flags);
02fc6c36 732 set_bit(XPT_CHNGBUF, &svsk->sk_xprt.xpt_flags);
7a37f578 733
7a37f578 734 /* make sure we get destination address info */
7702ce40
CL
735 switch (svsk->sk_sk->sk_family) {
736 case AF_INET:
737 level = SOL_IP;
738 optname = IP_PKTINFO;
739 break;
740 case AF_INET6:
741 level = SOL_IPV6;
742 optname = IPV6_RECVPKTINFO;
743 break;
744 default:
745 BUG();
746 }
747 err = kernel_setsockopt(svsk->sk_sock, level, optname,
748 (char *)&one, sizeof(one));
749 dprintk("svc: kernel_setsockopt returned %d\n", err);
1da177e4
LT
750}
751
752/*
753 * A data_ready event on a listening socket means there's a connection
754 * pending. Do not use state_change as a substitute for it.
755 */
676d2369 756static void svc_tcp_listen_data_ready(struct sock *sk)
1da177e4 757{
939bb7ef 758 struct svc_sock *svsk = (struct svc_sock *)sk->sk_user_data;
1da177e4
LT
759
760 dprintk("svc: socket %p TCP (listen) state change %d\n",
939bb7ef 761 sk, sk->sk_state);
1da177e4 762
fa9251af
TM
763 if (svsk)
764 svsk->sk_odata(sk);
939bb7ef
NB
765 /*
766 * This callback may called twice when a new connection
767 * is established as a child socket inherits everything
768 * from a parent LISTEN socket.
769 * 1) data_ready method of the parent socket will be called
770 * when one of child sockets become ESTABLISHED.
771 * 2) data_ready method of the child socket may be called
772 * when it receives data before the socket is accepted.
773 * In case of 2, we should ignore it silently.
774 */
775 if (sk->sk_state == TCP_LISTEN) {
776 if (svsk) {
02fc6c36 777 set_bit(XPT_CONN, &svsk->sk_xprt.xpt_flags);
f6150c3c 778 svc_xprt_enqueue(&svsk->sk_xprt);
939bb7ef
NB
779 } else
780 printk("svc: socket %p: no user data\n", sk);
1da177e4 781 }
1da177e4
LT
782}
783
784/*
785 * A state change on a connected socket means it's dying or dead.
786 */
0f0257ea 787static void svc_tcp_state_change(struct sock *sk)
1da177e4 788{
939bb7ef 789 struct svc_sock *svsk = (struct svc_sock *)sk->sk_user_data;
1da177e4
LT
790
791 dprintk("svc: socket %p TCP (connected) state change %d (svsk %p)\n",
939bb7ef 792 sk, sk->sk_state, sk->sk_user_data);
1da177e4 793
939bb7ef 794 if (!svsk)
1da177e4 795 printk("svc: socket %p: no user data\n", sk);
939bb7ef 796 else {
fa9251af 797 svsk->sk_ostate(sk);
02fc6c36 798 set_bit(XPT_CLOSE, &svsk->sk_xprt.xpt_flags);
f6150c3c 799 svc_xprt_enqueue(&svsk->sk_xprt);
1da177e4 800 }
1da177e4
LT
801}
802
803/*
804 * Accept a TCP connection
805 */
38a417cc 806static struct svc_xprt *svc_tcp_accept(struct svc_xprt *xprt)
1da177e4 807{
38a417cc 808 struct svc_sock *svsk = container_of(xprt, struct svc_sock, sk_xprt);
cdd88b9f 809 struct sockaddr_storage addr;
810 struct sockaddr *sin = (struct sockaddr *) &addr;
bb5cf160 811 struct svc_serv *serv = svsk->sk_xprt.xpt_server;
1da177e4
LT
812 struct socket *sock = svsk->sk_sock;
813 struct socket *newsock;
1da177e4
LT
814 struct svc_sock *newsvsk;
815 int err, slen;
5216a8e7 816 RPC_IFDEBUG(char buf[RPC_MAX_ADDRBUFLEN]);
1da177e4
LT
817
818 dprintk("svc: tcp_accept %p sock %p\n", svsk, sock);
819 if (!sock)
38a417cc 820 return NULL;
1da177e4 821
02fc6c36 822 clear_bit(XPT_CONN, &svsk->sk_xprt.xpt_flags);
e6242e92
SS
823 err = kernel_accept(sock, &newsock, O_NONBLOCK);
824 if (err < 0) {
1da177e4
LT
825 if (err == -ENOMEM)
826 printk(KERN_WARNING "%s: no more sockets!\n",
827 serv->sv_name);
e87cc472
JP
828 else if (err != -EAGAIN)
829 net_warn_ratelimited("%s: accept failed (err %d)!\n",
830 serv->sv_name, -err);
38a417cc 831 return NULL;
1da177e4 832 }
02fc6c36 833 set_bit(XPT_CONN, &svsk->sk_xprt.xpt_flags);
1da177e4 834
cdd88b9f 835 err = kernel_getpeername(newsock, sin, &slen);
1da177e4 836 if (err < 0) {
e87cc472
JP
837 net_warn_ratelimited("%s: peername failed (err %d)!\n",
838 serv->sv_name, -err);
1da177e4
LT
839 goto failed; /* aborted connection or whatever */
840 }
841
842 /* Ideally, we would want to reject connections from unauthorized
ad06e4bd
CL
843 * hosts here, but when we get encryption, the IP of the host won't
844 * tell us anything. For now just warn about unpriv connections.
1da177e4 845 */
cdd88b9f 846 if (!svc_port_is_privileged(sin)) {
a48fd0f9 847 dprintk("%s: connect from unprivileged port: %s\n",
cca5172a 848 serv->sv_name,
cdd88b9f 849 __svc_print_addr(sin, buf, sizeof(buf)));
1da177e4 850 }
ad06e4bd 851 dprintk("%s: connect from %s\n", serv->sv_name,
cdd88b9f 852 __svc_print_addr(sin, buf, sizeof(buf)));
1da177e4 853
fa9251af
TM
854 /* Reset the inherited callbacks before calling svc_setup_socket */
855 newsock->sk->sk_state_change = svsk->sk_ostate;
856 newsock->sk->sk_data_ready = svsk->sk_odata;
857 newsock->sk->sk_write_space = svsk->sk_owspace;
858
1da177e4
LT
859 /* make sure that a write doesn't block forever when
860 * low on memory
861 */
862 newsock->sk->sk_sndtimeo = HZ*30;
863
72c35376
BF
864 newsvsk = svc_setup_socket(serv, newsock,
865 (SVC_SOCK_ANONYMOUS | SVC_SOCK_TEMPORARY));
866 if (IS_ERR(newsvsk))
1da177e4 867 goto failed;
9dbc240f 868 svc_xprt_set_remote(&newsvsk->sk_xprt, sin, slen);
a9747692
FM
869 err = kernel_getsockname(newsock, sin, &slen);
870 if (unlikely(err < 0)) {
871 dprintk("svc_tcp_accept: kernel_getsockname error %d\n", -err);
872 slen = offsetof(struct sockaddr, sa_data);
873 }
9dbc240f 874 svc_xprt_set_local(&newsvsk->sk_xprt, sin, slen);
067d7817 875
ef11ce24
N
876 if (sock_is_loopback(newsock->sk))
877 set_bit(XPT_LOCAL, &newsvsk->sk_xprt.xpt_flags);
878 else
879 clear_bit(XPT_LOCAL, &newsvsk->sk_xprt.xpt_flags);
f9f3cc4f
TT
880 if (serv->sv_stats)
881 serv->sv_stats->nettcpconn++;
882
883 return &newsvsk->sk_xprt;
884
885failed:
886 sock_release(newsock);
887 return NULL;
888}
889
31d68ef6
BF
890static unsigned int svc_tcp_restore_pages(struct svc_sock *svsk, struct svc_rqst *rqstp)
891{
892 unsigned int i, len, npages;
893
8af345f5 894 if (svsk->sk_datalen == 0)
31d68ef6 895 return 0;
8af345f5 896 len = svsk->sk_datalen;
31d68ef6
BF
897 npages = (len + PAGE_SIZE - 1) >> PAGE_SHIFT;
898 for (i = 0; i < npages; i++) {
899 if (rqstp->rq_pages[i] != NULL)
900 put_page(rqstp->rq_pages[i]);
901 BUG_ON(svsk->sk_pages[i] == NULL);
902 rqstp->rq_pages[i] = svsk->sk_pages[i];
903 svsk->sk_pages[i] = NULL;
904 }
905 rqstp->rq_arg.head[0].iov_base = page_address(rqstp->rq_pages[0]);
906 return len;
907}
908
909static void svc_tcp_save_pages(struct svc_sock *svsk, struct svc_rqst *rqstp)
910{
911 unsigned int i, len, npages;
912
8af345f5 913 if (svsk->sk_datalen == 0)
31d68ef6 914 return;
8af345f5 915 len = svsk->sk_datalen;
31d68ef6
BF
916 npages = (len + PAGE_SIZE - 1) >> PAGE_SHIFT;
917 for (i = 0; i < npages; i++) {
918 svsk->sk_pages[i] = rqstp->rq_pages[i];
919 rqstp->rq_pages[i] = NULL;
920 }
921}
922
923static void svc_tcp_clear_pages(struct svc_sock *svsk)
924{
925 unsigned int i, len, npages;
926
8af345f5 927 if (svsk->sk_datalen == 0)
31d68ef6 928 goto out;
8af345f5 929 len = svsk->sk_datalen;
31d68ef6
BF
930 npages = (len + PAGE_SIZE - 1) >> PAGE_SHIFT;
931 for (i = 0; i < npages; i++) {
cf3aa02c
BF
932 if (svsk->sk_pages[i] == NULL) {
933 WARN_ON_ONCE(1);
934 continue;
935 }
31d68ef6
BF
936 put_page(svsk->sk_pages[i]);
937 svsk->sk_pages[i] = NULL;
938 }
939out:
940 svsk->sk_tcplen = 0;
8af345f5 941 svsk->sk_datalen = 0;
31d68ef6
BF
942}
943
1da177e4 944/*
ad46ccf0 945 * Receive fragment record header.
8f55f3c0 946 * If we haven't gotten the record length yet, get the next four bytes.
1da177e4 947 */
8f55f3c0 948static int svc_tcp_recv_record(struct svc_sock *svsk, struct svc_rqst *rqstp)
1da177e4 949{
bb5cf160 950 struct svc_serv *serv = svsk->sk_xprt.xpt_server;
5ee78d48 951 unsigned int want;
8f55f3c0 952 int len;
1da177e4 953
c0401ea0 954 if (svsk->sk_tcplen < sizeof(rpc_fraghdr)) {
1da177e4
LT
955 struct kvec iov;
956
5ee78d48 957 want = sizeof(rpc_fraghdr) - svsk->sk_tcplen;
1da177e4
LT
958 iov.iov_base = ((char *) &svsk->sk_reclen) + svsk->sk_tcplen;
959 iov.iov_len = want;
960 if ((len = svc_recvfrom(rqstp, &iov, 1, want)) < 0)
961 goto error;
962 svsk->sk_tcplen += len;
963
964 if (len < want) {
c0401ea0
CL
965 dprintk("svc: short recvfrom while reading record "
966 "length (%d of %d)\n", len, want);
31d68ef6 967 return -EAGAIN;
1da177e4
LT
968 }
969
cc248d4b 970 dprintk("svc: TCP record, %d bytes\n", svc_sock_reclen(svsk));
836fbadb
BF
971 if (svc_sock_reclen(svsk) + svsk->sk_datalen >
972 serv->sv_max_mesg) {
3a28e331
BF
973 net_notice_ratelimited("RPC: fragment too large: %d\n",
974 svc_sock_reclen(svsk));
1da177e4
LT
975 goto err_delete;
976 }
977 }
978
cc248d4b 979 return svc_sock_reclen(svsk);
31d68ef6
BF
980error:
981 dprintk("RPC: TCP recv_record got %d\n", len);
8f55f3c0 982 return len;
31d68ef6 983err_delete:
8f55f3c0 984 set_bit(XPT_CLOSE, &svsk->sk_xprt.xpt_flags);
8f55f3c0
AB
985 return -EAGAIN;
986}
987
586c52cc 988static int receive_cb_reply(struct svc_sock *svsk, struct svc_rqst *rqstp)
4cfc7e60 989{
586c52cc 990 struct rpc_xprt *bc_xprt = svsk->sk_xprt.xpt_bc_xprt;
4cfc7e60 991 struct rpc_rqst *req = NULL;
586c52cc
TM
992 struct kvec *src, *dst;
993 __be32 *p = (__be32 *)rqstp->rq_arg.head[0].iov_base;
48e6555c
BF
994 __be32 xid;
995 __be32 calldir;
4cfc7e60 996
4cfc7e60
RI
997 xid = *p++;
998 calldir = *p;
999
093a1468 1000 if (!bc_xprt)
586c52cc 1001 return -EAGAIN;
093a1468
TM
1002 spin_lock_bh(&bc_xprt->transport_lock);
1003 req = xprt_lookup_rqst(bc_xprt, xid);
1004 if (!req)
1005 goto unlock_notfound;
586c52cc
TM
1006
1007 memcpy(&req->rq_private_buf, &req->rq_rcv_buf, sizeof(struct xdr_buf));
1008 /*
1009 * XXX!: cheating for now! Only copying HEAD.
1010 * But we know this is good enough for now (in fact, for any
1011 * callback reply in the forseeable future).
1012 */
1013 dst = &req->rq_private_buf.head[0];
1014 src = &rqstp->rq_arg.head[0];
1015 if (dst->iov_len < src->iov_len)
093a1468 1016 goto unlock_eagain; /* whatever; just giving up. */
586c52cc 1017 memcpy(dst->iov_base, src->iov_base, src->iov_len);
cc248d4b 1018 xprt_complete_rqst(req->rq_task, rqstp->rq_arg.len);
586c52cc 1019 rqstp->rq_arg.len = 0;
093a1468 1020 spin_unlock_bh(&bc_xprt->transport_lock);
586c52cc 1021 return 0;
093a1468
TM
1022unlock_notfound:
1023 printk(KERN_NOTICE
1024 "%s: Got unrecognized reply: "
1025 "calldir 0x%x xpt_bc_xprt %p xid %08x\n",
1026 __func__, ntohl(calldir),
1027 bc_xprt, ntohl(xid));
1028unlock_eagain:
1029 spin_unlock_bh(&bc_xprt->transport_lock);
1030 return -EAGAIN;
586c52cc
TM
1031}
1032
1033static int copy_pages_to_kvecs(struct kvec *vec, struct page **pages, int len)
1034{
1035 int i = 0;
1036 int t = 0;
1037
1038 while (t < len) {
1039 vec[i].iov_base = page_address(pages[i]);
1040 vec[i].iov_len = PAGE_SIZE;
1041 i++;
1042 t += PAGE_SIZE;
1043 }
1044 return i;
4cfc7e60
RI
1045}
1046
836fbadb
BF
1047static void svc_tcp_fragment_received(struct svc_sock *svsk)
1048{
1049 /* If we have more data, signal svc_xprt_enqueue() to try again */
836fbadb
BF
1050 dprintk("svc: TCP %s record (%d bytes)\n",
1051 svc_sock_final_rec(svsk) ? "final" : "nonfinal",
1052 svc_sock_reclen(svsk));
1053 svsk->sk_tcplen = 0;
1054 svsk->sk_reclen = 0;
1055}
31d68ef6 1056
8f55f3c0
AB
1057/*
1058 * Receive data from a TCP socket.
1059 */
1060static int svc_tcp_recvfrom(struct svc_rqst *rqstp)
1061{
1062 struct svc_sock *svsk =
1063 container_of(rqstp->rq_xprt, struct svc_sock, sk_xprt);
1064 struct svc_serv *serv = svsk->sk_xprt.xpt_server;
1065 int len;
1066 struct kvec *vec;
31d68ef6 1067 unsigned int want, base;
586c52cc
TM
1068 __be32 *p;
1069 __be32 calldir;
5ee78d48 1070 int pnum;
8f55f3c0
AB
1071
1072 dprintk("svc: tcp_recv %p data %d conn %d close %d\n",
1073 svsk, test_bit(XPT_DATA, &svsk->sk_xprt.xpt_flags),
1074 test_bit(XPT_CONN, &svsk->sk_xprt.xpt_flags),
1075 test_bit(XPT_CLOSE, &svsk->sk_xprt.xpt_flags));
1076
1077 len = svc_tcp_recv_record(svsk, rqstp);
1078 if (len < 0)
1079 goto error;
1080
31d68ef6 1081 base = svc_tcp_restore_pages(svsk, rqstp);
836fbadb 1082 want = svc_sock_reclen(svsk) - (svsk->sk_tcplen - sizeof(rpc_fraghdr));
31d68ef6 1083
3cc03b16 1084 vec = rqstp->rq_vec;
4cfc7e60 1085
586c52cc 1086 pnum = copy_pages_to_kvecs(&vec[0], &rqstp->rq_pages[0],
836fbadb 1087 svsk->sk_datalen + want);
586c52cc 1088
44524359 1089 rqstp->rq_respages = &rqstp->rq_pages[pnum];
afc59400 1090 rqstp->rq_next_page = rqstp->rq_respages + 1;
1da177e4
LT
1091
1092 /* Now receive data */
31d68ef6 1093 len = svc_partial_recvfrom(rqstp, vec, pnum, want, base);
8af345f5 1094 if (len >= 0) {
31d68ef6 1095 svsk->sk_tcplen += len;
8af345f5
BF
1096 svsk->sk_datalen += len;
1097 }
836fbadb 1098 if (len != want || !svc_sock_final_rec(svsk)) {
be1e4444 1099 svc_tcp_save_pages(svsk, rqstp);
31d68ef6 1100 if (len < 0 && len != -EAGAIN)
ad46ccf0 1101 goto err_delete;
836fbadb
BF
1102 if (len == want)
1103 svc_tcp_fragment_received(svsk);
1104 else
3a28e331
BF
1105 dprintk("svc: incomplete TCP record (%d of %d)\n",
1106 (int)(svsk->sk_tcplen - sizeof(rpc_fraghdr)),
836fbadb 1107 svc_sock_reclen(svsk));
31d68ef6
BF
1108 goto err_noclose;
1109 }
1da177e4 1110
1f691b07 1111 if (svsk->sk_datalen < 8) {
cf3aa02c 1112 svsk->sk_datalen = 0;
ad46ccf0 1113 goto err_delete; /* client is nuts. */
cf3aa02c 1114 }
ad46ccf0 1115
836fbadb 1116 rqstp->rq_arg.len = svsk->sk_datalen;
1da177e4 1117 rqstp->rq_arg.page_base = 0;
5ee78d48
TM
1118 if (rqstp->rq_arg.len <= rqstp->rq_arg.head[0].iov_len) {
1119 rqstp->rq_arg.head[0].iov_len = rqstp->rq_arg.len;
1da177e4 1120 rqstp->rq_arg.page_len = 0;
5ee78d48
TM
1121 } else
1122 rqstp->rq_arg.page_len = rqstp->rq_arg.len - rqstp->rq_arg.head[0].iov_len;
1da177e4 1123
5148bf4e 1124 rqstp->rq_xprt_ctxt = NULL;
1da177e4 1125 rqstp->rq_prot = IPPROTO_TCP;
7501cc2b
JL
1126 if (test_bit(XPT_LOCAL, &svsk->sk_xprt.xpt_flags))
1127 set_bit(RQ_LOCAL, &rqstp->rq_flags);
1128 else
1129 clear_bit(RQ_LOCAL, &rqstp->rq_flags);
1da177e4 1130
586c52cc
TM
1131 p = (__be32 *)rqstp->rq_arg.head[0].iov_base;
1132 calldir = p[1];
8985ef0b 1133 if (calldir)
586c52cc 1134 len = receive_cb_reply(svsk, rqstp);
586c52cc 1135
1da177e4 1136 /* Reset TCP read info */
8af345f5 1137 svsk->sk_datalen = 0;
836fbadb 1138 svc_tcp_fragment_received(svsk);
0601f793 1139
8985ef0b
BF
1140 if (len < 0)
1141 goto error;
1da177e4 1142
9dbc240f 1143 svc_xprt_copy_addrs(rqstp, &svsk->sk_xprt);
1da177e4
LT
1144 if (serv->sv_stats)
1145 serv->sv_stats->nettcpcnt++;
1146
5ee78d48 1147 return rqstp->rq_arg.len;
1da177e4 1148
8f55f3c0 1149error:
31d68ef6 1150 if (len != -EAGAIN)
ad46ccf0 1151 goto err_delete;
31d68ef6 1152 dprintk("RPC: TCP recvfrom got EAGAIN\n");
9f9d2ebe 1153 return 0;
ad46ccf0 1154err_delete:
31d68ef6
BF
1155 printk(KERN_NOTICE "%s: recvfrom returned errno %d\n",
1156 svsk->sk_xprt.xpt_server->sv_name, -len);
1157 set_bit(XPT_CLOSE, &svsk->sk_xprt.xpt_flags);
1158err_noclose:
9f9d2ebe 1159 return 0; /* record not complete */
1da177e4
LT
1160}
1161
1162/*
1163 * Send out data on TCP socket.
1164 */
0f0257ea 1165static int svc_tcp_sendto(struct svc_rqst *rqstp)
1da177e4
LT
1166{
1167 struct xdr_buf *xbufp = &rqstp->rq_res;
1168 int sent;
d8ed029d 1169 __be32 reclen;
1da177e4
LT
1170
1171 /* Set up the first element of the reply kvec.
1172 * Any other kvecs that may be in use have been taken
1173 * care of by the server implementation itself.
1174 */
1175 reclen = htonl(0x80000000|((xbufp->len ) - 4));
1176 memcpy(xbufp->head[0].iov_base, &reclen, 4);
1177
1da177e4
LT
1178 sent = svc_sendto(rqstp, &rqstp->rq_res);
1179 if (sent != xbufp->len) {
0f0257ea
TT
1180 printk(KERN_NOTICE
1181 "rpc-srv/tcp: %s: %s %d when sending %d bytes "
1182 "- shutting down socket\n",
57b1d3ba 1183 rqstp->rq_xprt->xpt_server->sv_name,
1da177e4
LT
1184 (sent<0)?"got error":"sent only",
1185 sent, xbufp->len);
57b1d3ba 1186 set_bit(XPT_CLOSE, &rqstp->rq_xprt->xpt_flags);
f6150c3c 1187 svc_xprt_enqueue(rqstp->rq_xprt);
1da177e4
LT
1188 sent = -EAGAIN;
1189 }
1190 return sent;
1191}
1192
e831fe65
TT
1193/*
1194 * Setup response header. TCP has a 4B record length field.
1195 */
1196static void svc_tcp_prep_reply_hdr(struct svc_rqst *rqstp)
1197{
1198 struct kvec *resv = &rqstp->rq_res.head[0];
1199
1200 /* tcp needs a space for the record length... */
1201 svc_putnl(resv, 0);
1202}
1203
b700cbb1 1204static struct svc_xprt *svc_tcp_create(struct svc_serv *serv,
62832c03 1205 struct net *net,
b700cbb1
TT
1206 struct sockaddr *sa, int salen,
1207 int flags)
1208{
62832c03 1209 return svc_create_socket(serv, IPPROTO_TCP, net, sa, salen, flags);
b700cbb1
TT
1210}
1211
9e00abc3 1212#if defined(CONFIG_SUNRPC_BACKCHANNEL)
1f11a034
AA
1213static struct svc_xprt *svc_bc_create_socket(struct svc_serv *, int,
1214 struct net *, struct sockaddr *,
1215 int, int);
1216static void svc_bc_sock_free(struct svc_xprt *xprt);
1217
1218static struct svc_xprt *svc_bc_tcp_create(struct svc_serv *serv,
1219 struct net *net,
1220 struct sockaddr *sa, int salen,
1221 int flags)
1222{
1223 return svc_bc_create_socket(serv, IPPROTO_TCP, net, sa, salen, flags);
1224}
1225
1226static void svc_bc_tcp_sock_detach(struct svc_xprt *xprt)
1227{
1228}
1229
1230static struct svc_xprt_ops svc_tcp_bc_ops = {
1231 .xpo_create = svc_bc_tcp_create,
1232 .xpo_detach = svc_bc_tcp_sock_detach,
1233 .xpo_free = svc_bc_sock_free,
1234 .xpo_prep_reply_hdr = svc_tcp_prep_reply_hdr,
16e4d93f 1235 .xpo_secure_port = svc_sock_secure_port,
1f11a034
AA
1236};
1237
1238static struct svc_xprt_class svc_tcp_bc_class = {
1239 .xcl_name = "tcp-bc",
1240 .xcl_owner = THIS_MODULE,
1241 .xcl_ops = &svc_tcp_bc_ops,
1242 .xcl_max_payload = RPCSVC_MAXPAYLOAD_TCP,
1243};
16b2d1e1
AA
1244
1245static void svc_init_bc_xprt_sock(void)
1246{
1247 svc_reg_xprt_class(&svc_tcp_bc_class);
1248}
1249
1250static void svc_cleanup_bc_xprt_sock(void)
1251{
1252 svc_unreg_xprt_class(&svc_tcp_bc_class);
1253}
9e00abc3 1254#else /* CONFIG_SUNRPC_BACKCHANNEL */
16b2d1e1
AA
1255static void svc_init_bc_xprt_sock(void)
1256{
1257}
1258
1259static void svc_cleanup_bc_xprt_sock(void)
1260{
1261}
9e00abc3 1262#endif /* CONFIG_SUNRPC_BACKCHANNEL */
1f11a034 1263
360d8738 1264static struct svc_xprt_ops svc_tcp_ops = {
b700cbb1 1265 .xpo_create = svc_tcp_create,
5d137990
TT
1266 .xpo_recvfrom = svc_tcp_recvfrom,
1267 .xpo_sendto = svc_tcp_sendto,
5148bf4e 1268 .xpo_release_rqst = svc_release_skb,
69b6ba37 1269 .xpo_detach = svc_tcp_sock_detach,
755cceab 1270 .xpo_free = svc_sock_free,
e831fe65 1271 .xpo_prep_reply_hdr = svc_tcp_prep_reply_hdr,
323bee32 1272 .xpo_has_wspace = svc_tcp_has_wspace,
38a417cc 1273 .xpo_accept = svc_tcp_accept,
16e4d93f 1274 .xpo_secure_port = svc_sock_secure_port,
51877680 1275 .xpo_adjust_wspace = svc_tcp_adjust_wspace,
360d8738
TT
1276};
1277
1278static struct svc_xprt_class svc_tcp_class = {
1279 .xcl_name = "tcp",
b700cbb1 1280 .xcl_owner = THIS_MODULE,
360d8738 1281 .xcl_ops = &svc_tcp_ops,
49023155 1282 .xcl_max_payload = RPCSVC_MAXPAYLOAD_TCP,
3c45ddf8 1283 .xcl_ident = XPRT_TRANSPORT_TCP,
360d8738
TT
1284};
1285
1286void svc_init_xprt_sock(void)
1287{
1288 svc_reg_xprt_class(&svc_tcp_class);
1289 svc_reg_xprt_class(&svc_udp_class);
16b2d1e1 1290 svc_init_bc_xprt_sock();
360d8738
TT
1291}
1292
1293void svc_cleanup_xprt_sock(void)
1294{
1295 svc_unreg_xprt_class(&svc_tcp_class);
1296 svc_unreg_xprt_class(&svc_udp_class);
16b2d1e1 1297 svc_cleanup_bc_xprt_sock();
360d8738
TT
1298}
1299
bb5cf160 1300static void svc_tcp_init(struct svc_sock *svsk, struct svc_serv *serv)
1da177e4
LT
1301{
1302 struct sock *sk = svsk->sk_sk;
1da177e4 1303
bd4620dd
SK
1304 svc_xprt_init(sock_net(svsk->sk_sock->sk), &svc_tcp_class,
1305 &svsk->sk_xprt, serv);
def13d74 1306 set_bit(XPT_CACHE_AUTH, &svsk->sk_xprt.xpt_flags);
1da177e4
LT
1307 if (sk->sk_state == TCP_LISTEN) {
1308 dprintk("setting up TCP socket for listening\n");
02fc6c36 1309 set_bit(XPT_LISTENER, &svsk->sk_xprt.xpt_flags);
1da177e4 1310 sk->sk_data_ready = svc_tcp_listen_data_ready;
02fc6c36 1311 set_bit(XPT_CONN, &svsk->sk_xprt.xpt_flags);
1da177e4
LT
1312 } else {
1313 dprintk("setting up TCP socket for reading\n");
1314 sk->sk_state_change = svc_tcp_state_change;
fa9251af 1315 sk->sk_data_ready = svc_data_ready;
47fcb03f 1316 sk->sk_write_space = svc_tcp_write_space;
1da177e4
LT
1317
1318 svsk->sk_reclen = 0;
1319 svsk->sk_tcplen = 0;
8af345f5 1320 svsk->sk_datalen = 0;
31d68ef6 1321 memset(&svsk->sk_pages[0], 0, sizeof(svsk->sk_pages));
1da177e4 1322
b7872fe8 1323 tcp_sk(sk)->nonagle |= TCP_NAGLE_OFF;
1da177e4 1324
02fc6c36 1325 set_bit(XPT_DATA, &svsk->sk_xprt.xpt_flags);
cca5172a 1326 if (sk->sk_state != TCP_ESTABLISHED)
02fc6c36 1327 set_bit(XPT_CLOSE, &svsk->sk_xprt.xpt_flags);
1da177e4
LT
1328 }
1329}
1330
0f0257ea 1331void svc_sock_update_bufs(struct svc_serv *serv)
1da177e4
LT
1332{
1333 /*
1334 * The number of server threads has changed. Update
1335 * rcvbuf and sndbuf accordingly on all sockets
1336 */
8f3a6de3 1337 struct svc_sock *svsk;
1da177e4
LT
1338
1339 spin_lock_bh(&serv->sv_lock);
8f3a6de3 1340 list_for_each_entry(svsk, &serv->sv_permsocks, sk_xprt.xpt_list)
02fc6c36 1341 set_bit(XPT_CHNGBUF, &svsk->sk_xprt.xpt_flags);
1da177e4
LT
1342 spin_unlock_bh(&serv->sv_lock);
1343}
24c3767e 1344EXPORT_SYMBOL_GPL(svc_sock_update_bufs);
1da177e4 1345
1da177e4
LT
1346/*
1347 * Initialize socket for RPC use and create svc_sock struct
1da177e4 1348 */
6b174337
CL
1349static struct svc_sock *svc_setup_socket(struct svc_serv *serv,
1350 struct socket *sock,
72c35376 1351 int flags)
1da177e4
LT
1352{
1353 struct svc_sock *svsk;
1354 struct sock *inet;
6b174337 1355 int pmap_register = !(flags & SVC_SOCK_ANONYMOUS);
72c35376 1356 int err = 0;
1da177e4
LT
1357
1358 dprintk("svc: svc_setup_socket %p\n", sock);
72c35376
BF
1359 svsk = kzalloc(sizeof(*svsk), GFP_KERNEL);
1360 if (!svsk)
1361 return ERR_PTR(-ENOMEM);
1da177e4
LT
1362
1363 inet = sock->sk;
1364
1365 /* Register socket with portmapper */
72c35376
BF
1366 if (pmap_register)
1367 err = svc_register(serv, sock_net(sock->sk), inet->sk_family,
5247fab5 1368 inet->sk_protocol,
c720c7e8 1369 ntohs(inet_sk(inet)->inet_sport));
1da177e4 1370
72c35376 1371 if (err < 0) {
1da177e4 1372 kfree(svsk);
72c35376 1373 return ERR_PTR(err);
1da177e4
LT
1374 }
1375
1da177e4
LT
1376 inet->sk_user_data = svsk;
1377 svsk->sk_sock = sock;
1378 svsk->sk_sk = inet;
1379 svsk->sk_ostate = inet->sk_state_change;
1380 svsk->sk_odata = inet->sk_data_ready;
1381 svsk->sk_owspace = inet->sk_write_space;
1da177e4
LT
1382
1383 /* Initialize the socket */
1384 if (sock->type == SOCK_DGRAM)
bb5cf160 1385 svc_udp_init(svsk, serv);
96604398
OK
1386 else {
1387 /* initialise setting must have enough space to
1388 * receive and respond to one request.
1389 */
1390 svc_sock_setbufsize(svsk->sk_sock, 4 * serv->sv_max_mesg,
1391 4 * serv->sv_max_mesg);
bb5cf160 1392 svc_tcp_init(svsk, serv);
96604398 1393 }
1da177e4 1394
1da177e4
LT
1395 dprintk("svc: svc_setup_socket created %p (inet %p)\n",
1396 svsk, svsk->sk_sk);
1397
1da177e4
LT
1398 return svsk;
1399}
1400
30646394
SK
1401bool svc_alien_sock(struct net *net, int fd)
1402{
1403 int err;
1404 struct socket *sock = sockfd_lookup(fd, &err);
1405 bool ret = false;
1406
1407 if (!sock)
1408 goto out;
1409 if (sock_net(sock->sk) != net)
1410 ret = true;
1411 sockfd_put(sock);
1412out:
1413 return ret;
1414}
1415EXPORT_SYMBOL_GPL(svc_alien_sock);
1416
bfba9ab4
CL
1417/**
1418 * svc_addsock - add a listener socket to an RPC service
1419 * @serv: pointer to RPC service to which to add a new listener
1420 * @fd: file descriptor of the new listener
1421 * @name_return: pointer to buffer to fill in with name of listener
1422 * @len: size of the buffer
1423 *
1424 * Fills in socket name and returns positive length of name if successful.
1425 * Name is terminated with '\n'. On error, returns a negative errno
1426 * value.
1427 */
1428int svc_addsock(struct svc_serv *serv, const int fd, char *name_return,
1429 const size_t len)
b41b66d6
N
1430{
1431 int err = 0;
1432 struct socket *so = sockfd_lookup(fd, &err);
1433 struct svc_sock *svsk = NULL;
a8e10078
BF
1434 struct sockaddr_storage addr;
1435 struct sockaddr *sin = (struct sockaddr *)&addr;
1436 int salen;
b41b66d6
N
1437
1438 if (!so)
1439 return err;
a8e10078 1440 err = -EAFNOSUPPORT;
205ba423 1441 if ((so->sk->sk_family != PF_INET) && (so->sk->sk_family != PF_INET6))
a8e10078
BF
1442 goto out;
1443 err = -EPROTONOSUPPORT;
1444 if (so->sk->sk_protocol != IPPROTO_TCP &&
b41b66d6 1445 so->sk->sk_protocol != IPPROTO_UDP)
a8e10078
BF
1446 goto out;
1447 err = -EISCONN;
1448 if (so->state > SS_UNCONNECTED)
1449 goto out;
1450 err = -ENOENT;
1451 if (!try_module_get(THIS_MODULE))
1452 goto out;
1453 svsk = svc_setup_socket(serv, so, SVC_SOCK_DEFAULTS);
1454 if (IS_ERR(svsk)) {
1455 module_put(THIS_MODULE);
1456 err = PTR_ERR(svsk);
1457 goto out;
b41b66d6 1458 }
a8e10078
BF
1459 if (kernel_getsockname(svsk->sk_sock, sin, &salen) == 0)
1460 svc_xprt_set_local(&svsk->sk_xprt, sin, salen);
39b55301 1461 svc_add_new_perm_xprt(serv, &svsk->sk_xprt);
e7942b9f 1462 return svc_one_sock_name(svsk, name_return, len);
a8e10078
BF
1463out:
1464 sockfd_put(so);
1465 return err;
b41b66d6
N
1466}
1467EXPORT_SYMBOL_GPL(svc_addsock);
1468
1da177e4
LT
1469/*
1470 * Create socket for RPC service.
1471 */
b700cbb1
TT
1472static struct svc_xprt *svc_create_socket(struct svc_serv *serv,
1473 int protocol,
62832c03 1474 struct net *net,
b700cbb1
TT
1475 struct sockaddr *sin, int len,
1476 int flags)
1da177e4
LT
1477{
1478 struct svc_sock *svsk;
1479 struct socket *sock;
1480 int error;
1481 int type;
9dbc240f
TT
1482 struct sockaddr_storage addr;
1483 struct sockaddr *newsin = (struct sockaddr *)&addr;
1484 int newlen;
c69da774
TM
1485 int family;
1486 int val;
5216a8e7 1487 RPC_IFDEBUG(char buf[RPC_MAX_ADDRBUFLEN]);
1da177e4 1488
ad06e4bd
CL
1489 dprintk("svc: svc_create_socket(%s, %d, %s)\n",
1490 serv->sv_program->pg_name, protocol,
77f1f67a 1491 __svc_print_addr(sin, buf, sizeof(buf)));
1da177e4
LT
1492
1493 if (protocol != IPPROTO_UDP && protocol != IPPROTO_TCP) {
1494 printk(KERN_WARNING "svc: only UDP and TCP "
1495 "sockets supported\n");
b700cbb1 1496 return ERR_PTR(-EINVAL);
1da177e4 1497 }
c69da774 1498
1da177e4 1499 type = (protocol == IPPROTO_UDP)? SOCK_DGRAM : SOCK_STREAM;
c69da774
TM
1500 switch (sin->sa_family) {
1501 case AF_INET6:
1502 family = PF_INET6;
1503 break;
1504 case AF_INET:
1505 family = PF_INET;
1506 break;
1507 default:
1508 return ERR_PTR(-EINVAL);
1509 }
1da177e4 1510
14ec63c3 1511 error = __sock_create(net, family, type, protocol, &sock, 1);
77f1f67a 1512 if (error < 0)
b700cbb1 1513 return ERR_PTR(error);
1da177e4 1514
ed07536e
PZ
1515 svc_reclassify_socket(sock);
1516
c69da774
TM
1517 /*
1518 * If this is an PF_INET6 listener, we want to avoid
1519 * getting requests from IPv4 remotes. Those should
1520 * be shunted to a PF_INET listener via rpcbind.
1521 */
1522 val = 1;
1523 if (family == PF_INET6)
1524 kernel_setsockopt(sock, SOL_IPV6, IPV6_V6ONLY,
1525 (char *)&val, sizeof(val));
1526
18114746 1527 if (type == SOCK_STREAM)
4a17fd52 1528 sock->sk->sk_reuse = SK_CAN_REUSE; /* allow address reuse */
77f1f67a 1529 error = kernel_bind(sock, sin, len);
18114746
ES
1530 if (error < 0)
1531 goto bummer;
1da177e4 1532
9dbc240f
TT
1533 newlen = len;
1534 error = kernel_getsockname(sock, newsin, &newlen);
1535 if (error < 0)
1536 goto bummer;
1537
1da177e4 1538 if (protocol == IPPROTO_TCP) {
e6242e92 1539 if ((error = kernel_listen(sock, 64)) < 0)
1da177e4
LT
1540 goto bummer;
1541 }
1542
72c35376 1543 svsk = svc_setup_socket(serv, sock, flags);
a8e10078
BF
1544 if (IS_ERR(svsk)) {
1545 error = PTR_ERR(svsk);
1546 goto bummer;
e79eff1f 1547 }
a8e10078
BF
1548 svc_xprt_set_local(&svsk->sk_xprt, newsin, newlen);
1549 return (struct svc_xprt *)svsk;
1da177e4
LT
1550bummer:
1551 dprintk("svc: svc_create_socket error = %d\n", -error);
1552 sock_release(sock);
b700cbb1 1553 return ERR_PTR(error);
1da177e4
LT
1554}
1555
755cceab
TT
1556/*
1557 * Detach the svc_sock from the socket so that no
1558 * more callbacks occur.
1559 */
1560static void svc_sock_detach(struct svc_xprt *xprt)
1561{
1562 struct svc_sock *svsk = container_of(xprt, struct svc_sock, sk_xprt);
1563 struct sock *sk = svsk->sk_sk;
1564
1565 dprintk("svc: svc_sock_detach(%p)\n", svsk);
1566
1567 /* put back the old socket callbacks */
069c225b 1568 lock_sock(sk);
755cceab
TT
1569 sk->sk_state_change = svsk->sk_ostate;
1570 sk->sk_data_ready = svsk->sk_odata;
1571 sk->sk_write_space = svsk->sk_owspace;
069c225b
TM
1572 sk->sk_user_data = NULL;
1573 release_sock(sk);
69b6ba37
TM
1574}
1575
1576/*
1577 * Disconnect the socket, and reset the callbacks
1578 */
1579static void svc_tcp_sock_detach(struct svc_xprt *xprt)
1580{
1581 struct svc_sock *svsk = container_of(xprt, struct svc_sock, sk_xprt);
1582
1583 dprintk("svc: svc_tcp_sock_detach(%p)\n", svsk);
1584
1585 svc_sock_detach(xprt);
1586
31d68ef6
BF
1587 if (!test_bit(XPT_LISTENER, &xprt->xpt_flags)) {
1588 svc_tcp_clear_pages(svsk);
69b6ba37 1589 kernel_sock_shutdown(svsk->sk_sock, SHUT_RDWR);
31d68ef6 1590 }
755cceab
TT
1591}
1592
1593/*
1594 * Free the svc_sock's socket resources and the svc_sock itself.
1595 */
1596static void svc_sock_free(struct svc_xprt *xprt)
1597{
1598 struct svc_sock *svsk = container_of(xprt, struct svc_sock, sk_xprt);
1599 dprintk("svc: svc_sock_free(%p)\n", svsk);
1600
755cceab
TT
1601 if (svsk->sk_sock->file)
1602 sockfd_put(svsk->sk_sock);
1603 else
1604 sock_release(svsk->sk_sock);
1605 kfree(svsk);
1606}
7652e5a0 1607
9e00abc3 1608#if defined(CONFIG_SUNRPC_BACKCHANNEL)
7652e5a0 1609/*
1f11a034 1610 * Create a back channel svc_xprt which shares the fore channel socket.
7652e5a0 1611 */
1f11a034
AA
1612static struct svc_xprt *svc_bc_create_socket(struct svc_serv *serv,
1613 int protocol,
1614 struct net *net,
1615 struct sockaddr *sin, int len,
1616 int flags)
7652e5a0
BH
1617{
1618 struct svc_sock *svsk;
1f11a034
AA
1619 struct svc_xprt *xprt;
1620
1621 if (protocol != IPPROTO_TCP) {
1622 printk(KERN_WARNING "svc: only TCP sockets"
1623 " supported on shared back channel\n");
1624 return ERR_PTR(-EINVAL);
1625 }
7652e5a0 1626
7652e5a0
BH
1627 svsk = kzalloc(sizeof(*svsk), GFP_KERNEL);
1628 if (!svsk)
1f11a034 1629 return ERR_PTR(-ENOMEM);
7652e5a0
BH
1630
1631 xprt = &svsk->sk_xprt;
bd4620dd 1632 svc_xprt_init(net, &svc_tcp_bc_class, xprt, serv);
1f11a034 1633
4a19de0f 1634 serv->sv_bc_xprt = xprt;
1f11a034 1635
7652e5a0
BH
1636 return xprt;
1637}
7652e5a0
BH
1638
1639/*
1f11a034 1640 * Free a back channel svc_sock.
7652e5a0 1641 */
1f11a034 1642static void svc_bc_sock_free(struct svc_xprt *xprt)
7652e5a0 1643{
778be232 1644 if (xprt)
7652e5a0
BH
1645 kfree(container_of(xprt, struct svc_sock, sk_xprt));
1646}
9e00abc3 1647#endif /* CONFIG_SUNRPC_BACKCHANNEL */
This page took 0.820865 seconds and 5 git commands to generate.