defxx: Fix issues with debug printk calls
[deliverable/linux.git] / net / tipc / socket.c
CommitLineData
b97bf3fd 1/*
02c00c2a 2 * net/tipc/socket.c: TIPC socket API
c4307285 3 *
8826cde6 4 * Copyright (c) 2001-2007, 2012-2014, Ericsson AB
c5fa7b3c 5 * Copyright (c) 2004-2008, 2010-2013, Wind River Systems
b97bf3fd
PL
6 * All rights reserved.
7 *
9ea1fd3c 8 * Redistribution and use in source and binary forms, with or without
b97bf3fd
PL
9 * modification, are permitted provided that the following conditions are met:
10 *
9ea1fd3c
PL
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
16 * 3. Neither the names of the copyright holders nor the names of its
17 * contributors may be used to endorse or promote products derived from
18 * this software without specific prior written permission.
b97bf3fd 19 *
9ea1fd3c
PL
20 * Alternatively, this software may be distributed under the terms of the
21 * GNU General Public License ("GPL") version 2 as published by the Free
22 * Software Foundation.
23 *
24 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
25 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
26 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
27 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
28 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
29 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
30 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
31 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
32 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
33 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
b97bf3fd
PL
34 * POSSIBILITY OF SUCH DAMAGE.
35 */
36
b97bf3fd 37#include "core.h"
d265fef6 38#include "port.h"
e2dafe87 39#include "name_table.h"
78acb1f9 40#include "node.h"
e2dafe87 41#include "link.h"
2cf8aa19 42#include <linux/export.h>
8db1bae3 43#include "link.h"
2cf8aa19 44
b97bf3fd
PL
45#define SS_LISTENING -1 /* socket is listening */
46#define SS_READY -2 /* socket is connectionless */
47
3654ea02 48#define CONN_TIMEOUT_DEFAULT 8000 /* default connect timeout = 8s */
ac0074ee 49#define TIPC_FWD_MSG 1
b97bf3fd 50
4f4482dc 51static int tipc_backlog_rcv(struct sock *sk, struct sk_buff *skb);
676d2369 52static void tipc_data_ready(struct sock *sk);
f288bef4 53static void tipc_write_space(struct sock *sk);
247f0f3c
YX
54static int tipc_release(struct socket *sock);
55static int tipc_accept(struct socket *sock, struct socket *new_sock, int flags);
b97bf3fd 56
bca65eae
FW
57static const struct proto_ops packet_ops;
58static const struct proto_ops stream_ops;
59static const struct proto_ops msg_ops;
b97bf3fd
PL
60
61static struct proto tipc_proto;
c5fa7b3c 62static struct proto tipc_proto_kern;
b97bf3fd 63
c4307285 64/*
0c3141e9
AS
65 * Revised TIPC socket locking policy:
66 *
67 * Most socket operations take the standard socket lock when they start
68 * and hold it until they finish (or until they need to sleep). Acquiring
69 * this lock grants the owner exclusive access to the fields of the socket
70 * data structures, with the exception of the backlog queue. A few socket
71 * operations can be done without taking the socket lock because they only
72 * read socket information that never changes during the life of the socket.
73 *
74 * Socket operations may acquire the lock for the associated TIPC port if they
75 * need to perform an operation on the port. If any routine needs to acquire
76 * both the socket lock and the port lock it must take the socket lock first
77 * to avoid the risk of deadlock.
78 *
79 * The dispatcher handling incoming messages cannot grab the socket lock in
80 * the standard fashion, since invoked it runs at the BH level and cannot block.
81 * Instead, it checks to see if the socket lock is currently owned by someone,
82 * and either handles the message itself or adds it to the socket's backlog
83 * queue; in the latter case the queued message is processed once the process
84 * owning the socket lock releases it.
85 *
86 * NOTE: Releasing the socket lock while an operation is sleeping overcomes
87 * the problem of a blocked socket operation preventing any other operations
88 * from occurring. However, applications must be careful if they have
89 * multiple threads trying to send (or receive) on the same socket, as these
90 * operations might interfere with each other. For example, doing a connect
91 * and a receive at the same time might allow the receive to consume the
92 * ACK message meant for the connect. While additional work could be done
93 * to try and overcome this, it doesn't seem to be worthwhile at the present.
94 *
95 * NOTE: Releasing the socket lock while an operation is sleeping also ensures
96 * that another operation that must be performed in a non-blocking manner is
97 * not delayed for very long because the lock has already been taken.
98 *
99 * NOTE: This code assumes that certain fields of a port/socket pair are
100 * constant over its lifetime; such fields can be examined without taking
101 * the socket lock and/or port lock, and do not need to be re-read even
102 * after resuming processing after waiting. These fields include:
103 * - socket type
104 * - pointer to socket sk structure (aka tipc_sock structure)
105 * - pointer to port structure
106 * - port reference
107 */
108
8826cde6
JPM
109#include "socket.h"
110
0c3141e9
AS
111/**
112 * advance_rx_queue - discard first buffer in socket receive queue
113 *
114 * Caller must hold socket lock
b97bf3fd 115 */
0c3141e9 116static void advance_rx_queue(struct sock *sk)
b97bf3fd 117{
5f6d9123 118 kfree_skb(__skb_dequeue(&sk->sk_receive_queue));
b97bf3fd
PL
119}
120
b97bf3fd 121/**
0c3141e9
AS
122 * reject_rx_queue - reject all buffers in socket receive queue
123 *
124 * Caller must hold socket lock
b97bf3fd 125 */
0c3141e9 126static void reject_rx_queue(struct sock *sk)
b97bf3fd 127{
0c3141e9 128 struct sk_buff *buf;
8db1bae3 129 u32 dnode;
0c3141e9 130
8db1bae3
JPM
131 while ((buf = __skb_dequeue(&sk->sk_receive_queue))) {
132 if (tipc_msg_reverse(buf, &dnode, TIPC_ERR_NO_PORT))
133 tipc_link_xmit2(buf, dnode, 0);
134 }
b97bf3fd
PL
135}
136
137/**
c5fa7b3c 138 * tipc_sk_create - create a TIPC socket
0c3141e9 139 * @net: network namespace (must be default network)
b97bf3fd
PL
140 * @sock: pre-allocated socket structure
141 * @protocol: protocol indicator (must be 0)
3f378b68 142 * @kern: caused by kernel or by userspace?
c4307285 143 *
0c3141e9
AS
144 * This routine creates additional data structures used by the TIPC socket,
145 * initializes them, and links them together.
b97bf3fd
PL
146 *
147 * Returns 0 on success, errno otherwise
148 */
58ed9442
JPM
149static int tipc_sk_create(struct net *net, struct socket *sock,
150 int protocol, int kern)
b97bf3fd 151{
0c3141e9
AS
152 const struct proto_ops *ops;
153 socket_state state;
b97bf3fd 154 struct sock *sk;
58ed9442
JPM
155 struct tipc_sock *tsk;
156 struct tipc_port *port;
157 u32 ref;
0c3141e9
AS
158
159 /* Validate arguments */
b97bf3fd
PL
160 if (unlikely(protocol != 0))
161 return -EPROTONOSUPPORT;
162
b97bf3fd
PL
163 switch (sock->type) {
164 case SOCK_STREAM:
0c3141e9
AS
165 ops = &stream_ops;
166 state = SS_UNCONNECTED;
b97bf3fd
PL
167 break;
168 case SOCK_SEQPACKET:
0c3141e9
AS
169 ops = &packet_ops;
170 state = SS_UNCONNECTED;
b97bf3fd
PL
171 break;
172 case SOCK_DGRAM:
b97bf3fd 173 case SOCK_RDM:
0c3141e9
AS
174 ops = &msg_ops;
175 state = SS_READY;
b97bf3fd 176 break;
49978651 177 default:
49978651 178 return -EPROTOTYPE;
b97bf3fd
PL
179 }
180
0c3141e9 181 /* Allocate socket's protocol area */
c5fa7b3c
YX
182 if (!kern)
183 sk = sk_alloc(net, AF_TIPC, GFP_KERNEL, &tipc_proto);
184 else
185 sk = sk_alloc(net, AF_TIPC, GFP_KERNEL, &tipc_proto_kern);
186
0c3141e9 187 if (sk == NULL)
b97bf3fd 188 return -ENOMEM;
b97bf3fd 189
58ed9442
JPM
190 tsk = tipc_sk(sk);
191 port = &tsk->port;
192
193 ref = tipc_port_init(port, TIPC_LOW_IMPORTANCE);
194 if (!ref) {
195 pr_warn("Socket registration failed, ref. table exhausted\n");
0c3141e9
AS
196 sk_free(sk);
197 return -ENOMEM;
198 }
b97bf3fd 199
0c3141e9 200 /* Finish initializing socket data structures */
0c3141e9
AS
201 sock->ops = ops;
202 sock->state = state;
b97bf3fd 203
0c3141e9 204 sock_init_data(sock, sk);
4f4482dc 205 sk->sk_backlog_rcv = tipc_backlog_rcv;
cc79dd1b 206 sk->sk_rcvbuf = sysctl_tipc_rmem[1];
f288bef4
YX
207 sk->sk_data_ready = tipc_data_ready;
208 sk->sk_write_space = tipc_write_space;
4f4482dc 209 tsk->conn_timeout = CONN_TIMEOUT_DEFAULT;
60120526 210 tsk->sent_unacked = 0;
4f4482dc 211 atomic_set(&tsk->dupl_rcvcnt, 0);
58ed9442 212 tipc_port_unlock(port);
7ef43eba 213
0c3141e9 214 if (sock->state == SS_READY) {
58ed9442 215 tipc_port_set_unreturnable(port, true);
0c3141e9 216 if (sock->type == SOCK_DGRAM)
58ed9442 217 tipc_port_set_unreliable(port, true);
0c3141e9 218 }
b97bf3fd
PL
219 return 0;
220}
221
c5fa7b3c
YX
222/**
223 * tipc_sock_create_local - create TIPC socket from inside TIPC module
224 * @type: socket type - SOCK_RDM or SOCK_SEQPACKET
225 *
226 * We cannot use sock_creat_kern here because it bumps module user count.
227 * Since socket owner and creator is the same module we must make sure
228 * that module count remains zero for module local sockets, otherwise
229 * we cannot do rmmod.
230 *
231 * Returns 0 on success, errno otherwise
232 */
233int tipc_sock_create_local(int type, struct socket **res)
234{
235 int rc;
c5fa7b3c
YX
236
237 rc = sock_create_lite(AF_TIPC, type, 0, res);
238 if (rc < 0) {
239 pr_err("Failed to create kernel socket\n");
240 return rc;
241 }
242 tipc_sk_create(&init_net, *res, 0, 1);
243
c5fa7b3c
YX
244 return 0;
245}
246
247/**
248 * tipc_sock_release_local - release socket created by tipc_sock_create_local
249 * @sock: the socket to be released.
250 *
251 * Module reference count is not incremented when such sockets are created,
252 * so we must keep it from being decremented when they are released.
253 */
254void tipc_sock_release_local(struct socket *sock)
255{
247f0f3c 256 tipc_release(sock);
c5fa7b3c
YX
257 sock->ops = NULL;
258 sock_release(sock);
259}
260
261/**
262 * tipc_sock_accept_local - accept a connection on a socket created
263 * with tipc_sock_create_local. Use this function to avoid that
264 * module reference count is inadvertently incremented.
265 *
266 * @sock: the accepting socket
267 * @newsock: reference to the new socket to be created
268 * @flags: socket flags
269 */
270
271int tipc_sock_accept_local(struct socket *sock, struct socket **newsock,
ae8509c4 272 int flags)
c5fa7b3c
YX
273{
274 struct sock *sk = sock->sk;
275 int ret;
276
277 ret = sock_create_lite(sk->sk_family, sk->sk_type,
278 sk->sk_protocol, newsock);
279 if (ret < 0)
280 return ret;
281
247f0f3c 282 ret = tipc_accept(sock, *newsock, flags);
c5fa7b3c
YX
283 if (ret < 0) {
284 sock_release(*newsock);
285 return ret;
286 }
287 (*newsock)->ops = sock->ops;
288 return ret;
289}
290
b97bf3fd 291/**
247f0f3c 292 * tipc_release - destroy a TIPC socket
b97bf3fd
PL
293 * @sock: socket to destroy
294 *
295 * This routine cleans up any messages that are still queued on the socket.
296 * For DGRAM and RDM socket types, all queued messages are rejected.
297 * For SEQPACKET and STREAM socket types, the first message is rejected
298 * and any others are discarded. (If the first message on a STREAM socket
299 * is partially-read, it is discarded and the next one is rejected instead.)
c4307285 300 *
b97bf3fd
PL
301 * NOTE: Rejected messages are not necessarily returned to the sender! They
302 * are returned or discarded according to the "destination droppable" setting
303 * specified for the message by the sender.
304 *
305 * Returns 0 on success, errno otherwise
306 */
247f0f3c 307static int tipc_release(struct socket *sock)
b97bf3fd 308{
b97bf3fd 309 struct sock *sk = sock->sk;
58ed9442
JPM
310 struct tipc_sock *tsk;
311 struct tipc_port *port;
b97bf3fd 312 struct sk_buff *buf;
8db1bae3 313 u32 dnode;
b97bf3fd 314
0c3141e9
AS
315 /*
316 * Exit if socket isn't fully initialized (occurs when a failed accept()
317 * releases a pre-allocated child socket that was never used)
318 */
0c3141e9 319 if (sk == NULL)
b97bf3fd 320 return 0;
c4307285 321
58ed9442
JPM
322 tsk = tipc_sk(sk);
323 port = &tsk->port;
0c3141e9
AS
324 lock_sock(sk);
325
326 /*
327 * Reject all unreceived messages, except on an active connection
328 * (which disconnects locally & sends a 'FIN+' to peer)
329 */
b97bf3fd 330 while (sock->state != SS_DISCONNECTING) {
0c3141e9
AS
331 buf = __skb_dequeue(&sk->sk_receive_queue);
332 if (buf == NULL)
b97bf3fd 333 break;
40682432 334 if (TIPC_SKB_CB(buf)->handle != NULL)
5f6d9123 335 kfree_skb(buf);
0c3141e9
AS
336 else {
337 if ((sock->state == SS_CONNECTING) ||
338 (sock->state == SS_CONNECTED)) {
339 sock->state = SS_DISCONNECTING;
58ed9442 340 tipc_port_disconnect(port->ref);
0c3141e9 341 }
8db1bae3
JPM
342 if (tipc_msg_reverse(buf, &dnode, TIPC_ERR_NO_PORT))
343 tipc_link_xmit2(buf, dnode, 0);
0c3141e9 344 }
b97bf3fd
PL
345 }
346
58ed9442
JPM
347 /* Destroy TIPC port; also disconnects an active connection and
348 * sends a 'FIN-' to peer.
0c3141e9 349 */
58ed9442 350 tipc_port_destroy(port);
b97bf3fd 351
0c3141e9 352 /* Discard any remaining (connection-based) messages in receive queue */
57467e56 353 __skb_queue_purge(&sk->sk_receive_queue);
b97bf3fd 354
0c3141e9 355 /* Reject any messages that accumulated in backlog queue */
0c3141e9
AS
356 sock->state = SS_DISCONNECTING;
357 release_sock(sk);
b97bf3fd
PL
358
359 sock_put(sk);
0c3141e9 360 sock->sk = NULL;
b97bf3fd 361
065d7e39 362 return 0;
b97bf3fd
PL
363}
364
365/**
247f0f3c 366 * tipc_bind - associate or disassocate TIPC name(s) with a socket
b97bf3fd
PL
367 * @sock: socket structure
368 * @uaddr: socket address describing name(s) and desired operation
369 * @uaddr_len: size of socket address data structure
c4307285 370 *
b97bf3fd
PL
371 * Name and name sequence binding is indicated using a positive scope value;
372 * a negative scope value unbinds the specified name. Specifying no name
373 * (i.e. a socket address length of 0) unbinds all names from the socket.
c4307285 374 *
b97bf3fd 375 * Returns 0 on success, errno otherwise
0c3141e9
AS
376 *
377 * NOTE: This routine doesn't need to take the socket lock since it doesn't
378 * access any non-constant socket information.
b97bf3fd 379 */
247f0f3c
YX
380static int tipc_bind(struct socket *sock, struct sockaddr *uaddr,
381 int uaddr_len)
b97bf3fd 382{
84602761 383 struct sock *sk = sock->sk;
b97bf3fd 384 struct sockaddr_tipc *addr = (struct sockaddr_tipc *)uaddr;
58ed9442 385 struct tipc_sock *tsk = tipc_sk(sk);
84602761 386 int res = -EINVAL;
b97bf3fd 387
84602761
YX
388 lock_sock(sk);
389 if (unlikely(!uaddr_len)) {
58ed9442 390 res = tipc_withdraw(&tsk->port, 0, NULL);
84602761
YX
391 goto exit;
392 }
c4307285 393
84602761
YX
394 if (uaddr_len < sizeof(struct sockaddr_tipc)) {
395 res = -EINVAL;
396 goto exit;
397 }
398 if (addr->family != AF_TIPC) {
399 res = -EAFNOSUPPORT;
400 goto exit;
401 }
b97bf3fd 402
b97bf3fd
PL
403 if (addr->addrtype == TIPC_ADDR_NAME)
404 addr->addr.nameseq.upper = addr->addr.nameseq.lower;
84602761
YX
405 else if (addr->addrtype != TIPC_ADDR_NAMESEQ) {
406 res = -EAFNOSUPPORT;
407 goto exit;
408 }
c4307285 409
13a2e898 410 if ((addr->addr.nameseq.type < TIPC_RESERVED_TYPES) &&
7d0ab17b 411 (addr->addr.nameseq.type != TIPC_TOP_SRV) &&
84602761
YX
412 (addr->addr.nameseq.type != TIPC_CFG_SRV)) {
413 res = -EACCES;
414 goto exit;
415 }
c422f1bd 416
84602761 417 res = (addr->scope > 0) ?
58ed9442
JPM
418 tipc_publish(&tsk->port, addr->scope, &addr->addr.nameseq) :
419 tipc_withdraw(&tsk->port, -addr->scope, &addr->addr.nameseq);
84602761
YX
420exit:
421 release_sock(sk);
422 return res;
b97bf3fd
PL
423}
424
c4307285 425/**
247f0f3c 426 * tipc_getname - get port ID of socket or peer socket
b97bf3fd
PL
427 * @sock: socket structure
428 * @uaddr: area for returned socket address
429 * @uaddr_len: area for returned length of socket address
2da59918 430 * @peer: 0 = own ID, 1 = current peer ID, 2 = current/former peer ID
c4307285 431 *
b97bf3fd 432 * Returns 0 on success, errno otherwise
0c3141e9 433 *
2da59918
AS
434 * NOTE: This routine doesn't need to take the socket lock since it only
435 * accesses socket information that is unchanging (or which changes in
0e65967e 436 * a completely predictable manner).
b97bf3fd 437 */
247f0f3c
YX
438static int tipc_getname(struct socket *sock, struct sockaddr *uaddr,
439 int *uaddr_len, int peer)
b97bf3fd 440{
b97bf3fd 441 struct sockaddr_tipc *addr = (struct sockaddr_tipc *)uaddr;
58ed9442 442 struct tipc_sock *tsk = tipc_sk(sock->sk);
b97bf3fd 443
88f8a5e3 444 memset(addr, 0, sizeof(*addr));
0c3141e9 445 if (peer) {
2da59918
AS
446 if ((sock->state != SS_CONNECTED) &&
447 ((peer != 2) || (sock->state != SS_DISCONNECTING)))
448 return -ENOTCONN;
58ed9442
JPM
449 addr->addr.id.ref = tipc_port_peerport(&tsk->port);
450 addr->addr.id.node = tipc_port_peernode(&tsk->port);
0c3141e9 451 } else {
58ed9442 452 addr->addr.id.ref = tsk->port.ref;
b924dcf0 453 addr->addr.id.node = tipc_own_addr;
0c3141e9 454 }
b97bf3fd
PL
455
456 *uaddr_len = sizeof(*addr);
457 addr->addrtype = TIPC_ADDR_ID;
458 addr->family = AF_TIPC;
459 addr->scope = 0;
b97bf3fd
PL
460 addr->addr.name.domain = 0;
461
0c3141e9 462 return 0;
b97bf3fd
PL
463}
464
465/**
247f0f3c 466 * tipc_poll - read and possibly block on pollmask
b97bf3fd
PL
467 * @file: file structure associated with the socket
468 * @sock: socket for which to calculate the poll bits
469 * @wait: ???
470 *
9b674e82
AS
471 * Returns pollmask value
472 *
473 * COMMENTARY:
474 * It appears that the usual socket locking mechanisms are not useful here
475 * since the pollmask info is potentially out-of-date the moment this routine
476 * exits. TCP and other protocols seem to rely on higher level poll routines
477 * to handle any preventable race conditions, so TIPC will do the same ...
478 *
479 * TIPC sets the returned events as follows:
f662c070
AS
480 *
481 * socket state flags set
482 * ------------ ---------
483 * unconnected no read flags
c4fc298a 484 * POLLOUT if port is not congested
f662c070
AS
485 *
486 * connecting POLLIN/POLLRDNORM if ACK/NACK in rx queue
487 * no write flags
488 *
489 * connected POLLIN/POLLRDNORM if data in rx queue
490 * POLLOUT if port is not congested
491 *
492 * disconnecting POLLIN/POLLRDNORM/POLLHUP
493 * no write flags
494 *
495 * listening POLLIN if SYN in rx queue
496 * no write flags
497 *
498 * ready POLLIN/POLLRDNORM if data in rx queue
499 * [connectionless] POLLOUT (since port cannot be congested)
500 *
501 * IMPORTANT: The fact that a read or write operation is indicated does NOT
502 * imply that the operation will succeed, merely that it should be performed
503 * and will not block.
b97bf3fd 504 */
247f0f3c
YX
505static unsigned int tipc_poll(struct file *file, struct socket *sock,
506 poll_table *wait)
b97bf3fd 507{
9b674e82 508 struct sock *sk = sock->sk;
58ed9442 509 struct tipc_sock *tsk = tipc_sk(sk);
f662c070 510 u32 mask = 0;
9b674e82 511
f288bef4 512 sock_poll_wait(file, sk_sleep(sk), wait);
9b674e82 513
f662c070 514 switch ((int)sock->state) {
c4fc298a 515 case SS_UNCONNECTED:
60120526 516 if (!tsk->link_cong)
c4fc298a
EH
517 mask |= POLLOUT;
518 break;
f662c070
AS
519 case SS_READY:
520 case SS_CONNECTED:
60120526 521 if (!tsk->link_cong && !tipc_sk_conn_cong(tsk))
f662c070
AS
522 mask |= POLLOUT;
523 /* fall thru' */
524 case SS_CONNECTING:
525 case SS_LISTENING:
526 if (!skb_queue_empty(&sk->sk_receive_queue))
527 mask |= (POLLIN | POLLRDNORM);
528 break;
529 case SS_DISCONNECTING:
530 mask = (POLLIN | POLLRDNORM | POLLHUP);
531 break;
532 }
9b674e82
AS
533
534 return mask;
b97bf3fd
PL
535}
536
ac0074ee
JPM
537/**
538 * tipc_sk_proto_rcv - receive a connection mng protocol message
539 * @tsk: receiving socket
540 * @dnode: node to send response message to, if any
541 * @buf: buffer containing protocol message
542 * Returns 0 (TIPC_OK) if message was consumed, 1 (TIPC_FWD_MSG) if
543 * (CONN_PROBE_REPLY) message should be forwarded.
544 */
545int tipc_sk_proto_rcv(struct tipc_sock *tsk, u32 *dnode, struct sk_buff *buf)
546{
547 struct tipc_msg *msg = buf_msg(buf);
548 struct tipc_port *port = &tsk->port;
60120526 549 int conn_cong;
ac0074ee
JPM
550
551 /* Ignore if connection cannot be validated: */
552 if (!port->connected || !tipc_port_peer_msg(port, msg))
553 goto exit;
554
555 port->probing_state = TIPC_CONN_OK;
556
557 if (msg_type(msg) == CONN_ACK) {
60120526
JPM
558 conn_cong = tipc_sk_conn_cong(tsk);
559 tsk->sent_unacked -= msg_msgcnt(msg);
560 if (conn_cong)
561 tipc_sock_wakeup(tsk);
ac0074ee
JPM
562 } else if (msg_type(msg) == CONN_PROBE) {
563 if (!tipc_msg_reverse(buf, dnode, TIPC_OK))
564 return TIPC_OK;
565 msg_set_type(msg, CONN_PROBE_REPLY);
566 return TIPC_FWD_MSG;
567 }
568 /* Do nothing if msg_type() == CONN_PROBE_REPLY */
569exit:
570 kfree_skb(buf);
571 return TIPC_OK;
572}
573
c4307285 574/**
b97bf3fd
PL
575 * dest_name_check - verify user is permitted to send to specified port name
576 * @dest: destination address
577 * @m: descriptor for message to be sent
c4307285 578 *
b97bf3fd
PL
579 * Prevents restricted configuration commands from being issued by
580 * unauthorized users.
c4307285 581 *
b97bf3fd
PL
582 * Returns 0 if permission is granted, otherwise errno
583 */
05790c64 584static int dest_name_check(struct sockaddr_tipc *dest, struct msghdr *m)
b97bf3fd
PL
585{
586 struct tipc_cfg_msg_hdr hdr;
587
e2dafe87
JPM
588 if (unlikely(dest->addrtype == TIPC_ADDR_ID))
589 return 0;
c4307285
YH
590 if (likely(dest->addr.name.name.type >= TIPC_RESERVED_TYPES))
591 return 0;
592 if (likely(dest->addr.name.name.type == TIPC_TOP_SRV))
593 return 0;
c4307285
YH
594 if (likely(dest->addr.name.name.type != TIPC_CFG_SRV))
595 return -EACCES;
b97bf3fd 596
3f8dd944
AS
597 if (!m->msg_iovlen || (m->msg_iov[0].iov_len < sizeof(hdr)))
598 return -EMSGSIZE;
c4307285 599 if (copy_from_user(&hdr, m->msg_iov[0].iov_base, sizeof(hdr)))
b97bf3fd 600 return -EFAULT;
70cb2347 601 if ((ntohs(hdr.tcm_type) & 0xC000) && (!capable(CAP_NET_ADMIN)))
b97bf3fd 602 return -EACCES;
c4307285 603
b97bf3fd
PL
604 return 0;
605}
606
3f40504f
YX
607static int tipc_wait_for_sndmsg(struct socket *sock, long *timeo_p)
608{
609 struct sock *sk = sock->sk;
58ed9442 610 struct tipc_sock *tsk = tipc_sk(sk);
3f40504f
YX
611 DEFINE_WAIT(wait);
612 int done;
613
614 do {
615 int err = sock_error(sk);
616 if (err)
617 return err;
618 if (sock->state == SS_DISCONNECTING)
619 return -EPIPE;
620 if (!*timeo_p)
621 return -EAGAIN;
622 if (signal_pending(current))
623 return sock_intr_errno(*timeo_p);
624
625 prepare_to_wait(sk_sleep(sk), &wait, TASK_INTERRUPTIBLE);
60120526 626 done = sk_wait_event(sk, timeo_p, !tsk->link_cong);
3f40504f
YX
627 finish_wait(sk_sleep(sk), &wait);
628 } while (!done);
629 return 0;
630}
631
e2dafe87
JPM
632/**
633 * tipc_sendmcast - send multicast message
634 * @sock: socket structure
635 * @seq: destination address
636 * @iov: message data to send
637 * @dsz: total length of message data
638 * @timeo: timeout to wait for wakeup
639 *
640 * Called from function tipc_sendmsg(), which has done all sanity checks
641 * Returns the number of bytes sent on success, or errno
642 */
643static int tipc_sendmcast(struct socket *sock, struct tipc_name_seq *seq,
644 struct iovec *iov, size_t dsz, long timeo)
645{
646 struct sock *sk = sock->sk;
647 struct tipc_sock *tsk = tipc_sk(sk);
648 int rc;
649
650 do {
651 if (sock->state != SS_READY) {
652 rc = -EOPNOTSUPP;
653 break;
654 }
655 rc = tipc_port_mcast_xmit(&tsk->port, seq, iov, dsz);
656 if (likely(rc >= 0)) {
657 if (sock->state != SS_READY)
658 sock->state = SS_CONNECTING;
659 break;
660 }
661 if (rc != -ELINKCONG)
662 break;
663 rc = tipc_wait_for_sndmsg(sock, &timeo);
664 } while (!rc);
665
666 return rc;
667}
58ed9442 668
b97bf3fd 669/**
247f0f3c 670 * tipc_sendmsg - send message in connectionless manner
0c3141e9 671 * @iocb: if NULL, indicates that socket lock is already held
b97bf3fd
PL
672 * @sock: socket structure
673 * @m: message to send
e2dafe87 674 * @dsz: amount of user data to be sent
c4307285 675 *
b97bf3fd 676 * Message must have an destination specified explicitly.
c4307285 677 * Used for SOCK_RDM and SOCK_DGRAM messages,
b97bf3fd
PL
678 * and for 'SYN' messages on SOCK_SEQPACKET and SOCK_STREAM connections.
679 * (Note: 'SYN+' is prohibited on SOCK_STREAM.)
c4307285 680 *
b97bf3fd
PL
681 * Returns the number of bytes sent on success, or errno otherwise
682 */
247f0f3c 683static int tipc_sendmsg(struct kiocb *iocb, struct socket *sock,
e2dafe87 684 struct msghdr *m, size_t dsz)
b97bf3fd 685{
e2dafe87 686 DECLARE_SOCKADDR(struct sockaddr_tipc *, dest, m->msg_name);
0c3141e9 687 struct sock *sk = sock->sk;
58ed9442 688 struct tipc_sock *tsk = tipc_sk(sk);
5c311421 689 struct tipc_port *port = &tsk->port;
e2dafe87
JPM
690 struct tipc_msg *mhdr = &port->phdr;
691 struct iovec *iov = m->msg_iov;
692 u32 dnode, dport;
693 struct sk_buff *buf;
694 struct tipc_name_seq *seq = &dest->addr.nameseq;
695 u32 mtu;
3f40504f 696 long timeo;
e2dafe87 697 int rc = -EINVAL;
b97bf3fd
PL
698
699 if (unlikely(!dest))
700 return -EDESTADDRREQ;
e2dafe87 701
51f9cc1f
AS
702 if (unlikely((m->msg_namelen < sizeof(*dest)) ||
703 (dest->family != AF_TIPC)))
b97bf3fd 704 return -EINVAL;
e2dafe87
JPM
705
706 if (dsz > TIPC_MAX_USER_MSG_SIZE)
c29c3f70 707 return -EMSGSIZE;
b97bf3fd 708
0c3141e9
AS
709 if (iocb)
710 lock_sock(sk);
711
e2dafe87 712 if (unlikely(sock->state != SS_READY)) {
0c3141e9 713 if (sock->state == SS_LISTENING) {
e2dafe87 714 rc = -EPIPE;
0c3141e9
AS
715 goto exit;
716 }
717 if (sock->state != SS_UNCONNECTED) {
e2dafe87 718 rc = -EISCONN;
0c3141e9
AS
719 goto exit;
720 }
58ed9442 721 if (tsk->port.published) {
e2dafe87 722 rc = -EOPNOTSUPP;
0c3141e9
AS
723 goto exit;
724 }
3388007b 725 if (dest->addrtype == TIPC_ADDR_NAME) {
58ed9442
JPM
726 tsk->port.conn_type = dest->addr.name.name.type;
727 tsk->port.conn_instance = dest->addr.name.name.instance;
3388007b 728 }
b97bf3fd 729 }
e2dafe87
JPM
730 rc = dest_name_check(dest, m);
731 if (rc)
732 goto exit;
b97bf3fd 733
3f40504f 734 timeo = sock_sndtimeo(sk, m->msg_flags & MSG_DONTWAIT);
e2dafe87
JPM
735
736 if (dest->addrtype == TIPC_ADDR_MCAST) {
737 rc = tipc_sendmcast(sock, seq, iov, dsz, timeo);
738 goto exit;
739 } else if (dest->addrtype == TIPC_ADDR_NAME) {
740 u32 type = dest->addr.name.name.type;
741 u32 inst = dest->addr.name.name.instance;
742 u32 domain = dest->addr.name.domain;
743
744 dnode = domain;
745 msg_set_type(mhdr, TIPC_NAMED_MSG);
746 msg_set_hdr_sz(mhdr, NAMED_H_SIZE);
747 msg_set_nametype(mhdr, type);
748 msg_set_nameinst(mhdr, inst);
749 msg_set_lookup_scope(mhdr, tipc_addr_scope(domain));
750 dport = tipc_nametbl_translate(type, inst, &dnode);
751 msg_set_destnode(mhdr, dnode);
752 msg_set_destport(mhdr, dport);
753 if (unlikely(!dport && !dnode)) {
754 rc = -EHOSTUNREACH;
755 goto exit;
c4307285 756 }
e2dafe87
JPM
757 } else if (dest->addrtype == TIPC_ADDR_ID) {
758 dnode = dest->addr.id.node;
759 msg_set_type(mhdr, TIPC_DIRECT_MSG);
760 msg_set_lookup_scope(mhdr, 0);
761 msg_set_destnode(mhdr, dnode);
762 msg_set_destport(mhdr, dest->addr.id.ref);
763 msg_set_hdr_sz(mhdr, BASIC_H_SIZE);
764 }
765
766new_mtu:
767 mtu = tipc_node_get_mtu(dnode, tsk->port.ref);
768 rc = tipc_msg_build2(mhdr, iov, 0, dsz, mtu, &buf);
769 if (rc < 0)
770 goto exit;
771
772 do {
773 rc = tipc_link_xmit2(buf, dnode, tsk->port.ref);
774 if (likely(rc >= 0)) {
775 if (sock->state != SS_READY)
0c3141e9 776 sock->state = SS_CONNECTING;
e2dafe87 777 rc = dsz;
0c3141e9 778 break;
c4307285 779 }
e2dafe87
JPM
780 if (rc == -EMSGSIZE)
781 goto new_mtu;
782
783 if (rc != -ELINKCONG)
0c3141e9 784 break;
e2dafe87
JPM
785
786 rc = tipc_wait_for_sndmsg(sock, &timeo);
787 } while (!rc);
0c3141e9
AS
788
789exit:
790 if (iocb)
791 release_sock(sk);
e2dafe87
JPM
792
793 return rc;
b97bf3fd
PL
794}
795
391a6dd1
YX
796static int tipc_wait_for_sndpkt(struct socket *sock, long *timeo_p)
797{
798 struct sock *sk = sock->sk;
58ed9442 799 struct tipc_sock *tsk = tipc_sk(sk);
391a6dd1
YX
800 DEFINE_WAIT(wait);
801 int done;
802
803 do {
804 int err = sock_error(sk);
805 if (err)
806 return err;
807 if (sock->state == SS_DISCONNECTING)
808 return -EPIPE;
809 else if (sock->state != SS_CONNECTED)
810 return -ENOTCONN;
811 if (!*timeo_p)
812 return -EAGAIN;
813 if (signal_pending(current))
814 return sock_intr_errno(*timeo_p);
815
816 prepare_to_wait(sk_sleep(sk), &wait, TASK_INTERRUPTIBLE);
817 done = sk_wait_event(sk, timeo_p,
60120526
JPM
818 (!tsk->link_cong &&
819 !tipc_sk_conn_cong(tsk)) ||
820 !tsk->port.connected);
391a6dd1
YX
821 finish_wait(sk_sleep(sk), &wait);
822 } while (!done);
823 return 0;
824}
825
c4307285 826/**
4ccfe5e0
JPM
827 * tipc_send_stream - send stream-oriented data
828 * @iocb: (unused)
b97bf3fd 829 * @sock: socket structure
4ccfe5e0
JPM
830 * @m: data to send
831 * @dsz: total length of data to be transmitted
c4307285 832 *
4ccfe5e0 833 * Used for SOCK_STREAM data.
c4307285 834 *
4ccfe5e0
JPM
835 * Returns the number of bytes sent on success (or partial success),
836 * or errno if no data sent
b97bf3fd 837 */
4ccfe5e0
JPM
838static int tipc_send_stream(struct kiocb *iocb, struct socket *sock,
839 struct msghdr *m, size_t dsz)
b97bf3fd 840{
0c3141e9 841 struct sock *sk = sock->sk;
58ed9442 842 struct tipc_sock *tsk = tipc_sk(sk);
4ccfe5e0
JPM
843 struct tipc_port *port = &tsk->port;
844 struct tipc_msg *mhdr = &port->phdr;
845 struct sk_buff *buf;
342dfc30 846 DECLARE_SOCKADDR(struct sockaddr_tipc *, dest, m->msg_name);
4ccfe5e0
JPM
847 u32 ref = port->ref;
848 int rc = -EINVAL;
391a6dd1 849 long timeo;
4ccfe5e0
JPM
850 u32 dnode;
851 uint mtu, send, sent = 0;
b97bf3fd
PL
852
853 /* Handle implied connection establishment */
4ccfe5e0
JPM
854 if (unlikely(dest)) {
855 rc = tipc_sendmsg(iocb, sock, m, dsz);
856 if (dsz && (dsz == rc))
60120526 857 tsk->sent_unacked = 1;
4ccfe5e0
JPM
858 return rc;
859 }
860 if (dsz > (uint)INT_MAX)
c29c3f70
AS
861 return -EMSGSIZE;
862
0c3141e9
AS
863 if (iocb)
864 lock_sock(sk);
b97bf3fd 865
391a6dd1
YX
866 if (unlikely(sock->state != SS_CONNECTED)) {
867 if (sock->state == SS_DISCONNECTING)
4ccfe5e0 868 rc = -EPIPE;
391a6dd1 869 else
4ccfe5e0 870 rc = -ENOTCONN;
391a6dd1
YX
871 goto exit;
872 }
1d835874 873
391a6dd1 874 timeo = sock_sndtimeo(sk, m->msg_flags & MSG_DONTWAIT);
4ccfe5e0 875 dnode = tipc_port_peernode(port);
4ccfe5e0
JPM
876
877next:
878 mtu = port->max_pkt;
879 send = min_t(uint, dsz - sent, TIPC_MAX_USER_MSG_SIZE);
880 rc = tipc_msg_build2(mhdr, m->msg_iov, sent, send, mtu, &buf);
881 if (unlikely(rc < 0))
882 goto exit;
c4307285 883 do {
60120526 884 if (likely(!tipc_sk_conn_cong(tsk))) {
4ccfe5e0
JPM
885 rc = tipc_link_xmit2(buf, dnode, ref);
886 if (likely(!rc)) {
60120526 887 tsk->sent_unacked++;
4ccfe5e0
JPM
888 sent += send;
889 if (sent == dsz)
890 break;
891 goto next;
892 }
893 if (rc == -EMSGSIZE) {
894 port->max_pkt = tipc_node_get_mtu(dnode, ref);
895 goto next;
896 }
897 if (rc != -ELINKCONG)
898 break;
899 }
900 rc = tipc_wait_for_sndpkt(sock, &timeo);
901 } while (!rc);
391a6dd1 902exit:
0c3141e9
AS
903 if (iocb)
904 release_sock(sk);
4ccfe5e0 905 return sent ? sent : rc;
b97bf3fd
PL
906}
907
c4307285 908/**
4ccfe5e0
JPM
909 * tipc_send_packet - send a connection-oriented message
910 * @iocb: if NULL, indicates that socket lock is already held
b97bf3fd 911 * @sock: socket structure
4ccfe5e0
JPM
912 * @m: message to send
913 * @dsz: length of data to be transmitted
c4307285 914 *
4ccfe5e0 915 * Used for SOCK_SEQPACKET messages.
c4307285 916 *
4ccfe5e0 917 * Returns the number of bytes sent on success, or errno otherwise
b97bf3fd 918 */
4ccfe5e0
JPM
919static int tipc_send_packet(struct kiocb *iocb, struct socket *sock,
920 struct msghdr *m, size_t dsz)
b97bf3fd 921{
4ccfe5e0
JPM
922 if (dsz > TIPC_MAX_USER_MSG_SIZE)
923 return -EMSGSIZE;
b97bf3fd 924
4ccfe5e0 925 return tipc_send_stream(iocb, sock, m, dsz);
b97bf3fd
PL
926}
927
928/**
929 * auto_connect - complete connection setup to a remote port
58ed9442 930 * @tsk: tipc socket structure
b97bf3fd 931 * @msg: peer's response message
c4307285 932 *
b97bf3fd
PL
933 * Returns 0 on success, errno otherwise
934 */
58ed9442 935static int auto_connect(struct tipc_sock *tsk, struct tipc_msg *msg)
b97bf3fd 936{
58ed9442
JPM
937 struct tipc_port *port = &tsk->port;
938 struct socket *sock = tsk->sk.sk_socket;
f9fef18c
JPM
939 struct tipc_portid peer;
940
941 peer.ref = msg_origport(msg);
942 peer.node = msg_orignode(msg);
b97bf3fd 943
58ed9442 944 __tipc_port_connect(port->ref, port, &peer);
584d24b3
YX
945
946 if (msg_importance(msg) > TIPC_CRITICAL_IMPORTANCE)
947 return -EINVAL;
58ed9442 948 msg_set_importance(&port->phdr, (u32)msg_importance(msg));
b97bf3fd
PL
949 sock->state = SS_CONNECTED;
950 return 0;
951}
952
953/**
954 * set_orig_addr - capture sender's address for received message
955 * @m: descriptor for message info
956 * @msg: received message header
c4307285 957 *
b97bf3fd
PL
958 * Note: Address is not captured if not requested by receiver.
959 */
05790c64 960static void set_orig_addr(struct msghdr *m, struct tipc_msg *msg)
b97bf3fd 961{
342dfc30 962 DECLARE_SOCKADDR(struct sockaddr_tipc *, addr, m->msg_name);
b97bf3fd 963
c4307285 964 if (addr) {
b97bf3fd
PL
965 addr->family = AF_TIPC;
966 addr->addrtype = TIPC_ADDR_ID;
60085c3d 967 memset(&addr->addr, 0, sizeof(addr->addr));
b97bf3fd
PL
968 addr->addr.id.ref = msg_origport(msg);
969 addr->addr.id.node = msg_orignode(msg);
0e65967e
AS
970 addr->addr.name.domain = 0; /* could leave uninitialized */
971 addr->scope = 0; /* could leave uninitialized */
b97bf3fd
PL
972 m->msg_namelen = sizeof(struct sockaddr_tipc);
973 }
974}
975
976/**
c4307285 977 * anc_data_recv - optionally capture ancillary data for received message
b97bf3fd
PL
978 * @m: descriptor for message info
979 * @msg: received message header
980 * @tport: TIPC port associated with message
c4307285 981 *
b97bf3fd 982 * Note: Ancillary data is not captured if not requested by receiver.
c4307285 983 *
b97bf3fd
PL
984 * Returns 0 if successful, otherwise errno
985 */
05790c64 986static int anc_data_recv(struct msghdr *m, struct tipc_msg *msg,
ae8509c4 987 struct tipc_port *tport)
b97bf3fd
PL
988{
989 u32 anc_data[3];
990 u32 err;
991 u32 dest_type;
3546c750 992 int has_name;
b97bf3fd
PL
993 int res;
994
995 if (likely(m->msg_controllen == 0))
996 return 0;
997
998 /* Optionally capture errored message object(s) */
b97bf3fd
PL
999 err = msg ? msg_errcode(msg) : 0;
1000 if (unlikely(err)) {
1001 anc_data[0] = err;
1002 anc_data[1] = msg_data_sz(msg);
2db9983a
AS
1003 res = put_cmsg(m, SOL_TIPC, TIPC_ERRINFO, 8, anc_data);
1004 if (res)
b97bf3fd 1005 return res;
2db9983a
AS
1006 if (anc_data[1]) {
1007 res = put_cmsg(m, SOL_TIPC, TIPC_RETDATA, anc_data[1],
1008 msg_data(msg));
1009 if (res)
1010 return res;
1011 }
b97bf3fd
PL
1012 }
1013
1014 /* Optionally capture message destination object */
b97bf3fd
PL
1015 dest_type = msg ? msg_type(msg) : TIPC_DIRECT_MSG;
1016 switch (dest_type) {
1017 case TIPC_NAMED_MSG:
3546c750 1018 has_name = 1;
b97bf3fd
PL
1019 anc_data[0] = msg_nametype(msg);
1020 anc_data[1] = msg_namelower(msg);
1021 anc_data[2] = msg_namelower(msg);
1022 break;
1023 case TIPC_MCAST_MSG:
3546c750 1024 has_name = 1;
b97bf3fd
PL
1025 anc_data[0] = msg_nametype(msg);
1026 anc_data[1] = msg_namelower(msg);
1027 anc_data[2] = msg_nameupper(msg);
1028 break;
1029 case TIPC_CONN_MSG:
3546c750 1030 has_name = (tport->conn_type != 0);
b97bf3fd
PL
1031 anc_data[0] = tport->conn_type;
1032 anc_data[1] = tport->conn_instance;
1033 anc_data[2] = tport->conn_instance;
1034 break;
1035 default:
3546c750 1036 has_name = 0;
b97bf3fd 1037 }
2db9983a
AS
1038 if (has_name) {
1039 res = put_cmsg(m, SOL_TIPC, TIPC_DESTNAME, 12, anc_data);
1040 if (res)
1041 return res;
1042 }
b97bf3fd
PL
1043
1044 return 0;
1045}
1046
85d3fc94 1047static int tipc_wait_for_rcvmsg(struct socket *sock, long *timeop)
9bbb4ecc
YX
1048{
1049 struct sock *sk = sock->sk;
1050 DEFINE_WAIT(wait);
85d3fc94 1051 long timeo = *timeop;
9bbb4ecc
YX
1052 int err;
1053
1054 for (;;) {
1055 prepare_to_wait(sk_sleep(sk), &wait, TASK_INTERRUPTIBLE);
fe8e4649 1056 if (timeo && skb_queue_empty(&sk->sk_receive_queue)) {
9bbb4ecc
YX
1057 if (sock->state == SS_DISCONNECTING) {
1058 err = -ENOTCONN;
1059 break;
1060 }
1061 release_sock(sk);
1062 timeo = schedule_timeout(timeo);
1063 lock_sock(sk);
1064 }
1065 err = 0;
1066 if (!skb_queue_empty(&sk->sk_receive_queue))
1067 break;
1068 err = sock_intr_errno(timeo);
1069 if (signal_pending(current))
1070 break;
1071 err = -EAGAIN;
1072 if (!timeo)
1073 break;
1074 }
1075 finish_wait(sk_sleep(sk), &wait);
85d3fc94 1076 *timeop = timeo;
9bbb4ecc
YX
1077 return err;
1078}
1079
c4307285 1080/**
247f0f3c 1081 * tipc_recvmsg - receive packet-oriented message
b97bf3fd
PL
1082 * @iocb: (unused)
1083 * @m: descriptor for message info
1084 * @buf_len: total size of user buffer area
1085 * @flags: receive flags
c4307285 1086 *
b97bf3fd
PL
1087 * Used for SOCK_DGRAM, SOCK_RDM, and SOCK_SEQPACKET messages.
1088 * If the complete message doesn't fit in user area, truncate it.
1089 *
1090 * Returns size of returned message data, errno otherwise
1091 */
247f0f3c
YX
1092static int tipc_recvmsg(struct kiocb *iocb, struct socket *sock,
1093 struct msghdr *m, size_t buf_len, int flags)
b97bf3fd 1094{
0c3141e9 1095 struct sock *sk = sock->sk;
58ed9442
JPM
1096 struct tipc_sock *tsk = tipc_sk(sk);
1097 struct tipc_port *port = &tsk->port;
b97bf3fd
PL
1098 struct sk_buff *buf;
1099 struct tipc_msg *msg;
9bbb4ecc 1100 long timeo;
b97bf3fd
PL
1101 unsigned int sz;
1102 u32 err;
1103 int res;
1104
0c3141e9 1105 /* Catch invalid receive requests */
b97bf3fd
PL
1106 if (unlikely(!buf_len))
1107 return -EINVAL;
1108
0c3141e9 1109 lock_sock(sk);
b97bf3fd 1110
0c3141e9
AS
1111 if (unlikely(sock->state == SS_UNCONNECTED)) {
1112 res = -ENOTCONN;
b97bf3fd
PL
1113 goto exit;
1114 }
1115
9bbb4ecc 1116 timeo = sock_rcvtimeo(sk, flags & MSG_DONTWAIT);
0c3141e9 1117restart:
b97bf3fd 1118
0c3141e9 1119 /* Look for a message in receive queue; wait if necessary */
85d3fc94 1120 res = tipc_wait_for_rcvmsg(sock, &timeo);
9bbb4ecc
YX
1121 if (res)
1122 goto exit;
b97bf3fd 1123
0c3141e9 1124 /* Look at first message in receive queue */
0c3141e9 1125 buf = skb_peek(&sk->sk_receive_queue);
b97bf3fd
PL
1126 msg = buf_msg(buf);
1127 sz = msg_data_sz(msg);
1128 err = msg_errcode(msg);
1129
b97bf3fd 1130 /* Discard an empty non-errored message & try again */
b97bf3fd 1131 if ((!sz) && (!err)) {
0c3141e9 1132 advance_rx_queue(sk);
b97bf3fd
PL
1133 goto restart;
1134 }
1135
1136 /* Capture sender's address (optional) */
b97bf3fd
PL
1137 set_orig_addr(m, msg);
1138
1139 /* Capture ancillary data (optional) */
58ed9442 1140 res = anc_data_recv(m, msg, port);
0c3141e9 1141 if (res)
b97bf3fd
PL
1142 goto exit;
1143
1144 /* Capture message data (if valid) & compute return value (always) */
b97bf3fd
PL
1145 if (!err) {
1146 if (unlikely(buf_len < sz)) {
1147 sz = buf_len;
1148 m->msg_flags |= MSG_TRUNC;
1149 }
0232fd0a
AS
1150 res = skb_copy_datagram_iovec(buf, msg_hdr_sz(msg),
1151 m->msg_iov, sz);
1152 if (res)
b97bf3fd 1153 goto exit;
b97bf3fd
PL
1154 res = sz;
1155 } else {
1156 if ((sock->state == SS_READY) ||
1157 ((err == TIPC_CONN_SHUTDOWN) || m->msg_control))
1158 res = 0;
1159 else
1160 res = -ECONNRESET;
1161 }
1162
1163 /* Consume received message (optional) */
b97bf3fd 1164 if (likely(!(flags & MSG_PEEK))) {
99009806 1165 if ((sock->state != SS_READY) &&
60120526
JPM
1166 (++tsk->rcv_unacked >= TIPC_CONNACK_INTV)) {
1167 tipc_acknowledge(port->ref, tsk->rcv_unacked);
1168 tsk->rcv_unacked = 0;
1169 }
0c3141e9 1170 advance_rx_queue(sk);
c4307285 1171 }
b97bf3fd 1172exit:
0c3141e9 1173 release_sock(sk);
b97bf3fd
PL
1174 return res;
1175}
1176
c4307285 1177/**
247f0f3c 1178 * tipc_recv_stream - receive stream-oriented data
b97bf3fd
PL
1179 * @iocb: (unused)
1180 * @m: descriptor for message info
1181 * @buf_len: total size of user buffer area
1182 * @flags: receive flags
c4307285
YH
1183 *
1184 * Used for SOCK_STREAM messages only. If not enough data is available
b97bf3fd
PL
1185 * will optionally wait for more; never truncates data.
1186 *
1187 * Returns size of returned message data, errno otherwise
1188 */
247f0f3c
YX
1189static int tipc_recv_stream(struct kiocb *iocb, struct socket *sock,
1190 struct msghdr *m, size_t buf_len, int flags)
b97bf3fd 1191{
0c3141e9 1192 struct sock *sk = sock->sk;
58ed9442
JPM
1193 struct tipc_sock *tsk = tipc_sk(sk);
1194 struct tipc_port *port = &tsk->port;
b97bf3fd
PL
1195 struct sk_buff *buf;
1196 struct tipc_msg *msg;
9bbb4ecc 1197 long timeo;
b97bf3fd 1198 unsigned int sz;
3720d40b 1199 int sz_to_copy, target, needed;
b97bf3fd 1200 int sz_copied = 0;
b97bf3fd 1201 u32 err;
0c3141e9 1202 int res = 0;
b97bf3fd 1203
0c3141e9 1204 /* Catch invalid receive attempts */
b97bf3fd
PL
1205 if (unlikely(!buf_len))
1206 return -EINVAL;
1207
0c3141e9 1208 lock_sock(sk);
b97bf3fd 1209
9bbb4ecc 1210 if (unlikely(sock->state == SS_UNCONNECTED)) {
0c3141e9 1211 res = -ENOTCONN;
b97bf3fd
PL
1212 goto exit;
1213 }
1214
3720d40b 1215 target = sock_rcvlowat(sk, flags & MSG_WAITALL, buf_len);
9bbb4ecc 1216 timeo = sock_rcvtimeo(sk, flags & MSG_DONTWAIT);
b97bf3fd 1217
617d3c7a 1218restart:
0c3141e9 1219 /* Look for a message in receive queue; wait if necessary */
85d3fc94 1220 res = tipc_wait_for_rcvmsg(sock, &timeo);
9bbb4ecc
YX
1221 if (res)
1222 goto exit;
b97bf3fd 1223
0c3141e9 1224 /* Look at first message in receive queue */
0c3141e9 1225 buf = skb_peek(&sk->sk_receive_queue);
b97bf3fd
PL
1226 msg = buf_msg(buf);
1227 sz = msg_data_sz(msg);
1228 err = msg_errcode(msg);
1229
1230 /* Discard an empty non-errored message & try again */
b97bf3fd 1231 if ((!sz) && (!err)) {
0c3141e9 1232 advance_rx_queue(sk);
b97bf3fd
PL
1233 goto restart;
1234 }
1235
1236 /* Optionally capture sender's address & ancillary data of first msg */
b97bf3fd
PL
1237 if (sz_copied == 0) {
1238 set_orig_addr(m, msg);
58ed9442 1239 res = anc_data_recv(m, msg, port);
0c3141e9 1240 if (res)
b97bf3fd
PL
1241 goto exit;
1242 }
1243
1244 /* Capture message data (if valid) & compute return value (always) */
b97bf3fd 1245 if (!err) {
0232fd0a 1246 u32 offset = (u32)(unsigned long)(TIPC_SKB_CB(buf)->handle);
b97bf3fd 1247
0232fd0a 1248 sz -= offset;
b97bf3fd
PL
1249 needed = (buf_len - sz_copied);
1250 sz_to_copy = (sz <= needed) ? sz : needed;
0232fd0a
AS
1251
1252 res = skb_copy_datagram_iovec(buf, msg_hdr_sz(msg) + offset,
1253 m->msg_iov, sz_to_copy);
1254 if (res)
b97bf3fd 1255 goto exit;
0232fd0a 1256
b97bf3fd
PL
1257 sz_copied += sz_to_copy;
1258
1259 if (sz_to_copy < sz) {
1260 if (!(flags & MSG_PEEK))
0232fd0a
AS
1261 TIPC_SKB_CB(buf)->handle =
1262 (void *)(unsigned long)(offset + sz_to_copy);
b97bf3fd
PL
1263 goto exit;
1264 }
b97bf3fd
PL
1265 } else {
1266 if (sz_copied != 0)
1267 goto exit; /* can't add error msg to valid data */
1268
1269 if ((err == TIPC_CONN_SHUTDOWN) || m->msg_control)
1270 res = 0;
1271 else
1272 res = -ECONNRESET;
1273 }
1274
1275 /* Consume received message (optional) */
b97bf3fd 1276 if (likely(!(flags & MSG_PEEK))) {
60120526
JPM
1277 if (unlikely(++tsk->rcv_unacked >= TIPC_CONNACK_INTV)) {
1278 tipc_acknowledge(port->ref, tsk->rcv_unacked);
1279 tsk->rcv_unacked = 0;
1280 }
0c3141e9 1281 advance_rx_queue(sk);
c4307285 1282 }
b97bf3fd
PL
1283
1284 /* Loop around if more data is required */
f64f9e71
JP
1285 if ((sz_copied < buf_len) && /* didn't get all requested data */
1286 (!skb_queue_empty(&sk->sk_receive_queue) ||
3720d40b 1287 (sz_copied < target)) && /* and more is ready or required */
f64f9e71
JP
1288 (!(flags & MSG_PEEK)) && /* and aren't just peeking at data */
1289 (!err)) /* and haven't reached a FIN */
b97bf3fd
PL
1290 goto restart;
1291
1292exit:
0c3141e9 1293 release_sock(sk);
a3b0a5a9 1294 return sz_copied ? sz_copied : res;
b97bf3fd
PL
1295}
1296
f288bef4
YX
1297/**
1298 * tipc_write_space - wake up thread if port congestion is released
1299 * @sk: socket
1300 */
1301static void tipc_write_space(struct sock *sk)
1302{
1303 struct socket_wq *wq;
1304
1305 rcu_read_lock();
1306 wq = rcu_dereference(sk->sk_wq);
1307 if (wq_has_sleeper(wq))
1308 wake_up_interruptible_sync_poll(&wq->wait, POLLOUT |
1309 POLLWRNORM | POLLWRBAND);
1310 rcu_read_unlock();
1311}
1312
1313/**
1314 * tipc_data_ready - wake up threads to indicate messages have been received
1315 * @sk: socket
1316 * @len: the length of messages
1317 */
676d2369 1318static void tipc_data_ready(struct sock *sk)
f288bef4
YX
1319{
1320 struct socket_wq *wq;
1321
1322 rcu_read_lock();
1323 wq = rcu_dereference(sk->sk_wq);
1324 if (wq_has_sleeper(wq))
1325 wake_up_interruptible_sync_poll(&wq->wait, POLLIN |
1326 POLLRDNORM | POLLRDBAND);
1327 rcu_read_unlock();
1328}
1329
7e6c131e
YX
1330/**
1331 * filter_connect - Handle all incoming messages for a connection-based socket
58ed9442 1332 * @tsk: TIPC socket
7e6c131e
YX
1333 * @msg: message
1334 *
e4de5fab 1335 * Returns 0 (TIPC_OK) if everyting ok, -TIPC_ERR_NO_PORT otherwise
7e6c131e 1336 */
e4de5fab 1337static int filter_connect(struct tipc_sock *tsk, struct sk_buff **buf)
7e6c131e 1338{
58ed9442
JPM
1339 struct sock *sk = &tsk->sk;
1340 struct tipc_port *port = &tsk->port;
8826cde6 1341 struct socket *sock = sk->sk_socket;
7e6c131e 1342 struct tipc_msg *msg = buf_msg(*buf);
8826cde6 1343
e4de5fab 1344 int retval = -TIPC_ERR_NO_PORT;
584d24b3 1345 int res;
7e6c131e
YX
1346
1347 if (msg_mcast(msg))
1348 return retval;
1349
1350 switch ((int)sock->state) {
1351 case SS_CONNECTED:
1352 /* Accept only connection-based messages sent by peer */
8826cde6 1353 if (msg_connected(msg) && tipc_port_peer_msg(port, msg)) {
7e6c131e
YX
1354 if (unlikely(msg_errcode(msg))) {
1355 sock->state = SS_DISCONNECTING;
8826cde6 1356 __tipc_port_disconnect(port);
7e6c131e
YX
1357 }
1358 retval = TIPC_OK;
1359 }
1360 break;
1361 case SS_CONNECTING:
1362 /* Accept only ACK or NACK message */
584d24b3
YX
1363 if (unlikely(msg_errcode(msg))) {
1364 sock->state = SS_DISCONNECTING;
2c8d8518 1365 sk->sk_err = ECONNREFUSED;
584d24b3
YX
1366 retval = TIPC_OK;
1367 break;
1368 }
1369
1370 if (unlikely(!msg_connected(msg)))
1371 break;
1372
58ed9442 1373 res = auto_connect(tsk, msg);
584d24b3
YX
1374 if (res) {
1375 sock->state = SS_DISCONNECTING;
2c8d8518 1376 sk->sk_err = -res;
7e6c131e 1377 retval = TIPC_OK;
584d24b3
YX
1378 break;
1379 }
1380
1381 /* If an incoming message is an 'ACK-', it should be
1382 * discarded here because it doesn't contain useful
1383 * data. In addition, we should try to wake up
1384 * connect() routine if sleeping.
1385 */
1386 if (msg_data_sz(msg) == 0) {
1387 kfree_skb(*buf);
1388 *buf = NULL;
1389 if (waitqueue_active(sk_sleep(sk)))
1390 wake_up_interruptible(sk_sleep(sk));
1391 }
1392 retval = TIPC_OK;
7e6c131e
YX
1393 break;
1394 case SS_LISTENING:
1395 case SS_UNCONNECTED:
1396 /* Accept only SYN message */
1397 if (!msg_connected(msg) && !(msg_errcode(msg)))
1398 retval = TIPC_OK;
1399 break;
1400 case SS_DISCONNECTING:
1401 break;
1402 default:
1403 pr_err("Unknown socket state %u\n", sock->state);
1404 }
1405 return retval;
1406}
1407
aba79f33
YX
1408/**
1409 * rcvbuf_limit - get proper overload limit of socket receive queue
1410 * @sk: socket
1411 * @buf: message
1412 *
1413 * For all connection oriented messages, irrespective of importance,
1414 * the default overload value (i.e. 67MB) is set as limit.
1415 *
1416 * For all connectionless messages, by default new queue limits are
1417 * as belows:
1418 *
cc79dd1b
YX
1419 * TIPC_LOW_IMPORTANCE (4 MB)
1420 * TIPC_MEDIUM_IMPORTANCE (8 MB)
1421 * TIPC_HIGH_IMPORTANCE (16 MB)
1422 * TIPC_CRITICAL_IMPORTANCE (32 MB)
aba79f33
YX
1423 *
1424 * Returns overload limit according to corresponding message importance
1425 */
1426static unsigned int rcvbuf_limit(struct sock *sk, struct sk_buff *buf)
1427{
1428 struct tipc_msg *msg = buf_msg(buf);
aba79f33
YX
1429
1430 if (msg_connected(msg))
0cee6bbe 1431 return sysctl_tipc_rmem[2];
1432
1433 return sk->sk_rcvbuf >> TIPC_CRITICAL_IMPORTANCE <<
1434 msg_importance(msg);
aba79f33
YX
1435}
1436
c4307285 1437/**
0c3141e9
AS
1438 * filter_rcv - validate incoming message
1439 * @sk: socket
b97bf3fd 1440 * @buf: message
c4307285 1441 *
0c3141e9
AS
1442 * Enqueues message on receive queue if acceptable; optionally handles
1443 * disconnect indication for a connected socket.
1444 *
1445 * Called with socket lock already taken; port lock may also be taken.
c4307285 1446 *
e4de5fab 1447 * Returns 0 (TIPC_OK) if message was consumed, -TIPC error code if message
ac0074ee 1448 * to be rejected, 1 (TIPC_FWD_MSG) if (CONN_MANAGER) message to be forwarded
b97bf3fd 1449 */
e4de5fab 1450static int filter_rcv(struct sock *sk, struct sk_buff *buf)
b97bf3fd 1451{
0c3141e9 1452 struct socket *sock = sk->sk_socket;
58ed9442 1453 struct tipc_sock *tsk = tipc_sk(sk);
b97bf3fd 1454 struct tipc_msg *msg = buf_msg(buf);
aba79f33 1455 unsigned int limit = rcvbuf_limit(sk, buf);
ac0074ee 1456 u32 onode;
e4de5fab 1457 int rc = TIPC_OK;
b97bf3fd 1458
ac0074ee
JPM
1459 if (unlikely(msg_user(msg) == CONN_MANAGER))
1460 return tipc_sk_proto_rcv(tsk, &onode, buf);
ec8a2e56 1461
b97bf3fd 1462 /* Reject message if it is wrong sort of message for socket */
aad58547 1463 if (msg_type(msg) > TIPC_DIRECT_MSG)
e4de5fab 1464 return -TIPC_ERR_NO_PORT;
0c3141e9 1465
b97bf3fd 1466 if (sock->state == SS_READY) {
b29f1428 1467 if (msg_connected(msg))
e4de5fab 1468 return -TIPC_ERR_NO_PORT;
b97bf3fd 1469 } else {
e4de5fab
JPM
1470 rc = filter_connect(tsk, &buf);
1471 if (rc != TIPC_OK || buf == NULL)
1472 return rc;
b97bf3fd
PL
1473 }
1474
1475 /* Reject message if there isn't room to queue it */
aba79f33 1476 if (sk_rmem_alloc_get(sk) + buf->truesize >= limit)
e4de5fab 1477 return -TIPC_ERR_OVERLOAD;
b97bf3fd 1478
aba79f33 1479 /* Enqueue message */
40682432 1480 TIPC_SKB_CB(buf)->handle = NULL;
0c3141e9 1481 __skb_queue_tail(&sk->sk_receive_queue, buf);
aba79f33 1482 skb_set_owner_r(buf, sk);
0c3141e9 1483
676d2369 1484 sk->sk_data_ready(sk);
0c3141e9
AS
1485 return TIPC_OK;
1486}
b97bf3fd 1487
0c3141e9 1488/**
4f4482dc 1489 * tipc_backlog_rcv - handle incoming message from backlog queue
0c3141e9
AS
1490 * @sk: socket
1491 * @buf: message
1492 *
1493 * Caller must hold socket lock, but not port lock.
1494 *
1495 * Returns 0
1496 */
4f4482dc 1497static int tipc_backlog_rcv(struct sock *sk, struct sk_buff *buf)
0c3141e9 1498{
e4de5fab 1499 int rc;
8db1bae3 1500 u32 onode;
4f4482dc 1501 struct tipc_sock *tsk = tipc_sk(sk);
02c00c2a 1502 uint truesize = buf->truesize;
0c3141e9 1503
e4de5fab 1504 rc = filter_rcv(sk, buf);
4f4482dc 1505
ac0074ee
JPM
1506 if (likely(!rc)) {
1507 if (atomic_read(&tsk->dupl_rcvcnt) < TIPC_CONN_OVERLOAD_LIMIT)
1508 atomic_add(truesize, &tsk->dupl_rcvcnt);
1509 return 0;
1510 }
1511
1512 if ((rc < 0) && !tipc_msg_reverse(buf, &onode, -rc))
1513 return 0;
1514
1515 tipc_link_xmit2(buf, onode, 0);
4f4482dc 1516
0c3141e9
AS
1517 return 0;
1518}
1519
1520/**
24be34b5 1521 * tipc_sk_rcv - handle incoming message
9816f061
JPM
1522 * @buf: buffer containing arriving message
1523 * Consumes buffer
1524 * Returns 0 if success, or errno: -EHOSTUNREACH
0c3141e9 1525 */
9816f061 1526int tipc_sk_rcv(struct sk_buff *buf)
0c3141e9 1527{
9816f061
JPM
1528 struct tipc_sock *tsk;
1529 struct tipc_port *port;
1530 struct sock *sk;
1531 u32 dport = msg_destport(buf_msg(buf));
e4de5fab 1532 int rc = TIPC_OK;
4f4482dc 1533 uint limit;
8db1bae3 1534 u32 dnode;
9816f061 1535
5a379074 1536 /* Validate destination and message */
9816f061
JPM
1537 port = tipc_port_lock(dport);
1538 if (unlikely(!port)) {
5a379074 1539 rc = tipc_msg_eval(buf, &dnode);
9816f061
JPM
1540 goto exit;
1541 }
1542
1543 tsk = tipc_port_to_sock(port);
1544 sk = &tsk->sk;
1545
1546 /* Queue message */
0c3141e9 1547 bh_lock_sock(sk);
9816f061 1548
0c3141e9 1549 if (!sock_owned_by_user(sk)) {
e4de5fab 1550 rc = filter_rcv(sk, buf);
0c3141e9 1551 } else {
4f4482dc
JPM
1552 if (sk->sk_backlog.len == 0)
1553 atomic_set(&tsk->dupl_rcvcnt, 0);
1554 limit = rcvbuf_limit(sk, buf) + atomic_read(&tsk->dupl_rcvcnt);
1555 if (sk_add_backlog(sk, buf, limit))
e4de5fab 1556 rc = -TIPC_ERR_OVERLOAD;
0c3141e9
AS
1557 }
1558 bh_unlock_sock(sk);
9816f061 1559 tipc_port_unlock(port);
0c3141e9 1560
e4de5fab 1561 if (likely(!rc))
9816f061
JPM
1562 return 0;
1563exit:
5a379074 1564 if ((rc < 0) && !tipc_msg_reverse(buf, &dnode, -rc))
8db1bae3 1565 return -EHOSTUNREACH;
5a379074 1566
8db1bae3 1567 tipc_link_xmit2(buf, dnode, 0);
5a379074 1568 return (rc < 0) ? -EHOSTUNREACH : 0;
b97bf3fd
PL
1569}
1570
78eb3a53
YX
1571static int tipc_wait_for_connect(struct socket *sock, long *timeo_p)
1572{
1573 struct sock *sk = sock->sk;
1574 DEFINE_WAIT(wait);
1575 int done;
1576
1577 do {
1578 int err = sock_error(sk);
1579 if (err)
1580 return err;
1581 if (!*timeo_p)
1582 return -ETIMEDOUT;
1583 if (signal_pending(current))
1584 return sock_intr_errno(*timeo_p);
1585
1586 prepare_to_wait(sk_sleep(sk), &wait, TASK_INTERRUPTIBLE);
1587 done = sk_wait_event(sk, timeo_p, sock->state != SS_CONNECTING);
1588 finish_wait(sk_sleep(sk), &wait);
1589 } while (!done);
1590 return 0;
1591}
1592
b97bf3fd 1593/**
247f0f3c 1594 * tipc_connect - establish a connection to another TIPC port
b97bf3fd
PL
1595 * @sock: socket structure
1596 * @dest: socket address for destination port
1597 * @destlen: size of socket address data structure
0c3141e9 1598 * @flags: file-related flags associated with socket
b97bf3fd
PL
1599 *
1600 * Returns 0 on success, errno otherwise
1601 */
247f0f3c
YX
1602static int tipc_connect(struct socket *sock, struct sockaddr *dest,
1603 int destlen, int flags)
b97bf3fd 1604{
0c3141e9 1605 struct sock *sk = sock->sk;
b89741a0
AS
1606 struct sockaddr_tipc *dst = (struct sockaddr_tipc *)dest;
1607 struct msghdr m = {NULL,};
78eb3a53
YX
1608 long timeout = (flags & O_NONBLOCK) ? 0 : tipc_sk(sk)->conn_timeout;
1609 socket_state previous;
b89741a0
AS
1610 int res;
1611
0c3141e9
AS
1612 lock_sock(sk);
1613
b89741a0 1614 /* For now, TIPC does not allow use of connect() with DGRAM/RDM types */
0c3141e9
AS
1615 if (sock->state == SS_READY) {
1616 res = -EOPNOTSUPP;
1617 goto exit;
1618 }
b89741a0 1619
b89741a0
AS
1620 /*
1621 * Reject connection attempt using multicast address
1622 *
1623 * Note: send_msg() validates the rest of the address fields,
1624 * so there's no need to do it here
1625 */
0c3141e9
AS
1626 if (dst->addrtype == TIPC_ADDR_MCAST) {
1627 res = -EINVAL;
1628 goto exit;
1629 }
1630
78eb3a53 1631 previous = sock->state;
584d24b3
YX
1632 switch (sock->state) {
1633 case SS_UNCONNECTED:
1634 /* Send a 'SYN-' to destination */
1635 m.msg_name = dest;
1636 m.msg_namelen = destlen;
1637
1638 /* If connect is in non-blocking case, set MSG_DONTWAIT to
1639 * indicate send_msg() is never blocked.
1640 */
1641 if (!timeout)
1642 m.msg_flags = MSG_DONTWAIT;
1643
247f0f3c 1644 res = tipc_sendmsg(NULL, sock, &m, 0);
584d24b3
YX
1645 if ((res < 0) && (res != -EWOULDBLOCK))
1646 goto exit;
1647
1648 /* Just entered SS_CONNECTING state; the only
1649 * difference is that return value in non-blocking
1650 * case is EINPROGRESS, rather than EALREADY.
1651 */
1652 res = -EINPROGRESS;
584d24b3 1653 case SS_CONNECTING:
78eb3a53
YX
1654 if (previous == SS_CONNECTING)
1655 res = -EALREADY;
1656 if (!timeout)
1657 goto exit;
1658 timeout = msecs_to_jiffies(timeout);
1659 /* Wait until an 'ACK' or 'RST' arrives, or a timeout occurs */
1660 res = tipc_wait_for_connect(sock, &timeout);
584d24b3
YX
1661 break;
1662 case SS_CONNECTED:
1663 res = -EISCONN;
1664 break;
1665 default:
1666 res = -EINVAL;
78eb3a53 1667 break;
b89741a0 1668 }
0c3141e9
AS
1669exit:
1670 release_sock(sk);
b89741a0 1671 return res;
b97bf3fd
PL
1672}
1673
c4307285 1674/**
247f0f3c 1675 * tipc_listen - allow socket to listen for incoming connections
b97bf3fd
PL
1676 * @sock: socket structure
1677 * @len: (unused)
c4307285 1678 *
b97bf3fd
PL
1679 * Returns 0 on success, errno otherwise
1680 */
247f0f3c 1681static int tipc_listen(struct socket *sock, int len)
b97bf3fd 1682{
0c3141e9
AS
1683 struct sock *sk = sock->sk;
1684 int res;
1685
1686 lock_sock(sk);
b97bf3fd 1687
245f3d34 1688 if (sock->state != SS_UNCONNECTED)
0c3141e9
AS
1689 res = -EINVAL;
1690 else {
1691 sock->state = SS_LISTENING;
1692 res = 0;
1693 }
1694
1695 release_sock(sk);
1696 return res;
b97bf3fd
PL
1697}
1698
6398e23c
YX
1699static int tipc_wait_for_accept(struct socket *sock, long timeo)
1700{
1701 struct sock *sk = sock->sk;
1702 DEFINE_WAIT(wait);
1703 int err;
1704
1705 /* True wake-one mechanism for incoming connections: only
1706 * one process gets woken up, not the 'whole herd'.
1707 * Since we do not 'race & poll' for established sockets
1708 * anymore, the common case will execute the loop only once.
1709 */
1710 for (;;) {
1711 prepare_to_wait_exclusive(sk_sleep(sk), &wait,
1712 TASK_INTERRUPTIBLE);
fe8e4649 1713 if (timeo && skb_queue_empty(&sk->sk_receive_queue)) {
6398e23c
YX
1714 release_sock(sk);
1715 timeo = schedule_timeout(timeo);
1716 lock_sock(sk);
1717 }
1718 err = 0;
1719 if (!skb_queue_empty(&sk->sk_receive_queue))
1720 break;
1721 err = -EINVAL;
1722 if (sock->state != SS_LISTENING)
1723 break;
1724 err = sock_intr_errno(timeo);
1725 if (signal_pending(current))
1726 break;
1727 err = -EAGAIN;
1728 if (!timeo)
1729 break;
1730 }
1731 finish_wait(sk_sleep(sk), &wait);
1732 return err;
1733}
1734
c4307285 1735/**
247f0f3c 1736 * tipc_accept - wait for connection request
b97bf3fd
PL
1737 * @sock: listening socket
1738 * @newsock: new socket that is to be connected
1739 * @flags: file-related flags associated with socket
c4307285 1740 *
b97bf3fd
PL
1741 * Returns 0 on success, errno otherwise
1742 */
247f0f3c 1743static int tipc_accept(struct socket *sock, struct socket *new_sock, int flags)
b97bf3fd 1744{
0fef8f20 1745 struct sock *new_sk, *sk = sock->sk;
b97bf3fd 1746 struct sk_buff *buf;
8826cde6 1747 struct tipc_port *new_port;
0fef8f20 1748 struct tipc_msg *msg;
f9fef18c 1749 struct tipc_portid peer;
0fef8f20 1750 u32 new_ref;
6398e23c 1751 long timeo;
0c3141e9 1752 int res;
b97bf3fd 1753
0c3141e9 1754 lock_sock(sk);
b97bf3fd 1755
0c3141e9
AS
1756 if (sock->state != SS_LISTENING) {
1757 res = -EINVAL;
b97bf3fd
PL
1758 goto exit;
1759 }
6398e23c
YX
1760 timeo = sock_rcvtimeo(sk, flags & O_NONBLOCK);
1761 res = tipc_wait_for_accept(sock, timeo);
1762 if (res)
1763 goto exit;
0c3141e9
AS
1764
1765 buf = skb_peek(&sk->sk_receive_queue);
1766
c5fa7b3c 1767 res = tipc_sk_create(sock_net(sock->sk), new_sock, 0, 1);
0fef8f20
PG
1768 if (res)
1769 goto exit;
b97bf3fd 1770
0fef8f20 1771 new_sk = new_sock->sk;
58ed9442 1772 new_port = &tipc_sk(new_sk)->port;
8826cde6 1773 new_ref = new_port->ref;
0fef8f20 1774 msg = buf_msg(buf);
b97bf3fd 1775
0fef8f20
PG
1776 /* we lock on new_sk; but lockdep sees the lock on sk */
1777 lock_sock_nested(new_sk, SINGLE_DEPTH_NESTING);
1778
1779 /*
1780 * Reject any stray messages received by new socket
1781 * before the socket lock was taken (very, very unlikely)
1782 */
1783 reject_rx_queue(new_sk);
1784
1785 /* Connect new socket to it's peer */
f9fef18c
JPM
1786 peer.ref = msg_origport(msg);
1787 peer.node = msg_orignode(msg);
1788 tipc_port_connect(new_ref, &peer);
0fef8f20
PG
1789 new_sock->state = SS_CONNECTED;
1790
3b4f302d 1791 tipc_port_set_importance(new_port, msg_importance(msg));
0fef8f20 1792 if (msg_named(msg)) {
8826cde6
JPM
1793 new_port->conn_type = msg_nametype(msg);
1794 new_port->conn_instance = msg_nameinst(msg);
b97bf3fd 1795 }
0fef8f20
PG
1796
1797 /*
1798 * Respond to 'SYN-' by discarding it & returning 'ACK'-.
1799 * Respond to 'SYN+' by queuing it on new socket.
1800 */
1801 if (!msg_data_sz(msg)) {
1802 struct msghdr m = {NULL,};
1803
1804 advance_rx_queue(sk);
247f0f3c 1805 tipc_send_packet(NULL, new_sock, &m, 0);
0fef8f20
PG
1806 } else {
1807 __skb_dequeue(&sk->sk_receive_queue);
1808 __skb_queue_head(&new_sk->sk_receive_queue, buf);
aba79f33 1809 skb_set_owner_r(buf, new_sk);
0fef8f20
PG
1810 }
1811 release_sock(new_sk);
b97bf3fd 1812exit:
0c3141e9 1813 release_sock(sk);
b97bf3fd
PL
1814 return res;
1815}
1816
1817/**
247f0f3c 1818 * tipc_shutdown - shutdown socket connection
b97bf3fd 1819 * @sock: socket structure
e247a8f5 1820 * @how: direction to close (must be SHUT_RDWR)
b97bf3fd
PL
1821 *
1822 * Terminates connection (if necessary), then purges socket's receive queue.
c4307285 1823 *
b97bf3fd
PL
1824 * Returns 0 on success, errno otherwise
1825 */
247f0f3c 1826static int tipc_shutdown(struct socket *sock, int how)
b97bf3fd 1827{
0c3141e9 1828 struct sock *sk = sock->sk;
58ed9442
JPM
1829 struct tipc_sock *tsk = tipc_sk(sk);
1830 struct tipc_port *port = &tsk->port;
b97bf3fd 1831 struct sk_buff *buf;
8db1bae3 1832 u32 peer;
b97bf3fd
PL
1833 int res;
1834
e247a8f5
AS
1835 if (how != SHUT_RDWR)
1836 return -EINVAL;
b97bf3fd 1837
0c3141e9 1838 lock_sock(sk);
b97bf3fd
PL
1839
1840 switch (sock->state) {
0c3141e9 1841 case SS_CONNECTING:
b97bf3fd
PL
1842 case SS_CONNECTED:
1843
b97bf3fd 1844restart:
617d3c7a 1845 /* Disconnect and send a 'FIN+' or 'FIN-' message to peer */
0c3141e9
AS
1846 buf = __skb_dequeue(&sk->sk_receive_queue);
1847 if (buf) {
40682432 1848 if (TIPC_SKB_CB(buf)->handle != NULL) {
5f6d9123 1849 kfree_skb(buf);
b97bf3fd
PL
1850 goto restart;
1851 }
58ed9442 1852 tipc_port_disconnect(port->ref);
8db1bae3
JPM
1853 if (tipc_msg_reverse(buf, &peer, TIPC_CONN_SHUTDOWN))
1854 tipc_link_xmit2(buf, peer, 0);
0c3141e9 1855 } else {
58ed9442 1856 tipc_port_shutdown(port->ref);
b97bf3fd 1857 }
0c3141e9
AS
1858
1859 sock->state = SS_DISCONNECTING;
b97bf3fd
PL
1860
1861 /* fall through */
1862
1863 case SS_DISCONNECTING:
1864
75031151 1865 /* Discard any unreceived messages */
57467e56 1866 __skb_queue_purge(&sk->sk_receive_queue);
75031151
YX
1867
1868 /* Wake up anyone sleeping in poll */
1869 sk->sk_state_change(sk);
b97bf3fd
PL
1870 res = 0;
1871 break;
1872
1873 default:
1874 res = -ENOTCONN;
1875 }
1876
0c3141e9 1877 release_sock(sk);
b97bf3fd
PL
1878 return res;
1879}
1880
1881/**
247f0f3c 1882 * tipc_setsockopt - set socket option
b97bf3fd
PL
1883 * @sock: socket structure
1884 * @lvl: option level
1885 * @opt: option identifier
1886 * @ov: pointer to new option value
1887 * @ol: length of option value
c4307285
YH
1888 *
1889 * For stream sockets only, accepts and ignores all IPPROTO_TCP options
b97bf3fd 1890 * (to ease compatibility).
c4307285 1891 *
b97bf3fd
PL
1892 * Returns 0 on success, errno otherwise
1893 */
247f0f3c
YX
1894static int tipc_setsockopt(struct socket *sock, int lvl, int opt,
1895 char __user *ov, unsigned int ol)
b97bf3fd 1896{
0c3141e9 1897 struct sock *sk = sock->sk;
58ed9442
JPM
1898 struct tipc_sock *tsk = tipc_sk(sk);
1899 struct tipc_port *port = &tsk->port;
b97bf3fd
PL
1900 u32 value;
1901 int res;
1902
c4307285
YH
1903 if ((lvl == IPPROTO_TCP) && (sock->type == SOCK_STREAM))
1904 return 0;
b97bf3fd
PL
1905 if (lvl != SOL_TIPC)
1906 return -ENOPROTOOPT;
1907 if (ol < sizeof(value))
1908 return -EINVAL;
2db9983a
AS
1909 res = get_user(value, (u32 __user *)ov);
1910 if (res)
b97bf3fd
PL
1911 return res;
1912
0c3141e9 1913 lock_sock(sk);
c4307285 1914
b97bf3fd
PL
1915 switch (opt) {
1916 case TIPC_IMPORTANCE:
58ed9442 1917 tipc_port_set_importance(port, value);
b97bf3fd
PL
1918 break;
1919 case TIPC_SRC_DROPPABLE:
1920 if (sock->type != SOCK_STREAM)
58ed9442 1921 tipc_port_set_unreliable(port, value);
c4307285 1922 else
b97bf3fd
PL
1923 res = -ENOPROTOOPT;
1924 break;
1925 case TIPC_DEST_DROPPABLE:
58ed9442 1926 tipc_port_set_unreturnable(port, value);
b97bf3fd
PL
1927 break;
1928 case TIPC_CONN_TIMEOUT:
a0f40f02 1929 tipc_sk(sk)->conn_timeout = value;
0c3141e9 1930 /* no need to set "res", since already 0 at this point */
b97bf3fd
PL
1931 break;
1932 default:
1933 res = -EINVAL;
1934 }
1935
0c3141e9
AS
1936 release_sock(sk);
1937
b97bf3fd
PL
1938 return res;
1939}
1940
1941/**
247f0f3c 1942 * tipc_getsockopt - get socket option
b97bf3fd
PL
1943 * @sock: socket structure
1944 * @lvl: option level
1945 * @opt: option identifier
1946 * @ov: receptacle for option value
1947 * @ol: receptacle for length of option value
c4307285
YH
1948 *
1949 * For stream sockets only, returns 0 length result for all IPPROTO_TCP options
b97bf3fd 1950 * (to ease compatibility).
c4307285 1951 *
b97bf3fd
PL
1952 * Returns 0 on success, errno otherwise
1953 */
247f0f3c
YX
1954static int tipc_getsockopt(struct socket *sock, int lvl, int opt,
1955 char __user *ov, int __user *ol)
b97bf3fd 1956{
0c3141e9 1957 struct sock *sk = sock->sk;
58ed9442
JPM
1958 struct tipc_sock *tsk = tipc_sk(sk);
1959 struct tipc_port *port = &tsk->port;
c4307285 1960 int len;
b97bf3fd 1961 u32 value;
c4307285 1962 int res;
b97bf3fd 1963
c4307285
YH
1964 if ((lvl == IPPROTO_TCP) && (sock->type == SOCK_STREAM))
1965 return put_user(0, ol);
b97bf3fd
PL
1966 if (lvl != SOL_TIPC)
1967 return -ENOPROTOOPT;
2db9983a
AS
1968 res = get_user(len, ol);
1969 if (res)
c4307285 1970 return res;
b97bf3fd 1971
0c3141e9 1972 lock_sock(sk);
b97bf3fd
PL
1973
1974 switch (opt) {
1975 case TIPC_IMPORTANCE:
58ed9442 1976 value = tipc_port_importance(port);
b97bf3fd
PL
1977 break;
1978 case TIPC_SRC_DROPPABLE:
58ed9442 1979 value = tipc_port_unreliable(port);
b97bf3fd
PL
1980 break;
1981 case TIPC_DEST_DROPPABLE:
58ed9442 1982 value = tipc_port_unreturnable(port);
b97bf3fd
PL
1983 break;
1984 case TIPC_CONN_TIMEOUT:
a0f40f02 1985 value = tipc_sk(sk)->conn_timeout;
0c3141e9 1986 /* no need to set "res", since already 0 at this point */
b97bf3fd 1987 break;
0e65967e 1988 case TIPC_NODE_RECVQ_DEPTH:
9da3d475 1989 value = 0; /* was tipc_queue_size, now obsolete */
6650613d 1990 break;
0e65967e 1991 case TIPC_SOCK_RECVQ_DEPTH:
6650613d 1992 value = skb_queue_len(&sk->sk_receive_queue);
1993 break;
b97bf3fd
PL
1994 default:
1995 res = -EINVAL;
1996 }
1997
0c3141e9
AS
1998 release_sock(sk);
1999
25860c3b
PG
2000 if (res)
2001 return res; /* "get" failed */
b97bf3fd 2002
25860c3b
PG
2003 if (len < sizeof(value))
2004 return -EINVAL;
2005
2006 if (copy_to_user(ov, &value, sizeof(value)))
2007 return -EFAULT;
2008
2009 return put_user(sizeof(value), ol);
b97bf3fd
PL
2010}
2011
78acb1f9
EH
2012int tipc_ioctl(struct socket *sk, unsigned int cmd, unsigned long arg)
2013{
2014 struct tipc_sioc_ln_req lnr;
2015 void __user *argp = (void __user *)arg;
2016
2017 switch (cmd) {
2018 case SIOCGETLINKNAME:
2019 if (copy_from_user(&lnr, argp, sizeof(lnr)))
2020 return -EFAULT;
2021 if (!tipc_node_get_linkname(lnr.bearer_id, lnr.peer,
2022 lnr.linkname, TIPC_MAX_LINK_NAME)) {
2023 if (copy_to_user(argp, &lnr, sizeof(lnr)))
2024 return -EFAULT;
2025 return 0;
2026 }
2027 return -EADDRNOTAVAIL;
2028 break;
2029 default:
2030 return -ENOIOCTLCMD;
2031 }
2032}
2033
ae86b9e3
BH
2034/* Protocol switches for the various types of TIPC sockets */
2035
bca65eae 2036static const struct proto_ops msg_ops = {
0e65967e 2037 .owner = THIS_MODULE,
b97bf3fd 2038 .family = AF_TIPC,
247f0f3c
YX
2039 .release = tipc_release,
2040 .bind = tipc_bind,
2041 .connect = tipc_connect,
5eee6a6d 2042 .socketpair = sock_no_socketpair,
245f3d34 2043 .accept = sock_no_accept,
247f0f3c
YX
2044 .getname = tipc_getname,
2045 .poll = tipc_poll,
78acb1f9 2046 .ioctl = tipc_ioctl,
245f3d34 2047 .listen = sock_no_listen,
247f0f3c
YX
2048 .shutdown = tipc_shutdown,
2049 .setsockopt = tipc_setsockopt,
2050 .getsockopt = tipc_getsockopt,
2051 .sendmsg = tipc_sendmsg,
2052 .recvmsg = tipc_recvmsg,
8238745a
YH
2053 .mmap = sock_no_mmap,
2054 .sendpage = sock_no_sendpage
b97bf3fd
PL
2055};
2056
bca65eae 2057static const struct proto_ops packet_ops = {
0e65967e 2058 .owner = THIS_MODULE,
b97bf3fd 2059 .family = AF_TIPC,
247f0f3c
YX
2060 .release = tipc_release,
2061 .bind = tipc_bind,
2062 .connect = tipc_connect,
5eee6a6d 2063 .socketpair = sock_no_socketpair,
247f0f3c
YX
2064 .accept = tipc_accept,
2065 .getname = tipc_getname,
2066 .poll = tipc_poll,
78acb1f9 2067 .ioctl = tipc_ioctl,
247f0f3c
YX
2068 .listen = tipc_listen,
2069 .shutdown = tipc_shutdown,
2070 .setsockopt = tipc_setsockopt,
2071 .getsockopt = tipc_getsockopt,
2072 .sendmsg = tipc_send_packet,
2073 .recvmsg = tipc_recvmsg,
8238745a
YH
2074 .mmap = sock_no_mmap,
2075 .sendpage = sock_no_sendpage
b97bf3fd
PL
2076};
2077
bca65eae 2078static const struct proto_ops stream_ops = {
0e65967e 2079 .owner = THIS_MODULE,
b97bf3fd 2080 .family = AF_TIPC,
247f0f3c
YX
2081 .release = tipc_release,
2082 .bind = tipc_bind,
2083 .connect = tipc_connect,
5eee6a6d 2084 .socketpair = sock_no_socketpair,
247f0f3c
YX
2085 .accept = tipc_accept,
2086 .getname = tipc_getname,
2087 .poll = tipc_poll,
78acb1f9 2088 .ioctl = tipc_ioctl,
247f0f3c
YX
2089 .listen = tipc_listen,
2090 .shutdown = tipc_shutdown,
2091 .setsockopt = tipc_setsockopt,
2092 .getsockopt = tipc_getsockopt,
2093 .sendmsg = tipc_send_stream,
2094 .recvmsg = tipc_recv_stream,
8238745a
YH
2095 .mmap = sock_no_mmap,
2096 .sendpage = sock_no_sendpage
b97bf3fd
PL
2097};
2098
bca65eae 2099static const struct net_proto_family tipc_family_ops = {
0e65967e 2100 .owner = THIS_MODULE,
b97bf3fd 2101 .family = AF_TIPC,
c5fa7b3c 2102 .create = tipc_sk_create
b97bf3fd
PL
2103};
2104
2105static struct proto tipc_proto = {
2106 .name = "TIPC",
2107 .owner = THIS_MODULE,
cc79dd1b
YX
2108 .obj_size = sizeof(struct tipc_sock),
2109 .sysctl_rmem = sysctl_tipc_rmem
b97bf3fd
PL
2110};
2111
c5fa7b3c
YX
2112static struct proto tipc_proto_kern = {
2113 .name = "TIPC",
2114 .obj_size = sizeof(struct tipc_sock),
2115 .sysctl_rmem = sysctl_tipc_rmem
2116};
2117
b97bf3fd 2118/**
4323add6 2119 * tipc_socket_init - initialize TIPC socket interface
c4307285 2120 *
b97bf3fd
PL
2121 * Returns 0 on success, errno otherwise
2122 */
4323add6 2123int tipc_socket_init(void)
b97bf3fd
PL
2124{
2125 int res;
2126
c4307285 2127 res = proto_register(&tipc_proto, 1);
b97bf3fd 2128 if (res) {
2cf8aa19 2129 pr_err("Failed to register TIPC protocol type\n");
b97bf3fd
PL
2130 goto out;
2131 }
2132
2133 res = sock_register(&tipc_family_ops);
2134 if (res) {
2cf8aa19 2135 pr_err("Failed to register TIPC socket type\n");
b97bf3fd
PL
2136 proto_unregister(&tipc_proto);
2137 goto out;
2138 }
b97bf3fd
PL
2139 out:
2140 return res;
2141}
2142
2143/**
4323add6 2144 * tipc_socket_stop - stop TIPC socket interface
b97bf3fd 2145 */
4323add6 2146void tipc_socket_stop(void)
b97bf3fd 2147{
b97bf3fd
PL
2148 sock_unregister(tipc_family_ops.family);
2149 proto_unregister(&tipc_proto);
2150}
This page took 0.840786 seconds and 5 git commands to generate.