Merge branch 'davem-next' of master.kernel.org:/pub/scm/linux/kernel/git/jgarzik...
[deliverable/linux.git] / net / ipv6 / tcp_ipv6.c
1 /*
2 * TCP over IPv6
3 * Linux INET6 implementation
4 *
5 * Authors:
6 * Pedro Roque <roque@di.fc.ul.pt>
7 *
8 * Based on:
9 * linux/net/ipv4/tcp.c
10 * linux/net/ipv4/tcp_input.c
11 * linux/net/ipv4/tcp_output.c
12 *
13 * Fixes:
14 * Hideaki YOSHIFUJI : sin6_scope_id support
15 * YOSHIFUJI Hideaki @USAGI and: Support IPV6_V6ONLY socket option, which
16 * Alexey Kuznetsov allow both IPv4 and IPv6 sockets to bind
17 * a single port at the same time.
18 * YOSHIFUJI Hideaki @USAGI: convert /proc/net/tcp6 to seq_file.
19 *
20 * This program is free software; you can redistribute it and/or
21 * modify it under the terms of the GNU General Public License
22 * as published by the Free Software Foundation; either version
23 * 2 of the License, or (at your option) any later version.
24 */
25
26 #include <linux/module.h>
27 #include <linux/errno.h>
28 #include <linux/types.h>
29 #include <linux/socket.h>
30 #include <linux/sockios.h>
31 #include <linux/net.h>
32 #include <linux/jiffies.h>
33 #include <linux/in.h>
34 #include <linux/in6.h>
35 #include <linux/netdevice.h>
36 #include <linux/init.h>
37 #include <linux/jhash.h>
38 #include <linux/ipsec.h>
39 #include <linux/times.h>
40
41 #include <linux/ipv6.h>
42 #include <linux/icmpv6.h>
43 #include <linux/random.h>
44
45 #include <net/tcp.h>
46 #include <net/ndisc.h>
47 #include <net/inet6_hashtables.h>
48 #include <net/inet6_connection_sock.h>
49 #include <net/ipv6.h>
50 #include <net/transp_v6.h>
51 #include <net/addrconf.h>
52 #include <net/ip6_route.h>
53 #include <net/ip6_checksum.h>
54 #include <net/inet_ecn.h>
55 #include <net/protocol.h>
56 #include <net/xfrm.h>
57 #include <net/snmp.h>
58 #include <net/dsfield.h>
59 #include <net/timewait_sock.h>
60 #include <net/netdma.h>
61 #include <net/inet_common.h>
62
63 #include <asm/uaccess.h>
64
65 #include <linux/proc_fs.h>
66 #include <linux/seq_file.h>
67
68 #include <linux/crypto.h>
69 #include <linux/scatterlist.h>
70
71 static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb);
72 static void tcp_v6_reqsk_send_ack(struct sk_buff *skb, struct request_sock *req);
73 static void tcp_v6_send_check(struct sock *sk, int len,
74 struct sk_buff *skb);
75
76 static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb);
77
78 static struct inet_connection_sock_af_ops ipv6_mapped;
79 static struct inet_connection_sock_af_ops ipv6_specific;
80 #ifdef CONFIG_TCP_MD5SIG
81 static struct tcp_sock_af_ops tcp_sock_ipv6_specific;
82 static struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific;
83 #else
84 static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
85 struct in6_addr *addr)
86 {
87 return NULL;
88 }
89 #endif
90
91 static void tcp_v6_hash(struct sock *sk)
92 {
93 if (sk->sk_state != TCP_CLOSE) {
94 if (inet_csk(sk)->icsk_af_ops == &ipv6_mapped) {
95 tcp_prot.hash(sk);
96 return;
97 }
98 local_bh_disable();
99 __inet6_hash(sk);
100 local_bh_enable();
101 }
102 }
103
104 static __inline__ __sum16 tcp_v6_check(struct tcphdr *th, int len,
105 struct in6_addr *saddr,
106 struct in6_addr *daddr,
107 __wsum base)
108 {
109 return csum_ipv6_magic(saddr, daddr, len, IPPROTO_TCP, base);
110 }
111
112 static __u32 tcp_v6_init_sequence(struct sk_buff *skb)
113 {
114 return secure_tcpv6_sequence_number(ipv6_hdr(skb)->daddr.s6_addr32,
115 ipv6_hdr(skb)->saddr.s6_addr32,
116 tcp_hdr(skb)->dest,
117 tcp_hdr(skb)->source);
118 }
119
120 static int tcp_v6_connect(struct sock *sk, struct sockaddr *uaddr,
121 int addr_len)
122 {
123 struct sockaddr_in6 *usin = (struct sockaddr_in6 *) uaddr;
124 struct inet_sock *inet = inet_sk(sk);
125 struct inet_connection_sock *icsk = inet_csk(sk);
126 struct ipv6_pinfo *np = inet6_sk(sk);
127 struct tcp_sock *tp = tcp_sk(sk);
128 struct in6_addr *saddr = NULL, *final_p = NULL, final;
129 struct flowi fl;
130 struct dst_entry *dst;
131 int addr_type;
132 int err;
133
134 if (addr_len < SIN6_LEN_RFC2133)
135 return -EINVAL;
136
137 if (usin->sin6_family != AF_INET6)
138 return(-EAFNOSUPPORT);
139
140 memset(&fl, 0, sizeof(fl));
141
142 if (np->sndflow) {
143 fl.fl6_flowlabel = usin->sin6_flowinfo&IPV6_FLOWINFO_MASK;
144 IP6_ECN_flow_init(fl.fl6_flowlabel);
145 if (fl.fl6_flowlabel&IPV6_FLOWLABEL_MASK) {
146 struct ip6_flowlabel *flowlabel;
147 flowlabel = fl6_sock_lookup(sk, fl.fl6_flowlabel);
148 if (flowlabel == NULL)
149 return -EINVAL;
150 ipv6_addr_copy(&usin->sin6_addr, &flowlabel->dst);
151 fl6_sock_release(flowlabel);
152 }
153 }
154
155 /*
156 * connect() to INADDR_ANY means loopback (BSD'ism).
157 */
158
159 if(ipv6_addr_any(&usin->sin6_addr))
160 usin->sin6_addr.s6_addr[15] = 0x1;
161
162 addr_type = ipv6_addr_type(&usin->sin6_addr);
163
164 if(addr_type & IPV6_ADDR_MULTICAST)
165 return -ENETUNREACH;
166
167 if (addr_type&IPV6_ADDR_LINKLOCAL) {
168 if (addr_len >= sizeof(struct sockaddr_in6) &&
169 usin->sin6_scope_id) {
170 /* If interface is set while binding, indices
171 * must coincide.
172 */
173 if (sk->sk_bound_dev_if &&
174 sk->sk_bound_dev_if != usin->sin6_scope_id)
175 return -EINVAL;
176
177 sk->sk_bound_dev_if = usin->sin6_scope_id;
178 }
179
180 /* Connect to link-local address requires an interface */
181 if (!sk->sk_bound_dev_if)
182 return -EINVAL;
183 }
184
185 if (tp->rx_opt.ts_recent_stamp &&
186 !ipv6_addr_equal(&np->daddr, &usin->sin6_addr)) {
187 tp->rx_opt.ts_recent = 0;
188 tp->rx_opt.ts_recent_stamp = 0;
189 tp->write_seq = 0;
190 }
191
192 ipv6_addr_copy(&np->daddr, &usin->sin6_addr);
193 np->flow_label = fl.fl6_flowlabel;
194
195 /*
196 * TCP over IPv4
197 */
198
199 if (addr_type == IPV6_ADDR_MAPPED) {
200 u32 exthdrlen = icsk->icsk_ext_hdr_len;
201 struct sockaddr_in sin;
202
203 SOCK_DEBUG(sk, "connect: ipv4 mapped\n");
204
205 if (__ipv6_only_sock(sk))
206 return -ENETUNREACH;
207
208 sin.sin_family = AF_INET;
209 sin.sin_port = usin->sin6_port;
210 sin.sin_addr.s_addr = usin->sin6_addr.s6_addr32[3];
211
212 icsk->icsk_af_ops = &ipv6_mapped;
213 sk->sk_backlog_rcv = tcp_v4_do_rcv;
214 #ifdef CONFIG_TCP_MD5SIG
215 tp->af_specific = &tcp_sock_ipv6_mapped_specific;
216 #endif
217
218 err = tcp_v4_connect(sk, (struct sockaddr *)&sin, sizeof(sin));
219
220 if (err) {
221 icsk->icsk_ext_hdr_len = exthdrlen;
222 icsk->icsk_af_ops = &ipv6_specific;
223 sk->sk_backlog_rcv = tcp_v6_do_rcv;
224 #ifdef CONFIG_TCP_MD5SIG
225 tp->af_specific = &tcp_sock_ipv6_specific;
226 #endif
227 goto failure;
228 } else {
229 ipv6_addr_set(&np->saddr, 0, 0, htonl(0x0000FFFF),
230 inet->saddr);
231 ipv6_addr_set(&np->rcv_saddr, 0, 0, htonl(0x0000FFFF),
232 inet->rcv_saddr);
233 }
234
235 return err;
236 }
237
238 if (!ipv6_addr_any(&np->rcv_saddr))
239 saddr = &np->rcv_saddr;
240
241 fl.proto = IPPROTO_TCP;
242 ipv6_addr_copy(&fl.fl6_dst, &np->daddr);
243 ipv6_addr_copy(&fl.fl6_src,
244 (saddr ? saddr : &np->saddr));
245 fl.oif = sk->sk_bound_dev_if;
246 fl.fl_ip_dport = usin->sin6_port;
247 fl.fl_ip_sport = inet->sport;
248
249 if (np->opt && np->opt->srcrt) {
250 struct rt0_hdr *rt0 = (struct rt0_hdr *)np->opt->srcrt;
251 ipv6_addr_copy(&final, &fl.fl6_dst);
252 ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
253 final_p = &final;
254 }
255
256 security_sk_classify_flow(sk, &fl);
257
258 err = ip6_dst_lookup(sk, &dst, &fl);
259 if (err)
260 goto failure;
261 if (final_p)
262 ipv6_addr_copy(&fl.fl6_dst, final_p);
263
264 if ((err = __xfrm_lookup(&dst, &fl, sk, XFRM_LOOKUP_WAIT)) < 0) {
265 if (err == -EREMOTE)
266 err = ip6_dst_blackhole(sk, &dst, &fl);
267 if (err < 0)
268 goto failure;
269 }
270
271 if (saddr == NULL) {
272 saddr = &fl.fl6_src;
273 ipv6_addr_copy(&np->rcv_saddr, saddr);
274 }
275
276 /* set the source address */
277 ipv6_addr_copy(&np->saddr, saddr);
278 inet->rcv_saddr = LOOPBACK4_IPV6;
279
280 sk->sk_gso_type = SKB_GSO_TCPV6;
281 __ip6_dst_store(sk, dst, NULL, NULL);
282
283 icsk->icsk_ext_hdr_len = 0;
284 if (np->opt)
285 icsk->icsk_ext_hdr_len = (np->opt->opt_flen +
286 np->opt->opt_nflen);
287
288 tp->rx_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
289
290 inet->dport = usin->sin6_port;
291
292 tcp_set_state(sk, TCP_SYN_SENT);
293 err = inet6_hash_connect(&tcp_death_row, sk);
294 if (err)
295 goto late_failure;
296
297 if (!tp->write_seq)
298 tp->write_seq = secure_tcpv6_sequence_number(np->saddr.s6_addr32,
299 np->daddr.s6_addr32,
300 inet->sport,
301 inet->dport);
302
303 err = tcp_connect(sk);
304 if (err)
305 goto late_failure;
306
307 return 0;
308
309 late_failure:
310 tcp_set_state(sk, TCP_CLOSE);
311 __sk_dst_reset(sk);
312 failure:
313 inet->dport = 0;
314 sk->sk_route_caps = 0;
315 return err;
316 }
317
318 static void tcp_v6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
319 int type, int code, int offset, __be32 info)
320 {
321 struct ipv6hdr *hdr = (struct ipv6hdr*)skb->data;
322 const struct tcphdr *th = (struct tcphdr *)(skb->data+offset);
323 struct ipv6_pinfo *np;
324 struct sock *sk;
325 int err;
326 struct tcp_sock *tp;
327 __u32 seq;
328
329 sk = inet6_lookup(dev_net(skb->dev), &tcp_hashinfo, &hdr->daddr,
330 th->dest, &hdr->saddr, th->source, skb->dev->ifindex);
331
332 if (sk == NULL) {
333 ICMP6_INC_STATS_BH(__in6_dev_get(skb->dev), ICMP6_MIB_INERRORS);
334 return;
335 }
336
337 if (sk->sk_state == TCP_TIME_WAIT) {
338 inet_twsk_put(inet_twsk(sk));
339 return;
340 }
341
342 bh_lock_sock(sk);
343 if (sock_owned_by_user(sk))
344 NET_INC_STATS_BH(LINUX_MIB_LOCKDROPPEDICMPS);
345
346 if (sk->sk_state == TCP_CLOSE)
347 goto out;
348
349 tp = tcp_sk(sk);
350 seq = ntohl(th->seq);
351 if (sk->sk_state != TCP_LISTEN &&
352 !between(seq, tp->snd_una, tp->snd_nxt)) {
353 NET_INC_STATS_BH(LINUX_MIB_OUTOFWINDOWICMPS);
354 goto out;
355 }
356
357 np = inet6_sk(sk);
358
359 if (type == ICMPV6_PKT_TOOBIG) {
360 struct dst_entry *dst = NULL;
361
362 if (sock_owned_by_user(sk))
363 goto out;
364 if ((1 << sk->sk_state) & (TCPF_LISTEN | TCPF_CLOSE))
365 goto out;
366
367 /* icmp should have updated the destination cache entry */
368 dst = __sk_dst_check(sk, np->dst_cookie);
369
370 if (dst == NULL) {
371 struct inet_sock *inet = inet_sk(sk);
372 struct flowi fl;
373
374 /* BUGGG_FUTURE: Again, it is not clear how
375 to handle rthdr case. Ignore this complexity
376 for now.
377 */
378 memset(&fl, 0, sizeof(fl));
379 fl.proto = IPPROTO_TCP;
380 ipv6_addr_copy(&fl.fl6_dst, &np->daddr);
381 ipv6_addr_copy(&fl.fl6_src, &np->saddr);
382 fl.oif = sk->sk_bound_dev_if;
383 fl.fl_ip_dport = inet->dport;
384 fl.fl_ip_sport = inet->sport;
385 security_skb_classify_flow(skb, &fl);
386
387 if ((err = ip6_dst_lookup(sk, &dst, &fl))) {
388 sk->sk_err_soft = -err;
389 goto out;
390 }
391
392 if ((err = xfrm_lookup(&dst, &fl, sk, 0)) < 0) {
393 sk->sk_err_soft = -err;
394 goto out;
395 }
396
397 } else
398 dst_hold(dst);
399
400 if (inet_csk(sk)->icsk_pmtu_cookie > dst_mtu(dst)) {
401 tcp_sync_mss(sk, dst_mtu(dst));
402 tcp_simple_retransmit(sk);
403 } /* else let the usual retransmit timer handle it */
404 dst_release(dst);
405 goto out;
406 }
407
408 icmpv6_err_convert(type, code, &err);
409
410 /* Might be for an request_sock */
411 switch (sk->sk_state) {
412 struct request_sock *req, **prev;
413 case TCP_LISTEN:
414 if (sock_owned_by_user(sk))
415 goto out;
416
417 req = inet6_csk_search_req(sk, &prev, th->dest, &hdr->daddr,
418 &hdr->saddr, inet6_iif(skb));
419 if (!req)
420 goto out;
421
422 /* ICMPs are not backlogged, hence we cannot get
423 * an established socket here.
424 */
425 BUG_TRAP(req->sk == NULL);
426
427 if (seq != tcp_rsk(req)->snt_isn) {
428 NET_INC_STATS_BH(LINUX_MIB_OUTOFWINDOWICMPS);
429 goto out;
430 }
431
432 inet_csk_reqsk_queue_drop(sk, req, prev);
433 goto out;
434
435 case TCP_SYN_SENT:
436 case TCP_SYN_RECV: /* Cannot happen.
437 It can, it SYNs are crossed. --ANK */
438 if (!sock_owned_by_user(sk)) {
439 sk->sk_err = err;
440 sk->sk_error_report(sk); /* Wake people up to see the error (see connect in sock.c) */
441
442 tcp_done(sk);
443 } else
444 sk->sk_err_soft = err;
445 goto out;
446 }
447
448 if (!sock_owned_by_user(sk) && np->recverr) {
449 sk->sk_err = err;
450 sk->sk_error_report(sk);
451 } else
452 sk->sk_err_soft = err;
453
454 out:
455 bh_unlock_sock(sk);
456 sock_put(sk);
457 }
458
459
460 static int tcp_v6_send_synack(struct sock *sk, struct request_sock *req)
461 {
462 struct inet6_request_sock *treq = inet6_rsk(req);
463 struct ipv6_pinfo *np = inet6_sk(sk);
464 struct sk_buff * skb;
465 struct ipv6_txoptions *opt = NULL;
466 struct in6_addr * final_p = NULL, final;
467 struct flowi fl;
468 struct dst_entry *dst;
469 int err = -1;
470
471 memset(&fl, 0, sizeof(fl));
472 fl.proto = IPPROTO_TCP;
473 ipv6_addr_copy(&fl.fl6_dst, &treq->rmt_addr);
474 ipv6_addr_copy(&fl.fl6_src, &treq->loc_addr);
475 fl.fl6_flowlabel = 0;
476 fl.oif = treq->iif;
477 fl.fl_ip_dport = inet_rsk(req)->rmt_port;
478 fl.fl_ip_sport = inet_sk(sk)->sport;
479 security_req_classify_flow(req, &fl);
480
481 opt = np->opt;
482 if (opt && opt->srcrt) {
483 struct rt0_hdr *rt0 = (struct rt0_hdr *) opt->srcrt;
484 ipv6_addr_copy(&final, &fl.fl6_dst);
485 ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
486 final_p = &final;
487 }
488
489 err = ip6_dst_lookup(sk, &dst, &fl);
490 if (err)
491 goto done;
492 if (final_p)
493 ipv6_addr_copy(&fl.fl6_dst, final_p);
494 if ((err = xfrm_lookup(&dst, &fl, sk, 0)) < 0)
495 goto done;
496
497 skb = tcp_make_synack(sk, dst, req);
498 if (skb) {
499 struct tcphdr *th = tcp_hdr(skb);
500
501 th->check = tcp_v6_check(th, skb->len,
502 &treq->loc_addr, &treq->rmt_addr,
503 csum_partial((char *)th, skb->len, skb->csum));
504
505 ipv6_addr_copy(&fl.fl6_dst, &treq->rmt_addr);
506 err = ip6_xmit(sk, skb, &fl, opt, 0);
507 err = net_xmit_eval(err);
508 }
509
510 done:
511 if (opt && opt != np->opt)
512 sock_kfree_s(sk, opt, opt->tot_len);
513 dst_release(dst);
514 return err;
515 }
516
517 static inline void syn_flood_warning(struct sk_buff *skb)
518 {
519 #ifdef CONFIG_SYN_COOKIES
520 if (sysctl_tcp_syncookies)
521 printk(KERN_INFO
522 "TCPv6: Possible SYN flooding on port %d. "
523 "Sending cookies.\n", ntohs(tcp_hdr(skb)->dest));
524 else
525 #endif
526 printk(KERN_INFO
527 "TCPv6: Possible SYN flooding on port %d. "
528 "Dropping request.\n", ntohs(tcp_hdr(skb)->dest));
529 }
530
531 static void tcp_v6_reqsk_destructor(struct request_sock *req)
532 {
533 if (inet6_rsk(req)->pktopts)
534 kfree_skb(inet6_rsk(req)->pktopts);
535 }
536
537 #ifdef CONFIG_TCP_MD5SIG
538 static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
539 struct in6_addr *addr)
540 {
541 struct tcp_sock *tp = tcp_sk(sk);
542 int i;
543
544 BUG_ON(tp == NULL);
545
546 if (!tp->md5sig_info || !tp->md5sig_info->entries6)
547 return NULL;
548
549 for (i = 0; i < tp->md5sig_info->entries6; i++) {
550 if (ipv6_addr_equal(&tp->md5sig_info->keys6[i].addr, addr))
551 return &tp->md5sig_info->keys6[i].base;
552 }
553 return NULL;
554 }
555
556 static struct tcp_md5sig_key *tcp_v6_md5_lookup(struct sock *sk,
557 struct sock *addr_sk)
558 {
559 return tcp_v6_md5_do_lookup(sk, &inet6_sk(addr_sk)->daddr);
560 }
561
562 static struct tcp_md5sig_key *tcp_v6_reqsk_md5_lookup(struct sock *sk,
563 struct request_sock *req)
564 {
565 return tcp_v6_md5_do_lookup(sk, &inet6_rsk(req)->rmt_addr);
566 }
567
568 static int tcp_v6_md5_do_add(struct sock *sk, struct in6_addr *peer,
569 char *newkey, u8 newkeylen)
570 {
571 /* Add key to the list */
572 struct tcp_md5sig_key *key;
573 struct tcp_sock *tp = tcp_sk(sk);
574 struct tcp6_md5sig_key *keys;
575
576 key = tcp_v6_md5_do_lookup(sk, peer);
577 if (key) {
578 /* modify existing entry - just update that one */
579 kfree(key->key);
580 key->key = newkey;
581 key->keylen = newkeylen;
582 } else {
583 /* reallocate new list if current one is full. */
584 if (!tp->md5sig_info) {
585 tp->md5sig_info = kzalloc(sizeof(*tp->md5sig_info), GFP_ATOMIC);
586 if (!tp->md5sig_info) {
587 kfree(newkey);
588 return -ENOMEM;
589 }
590 sk->sk_route_caps &= ~NETIF_F_GSO_MASK;
591 }
592 if (tcp_alloc_md5sig_pool() == NULL) {
593 kfree(newkey);
594 return -ENOMEM;
595 }
596 if (tp->md5sig_info->alloced6 == tp->md5sig_info->entries6) {
597 keys = kmalloc((sizeof (tp->md5sig_info->keys6[0]) *
598 (tp->md5sig_info->entries6 + 1)), GFP_ATOMIC);
599
600 if (!keys) {
601 tcp_free_md5sig_pool();
602 kfree(newkey);
603 return -ENOMEM;
604 }
605
606 if (tp->md5sig_info->entries6)
607 memmove(keys, tp->md5sig_info->keys6,
608 (sizeof (tp->md5sig_info->keys6[0]) *
609 tp->md5sig_info->entries6));
610
611 kfree(tp->md5sig_info->keys6);
612 tp->md5sig_info->keys6 = keys;
613 tp->md5sig_info->alloced6++;
614 }
615
616 ipv6_addr_copy(&tp->md5sig_info->keys6[tp->md5sig_info->entries6].addr,
617 peer);
618 tp->md5sig_info->keys6[tp->md5sig_info->entries6].base.key = newkey;
619 tp->md5sig_info->keys6[tp->md5sig_info->entries6].base.keylen = newkeylen;
620
621 tp->md5sig_info->entries6++;
622 }
623 return 0;
624 }
625
626 static int tcp_v6_md5_add_func(struct sock *sk, struct sock *addr_sk,
627 u8 *newkey, __u8 newkeylen)
628 {
629 return tcp_v6_md5_do_add(sk, &inet6_sk(addr_sk)->daddr,
630 newkey, newkeylen);
631 }
632
633 static int tcp_v6_md5_do_del(struct sock *sk, struct in6_addr *peer)
634 {
635 struct tcp_sock *tp = tcp_sk(sk);
636 int i;
637
638 for (i = 0; i < tp->md5sig_info->entries6; i++) {
639 if (ipv6_addr_equal(&tp->md5sig_info->keys6[i].addr, peer)) {
640 /* Free the key */
641 kfree(tp->md5sig_info->keys6[i].base.key);
642 tp->md5sig_info->entries6--;
643
644 if (tp->md5sig_info->entries6 == 0) {
645 kfree(tp->md5sig_info->keys6);
646 tp->md5sig_info->keys6 = NULL;
647 tp->md5sig_info->alloced6 = 0;
648 } else {
649 /* shrink the database */
650 if (tp->md5sig_info->entries6 != i)
651 memmove(&tp->md5sig_info->keys6[i],
652 &tp->md5sig_info->keys6[i+1],
653 (tp->md5sig_info->entries6 - i)
654 * sizeof (tp->md5sig_info->keys6[0]));
655 }
656 tcp_free_md5sig_pool();
657 return 0;
658 }
659 }
660 return -ENOENT;
661 }
662
663 static void tcp_v6_clear_md5_list (struct sock *sk)
664 {
665 struct tcp_sock *tp = tcp_sk(sk);
666 int i;
667
668 if (tp->md5sig_info->entries6) {
669 for (i = 0; i < tp->md5sig_info->entries6; i++)
670 kfree(tp->md5sig_info->keys6[i].base.key);
671 tp->md5sig_info->entries6 = 0;
672 tcp_free_md5sig_pool();
673 }
674
675 kfree(tp->md5sig_info->keys6);
676 tp->md5sig_info->keys6 = NULL;
677 tp->md5sig_info->alloced6 = 0;
678
679 if (tp->md5sig_info->entries4) {
680 for (i = 0; i < tp->md5sig_info->entries4; i++)
681 kfree(tp->md5sig_info->keys4[i].base.key);
682 tp->md5sig_info->entries4 = 0;
683 tcp_free_md5sig_pool();
684 }
685
686 kfree(tp->md5sig_info->keys4);
687 tp->md5sig_info->keys4 = NULL;
688 tp->md5sig_info->alloced4 = 0;
689 }
690
691 static int tcp_v6_parse_md5_keys (struct sock *sk, char __user *optval,
692 int optlen)
693 {
694 struct tcp_md5sig cmd;
695 struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)&cmd.tcpm_addr;
696 u8 *newkey;
697
698 if (optlen < sizeof(cmd))
699 return -EINVAL;
700
701 if (copy_from_user(&cmd, optval, sizeof(cmd)))
702 return -EFAULT;
703
704 if (sin6->sin6_family != AF_INET6)
705 return -EINVAL;
706
707 if (!cmd.tcpm_keylen) {
708 if (!tcp_sk(sk)->md5sig_info)
709 return -ENOENT;
710 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
711 return tcp_v4_md5_do_del(sk, sin6->sin6_addr.s6_addr32[3]);
712 return tcp_v6_md5_do_del(sk, &sin6->sin6_addr);
713 }
714
715 if (cmd.tcpm_keylen > TCP_MD5SIG_MAXKEYLEN)
716 return -EINVAL;
717
718 if (!tcp_sk(sk)->md5sig_info) {
719 struct tcp_sock *tp = tcp_sk(sk);
720 struct tcp_md5sig_info *p;
721
722 p = kzalloc(sizeof(struct tcp_md5sig_info), GFP_KERNEL);
723 if (!p)
724 return -ENOMEM;
725
726 tp->md5sig_info = p;
727 sk->sk_route_caps &= ~NETIF_F_GSO_MASK;
728 }
729
730 newkey = kmemdup(cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
731 if (!newkey)
732 return -ENOMEM;
733 if (ipv6_addr_v4mapped(&sin6->sin6_addr)) {
734 return tcp_v4_md5_do_add(sk, sin6->sin6_addr.s6_addr32[3],
735 newkey, cmd.tcpm_keylen);
736 }
737 return tcp_v6_md5_do_add(sk, &sin6->sin6_addr, newkey, cmd.tcpm_keylen);
738 }
739
740 static int tcp_v6_do_calc_md5_hash(char *md5_hash, struct tcp_md5sig_key *key,
741 struct in6_addr *saddr,
742 struct in6_addr *daddr,
743 struct tcphdr *th, unsigned int tcplen)
744 {
745 struct tcp_md5sig_pool *hp;
746 struct tcp6_pseudohdr *bp;
747 int err;
748
749 hp = tcp_get_md5sig_pool();
750 if (!hp) {
751 printk(KERN_WARNING "%s(): hash pool not found...\n", __func__);
752 goto clear_hash_noput;
753 }
754
755 bp = &hp->md5_blk.ip6;
756
757 /* 1. TCP pseudo-header (RFC2460) */
758 ipv6_addr_copy(&bp->saddr, saddr);
759 ipv6_addr_copy(&bp->daddr, daddr);
760 bp->len = htonl(tcplen);
761 bp->protocol = htonl(IPPROTO_TCP);
762
763 err = tcp_calc_md5_hash(md5_hash, key, sizeof(*bp),
764 th, tcplen, hp);
765
766 if (err)
767 goto clear_hash;
768
769 /* Free up the crypto pool */
770 tcp_put_md5sig_pool();
771 out:
772 return 0;
773 clear_hash:
774 tcp_put_md5sig_pool();
775 clear_hash_noput:
776 memset(md5_hash, 0, 16);
777 goto out;
778 }
779
780 static int tcp_v6_calc_md5_hash(char *md5_hash, struct tcp_md5sig_key *key,
781 struct sock *sk,
782 struct dst_entry *dst,
783 struct request_sock *req,
784 struct tcphdr *th, unsigned int tcplen)
785 {
786 struct in6_addr *saddr, *daddr;
787
788 if (sk) {
789 saddr = &inet6_sk(sk)->saddr;
790 daddr = &inet6_sk(sk)->daddr;
791 } else {
792 saddr = &inet6_rsk(req)->loc_addr;
793 daddr = &inet6_rsk(req)->rmt_addr;
794 }
795 return tcp_v6_do_calc_md5_hash(md5_hash, key,
796 saddr, daddr,
797 th, tcplen);
798 }
799
800 static int tcp_v6_inbound_md5_hash (struct sock *sk, struct sk_buff *skb)
801 {
802 __u8 *hash_location = NULL;
803 struct tcp_md5sig_key *hash_expected;
804 struct ipv6hdr *ip6h = ipv6_hdr(skb);
805 struct tcphdr *th = tcp_hdr(skb);
806 int genhash;
807 u8 newhash[16];
808
809 hash_expected = tcp_v6_md5_do_lookup(sk, &ip6h->saddr);
810 hash_location = tcp_parse_md5sig_option(th);
811
812 /* do we have a hash as expected? */
813 if (!hash_expected) {
814 if (!hash_location)
815 return 0;
816 if (net_ratelimit()) {
817 printk(KERN_INFO "MD5 Hash NOT expected but found "
818 "(" NIP6_FMT ", %u)->"
819 "(" NIP6_FMT ", %u)\n",
820 NIP6(ip6h->saddr), ntohs(th->source),
821 NIP6(ip6h->daddr), ntohs(th->dest));
822 }
823 return 1;
824 }
825
826 if (!hash_location) {
827 if (net_ratelimit()) {
828 printk(KERN_INFO "MD5 Hash expected but NOT found "
829 "(" NIP6_FMT ", %u)->"
830 "(" NIP6_FMT ", %u)\n",
831 NIP6(ip6h->saddr), ntohs(th->source),
832 NIP6(ip6h->daddr), ntohs(th->dest));
833 }
834 return 1;
835 }
836
837 /* check the signature */
838 genhash = tcp_v6_do_calc_md5_hash(newhash,
839 hash_expected,
840 &ip6h->saddr, &ip6h->daddr,
841 th, skb->len);
842 if (genhash || memcmp(hash_location, newhash, 16) != 0) {
843 if (net_ratelimit()) {
844 printk(KERN_INFO "MD5 Hash %s for "
845 "(" NIP6_FMT ", %u)->"
846 "(" NIP6_FMT ", %u)\n",
847 genhash ? "failed" : "mismatch",
848 NIP6(ip6h->saddr), ntohs(th->source),
849 NIP6(ip6h->daddr), ntohs(th->dest));
850 }
851 return 1;
852 }
853 return 0;
854 }
855 #endif
856
857 struct request_sock_ops tcp6_request_sock_ops __read_mostly = {
858 .family = AF_INET6,
859 .obj_size = sizeof(struct tcp6_request_sock),
860 .rtx_syn_ack = tcp_v6_send_synack,
861 .send_ack = tcp_v6_reqsk_send_ack,
862 .destructor = tcp_v6_reqsk_destructor,
863 .send_reset = tcp_v6_send_reset
864 };
865
866 #ifdef CONFIG_TCP_MD5SIG
867 static struct tcp_request_sock_ops tcp_request_sock_ipv6_ops = {
868 .md5_lookup = tcp_v6_reqsk_md5_lookup,
869 };
870 #endif
871
872 static struct timewait_sock_ops tcp6_timewait_sock_ops = {
873 .twsk_obj_size = sizeof(struct tcp6_timewait_sock),
874 .twsk_unique = tcp_twsk_unique,
875 .twsk_destructor= tcp_twsk_destructor,
876 };
877
878 static void tcp_v6_send_check(struct sock *sk, int len, struct sk_buff *skb)
879 {
880 struct ipv6_pinfo *np = inet6_sk(sk);
881 struct tcphdr *th = tcp_hdr(skb);
882
883 if (skb->ip_summed == CHECKSUM_PARTIAL) {
884 th->check = ~csum_ipv6_magic(&np->saddr, &np->daddr, len, IPPROTO_TCP, 0);
885 skb->csum_start = skb_transport_header(skb) - skb->head;
886 skb->csum_offset = offsetof(struct tcphdr, check);
887 } else {
888 th->check = csum_ipv6_magic(&np->saddr, &np->daddr, len, IPPROTO_TCP,
889 csum_partial((char *)th, th->doff<<2,
890 skb->csum));
891 }
892 }
893
894 static int tcp_v6_gso_send_check(struct sk_buff *skb)
895 {
896 struct ipv6hdr *ipv6h;
897 struct tcphdr *th;
898
899 if (!pskb_may_pull(skb, sizeof(*th)))
900 return -EINVAL;
901
902 ipv6h = ipv6_hdr(skb);
903 th = tcp_hdr(skb);
904
905 th->check = 0;
906 th->check = ~csum_ipv6_magic(&ipv6h->saddr, &ipv6h->daddr, skb->len,
907 IPPROTO_TCP, 0);
908 skb->csum_start = skb_transport_header(skb) - skb->head;
909 skb->csum_offset = offsetof(struct tcphdr, check);
910 skb->ip_summed = CHECKSUM_PARTIAL;
911 return 0;
912 }
913
914 static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb)
915 {
916 struct tcphdr *th = tcp_hdr(skb), *t1;
917 struct sk_buff *buff;
918 struct flowi fl;
919 struct net *net = dev_net(skb->dst->dev);
920 struct sock *ctl_sk = net->ipv6.tcp_sk;
921 unsigned int tot_len = sizeof(*th);
922 #ifdef CONFIG_TCP_MD5SIG
923 struct tcp_md5sig_key *key;
924 #endif
925
926 if (th->rst)
927 return;
928
929 if (!ipv6_unicast_destination(skb))
930 return;
931
932 #ifdef CONFIG_TCP_MD5SIG
933 if (sk)
934 key = tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr);
935 else
936 key = NULL;
937
938 if (key)
939 tot_len += TCPOLEN_MD5SIG_ALIGNED;
940 #endif
941
942 /*
943 * We need to grab some memory, and put together an RST,
944 * and then put it into the queue to be sent.
945 */
946
947 buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
948 GFP_ATOMIC);
949 if (buff == NULL)
950 return;
951
952 skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
953
954 t1 = (struct tcphdr *) skb_push(buff, tot_len);
955
956 /* Swap the send and the receive. */
957 memset(t1, 0, sizeof(*t1));
958 t1->dest = th->source;
959 t1->source = th->dest;
960 t1->doff = tot_len / 4;
961 t1->rst = 1;
962
963 if(th->ack) {
964 t1->seq = th->ack_seq;
965 } else {
966 t1->ack = 1;
967 t1->ack_seq = htonl(ntohl(th->seq) + th->syn + th->fin
968 + skb->len - (th->doff<<2));
969 }
970
971 #ifdef CONFIG_TCP_MD5SIG
972 if (key) {
973 __be32 *opt = (__be32*)(t1 + 1);
974 opt[0] = htonl((TCPOPT_NOP << 24) |
975 (TCPOPT_NOP << 16) |
976 (TCPOPT_MD5SIG << 8) |
977 TCPOLEN_MD5SIG);
978 tcp_v6_do_calc_md5_hash((__u8 *)&opt[1], key,
979 &ipv6_hdr(skb)->daddr,
980 &ipv6_hdr(skb)->saddr,
981 t1, tot_len);
982 }
983 #endif
984
985 buff->csum = csum_partial((char *)t1, sizeof(*t1), 0);
986
987 memset(&fl, 0, sizeof(fl));
988 ipv6_addr_copy(&fl.fl6_dst, &ipv6_hdr(skb)->saddr);
989 ipv6_addr_copy(&fl.fl6_src, &ipv6_hdr(skb)->daddr);
990
991 t1->check = csum_ipv6_magic(&fl.fl6_src, &fl.fl6_dst,
992 sizeof(*t1), IPPROTO_TCP,
993 buff->csum);
994
995 fl.proto = IPPROTO_TCP;
996 fl.oif = inet6_iif(skb);
997 fl.fl_ip_dport = t1->dest;
998 fl.fl_ip_sport = t1->source;
999 security_skb_classify_flow(skb, &fl);
1000
1001 /* Pass a socket to ip6_dst_lookup either it is for RST
1002 * Underlying function will use this to retrieve the network
1003 * namespace
1004 */
1005 if (!ip6_dst_lookup(ctl_sk, &buff->dst, &fl)) {
1006
1007 if (xfrm_lookup(&buff->dst, &fl, NULL, 0) >= 0) {
1008 ip6_xmit(ctl_sk, buff, &fl, NULL, 0);
1009 TCP_INC_STATS_BH(TCP_MIB_OUTSEGS);
1010 TCP_INC_STATS_BH(TCP_MIB_OUTRSTS);
1011 return;
1012 }
1013 }
1014
1015 kfree_skb(buff);
1016 }
1017
1018 static void tcp_v6_send_ack(struct sk_buff *skb, u32 seq, u32 ack, u32 win, u32 ts,
1019 struct tcp_md5sig_key *key)
1020 {
1021 struct tcphdr *th = tcp_hdr(skb), *t1;
1022 struct sk_buff *buff;
1023 struct flowi fl;
1024 struct net *net = dev_net(skb->dev);
1025 struct sock *ctl_sk = net->ipv6.tcp_sk;
1026 unsigned int tot_len = sizeof(struct tcphdr);
1027 __be32 *topt;
1028
1029 if (ts)
1030 tot_len += TCPOLEN_TSTAMP_ALIGNED;
1031 #ifdef CONFIG_TCP_MD5SIG
1032 if (key)
1033 tot_len += TCPOLEN_MD5SIG_ALIGNED;
1034 #endif
1035
1036 buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
1037 GFP_ATOMIC);
1038 if (buff == NULL)
1039 return;
1040
1041 skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
1042
1043 t1 = (struct tcphdr *) skb_push(buff,tot_len);
1044
1045 /* Swap the send and the receive. */
1046 memset(t1, 0, sizeof(*t1));
1047 t1->dest = th->source;
1048 t1->source = th->dest;
1049 t1->doff = tot_len/4;
1050 t1->seq = htonl(seq);
1051 t1->ack_seq = htonl(ack);
1052 t1->ack = 1;
1053 t1->window = htons(win);
1054
1055 topt = (__be32 *)(t1 + 1);
1056
1057 if (ts) {
1058 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
1059 (TCPOPT_TIMESTAMP << 8) | TCPOLEN_TIMESTAMP);
1060 *topt++ = htonl(tcp_time_stamp);
1061 *topt = htonl(ts);
1062 }
1063
1064 #ifdef CONFIG_TCP_MD5SIG
1065 if (key) {
1066 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
1067 (TCPOPT_MD5SIG << 8) | TCPOLEN_MD5SIG);
1068 tcp_v6_do_calc_md5_hash((__u8 *)topt, key,
1069 &ipv6_hdr(skb)->daddr,
1070 &ipv6_hdr(skb)->saddr,
1071 t1, tot_len);
1072 }
1073 #endif
1074
1075 buff->csum = csum_partial((char *)t1, tot_len, 0);
1076
1077 memset(&fl, 0, sizeof(fl));
1078 ipv6_addr_copy(&fl.fl6_dst, &ipv6_hdr(skb)->saddr);
1079 ipv6_addr_copy(&fl.fl6_src, &ipv6_hdr(skb)->daddr);
1080
1081 t1->check = csum_ipv6_magic(&fl.fl6_src, &fl.fl6_dst,
1082 tot_len, IPPROTO_TCP,
1083 buff->csum);
1084
1085 fl.proto = IPPROTO_TCP;
1086 fl.oif = inet6_iif(skb);
1087 fl.fl_ip_dport = t1->dest;
1088 fl.fl_ip_sport = t1->source;
1089 security_skb_classify_flow(skb, &fl);
1090
1091 if (!ip6_dst_lookup(ctl_sk, &buff->dst, &fl)) {
1092 if (xfrm_lookup(&buff->dst, &fl, NULL, 0) >= 0) {
1093 ip6_xmit(ctl_sk, buff, &fl, NULL, 0);
1094 TCP_INC_STATS_BH(TCP_MIB_OUTSEGS);
1095 return;
1096 }
1097 }
1098
1099 kfree_skb(buff);
1100 }
1101
1102 static void tcp_v6_timewait_ack(struct sock *sk, struct sk_buff *skb)
1103 {
1104 struct inet_timewait_sock *tw = inet_twsk(sk);
1105 struct tcp_timewait_sock *tcptw = tcp_twsk(sk);
1106
1107 tcp_v6_send_ack(skb, tcptw->tw_snd_nxt, tcptw->tw_rcv_nxt,
1108 tcptw->tw_rcv_wnd >> tw->tw_rcv_wscale,
1109 tcptw->tw_ts_recent, tcp_twsk_md5_key(tcptw));
1110
1111 inet_twsk_put(tw);
1112 }
1113
1114 static void tcp_v6_reqsk_send_ack(struct sk_buff *skb, struct request_sock *req)
1115 {
1116 tcp_v6_send_ack(skb, tcp_rsk(req)->snt_isn + 1, tcp_rsk(req)->rcv_isn + 1, req->rcv_wnd, req->ts_recent,
1117 tcp_v6_md5_do_lookup(skb->sk, &ipv6_hdr(skb)->daddr));
1118 }
1119
1120
1121 static struct sock *tcp_v6_hnd_req(struct sock *sk,struct sk_buff *skb)
1122 {
1123 struct request_sock *req, **prev;
1124 const struct tcphdr *th = tcp_hdr(skb);
1125 struct sock *nsk;
1126
1127 /* Find possible connection requests. */
1128 req = inet6_csk_search_req(sk, &prev, th->source,
1129 &ipv6_hdr(skb)->saddr,
1130 &ipv6_hdr(skb)->daddr, inet6_iif(skb));
1131 if (req)
1132 return tcp_check_req(sk, skb, req, prev);
1133
1134 nsk = __inet6_lookup_established(sock_net(sk), &tcp_hashinfo,
1135 &ipv6_hdr(skb)->saddr, th->source,
1136 &ipv6_hdr(skb)->daddr, ntohs(th->dest), inet6_iif(skb));
1137
1138 if (nsk) {
1139 if (nsk->sk_state != TCP_TIME_WAIT) {
1140 bh_lock_sock(nsk);
1141 return nsk;
1142 }
1143 inet_twsk_put(inet_twsk(nsk));
1144 return NULL;
1145 }
1146
1147 #ifdef CONFIG_SYN_COOKIES
1148 if (!th->rst && !th->syn && th->ack)
1149 sk = cookie_v6_check(sk, skb);
1150 #endif
1151 return sk;
1152 }
1153
1154 /* FIXME: this is substantially similar to the ipv4 code.
1155 * Can some kind of merge be done? -- erics
1156 */
1157 static int tcp_v6_conn_request(struct sock *sk, struct sk_buff *skb)
1158 {
1159 struct inet6_request_sock *treq;
1160 struct ipv6_pinfo *np = inet6_sk(sk);
1161 struct tcp_options_received tmp_opt;
1162 struct tcp_sock *tp = tcp_sk(sk);
1163 struct request_sock *req = NULL;
1164 __u32 isn = TCP_SKB_CB(skb)->when;
1165 #ifdef CONFIG_SYN_COOKIES
1166 int want_cookie = 0;
1167 #else
1168 #define want_cookie 0
1169 #endif
1170
1171 if (skb->protocol == htons(ETH_P_IP))
1172 return tcp_v4_conn_request(sk, skb);
1173
1174 if (!ipv6_unicast_destination(skb))
1175 goto drop;
1176
1177 if (inet_csk_reqsk_queue_is_full(sk) && !isn) {
1178 if (net_ratelimit())
1179 syn_flood_warning(skb);
1180 #ifdef CONFIG_SYN_COOKIES
1181 if (sysctl_tcp_syncookies)
1182 want_cookie = 1;
1183 else
1184 #endif
1185 goto drop;
1186 }
1187
1188 if (sk_acceptq_is_full(sk) && inet_csk_reqsk_queue_young(sk) > 1)
1189 goto drop;
1190
1191 req = inet6_reqsk_alloc(&tcp6_request_sock_ops);
1192 if (req == NULL)
1193 goto drop;
1194
1195 #ifdef CONFIG_TCP_MD5SIG
1196 tcp_rsk(req)->af_specific = &tcp_request_sock_ipv6_ops;
1197 #endif
1198
1199 tcp_clear_options(&tmp_opt);
1200 tmp_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
1201 tmp_opt.user_mss = tp->rx_opt.user_mss;
1202
1203 tcp_parse_options(skb, &tmp_opt, 0);
1204
1205 if (want_cookie && !tmp_opt.saw_tstamp)
1206 tcp_clear_options(&tmp_opt);
1207
1208 tmp_opt.tstamp_ok = tmp_opt.saw_tstamp;
1209 tcp_openreq_init(req, &tmp_opt, skb);
1210
1211 treq = inet6_rsk(req);
1212 ipv6_addr_copy(&treq->rmt_addr, &ipv6_hdr(skb)->saddr);
1213 ipv6_addr_copy(&treq->loc_addr, &ipv6_hdr(skb)->daddr);
1214 treq->pktopts = NULL;
1215 if (!want_cookie)
1216 TCP_ECN_create_request(req, tcp_hdr(skb));
1217
1218 if (want_cookie) {
1219 isn = cookie_v6_init_sequence(sk, skb, &req->mss);
1220 req->cookie_ts = tmp_opt.tstamp_ok;
1221 } else if (!isn) {
1222 if (ipv6_opt_accepted(sk, skb) ||
1223 np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo ||
1224 np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim) {
1225 atomic_inc(&skb->users);
1226 treq->pktopts = skb;
1227 }
1228 treq->iif = sk->sk_bound_dev_if;
1229
1230 /* So that link locals have meaning */
1231 if (!sk->sk_bound_dev_if &&
1232 ipv6_addr_type(&treq->rmt_addr) & IPV6_ADDR_LINKLOCAL)
1233 treq->iif = inet6_iif(skb);
1234
1235 isn = tcp_v6_init_sequence(skb);
1236 }
1237
1238 tcp_rsk(req)->snt_isn = isn;
1239
1240 security_inet_conn_request(sk, skb, req);
1241
1242 if (tcp_v6_send_synack(sk, req))
1243 goto drop;
1244
1245 if (!want_cookie) {
1246 inet6_csk_reqsk_queue_hash_add(sk, req, TCP_TIMEOUT_INIT);
1247 return 0;
1248 }
1249
1250 drop:
1251 if (req)
1252 reqsk_free(req);
1253
1254 return 0; /* don't send reset */
1255 }
1256
1257 static struct sock * tcp_v6_syn_recv_sock(struct sock *sk, struct sk_buff *skb,
1258 struct request_sock *req,
1259 struct dst_entry *dst)
1260 {
1261 struct inet6_request_sock *treq = inet6_rsk(req);
1262 struct ipv6_pinfo *newnp, *np = inet6_sk(sk);
1263 struct tcp6_sock *newtcp6sk;
1264 struct inet_sock *newinet;
1265 struct tcp_sock *newtp;
1266 struct sock *newsk;
1267 struct ipv6_txoptions *opt;
1268 #ifdef CONFIG_TCP_MD5SIG
1269 struct tcp_md5sig_key *key;
1270 #endif
1271
1272 if (skb->protocol == htons(ETH_P_IP)) {
1273 /*
1274 * v6 mapped
1275 */
1276
1277 newsk = tcp_v4_syn_recv_sock(sk, skb, req, dst);
1278
1279 if (newsk == NULL)
1280 return NULL;
1281
1282 newtcp6sk = (struct tcp6_sock *)newsk;
1283 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1284
1285 newinet = inet_sk(newsk);
1286 newnp = inet6_sk(newsk);
1287 newtp = tcp_sk(newsk);
1288
1289 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1290
1291 ipv6_addr_set(&newnp->daddr, 0, 0, htonl(0x0000FFFF),
1292 newinet->daddr);
1293
1294 ipv6_addr_set(&newnp->saddr, 0, 0, htonl(0x0000FFFF),
1295 newinet->saddr);
1296
1297 ipv6_addr_copy(&newnp->rcv_saddr, &newnp->saddr);
1298
1299 inet_csk(newsk)->icsk_af_ops = &ipv6_mapped;
1300 newsk->sk_backlog_rcv = tcp_v4_do_rcv;
1301 #ifdef CONFIG_TCP_MD5SIG
1302 newtp->af_specific = &tcp_sock_ipv6_mapped_specific;
1303 #endif
1304
1305 newnp->pktoptions = NULL;
1306 newnp->opt = NULL;
1307 newnp->mcast_oif = inet6_iif(skb);
1308 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
1309
1310 /*
1311 * No need to charge this sock to the relevant IPv6 refcnt debug socks count
1312 * here, tcp_create_openreq_child now does this for us, see the comment in
1313 * that function for the gory details. -acme
1314 */
1315
1316 /* It is tricky place. Until this moment IPv4 tcp
1317 worked with IPv6 icsk.icsk_af_ops.
1318 Sync it now.
1319 */
1320 tcp_sync_mss(newsk, inet_csk(newsk)->icsk_pmtu_cookie);
1321
1322 return newsk;
1323 }
1324
1325 opt = np->opt;
1326
1327 if (sk_acceptq_is_full(sk))
1328 goto out_overflow;
1329
1330 if (dst == NULL) {
1331 struct in6_addr *final_p = NULL, final;
1332 struct flowi fl;
1333
1334 memset(&fl, 0, sizeof(fl));
1335 fl.proto = IPPROTO_TCP;
1336 ipv6_addr_copy(&fl.fl6_dst, &treq->rmt_addr);
1337 if (opt && opt->srcrt) {
1338 struct rt0_hdr *rt0 = (struct rt0_hdr *) opt->srcrt;
1339 ipv6_addr_copy(&final, &fl.fl6_dst);
1340 ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
1341 final_p = &final;
1342 }
1343 ipv6_addr_copy(&fl.fl6_src, &treq->loc_addr);
1344 fl.oif = sk->sk_bound_dev_if;
1345 fl.fl_ip_dport = inet_rsk(req)->rmt_port;
1346 fl.fl_ip_sport = inet_sk(sk)->sport;
1347 security_req_classify_flow(req, &fl);
1348
1349 if (ip6_dst_lookup(sk, &dst, &fl))
1350 goto out;
1351
1352 if (final_p)
1353 ipv6_addr_copy(&fl.fl6_dst, final_p);
1354
1355 if ((xfrm_lookup(&dst, &fl, sk, 0)) < 0)
1356 goto out;
1357 }
1358
1359 newsk = tcp_create_openreq_child(sk, req, skb);
1360 if (newsk == NULL)
1361 goto out;
1362
1363 /*
1364 * No need to charge this sock to the relevant IPv6 refcnt debug socks
1365 * count here, tcp_create_openreq_child now does this for us, see the
1366 * comment in that function for the gory details. -acme
1367 */
1368
1369 newsk->sk_gso_type = SKB_GSO_TCPV6;
1370 __ip6_dst_store(newsk, dst, NULL, NULL);
1371
1372 newtcp6sk = (struct tcp6_sock *)newsk;
1373 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1374
1375 newtp = tcp_sk(newsk);
1376 newinet = inet_sk(newsk);
1377 newnp = inet6_sk(newsk);
1378
1379 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1380
1381 ipv6_addr_copy(&newnp->daddr, &treq->rmt_addr);
1382 ipv6_addr_copy(&newnp->saddr, &treq->loc_addr);
1383 ipv6_addr_copy(&newnp->rcv_saddr, &treq->loc_addr);
1384 newsk->sk_bound_dev_if = treq->iif;
1385
1386 /* Now IPv6 options...
1387
1388 First: no IPv4 options.
1389 */
1390 newinet->opt = NULL;
1391 newnp->ipv6_fl_list = NULL;
1392
1393 /* Clone RX bits */
1394 newnp->rxopt.all = np->rxopt.all;
1395
1396 /* Clone pktoptions received with SYN */
1397 newnp->pktoptions = NULL;
1398 if (treq->pktopts != NULL) {
1399 newnp->pktoptions = skb_clone(treq->pktopts, GFP_ATOMIC);
1400 kfree_skb(treq->pktopts);
1401 treq->pktopts = NULL;
1402 if (newnp->pktoptions)
1403 skb_set_owner_r(newnp->pktoptions, newsk);
1404 }
1405 newnp->opt = NULL;
1406 newnp->mcast_oif = inet6_iif(skb);
1407 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
1408
1409 /* Clone native IPv6 options from listening socket (if any)
1410
1411 Yes, keeping reference count would be much more clever,
1412 but we make one more one thing there: reattach optmem
1413 to newsk.
1414 */
1415 if (opt) {
1416 newnp->opt = ipv6_dup_options(newsk, opt);
1417 if (opt != np->opt)
1418 sock_kfree_s(sk, opt, opt->tot_len);
1419 }
1420
1421 inet_csk(newsk)->icsk_ext_hdr_len = 0;
1422 if (newnp->opt)
1423 inet_csk(newsk)->icsk_ext_hdr_len = (newnp->opt->opt_nflen +
1424 newnp->opt->opt_flen);
1425
1426 tcp_mtup_init(newsk);
1427 tcp_sync_mss(newsk, dst_mtu(dst));
1428 newtp->advmss = dst_metric(dst, RTAX_ADVMSS);
1429 tcp_initialize_rcv_mss(newsk);
1430
1431 newinet->daddr = newinet->saddr = newinet->rcv_saddr = LOOPBACK4_IPV6;
1432
1433 #ifdef CONFIG_TCP_MD5SIG
1434 /* Copy over the MD5 key from the original socket */
1435 if ((key = tcp_v6_md5_do_lookup(sk, &newnp->daddr)) != NULL) {
1436 /* We're using one, so create a matching key
1437 * on the newsk structure. If we fail to get
1438 * memory, then we end up not copying the key
1439 * across. Shucks.
1440 */
1441 char *newkey = kmemdup(key->key, key->keylen, GFP_ATOMIC);
1442 if (newkey != NULL)
1443 tcp_v6_md5_do_add(newsk, &inet6_sk(sk)->daddr,
1444 newkey, key->keylen);
1445 }
1446 #endif
1447
1448 __inet6_hash(newsk);
1449 __inet_inherit_port(sk, newsk);
1450
1451 return newsk;
1452
1453 out_overflow:
1454 NET_INC_STATS_BH(LINUX_MIB_LISTENOVERFLOWS);
1455 out:
1456 NET_INC_STATS_BH(LINUX_MIB_LISTENDROPS);
1457 if (opt && opt != np->opt)
1458 sock_kfree_s(sk, opt, opt->tot_len);
1459 dst_release(dst);
1460 return NULL;
1461 }
1462
1463 static __sum16 tcp_v6_checksum_init(struct sk_buff *skb)
1464 {
1465 if (skb->ip_summed == CHECKSUM_COMPLETE) {
1466 if (!tcp_v6_check(tcp_hdr(skb), skb->len, &ipv6_hdr(skb)->saddr,
1467 &ipv6_hdr(skb)->daddr, skb->csum)) {
1468 skb->ip_summed = CHECKSUM_UNNECESSARY;
1469 return 0;
1470 }
1471 }
1472
1473 skb->csum = ~csum_unfold(tcp_v6_check(tcp_hdr(skb), skb->len,
1474 &ipv6_hdr(skb)->saddr,
1475 &ipv6_hdr(skb)->daddr, 0));
1476
1477 if (skb->len <= 76) {
1478 return __skb_checksum_complete(skb);
1479 }
1480 return 0;
1481 }
1482
1483 /* The socket must have it's spinlock held when we get
1484 * here.
1485 *
1486 * We have a potential double-lock case here, so even when
1487 * doing backlog processing we use the BH locking scheme.
1488 * This is because we cannot sleep with the original spinlock
1489 * held.
1490 */
1491 static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb)
1492 {
1493 struct ipv6_pinfo *np = inet6_sk(sk);
1494 struct tcp_sock *tp;
1495 struct sk_buff *opt_skb = NULL;
1496
1497 /* Imagine: socket is IPv6. IPv4 packet arrives,
1498 goes to IPv4 receive handler and backlogged.
1499 From backlog it always goes here. Kerboom...
1500 Fortunately, tcp_rcv_established and rcv_established
1501 handle them correctly, but it is not case with
1502 tcp_v6_hnd_req and tcp_v6_send_reset(). --ANK
1503 */
1504
1505 if (skb->protocol == htons(ETH_P_IP))
1506 return tcp_v4_do_rcv(sk, skb);
1507
1508 #ifdef CONFIG_TCP_MD5SIG
1509 if (tcp_v6_inbound_md5_hash (sk, skb))
1510 goto discard;
1511 #endif
1512
1513 if (sk_filter(sk, skb))
1514 goto discard;
1515
1516 /*
1517 * socket locking is here for SMP purposes as backlog rcv
1518 * is currently called with bh processing disabled.
1519 */
1520
1521 /* Do Stevens' IPV6_PKTOPTIONS.
1522
1523 Yes, guys, it is the only place in our code, where we
1524 may make it not affecting IPv4.
1525 The rest of code is protocol independent,
1526 and I do not like idea to uglify IPv4.
1527
1528 Actually, all the idea behind IPV6_PKTOPTIONS
1529 looks not very well thought. For now we latch
1530 options, received in the last packet, enqueued
1531 by tcp. Feel free to propose better solution.
1532 --ANK (980728)
1533 */
1534 if (np->rxopt.all)
1535 opt_skb = skb_clone(skb, GFP_ATOMIC);
1536
1537 if (sk->sk_state == TCP_ESTABLISHED) { /* Fast path */
1538 TCP_CHECK_TIMER(sk);
1539 if (tcp_rcv_established(sk, skb, tcp_hdr(skb), skb->len))
1540 goto reset;
1541 TCP_CHECK_TIMER(sk);
1542 if (opt_skb)
1543 goto ipv6_pktoptions;
1544 return 0;
1545 }
1546
1547 if (skb->len < tcp_hdrlen(skb) || tcp_checksum_complete(skb))
1548 goto csum_err;
1549
1550 if (sk->sk_state == TCP_LISTEN) {
1551 struct sock *nsk = tcp_v6_hnd_req(sk, skb);
1552 if (!nsk)
1553 goto discard;
1554
1555 /*
1556 * Queue it on the new socket if the new socket is active,
1557 * otherwise we just shortcircuit this and continue with
1558 * the new socket..
1559 */
1560 if(nsk != sk) {
1561 if (tcp_child_process(sk, nsk, skb))
1562 goto reset;
1563 if (opt_skb)
1564 __kfree_skb(opt_skb);
1565 return 0;
1566 }
1567 }
1568
1569 TCP_CHECK_TIMER(sk);
1570 if (tcp_rcv_state_process(sk, skb, tcp_hdr(skb), skb->len))
1571 goto reset;
1572 TCP_CHECK_TIMER(sk);
1573 if (opt_skb)
1574 goto ipv6_pktoptions;
1575 return 0;
1576
1577 reset:
1578 tcp_v6_send_reset(sk, skb);
1579 discard:
1580 if (opt_skb)
1581 __kfree_skb(opt_skb);
1582 kfree_skb(skb);
1583 return 0;
1584 csum_err:
1585 TCP_INC_STATS_BH(TCP_MIB_INERRS);
1586 goto discard;
1587
1588
1589 ipv6_pktoptions:
1590 /* Do you ask, what is it?
1591
1592 1. skb was enqueued by tcp.
1593 2. skb is added to tail of read queue, rather than out of order.
1594 3. socket is not in passive state.
1595 4. Finally, it really contains options, which user wants to receive.
1596 */
1597 tp = tcp_sk(sk);
1598 if (TCP_SKB_CB(opt_skb)->end_seq == tp->rcv_nxt &&
1599 !((1 << sk->sk_state) & (TCPF_CLOSE | TCPF_LISTEN))) {
1600 if (np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo)
1601 np->mcast_oif = inet6_iif(opt_skb);
1602 if (np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim)
1603 np->mcast_hops = ipv6_hdr(opt_skb)->hop_limit;
1604 if (ipv6_opt_accepted(sk, opt_skb)) {
1605 skb_set_owner_r(opt_skb, sk);
1606 opt_skb = xchg(&np->pktoptions, opt_skb);
1607 } else {
1608 __kfree_skb(opt_skb);
1609 opt_skb = xchg(&np->pktoptions, NULL);
1610 }
1611 }
1612
1613 if (opt_skb)
1614 kfree_skb(opt_skb);
1615 return 0;
1616 }
1617
1618 static int tcp_v6_rcv(struct sk_buff *skb)
1619 {
1620 struct tcphdr *th;
1621 struct sock *sk;
1622 int ret;
1623
1624 if (skb->pkt_type != PACKET_HOST)
1625 goto discard_it;
1626
1627 /*
1628 * Count it even if it's bad.
1629 */
1630 TCP_INC_STATS_BH(TCP_MIB_INSEGS);
1631
1632 if (!pskb_may_pull(skb, sizeof(struct tcphdr)))
1633 goto discard_it;
1634
1635 th = tcp_hdr(skb);
1636
1637 if (th->doff < sizeof(struct tcphdr)/4)
1638 goto bad_packet;
1639 if (!pskb_may_pull(skb, th->doff*4))
1640 goto discard_it;
1641
1642 if (!skb_csum_unnecessary(skb) && tcp_v6_checksum_init(skb))
1643 goto bad_packet;
1644
1645 th = tcp_hdr(skb);
1646 TCP_SKB_CB(skb)->seq = ntohl(th->seq);
1647 TCP_SKB_CB(skb)->end_seq = (TCP_SKB_CB(skb)->seq + th->syn + th->fin +
1648 skb->len - th->doff*4);
1649 TCP_SKB_CB(skb)->ack_seq = ntohl(th->ack_seq);
1650 TCP_SKB_CB(skb)->when = 0;
1651 TCP_SKB_CB(skb)->flags = ipv6_get_dsfield(ipv6_hdr(skb));
1652 TCP_SKB_CB(skb)->sacked = 0;
1653
1654 sk = __inet6_lookup(dev_net(skb->dev), &tcp_hashinfo,
1655 &ipv6_hdr(skb)->saddr, th->source,
1656 &ipv6_hdr(skb)->daddr, ntohs(th->dest),
1657 inet6_iif(skb));
1658
1659 if (!sk)
1660 goto no_tcp_socket;
1661
1662 process:
1663 if (sk->sk_state == TCP_TIME_WAIT)
1664 goto do_time_wait;
1665
1666 if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
1667 goto discard_and_relse;
1668
1669 if (sk_filter(sk, skb))
1670 goto discard_and_relse;
1671
1672 skb->dev = NULL;
1673
1674 bh_lock_sock_nested(sk);
1675 ret = 0;
1676 if (!sock_owned_by_user(sk)) {
1677 #ifdef CONFIG_NET_DMA
1678 struct tcp_sock *tp = tcp_sk(sk);
1679 if (!tp->ucopy.dma_chan && tp->ucopy.pinned_list)
1680 tp->ucopy.dma_chan = get_softnet_dma();
1681 if (tp->ucopy.dma_chan)
1682 ret = tcp_v6_do_rcv(sk, skb);
1683 else
1684 #endif
1685 {
1686 if (!tcp_prequeue(sk, skb))
1687 ret = tcp_v6_do_rcv(sk, skb);
1688 }
1689 } else
1690 sk_add_backlog(sk, skb);
1691 bh_unlock_sock(sk);
1692
1693 sock_put(sk);
1694 return ret ? -1 : 0;
1695
1696 no_tcp_socket:
1697 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb))
1698 goto discard_it;
1699
1700 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
1701 bad_packet:
1702 TCP_INC_STATS_BH(TCP_MIB_INERRS);
1703 } else {
1704 tcp_v6_send_reset(NULL, skb);
1705 }
1706
1707 discard_it:
1708
1709 /*
1710 * Discard frame
1711 */
1712
1713 kfree_skb(skb);
1714 return 0;
1715
1716 discard_and_relse:
1717 sock_put(sk);
1718 goto discard_it;
1719
1720 do_time_wait:
1721 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
1722 inet_twsk_put(inet_twsk(sk));
1723 goto discard_it;
1724 }
1725
1726 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
1727 TCP_INC_STATS_BH(TCP_MIB_INERRS);
1728 inet_twsk_put(inet_twsk(sk));
1729 goto discard_it;
1730 }
1731
1732 switch (tcp_timewait_state_process(inet_twsk(sk), skb, th)) {
1733 case TCP_TW_SYN:
1734 {
1735 struct sock *sk2;
1736
1737 sk2 = inet6_lookup_listener(dev_net(skb->dev), &tcp_hashinfo,
1738 &ipv6_hdr(skb)->daddr,
1739 ntohs(th->dest), inet6_iif(skb));
1740 if (sk2 != NULL) {
1741 struct inet_timewait_sock *tw = inet_twsk(sk);
1742 inet_twsk_deschedule(tw, &tcp_death_row);
1743 inet_twsk_put(tw);
1744 sk = sk2;
1745 goto process;
1746 }
1747 /* Fall through to ACK */
1748 }
1749 case TCP_TW_ACK:
1750 tcp_v6_timewait_ack(sk, skb);
1751 break;
1752 case TCP_TW_RST:
1753 goto no_tcp_socket;
1754 case TCP_TW_SUCCESS:;
1755 }
1756 goto discard_it;
1757 }
1758
1759 static int tcp_v6_remember_stamp(struct sock *sk)
1760 {
1761 /* Alas, not yet... */
1762 return 0;
1763 }
1764
1765 static struct inet_connection_sock_af_ops ipv6_specific = {
1766 .queue_xmit = inet6_csk_xmit,
1767 .send_check = tcp_v6_send_check,
1768 .rebuild_header = inet6_sk_rebuild_header,
1769 .conn_request = tcp_v6_conn_request,
1770 .syn_recv_sock = tcp_v6_syn_recv_sock,
1771 .remember_stamp = tcp_v6_remember_stamp,
1772 .net_header_len = sizeof(struct ipv6hdr),
1773 .setsockopt = ipv6_setsockopt,
1774 .getsockopt = ipv6_getsockopt,
1775 .addr2sockaddr = inet6_csk_addr2sockaddr,
1776 .sockaddr_len = sizeof(struct sockaddr_in6),
1777 .bind_conflict = inet6_csk_bind_conflict,
1778 #ifdef CONFIG_COMPAT
1779 .compat_setsockopt = compat_ipv6_setsockopt,
1780 .compat_getsockopt = compat_ipv6_getsockopt,
1781 #endif
1782 };
1783
1784 #ifdef CONFIG_TCP_MD5SIG
1785 static struct tcp_sock_af_ops tcp_sock_ipv6_specific = {
1786 .md5_lookup = tcp_v6_md5_lookup,
1787 .calc_md5_hash = tcp_v6_calc_md5_hash,
1788 .md5_add = tcp_v6_md5_add_func,
1789 .md5_parse = tcp_v6_parse_md5_keys,
1790 };
1791 #endif
1792
1793 /*
1794 * TCP over IPv4 via INET6 API
1795 */
1796
1797 static struct inet_connection_sock_af_ops ipv6_mapped = {
1798 .queue_xmit = ip_queue_xmit,
1799 .send_check = tcp_v4_send_check,
1800 .rebuild_header = inet_sk_rebuild_header,
1801 .conn_request = tcp_v6_conn_request,
1802 .syn_recv_sock = tcp_v6_syn_recv_sock,
1803 .remember_stamp = tcp_v4_remember_stamp,
1804 .net_header_len = sizeof(struct iphdr),
1805 .setsockopt = ipv6_setsockopt,
1806 .getsockopt = ipv6_getsockopt,
1807 .addr2sockaddr = inet6_csk_addr2sockaddr,
1808 .sockaddr_len = sizeof(struct sockaddr_in6),
1809 .bind_conflict = inet6_csk_bind_conflict,
1810 #ifdef CONFIG_COMPAT
1811 .compat_setsockopt = compat_ipv6_setsockopt,
1812 .compat_getsockopt = compat_ipv6_getsockopt,
1813 #endif
1814 };
1815
1816 #ifdef CONFIG_TCP_MD5SIG
1817 static struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific = {
1818 .md5_lookup = tcp_v4_md5_lookup,
1819 .calc_md5_hash = tcp_v4_calc_md5_hash,
1820 .md5_add = tcp_v6_md5_add_func,
1821 .md5_parse = tcp_v6_parse_md5_keys,
1822 };
1823 #endif
1824
1825 /* NOTE: A lot of things set to zero explicitly by call to
1826 * sk_alloc() so need not be done here.
1827 */
1828 static int tcp_v6_init_sock(struct sock *sk)
1829 {
1830 struct inet_connection_sock *icsk = inet_csk(sk);
1831 struct tcp_sock *tp = tcp_sk(sk);
1832
1833 skb_queue_head_init(&tp->out_of_order_queue);
1834 tcp_init_xmit_timers(sk);
1835 tcp_prequeue_init(tp);
1836
1837 icsk->icsk_rto = TCP_TIMEOUT_INIT;
1838 tp->mdev = TCP_TIMEOUT_INIT;
1839
1840 /* So many TCP implementations out there (incorrectly) count the
1841 * initial SYN frame in their delayed-ACK and congestion control
1842 * algorithms that we must have the following bandaid to talk
1843 * efficiently to them. -DaveM
1844 */
1845 tp->snd_cwnd = 2;
1846
1847 /* See draft-stevens-tcpca-spec-01 for discussion of the
1848 * initialization of these values.
1849 */
1850 tp->snd_ssthresh = 0x7fffffff;
1851 tp->snd_cwnd_clamp = ~0;
1852 tp->mss_cache = 536;
1853
1854 tp->reordering = sysctl_tcp_reordering;
1855
1856 sk->sk_state = TCP_CLOSE;
1857
1858 icsk->icsk_af_ops = &ipv6_specific;
1859 icsk->icsk_ca_ops = &tcp_init_congestion_ops;
1860 icsk->icsk_sync_mss = tcp_sync_mss;
1861 sk->sk_write_space = sk_stream_write_space;
1862 sock_set_flag(sk, SOCK_USE_WRITE_QUEUE);
1863
1864 #ifdef CONFIG_TCP_MD5SIG
1865 tp->af_specific = &tcp_sock_ipv6_specific;
1866 #endif
1867
1868 sk->sk_sndbuf = sysctl_tcp_wmem[1];
1869 sk->sk_rcvbuf = sysctl_tcp_rmem[1];
1870
1871 atomic_inc(&tcp_sockets_allocated);
1872
1873 return 0;
1874 }
1875
1876 static int tcp_v6_destroy_sock(struct sock *sk)
1877 {
1878 #ifdef CONFIG_TCP_MD5SIG
1879 /* Clean up the MD5 key list */
1880 if (tcp_sk(sk)->md5sig_info)
1881 tcp_v6_clear_md5_list(sk);
1882 #endif
1883 tcp_v4_destroy_sock(sk);
1884 return inet6_destroy_sock(sk);
1885 }
1886
1887 #ifdef CONFIG_PROC_FS
1888 /* Proc filesystem TCPv6 sock list dumping. */
1889 static void get_openreq6(struct seq_file *seq,
1890 struct sock *sk, struct request_sock *req, int i, int uid)
1891 {
1892 int ttd = req->expires - jiffies;
1893 struct in6_addr *src = &inet6_rsk(req)->loc_addr;
1894 struct in6_addr *dest = &inet6_rsk(req)->rmt_addr;
1895
1896 if (ttd < 0)
1897 ttd = 0;
1898
1899 seq_printf(seq,
1900 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1901 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %p\n",
1902 i,
1903 src->s6_addr32[0], src->s6_addr32[1],
1904 src->s6_addr32[2], src->s6_addr32[3],
1905 ntohs(inet_sk(sk)->sport),
1906 dest->s6_addr32[0], dest->s6_addr32[1],
1907 dest->s6_addr32[2], dest->s6_addr32[3],
1908 ntohs(inet_rsk(req)->rmt_port),
1909 TCP_SYN_RECV,
1910 0,0, /* could print option size, but that is af dependent. */
1911 1, /* timers active (only the expire timer) */
1912 jiffies_to_clock_t(ttd),
1913 req->retrans,
1914 uid,
1915 0, /* non standard timer */
1916 0, /* open_requests have no inode */
1917 0, req);
1918 }
1919
1920 static void get_tcp6_sock(struct seq_file *seq, struct sock *sp, int i)
1921 {
1922 struct in6_addr *dest, *src;
1923 __u16 destp, srcp;
1924 int timer_active;
1925 unsigned long timer_expires;
1926 struct inet_sock *inet = inet_sk(sp);
1927 struct tcp_sock *tp = tcp_sk(sp);
1928 const struct inet_connection_sock *icsk = inet_csk(sp);
1929 struct ipv6_pinfo *np = inet6_sk(sp);
1930
1931 dest = &np->daddr;
1932 src = &np->rcv_saddr;
1933 destp = ntohs(inet->dport);
1934 srcp = ntohs(inet->sport);
1935
1936 if (icsk->icsk_pending == ICSK_TIME_RETRANS) {
1937 timer_active = 1;
1938 timer_expires = icsk->icsk_timeout;
1939 } else if (icsk->icsk_pending == ICSK_TIME_PROBE0) {
1940 timer_active = 4;
1941 timer_expires = icsk->icsk_timeout;
1942 } else if (timer_pending(&sp->sk_timer)) {
1943 timer_active = 2;
1944 timer_expires = sp->sk_timer.expires;
1945 } else {
1946 timer_active = 0;
1947 timer_expires = jiffies;
1948 }
1949
1950 seq_printf(seq,
1951 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1952 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %lu %d %p %u %u %u %u %d\n",
1953 i,
1954 src->s6_addr32[0], src->s6_addr32[1],
1955 src->s6_addr32[2], src->s6_addr32[3], srcp,
1956 dest->s6_addr32[0], dest->s6_addr32[1],
1957 dest->s6_addr32[2], dest->s6_addr32[3], destp,
1958 sp->sk_state,
1959 tp->write_seq-tp->snd_una,
1960 (sp->sk_state == TCP_LISTEN) ? sp->sk_ack_backlog : (tp->rcv_nxt - tp->copied_seq),
1961 timer_active,
1962 jiffies_to_clock_t(timer_expires - jiffies),
1963 icsk->icsk_retransmits,
1964 sock_i_uid(sp),
1965 icsk->icsk_probes_out,
1966 sock_i_ino(sp),
1967 atomic_read(&sp->sk_refcnt), sp,
1968 icsk->icsk_rto,
1969 icsk->icsk_ack.ato,
1970 (icsk->icsk_ack.quick << 1 ) | icsk->icsk_ack.pingpong,
1971 tp->snd_cwnd, tp->snd_ssthresh>=0xFFFF?-1:tp->snd_ssthresh
1972 );
1973 }
1974
1975 static void get_timewait6_sock(struct seq_file *seq,
1976 struct inet_timewait_sock *tw, int i)
1977 {
1978 struct in6_addr *dest, *src;
1979 __u16 destp, srcp;
1980 struct inet6_timewait_sock *tw6 = inet6_twsk((struct sock *)tw);
1981 int ttd = tw->tw_ttd - jiffies;
1982
1983 if (ttd < 0)
1984 ttd = 0;
1985
1986 dest = &tw6->tw_v6_daddr;
1987 src = &tw6->tw_v6_rcv_saddr;
1988 destp = ntohs(tw->tw_dport);
1989 srcp = ntohs(tw->tw_sport);
1990
1991 seq_printf(seq,
1992 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1993 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %p\n",
1994 i,
1995 src->s6_addr32[0], src->s6_addr32[1],
1996 src->s6_addr32[2], src->s6_addr32[3], srcp,
1997 dest->s6_addr32[0], dest->s6_addr32[1],
1998 dest->s6_addr32[2], dest->s6_addr32[3], destp,
1999 tw->tw_substate, 0, 0,
2000 3, jiffies_to_clock_t(ttd), 0, 0, 0, 0,
2001 atomic_read(&tw->tw_refcnt), tw);
2002 }
2003
2004 static int tcp6_seq_show(struct seq_file *seq, void *v)
2005 {
2006 struct tcp_iter_state *st;
2007
2008 if (v == SEQ_START_TOKEN) {
2009 seq_puts(seq,
2010 " sl "
2011 "local_address "
2012 "remote_address "
2013 "st tx_queue rx_queue tr tm->when retrnsmt"
2014 " uid timeout inode\n");
2015 goto out;
2016 }
2017 st = seq->private;
2018
2019 switch (st->state) {
2020 case TCP_SEQ_STATE_LISTENING:
2021 case TCP_SEQ_STATE_ESTABLISHED:
2022 get_tcp6_sock(seq, v, st->num);
2023 break;
2024 case TCP_SEQ_STATE_OPENREQ:
2025 get_openreq6(seq, st->syn_wait_sk, v, st->num, st->uid);
2026 break;
2027 case TCP_SEQ_STATE_TIME_WAIT:
2028 get_timewait6_sock(seq, v, st->num);
2029 break;
2030 }
2031 out:
2032 return 0;
2033 }
2034
2035 static struct tcp_seq_afinfo tcp6_seq_afinfo = {
2036 .name = "tcp6",
2037 .family = AF_INET6,
2038 .seq_fops = {
2039 .owner = THIS_MODULE,
2040 },
2041 .seq_ops = {
2042 .show = tcp6_seq_show,
2043 },
2044 };
2045
2046 int tcp6_proc_init(struct net *net)
2047 {
2048 return tcp_proc_register(net, &tcp6_seq_afinfo);
2049 }
2050
2051 void tcp6_proc_exit(struct net *net)
2052 {
2053 tcp_proc_unregister(net, &tcp6_seq_afinfo);
2054 }
2055 #endif
2056
2057 struct proto tcpv6_prot = {
2058 .name = "TCPv6",
2059 .owner = THIS_MODULE,
2060 .close = tcp_close,
2061 .connect = tcp_v6_connect,
2062 .disconnect = tcp_disconnect,
2063 .accept = inet_csk_accept,
2064 .ioctl = tcp_ioctl,
2065 .init = tcp_v6_init_sock,
2066 .destroy = tcp_v6_destroy_sock,
2067 .shutdown = tcp_shutdown,
2068 .setsockopt = tcp_setsockopt,
2069 .getsockopt = tcp_getsockopt,
2070 .recvmsg = tcp_recvmsg,
2071 .backlog_rcv = tcp_v6_do_rcv,
2072 .hash = tcp_v6_hash,
2073 .unhash = inet_unhash,
2074 .get_port = inet_csk_get_port,
2075 .enter_memory_pressure = tcp_enter_memory_pressure,
2076 .sockets_allocated = &tcp_sockets_allocated,
2077 .memory_allocated = &tcp_memory_allocated,
2078 .memory_pressure = &tcp_memory_pressure,
2079 .orphan_count = &tcp_orphan_count,
2080 .sysctl_mem = sysctl_tcp_mem,
2081 .sysctl_wmem = sysctl_tcp_wmem,
2082 .sysctl_rmem = sysctl_tcp_rmem,
2083 .max_header = MAX_TCP_HEADER,
2084 .obj_size = sizeof(struct tcp6_sock),
2085 .twsk_prot = &tcp6_timewait_sock_ops,
2086 .rsk_prot = &tcp6_request_sock_ops,
2087 .h.hashinfo = &tcp_hashinfo,
2088 #ifdef CONFIG_COMPAT
2089 .compat_setsockopt = compat_tcp_setsockopt,
2090 .compat_getsockopt = compat_tcp_getsockopt,
2091 #endif
2092 };
2093
2094 static struct inet6_protocol tcpv6_protocol = {
2095 .handler = tcp_v6_rcv,
2096 .err_handler = tcp_v6_err,
2097 .gso_send_check = tcp_v6_gso_send_check,
2098 .gso_segment = tcp_tso_segment,
2099 .flags = INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
2100 };
2101
2102 static struct inet_protosw tcpv6_protosw = {
2103 .type = SOCK_STREAM,
2104 .protocol = IPPROTO_TCP,
2105 .prot = &tcpv6_prot,
2106 .ops = &inet6_stream_ops,
2107 .capability = -1,
2108 .no_check = 0,
2109 .flags = INET_PROTOSW_PERMANENT |
2110 INET_PROTOSW_ICSK,
2111 };
2112
2113 static int tcpv6_net_init(struct net *net)
2114 {
2115 return inet_ctl_sock_create(&net->ipv6.tcp_sk, PF_INET6,
2116 SOCK_RAW, IPPROTO_TCP, net);
2117 }
2118
2119 static void tcpv6_net_exit(struct net *net)
2120 {
2121 inet_ctl_sock_destroy(net->ipv6.tcp_sk);
2122 }
2123
2124 static struct pernet_operations tcpv6_net_ops = {
2125 .init = tcpv6_net_init,
2126 .exit = tcpv6_net_exit,
2127 };
2128
2129 int __init tcpv6_init(void)
2130 {
2131 int ret;
2132
2133 ret = inet6_add_protocol(&tcpv6_protocol, IPPROTO_TCP);
2134 if (ret)
2135 goto out;
2136
2137 /* register inet6 protocol */
2138 ret = inet6_register_protosw(&tcpv6_protosw);
2139 if (ret)
2140 goto out_tcpv6_protocol;
2141
2142 ret = register_pernet_subsys(&tcpv6_net_ops);
2143 if (ret)
2144 goto out_tcpv6_protosw;
2145 out:
2146 return ret;
2147
2148 out_tcpv6_protocol:
2149 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
2150 out_tcpv6_protosw:
2151 inet6_unregister_protosw(&tcpv6_protosw);
2152 goto out;
2153 }
2154
2155 void tcpv6_exit(void)
2156 {
2157 unregister_pernet_subsys(&tcpv6_net_ops);
2158 inet6_unregister_protosw(&tcpv6_protosw);
2159 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
2160 }
This page took 0.075248 seconds and 5 git commands to generate.