Merge branch 'master' of master.kernel.org:/pub/scm/linux/kernel/git/davem/net-2.6
[deliverable/linux.git] / net / ipv6 / tcp_ipv6.c
1 /*
2 * TCP over IPv6
3 * Linux INET6 implementation
4 *
5 * Authors:
6 * Pedro Roque <roque@di.fc.ul.pt>
7 *
8 * Based on:
9 * linux/net/ipv4/tcp.c
10 * linux/net/ipv4/tcp_input.c
11 * linux/net/ipv4/tcp_output.c
12 *
13 * Fixes:
14 * Hideaki YOSHIFUJI : sin6_scope_id support
15 * YOSHIFUJI Hideaki @USAGI and: Support IPV6_V6ONLY socket option, which
16 * Alexey Kuznetsov allow both IPv4 and IPv6 sockets to bind
17 * a single port at the same time.
18 * YOSHIFUJI Hideaki @USAGI: convert /proc/net/tcp6 to seq_file.
19 *
20 * This program is free software; you can redistribute it and/or
21 * modify it under the terms of the GNU General Public License
22 * as published by the Free Software Foundation; either version
23 * 2 of the License, or (at your option) any later version.
24 */
25
26 #include <linux/module.h>
27 #include <linux/errno.h>
28 #include <linux/types.h>
29 #include <linux/socket.h>
30 #include <linux/sockios.h>
31 #include <linux/net.h>
32 #include <linux/jiffies.h>
33 #include <linux/in.h>
34 #include <linux/in6.h>
35 #include <linux/netdevice.h>
36 #include <linux/init.h>
37 #include <linux/jhash.h>
38 #include <linux/ipsec.h>
39 #include <linux/times.h>
40
41 #include <linux/ipv6.h>
42 #include <linux/icmpv6.h>
43 #include <linux/random.h>
44
45 #include <net/tcp.h>
46 #include <net/ndisc.h>
47 #include <net/inet6_hashtables.h>
48 #include <net/inet6_connection_sock.h>
49 #include <net/ipv6.h>
50 #include <net/transp_v6.h>
51 #include <net/addrconf.h>
52 #include <net/ip6_route.h>
53 #include <net/ip6_checksum.h>
54 #include <net/inet_ecn.h>
55 #include <net/protocol.h>
56 #include <net/xfrm.h>
57 #include <net/snmp.h>
58 #include <net/dsfield.h>
59 #include <net/timewait_sock.h>
60 #include <net/netdma.h>
61 #include <net/inet_common.h>
62
63 #include <asm/uaccess.h>
64
65 #include <linux/proc_fs.h>
66 #include <linux/seq_file.h>
67
68 #include <linux/crypto.h>
69 #include <linux/scatterlist.h>
70
71 static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb);
72 static void tcp_v6_reqsk_send_ack(struct sk_buff *skb, struct request_sock *req);
73
74 static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb);
75
76 static struct inet_connection_sock_af_ops ipv6_mapped;
77 static struct inet_connection_sock_af_ops ipv6_specific;
78 #ifdef CONFIG_TCP_MD5SIG
79 static struct tcp_sock_af_ops tcp_sock_ipv6_specific;
80 static struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific;
81 #else
82 static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
83 struct in6_addr *addr)
84 {
85 return NULL;
86 }
87 #endif
88
89 static void tcp_v6_hash(struct sock *sk)
90 {
91 if (sk->sk_state != TCP_CLOSE) {
92 if (inet_csk(sk)->icsk_af_ops == &ipv6_mapped) {
93 tcp_prot.hash(sk);
94 return;
95 }
96 local_bh_disable();
97 __inet6_hash(sk);
98 local_bh_enable();
99 }
100 }
101
102 static __inline__ __sum16 tcp_v6_check(struct tcphdr *th, int len,
103 struct in6_addr *saddr,
104 struct in6_addr *daddr,
105 __wsum base)
106 {
107 return csum_ipv6_magic(saddr, daddr, len, IPPROTO_TCP, base);
108 }
109
110 static __u32 tcp_v6_init_sequence(struct sk_buff *skb)
111 {
112 return secure_tcpv6_sequence_number(ipv6_hdr(skb)->daddr.s6_addr32,
113 ipv6_hdr(skb)->saddr.s6_addr32,
114 tcp_hdr(skb)->dest,
115 tcp_hdr(skb)->source);
116 }
117
118 static int tcp_v6_connect(struct sock *sk, struct sockaddr *uaddr,
119 int addr_len)
120 {
121 struct sockaddr_in6 *usin = (struct sockaddr_in6 *) uaddr;
122 struct inet_sock *inet = inet_sk(sk);
123 struct inet_connection_sock *icsk = inet_csk(sk);
124 struct ipv6_pinfo *np = inet6_sk(sk);
125 struct tcp_sock *tp = tcp_sk(sk);
126 struct in6_addr *saddr = NULL, *final_p = NULL, final;
127 struct flowi fl;
128 struct dst_entry *dst;
129 int addr_type;
130 int err;
131
132 if (addr_len < SIN6_LEN_RFC2133)
133 return -EINVAL;
134
135 if (usin->sin6_family != AF_INET6)
136 return(-EAFNOSUPPORT);
137
138 memset(&fl, 0, sizeof(fl));
139
140 if (np->sndflow) {
141 fl.fl6_flowlabel = usin->sin6_flowinfo&IPV6_FLOWINFO_MASK;
142 IP6_ECN_flow_init(fl.fl6_flowlabel);
143 if (fl.fl6_flowlabel&IPV6_FLOWLABEL_MASK) {
144 struct ip6_flowlabel *flowlabel;
145 flowlabel = fl6_sock_lookup(sk, fl.fl6_flowlabel);
146 if (flowlabel == NULL)
147 return -EINVAL;
148 ipv6_addr_copy(&usin->sin6_addr, &flowlabel->dst);
149 fl6_sock_release(flowlabel);
150 }
151 }
152
153 /*
154 * connect() to INADDR_ANY means loopback (BSD'ism).
155 */
156
157 if(ipv6_addr_any(&usin->sin6_addr))
158 usin->sin6_addr.s6_addr[15] = 0x1;
159
160 addr_type = ipv6_addr_type(&usin->sin6_addr);
161
162 if(addr_type & IPV6_ADDR_MULTICAST)
163 return -ENETUNREACH;
164
165 if (addr_type&IPV6_ADDR_LINKLOCAL) {
166 if (addr_len >= sizeof(struct sockaddr_in6) &&
167 usin->sin6_scope_id) {
168 /* If interface is set while binding, indices
169 * must coincide.
170 */
171 if (sk->sk_bound_dev_if &&
172 sk->sk_bound_dev_if != usin->sin6_scope_id)
173 return -EINVAL;
174
175 sk->sk_bound_dev_if = usin->sin6_scope_id;
176 }
177
178 /* Connect to link-local address requires an interface */
179 if (!sk->sk_bound_dev_if)
180 return -EINVAL;
181 }
182
183 if (tp->rx_opt.ts_recent_stamp &&
184 !ipv6_addr_equal(&np->daddr, &usin->sin6_addr)) {
185 tp->rx_opt.ts_recent = 0;
186 tp->rx_opt.ts_recent_stamp = 0;
187 tp->write_seq = 0;
188 }
189
190 ipv6_addr_copy(&np->daddr, &usin->sin6_addr);
191 np->flow_label = fl.fl6_flowlabel;
192
193 /*
194 * TCP over IPv4
195 */
196
197 if (addr_type == IPV6_ADDR_MAPPED) {
198 u32 exthdrlen = icsk->icsk_ext_hdr_len;
199 struct sockaddr_in sin;
200
201 SOCK_DEBUG(sk, "connect: ipv4 mapped\n");
202
203 if (__ipv6_only_sock(sk))
204 return -ENETUNREACH;
205
206 sin.sin_family = AF_INET;
207 sin.sin_port = usin->sin6_port;
208 sin.sin_addr.s_addr = usin->sin6_addr.s6_addr32[3];
209
210 icsk->icsk_af_ops = &ipv6_mapped;
211 sk->sk_backlog_rcv = tcp_v4_do_rcv;
212 #ifdef CONFIG_TCP_MD5SIG
213 tp->af_specific = &tcp_sock_ipv6_mapped_specific;
214 #endif
215
216 err = tcp_v4_connect(sk, (struct sockaddr *)&sin, sizeof(sin));
217
218 if (err) {
219 icsk->icsk_ext_hdr_len = exthdrlen;
220 icsk->icsk_af_ops = &ipv6_specific;
221 sk->sk_backlog_rcv = tcp_v6_do_rcv;
222 #ifdef CONFIG_TCP_MD5SIG
223 tp->af_specific = &tcp_sock_ipv6_specific;
224 #endif
225 goto failure;
226 } else {
227 ipv6_addr_set(&np->saddr, 0, 0, htonl(0x0000FFFF),
228 inet->saddr);
229 ipv6_addr_set(&np->rcv_saddr, 0, 0, htonl(0x0000FFFF),
230 inet->rcv_saddr);
231 }
232
233 return err;
234 }
235
236 if (!ipv6_addr_any(&np->rcv_saddr))
237 saddr = &np->rcv_saddr;
238
239 fl.proto = IPPROTO_TCP;
240 ipv6_addr_copy(&fl.fl6_dst, &np->daddr);
241 ipv6_addr_copy(&fl.fl6_src,
242 (saddr ? saddr : &np->saddr));
243 fl.oif = sk->sk_bound_dev_if;
244 fl.fl_ip_dport = usin->sin6_port;
245 fl.fl_ip_sport = inet->sport;
246
247 if (np->opt && np->opt->srcrt) {
248 struct rt0_hdr *rt0 = (struct rt0_hdr *)np->opt->srcrt;
249 ipv6_addr_copy(&final, &fl.fl6_dst);
250 ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
251 final_p = &final;
252 }
253
254 security_sk_classify_flow(sk, &fl);
255
256 err = ip6_dst_lookup(sk, &dst, &fl);
257 if (err)
258 goto failure;
259 if (final_p)
260 ipv6_addr_copy(&fl.fl6_dst, final_p);
261
262 if ((err = __xfrm_lookup(&dst, &fl, sk, XFRM_LOOKUP_WAIT)) < 0) {
263 if (err == -EREMOTE)
264 err = ip6_dst_blackhole(sk, &dst, &fl);
265 if (err < 0)
266 goto failure;
267 }
268
269 if (saddr == NULL) {
270 saddr = &fl.fl6_src;
271 ipv6_addr_copy(&np->rcv_saddr, saddr);
272 }
273
274 /* set the source address */
275 ipv6_addr_copy(&np->saddr, saddr);
276 inet->rcv_saddr = LOOPBACK4_IPV6;
277
278 sk->sk_gso_type = SKB_GSO_TCPV6;
279 __ip6_dst_store(sk, dst, NULL, NULL);
280
281 icsk->icsk_ext_hdr_len = 0;
282 if (np->opt)
283 icsk->icsk_ext_hdr_len = (np->opt->opt_flen +
284 np->opt->opt_nflen);
285
286 tp->rx_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
287
288 inet->dport = usin->sin6_port;
289
290 tcp_set_state(sk, TCP_SYN_SENT);
291 err = inet6_hash_connect(&tcp_death_row, sk);
292 if (err)
293 goto late_failure;
294
295 if (!tp->write_seq)
296 tp->write_seq = secure_tcpv6_sequence_number(np->saddr.s6_addr32,
297 np->daddr.s6_addr32,
298 inet->sport,
299 inet->dport);
300
301 err = tcp_connect(sk);
302 if (err)
303 goto late_failure;
304
305 return 0;
306
307 late_failure:
308 tcp_set_state(sk, TCP_CLOSE);
309 __sk_dst_reset(sk);
310 failure:
311 inet->dport = 0;
312 sk->sk_route_caps = 0;
313 return err;
314 }
315
316 static void tcp_v6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
317 int type, int code, int offset, __be32 info)
318 {
319 struct ipv6hdr *hdr = (struct ipv6hdr*)skb->data;
320 const struct tcphdr *th = (struct tcphdr *)(skb->data+offset);
321 struct ipv6_pinfo *np;
322 struct sock *sk;
323 int err;
324 struct tcp_sock *tp;
325 __u32 seq;
326
327 sk = inet6_lookup(dev_net(skb->dev), &tcp_hashinfo, &hdr->daddr,
328 th->dest, &hdr->saddr, th->source, skb->dev->ifindex);
329
330 if (sk == NULL) {
331 ICMP6_INC_STATS_BH(__in6_dev_get(skb->dev), ICMP6_MIB_INERRORS);
332 return;
333 }
334
335 if (sk->sk_state == TCP_TIME_WAIT) {
336 inet_twsk_put(inet_twsk(sk));
337 return;
338 }
339
340 bh_lock_sock(sk);
341 if (sock_owned_by_user(sk))
342 NET_INC_STATS_BH(LINUX_MIB_LOCKDROPPEDICMPS);
343
344 if (sk->sk_state == TCP_CLOSE)
345 goto out;
346
347 tp = tcp_sk(sk);
348 seq = ntohl(th->seq);
349 if (sk->sk_state != TCP_LISTEN &&
350 !between(seq, tp->snd_una, tp->snd_nxt)) {
351 NET_INC_STATS_BH(LINUX_MIB_OUTOFWINDOWICMPS);
352 goto out;
353 }
354
355 np = inet6_sk(sk);
356
357 if (type == ICMPV6_PKT_TOOBIG) {
358 struct dst_entry *dst = NULL;
359
360 if (sock_owned_by_user(sk))
361 goto out;
362 if ((1 << sk->sk_state) & (TCPF_LISTEN | TCPF_CLOSE))
363 goto out;
364
365 /* icmp should have updated the destination cache entry */
366 dst = __sk_dst_check(sk, np->dst_cookie);
367
368 if (dst == NULL) {
369 struct inet_sock *inet = inet_sk(sk);
370 struct flowi fl;
371
372 /* BUGGG_FUTURE: Again, it is not clear how
373 to handle rthdr case. Ignore this complexity
374 for now.
375 */
376 memset(&fl, 0, sizeof(fl));
377 fl.proto = IPPROTO_TCP;
378 ipv6_addr_copy(&fl.fl6_dst, &np->daddr);
379 ipv6_addr_copy(&fl.fl6_src, &np->saddr);
380 fl.oif = sk->sk_bound_dev_if;
381 fl.fl_ip_dport = inet->dport;
382 fl.fl_ip_sport = inet->sport;
383 security_skb_classify_flow(skb, &fl);
384
385 if ((err = ip6_dst_lookup(sk, &dst, &fl))) {
386 sk->sk_err_soft = -err;
387 goto out;
388 }
389
390 if ((err = xfrm_lookup(&dst, &fl, sk, 0)) < 0) {
391 sk->sk_err_soft = -err;
392 goto out;
393 }
394
395 } else
396 dst_hold(dst);
397
398 if (inet_csk(sk)->icsk_pmtu_cookie > dst_mtu(dst)) {
399 tcp_sync_mss(sk, dst_mtu(dst));
400 tcp_simple_retransmit(sk);
401 } /* else let the usual retransmit timer handle it */
402 dst_release(dst);
403 goto out;
404 }
405
406 icmpv6_err_convert(type, code, &err);
407
408 /* Might be for an request_sock */
409 switch (sk->sk_state) {
410 struct request_sock *req, **prev;
411 case TCP_LISTEN:
412 if (sock_owned_by_user(sk))
413 goto out;
414
415 req = inet6_csk_search_req(sk, &prev, th->dest, &hdr->daddr,
416 &hdr->saddr, inet6_iif(skb));
417 if (!req)
418 goto out;
419
420 /* ICMPs are not backlogged, hence we cannot get
421 * an established socket here.
422 */
423 BUG_TRAP(req->sk == NULL);
424
425 if (seq != tcp_rsk(req)->snt_isn) {
426 NET_INC_STATS_BH(LINUX_MIB_OUTOFWINDOWICMPS);
427 goto out;
428 }
429
430 inet_csk_reqsk_queue_drop(sk, req, prev);
431 goto out;
432
433 case TCP_SYN_SENT:
434 case TCP_SYN_RECV: /* Cannot happen.
435 It can, it SYNs are crossed. --ANK */
436 if (!sock_owned_by_user(sk)) {
437 sk->sk_err = err;
438 sk->sk_error_report(sk); /* Wake people up to see the error (see connect in sock.c) */
439
440 tcp_done(sk);
441 } else
442 sk->sk_err_soft = err;
443 goto out;
444 }
445
446 if (!sock_owned_by_user(sk) && np->recverr) {
447 sk->sk_err = err;
448 sk->sk_error_report(sk);
449 } else
450 sk->sk_err_soft = err;
451
452 out:
453 bh_unlock_sock(sk);
454 sock_put(sk);
455 }
456
457
458 static int tcp_v6_send_synack(struct sock *sk, struct request_sock *req)
459 {
460 struct inet6_request_sock *treq = inet6_rsk(req);
461 struct ipv6_pinfo *np = inet6_sk(sk);
462 struct sk_buff * skb;
463 struct ipv6_txoptions *opt = NULL;
464 struct in6_addr * final_p = NULL, final;
465 struct flowi fl;
466 struct dst_entry *dst;
467 int err = -1;
468
469 memset(&fl, 0, sizeof(fl));
470 fl.proto = IPPROTO_TCP;
471 ipv6_addr_copy(&fl.fl6_dst, &treq->rmt_addr);
472 ipv6_addr_copy(&fl.fl6_src, &treq->loc_addr);
473 fl.fl6_flowlabel = 0;
474 fl.oif = treq->iif;
475 fl.fl_ip_dport = inet_rsk(req)->rmt_port;
476 fl.fl_ip_sport = inet_sk(sk)->sport;
477 security_req_classify_flow(req, &fl);
478
479 opt = np->opt;
480 if (opt && opt->srcrt) {
481 struct rt0_hdr *rt0 = (struct rt0_hdr *) opt->srcrt;
482 ipv6_addr_copy(&final, &fl.fl6_dst);
483 ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
484 final_p = &final;
485 }
486
487 err = ip6_dst_lookup(sk, &dst, &fl);
488 if (err)
489 goto done;
490 if (final_p)
491 ipv6_addr_copy(&fl.fl6_dst, final_p);
492 if ((err = xfrm_lookup(&dst, &fl, sk, 0)) < 0)
493 goto done;
494
495 skb = tcp_make_synack(sk, dst, req);
496 if (skb) {
497 struct tcphdr *th = tcp_hdr(skb);
498
499 th->check = tcp_v6_check(th, skb->len,
500 &treq->loc_addr, &treq->rmt_addr,
501 csum_partial((char *)th, skb->len, skb->csum));
502
503 ipv6_addr_copy(&fl.fl6_dst, &treq->rmt_addr);
504 err = ip6_xmit(sk, skb, &fl, opt, 0);
505 err = net_xmit_eval(err);
506 }
507
508 done:
509 if (opt && opt != np->opt)
510 sock_kfree_s(sk, opt, opt->tot_len);
511 dst_release(dst);
512 return err;
513 }
514
515 static inline void syn_flood_warning(struct sk_buff *skb)
516 {
517 #ifdef CONFIG_SYN_COOKIES
518 if (sysctl_tcp_syncookies)
519 printk(KERN_INFO
520 "TCPv6: Possible SYN flooding on port %d. "
521 "Sending cookies.\n", ntohs(tcp_hdr(skb)->dest));
522 else
523 #endif
524 printk(KERN_INFO
525 "TCPv6: Possible SYN flooding on port %d. "
526 "Dropping request.\n", ntohs(tcp_hdr(skb)->dest));
527 }
528
529 static void tcp_v6_reqsk_destructor(struct request_sock *req)
530 {
531 if (inet6_rsk(req)->pktopts)
532 kfree_skb(inet6_rsk(req)->pktopts);
533 }
534
535 #ifdef CONFIG_TCP_MD5SIG
536 static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
537 struct in6_addr *addr)
538 {
539 struct tcp_sock *tp = tcp_sk(sk);
540 int i;
541
542 BUG_ON(tp == NULL);
543
544 if (!tp->md5sig_info || !tp->md5sig_info->entries6)
545 return NULL;
546
547 for (i = 0; i < tp->md5sig_info->entries6; i++) {
548 if (ipv6_addr_equal(&tp->md5sig_info->keys6[i].addr, addr))
549 return &tp->md5sig_info->keys6[i].base;
550 }
551 return NULL;
552 }
553
554 static struct tcp_md5sig_key *tcp_v6_md5_lookup(struct sock *sk,
555 struct sock *addr_sk)
556 {
557 return tcp_v6_md5_do_lookup(sk, &inet6_sk(addr_sk)->daddr);
558 }
559
560 static struct tcp_md5sig_key *tcp_v6_reqsk_md5_lookup(struct sock *sk,
561 struct request_sock *req)
562 {
563 return tcp_v6_md5_do_lookup(sk, &inet6_rsk(req)->rmt_addr);
564 }
565
566 static int tcp_v6_md5_do_add(struct sock *sk, struct in6_addr *peer,
567 char *newkey, u8 newkeylen)
568 {
569 /* Add key to the list */
570 struct tcp_md5sig_key *key;
571 struct tcp_sock *tp = tcp_sk(sk);
572 struct tcp6_md5sig_key *keys;
573
574 key = tcp_v6_md5_do_lookup(sk, peer);
575 if (key) {
576 /* modify existing entry - just update that one */
577 kfree(key->key);
578 key->key = newkey;
579 key->keylen = newkeylen;
580 } else {
581 /* reallocate new list if current one is full. */
582 if (!tp->md5sig_info) {
583 tp->md5sig_info = kzalloc(sizeof(*tp->md5sig_info), GFP_ATOMIC);
584 if (!tp->md5sig_info) {
585 kfree(newkey);
586 return -ENOMEM;
587 }
588 sk->sk_route_caps &= ~NETIF_F_GSO_MASK;
589 }
590 if (tcp_alloc_md5sig_pool() == NULL) {
591 kfree(newkey);
592 return -ENOMEM;
593 }
594 if (tp->md5sig_info->alloced6 == tp->md5sig_info->entries6) {
595 keys = kmalloc((sizeof (tp->md5sig_info->keys6[0]) *
596 (tp->md5sig_info->entries6 + 1)), GFP_ATOMIC);
597
598 if (!keys) {
599 tcp_free_md5sig_pool();
600 kfree(newkey);
601 return -ENOMEM;
602 }
603
604 if (tp->md5sig_info->entries6)
605 memmove(keys, tp->md5sig_info->keys6,
606 (sizeof (tp->md5sig_info->keys6[0]) *
607 tp->md5sig_info->entries6));
608
609 kfree(tp->md5sig_info->keys6);
610 tp->md5sig_info->keys6 = keys;
611 tp->md5sig_info->alloced6++;
612 }
613
614 ipv6_addr_copy(&tp->md5sig_info->keys6[tp->md5sig_info->entries6].addr,
615 peer);
616 tp->md5sig_info->keys6[tp->md5sig_info->entries6].base.key = newkey;
617 tp->md5sig_info->keys6[tp->md5sig_info->entries6].base.keylen = newkeylen;
618
619 tp->md5sig_info->entries6++;
620 }
621 return 0;
622 }
623
624 static int tcp_v6_md5_add_func(struct sock *sk, struct sock *addr_sk,
625 u8 *newkey, __u8 newkeylen)
626 {
627 return tcp_v6_md5_do_add(sk, &inet6_sk(addr_sk)->daddr,
628 newkey, newkeylen);
629 }
630
631 static int tcp_v6_md5_do_del(struct sock *sk, struct in6_addr *peer)
632 {
633 struct tcp_sock *tp = tcp_sk(sk);
634 int i;
635
636 for (i = 0; i < tp->md5sig_info->entries6; i++) {
637 if (ipv6_addr_equal(&tp->md5sig_info->keys6[i].addr, peer)) {
638 /* Free the key */
639 kfree(tp->md5sig_info->keys6[i].base.key);
640 tp->md5sig_info->entries6--;
641
642 if (tp->md5sig_info->entries6 == 0) {
643 kfree(tp->md5sig_info->keys6);
644 tp->md5sig_info->keys6 = NULL;
645 tp->md5sig_info->alloced6 = 0;
646 } else {
647 /* shrink the database */
648 if (tp->md5sig_info->entries6 != i)
649 memmove(&tp->md5sig_info->keys6[i],
650 &tp->md5sig_info->keys6[i+1],
651 (tp->md5sig_info->entries6 - i)
652 * sizeof (tp->md5sig_info->keys6[0]));
653 }
654 tcp_free_md5sig_pool();
655 return 0;
656 }
657 }
658 return -ENOENT;
659 }
660
661 static void tcp_v6_clear_md5_list (struct sock *sk)
662 {
663 struct tcp_sock *tp = tcp_sk(sk);
664 int i;
665
666 if (tp->md5sig_info->entries6) {
667 for (i = 0; i < tp->md5sig_info->entries6; i++)
668 kfree(tp->md5sig_info->keys6[i].base.key);
669 tp->md5sig_info->entries6 = 0;
670 tcp_free_md5sig_pool();
671 }
672
673 kfree(tp->md5sig_info->keys6);
674 tp->md5sig_info->keys6 = NULL;
675 tp->md5sig_info->alloced6 = 0;
676
677 if (tp->md5sig_info->entries4) {
678 for (i = 0; i < tp->md5sig_info->entries4; i++)
679 kfree(tp->md5sig_info->keys4[i].base.key);
680 tp->md5sig_info->entries4 = 0;
681 tcp_free_md5sig_pool();
682 }
683
684 kfree(tp->md5sig_info->keys4);
685 tp->md5sig_info->keys4 = NULL;
686 tp->md5sig_info->alloced4 = 0;
687 }
688
689 static int tcp_v6_parse_md5_keys (struct sock *sk, char __user *optval,
690 int optlen)
691 {
692 struct tcp_md5sig cmd;
693 struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)&cmd.tcpm_addr;
694 u8 *newkey;
695
696 if (optlen < sizeof(cmd))
697 return -EINVAL;
698
699 if (copy_from_user(&cmd, optval, sizeof(cmd)))
700 return -EFAULT;
701
702 if (sin6->sin6_family != AF_INET6)
703 return -EINVAL;
704
705 if (!cmd.tcpm_keylen) {
706 if (!tcp_sk(sk)->md5sig_info)
707 return -ENOENT;
708 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
709 return tcp_v4_md5_do_del(sk, sin6->sin6_addr.s6_addr32[3]);
710 return tcp_v6_md5_do_del(sk, &sin6->sin6_addr);
711 }
712
713 if (cmd.tcpm_keylen > TCP_MD5SIG_MAXKEYLEN)
714 return -EINVAL;
715
716 if (!tcp_sk(sk)->md5sig_info) {
717 struct tcp_sock *tp = tcp_sk(sk);
718 struct tcp_md5sig_info *p;
719
720 p = kzalloc(sizeof(struct tcp_md5sig_info), GFP_KERNEL);
721 if (!p)
722 return -ENOMEM;
723
724 tp->md5sig_info = p;
725 sk->sk_route_caps &= ~NETIF_F_GSO_MASK;
726 }
727
728 newkey = kmemdup(cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
729 if (!newkey)
730 return -ENOMEM;
731 if (ipv6_addr_v4mapped(&sin6->sin6_addr)) {
732 return tcp_v4_md5_do_add(sk, sin6->sin6_addr.s6_addr32[3],
733 newkey, cmd.tcpm_keylen);
734 }
735 return tcp_v6_md5_do_add(sk, &sin6->sin6_addr, newkey, cmd.tcpm_keylen);
736 }
737
738 static int tcp_v6_do_calc_md5_hash(char *md5_hash, struct tcp_md5sig_key *key,
739 struct in6_addr *saddr,
740 struct in6_addr *daddr,
741 struct tcphdr *th, unsigned int tcplen)
742 {
743 struct tcp_md5sig_pool *hp;
744 struct tcp6_pseudohdr *bp;
745 int err;
746
747 hp = tcp_get_md5sig_pool();
748 if (!hp) {
749 printk(KERN_WARNING "%s(): hash pool not found...\n", __func__);
750 goto clear_hash_noput;
751 }
752
753 bp = &hp->md5_blk.ip6;
754
755 /* 1. TCP pseudo-header (RFC2460) */
756 ipv6_addr_copy(&bp->saddr, saddr);
757 ipv6_addr_copy(&bp->daddr, daddr);
758 bp->len = htonl(tcplen);
759 bp->protocol = htonl(IPPROTO_TCP);
760
761 err = tcp_calc_md5_hash(md5_hash, key, sizeof(*bp),
762 th, tcplen, hp);
763
764 if (err)
765 goto clear_hash;
766
767 /* Free up the crypto pool */
768 tcp_put_md5sig_pool();
769 out:
770 return 0;
771 clear_hash:
772 tcp_put_md5sig_pool();
773 clear_hash_noput:
774 memset(md5_hash, 0, 16);
775 goto out;
776 }
777
778 static int tcp_v6_calc_md5_hash(char *md5_hash, struct tcp_md5sig_key *key,
779 struct sock *sk,
780 struct dst_entry *dst,
781 struct request_sock *req,
782 struct tcphdr *th, unsigned int tcplen)
783 {
784 struct in6_addr *saddr, *daddr;
785
786 if (sk) {
787 saddr = &inet6_sk(sk)->saddr;
788 daddr = &inet6_sk(sk)->daddr;
789 } else {
790 saddr = &inet6_rsk(req)->loc_addr;
791 daddr = &inet6_rsk(req)->rmt_addr;
792 }
793 return tcp_v6_do_calc_md5_hash(md5_hash, key,
794 saddr, daddr,
795 th, tcplen);
796 }
797
798 static int tcp_v6_inbound_md5_hash (struct sock *sk, struct sk_buff *skb)
799 {
800 __u8 *hash_location = NULL;
801 struct tcp_md5sig_key *hash_expected;
802 struct ipv6hdr *ip6h = ipv6_hdr(skb);
803 struct tcphdr *th = tcp_hdr(skb);
804 int genhash;
805 u8 newhash[16];
806
807 hash_expected = tcp_v6_md5_do_lookup(sk, &ip6h->saddr);
808 hash_location = tcp_parse_md5sig_option(th);
809
810 /* do we have a hash as expected? */
811 if (!hash_expected) {
812 if (!hash_location)
813 return 0;
814 if (net_ratelimit()) {
815 printk(KERN_INFO "MD5 Hash NOT expected but found "
816 "(" NIP6_FMT ", %u)->"
817 "(" NIP6_FMT ", %u)\n",
818 NIP6(ip6h->saddr), ntohs(th->source),
819 NIP6(ip6h->daddr), ntohs(th->dest));
820 }
821 return 1;
822 }
823
824 if (!hash_location) {
825 if (net_ratelimit()) {
826 printk(KERN_INFO "MD5 Hash expected but NOT found "
827 "(" NIP6_FMT ", %u)->"
828 "(" NIP6_FMT ", %u)\n",
829 NIP6(ip6h->saddr), ntohs(th->source),
830 NIP6(ip6h->daddr), ntohs(th->dest));
831 }
832 return 1;
833 }
834
835 /* check the signature */
836 genhash = tcp_v6_do_calc_md5_hash(newhash,
837 hash_expected,
838 &ip6h->saddr, &ip6h->daddr,
839 th, skb->len);
840 if (genhash || memcmp(hash_location, newhash, 16) != 0) {
841 if (net_ratelimit()) {
842 printk(KERN_INFO "MD5 Hash %s for "
843 "(" NIP6_FMT ", %u)->"
844 "(" NIP6_FMT ", %u)\n",
845 genhash ? "failed" : "mismatch",
846 NIP6(ip6h->saddr), ntohs(th->source),
847 NIP6(ip6h->daddr), ntohs(th->dest));
848 }
849 return 1;
850 }
851 return 0;
852 }
853 #endif
854
855 struct request_sock_ops tcp6_request_sock_ops __read_mostly = {
856 .family = AF_INET6,
857 .obj_size = sizeof(struct tcp6_request_sock),
858 .rtx_syn_ack = tcp_v6_send_synack,
859 .send_ack = tcp_v6_reqsk_send_ack,
860 .destructor = tcp_v6_reqsk_destructor,
861 .send_reset = tcp_v6_send_reset
862 };
863
864 #ifdef CONFIG_TCP_MD5SIG
865 static struct tcp_request_sock_ops tcp_request_sock_ipv6_ops = {
866 .md5_lookup = tcp_v6_reqsk_md5_lookup,
867 };
868 #endif
869
870 static struct timewait_sock_ops tcp6_timewait_sock_ops = {
871 .twsk_obj_size = sizeof(struct tcp6_timewait_sock),
872 .twsk_unique = tcp_twsk_unique,
873 .twsk_destructor= tcp_twsk_destructor,
874 };
875
876 static void tcp_v6_send_check(struct sock *sk, int len, struct sk_buff *skb)
877 {
878 struct ipv6_pinfo *np = inet6_sk(sk);
879 struct tcphdr *th = tcp_hdr(skb);
880
881 if (skb->ip_summed == CHECKSUM_PARTIAL) {
882 th->check = ~csum_ipv6_magic(&np->saddr, &np->daddr, len, IPPROTO_TCP, 0);
883 skb->csum_start = skb_transport_header(skb) - skb->head;
884 skb->csum_offset = offsetof(struct tcphdr, check);
885 } else {
886 th->check = csum_ipv6_magic(&np->saddr, &np->daddr, len, IPPROTO_TCP,
887 csum_partial((char *)th, th->doff<<2,
888 skb->csum));
889 }
890 }
891
892 static int tcp_v6_gso_send_check(struct sk_buff *skb)
893 {
894 struct ipv6hdr *ipv6h;
895 struct tcphdr *th;
896
897 if (!pskb_may_pull(skb, sizeof(*th)))
898 return -EINVAL;
899
900 ipv6h = ipv6_hdr(skb);
901 th = tcp_hdr(skb);
902
903 th->check = 0;
904 th->check = ~csum_ipv6_magic(&ipv6h->saddr, &ipv6h->daddr, skb->len,
905 IPPROTO_TCP, 0);
906 skb->csum_start = skb_transport_header(skb) - skb->head;
907 skb->csum_offset = offsetof(struct tcphdr, check);
908 skb->ip_summed = CHECKSUM_PARTIAL;
909 return 0;
910 }
911
912 static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb)
913 {
914 struct tcphdr *th = tcp_hdr(skb), *t1;
915 struct sk_buff *buff;
916 struct flowi fl;
917 struct net *net = dev_net(skb->dst->dev);
918 struct sock *ctl_sk = net->ipv6.tcp_sk;
919 unsigned int tot_len = sizeof(*th);
920 #ifdef CONFIG_TCP_MD5SIG
921 struct tcp_md5sig_key *key;
922 #endif
923
924 if (th->rst)
925 return;
926
927 if (!ipv6_unicast_destination(skb))
928 return;
929
930 #ifdef CONFIG_TCP_MD5SIG
931 if (sk)
932 key = tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr);
933 else
934 key = NULL;
935
936 if (key)
937 tot_len += TCPOLEN_MD5SIG_ALIGNED;
938 #endif
939
940 /*
941 * We need to grab some memory, and put together an RST,
942 * and then put it into the queue to be sent.
943 */
944
945 buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
946 GFP_ATOMIC);
947 if (buff == NULL)
948 return;
949
950 skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
951
952 t1 = (struct tcphdr *) skb_push(buff, tot_len);
953
954 /* Swap the send and the receive. */
955 memset(t1, 0, sizeof(*t1));
956 t1->dest = th->source;
957 t1->source = th->dest;
958 t1->doff = tot_len / 4;
959 t1->rst = 1;
960
961 if(th->ack) {
962 t1->seq = th->ack_seq;
963 } else {
964 t1->ack = 1;
965 t1->ack_seq = htonl(ntohl(th->seq) + th->syn + th->fin
966 + skb->len - (th->doff<<2));
967 }
968
969 #ifdef CONFIG_TCP_MD5SIG
970 if (key) {
971 __be32 *opt = (__be32*)(t1 + 1);
972 opt[0] = htonl((TCPOPT_NOP << 24) |
973 (TCPOPT_NOP << 16) |
974 (TCPOPT_MD5SIG << 8) |
975 TCPOLEN_MD5SIG);
976 tcp_v6_do_calc_md5_hash((__u8 *)&opt[1], key,
977 &ipv6_hdr(skb)->daddr,
978 &ipv6_hdr(skb)->saddr,
979 t1, tot_len);
980 }
981 #endif
982
983 buff->csum = csum_partial((char *)t1, sizeof(*t1), 0);
984
985 memset(&fl, 0, sizeof(fl));
986 ipv6_addr_copy(&fl.fl6_dst, &ipv6_hdr(skb)->saddr);
987 ipv6_addr_copy(&fl.fl6_src, &ipv6_hdr(skb)->daddr);
988
989 t1->check = csum_ipv6_magic(&fl.fl6_src, &fl.fl6_dst,
990 sizeof(*t1), IPPROTO_TCP,
991 buff->csum);
992
993 fl.proto = IPPROTO_TCP;
994 fl.oif = inet6_iif(skb);
995 fl.fl_ip_dport = t1->dest;
996 fl.fl_ip_sport = t1->source;
997 security_skb_classify_flow(skb, &fl);
998
999 /* Pass a socket to ip6_dst_lookup either it is for RST
1000 * Underlying function will use this to retrieve the network
1001 * namespace
1002 */
1003 if (!ip6_dst_lookup(ctl_sk, &buff->dst, &fl)) {
1004
1005 if (xfrm_lookup(&buff->dst, &fl, NULL, 0) >= 0) {
1006 ip6_xmit(ctl_sk, buff, &fl, NULL, 0);
1007 TCP_INC_STATS_BH(TCP_MIB_OUTSEGS);
1008 TCP_INC_STATS_BH(TCP_MIB_OUTRSTS);
1009 return;
1010 }
1011 }
1012
1013 kfree_skb(buff);
1014 }
1015
1016 static void tcp_v6_send_ack(struct sk_buff *skb, u32 seq, u32 ack, u32 win, u32 ts,
1017 struct tcp_md5sig_key *key)
1018 {
1019 struct tcphdr *th = tcp_hdr(skb), *t1;
1020 struct sk_buff *buff;
1021 struct flowi fl;
1022 struct net *net = dev_net(skb->dev);
1023 struct sock *ctl_sk = net->ipv6.tcp_sk;
1024 unsigned int tot_len = sizeof(struct tcphdr);
1025 __be32 *topt;
1026
1027 if (ts)
1028 tot_len += TCPOLEN_TSTAMP_ALIGNED;
1029 #ifdef CONFIG_TCP_MD5SIG
1030 if (key)
1031 tot_len += TCPOLEN_MD5SIG_ALIGNED;
1032 #endif
1033
1034 buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
1035 GFP_ATOMIC);
1036 if (buff == NULL)
1037 return;
1038
1039 skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
1040
1041 t1 = (struct tcphdr *) skb_push(buff,tot_len);
1042
1043 /* Swap the send and the receive. */
1044 memset(t1, 0, sizeof(*t1));
1045 t1->dest = th->source;
1046 t1->source = th->dest;
1047 t1->doff = tot_len/4;
1048 t1->seq = htonl(seq);
1049 t1->ack_seq = htonl(ack);
1050 t1->ack = 1;
1051 t1->window = htons(win);
1052
1053 topt = (__be32 *)(t1 + 1);
1054
1055 if (ts) {
1056 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
1057 (TCPOPT_TIMESTAMP << 8) | TCPOLEN_TIMESTAMP);
1058 *topt++ = htonl(tcp_time_stamp);
1059 *topt = htonl(ts);
1060 }
1061
1062 #ifdef CONFIG_TCP_MD5SIG
1063 if (key) {
1064 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
1065 (TCPOPT_MD5SIG << 8) | TCPOLEN_MD5SIG);
1066 tcp_v6_do_calc_md5_hash((__u8 *)topt, key,
1067 &ipv6_hdr(skb)->daddr,
1068 &ipv6_hdr(skb)->saddr,
1069 t1, tot_len);
1070 }
1071 #endif
1072
1073 buff->csum = csum_partial((char *)t1, tot_len, 0);
1074
1075 memset(&fl, 0, sizeof(fl));
1076 ipv6_addr_copy(&fl.fl6_dst, &ipv6_hdr(skb)->saddr);
1077 ipv6_addr_copy(&fl.fl6_src, &ipv6_hdr(skb)->daddr);
1078
1079 t1->check = csum_ipv6_magic(&fl.fl6_src, &fl.fl6_dst,
1080 tot_len, IPPROTO_TCP,
1081 buff->csum);
1082
1083 fl.proto = IPPROTO_TCP;
1084 fl.oif = inet6_iif(skb);
1085 fl.fl_ip_dport = t1->dest;
1086 fl.fl_ip_sport = t1->source;
1087 security_skb_classify_flow(skb, &fl);
1088
1089 if (!ip6_dst_lookup(ctl_sk, &buff->dst, &fl)) {
1090 if (xfrm_lookup(&buff->dst, &fl, NULL, 0) >= 0) {
1091 ip6_xmit(ctl_sk, buff, &fl, NULL, 0);
1092 TCP_INC_STATS_BH(TCP_MIB_OUTSEGS);
1093 return;
1094 }
1095 }
1096
1097 kfree_skb(buff);
1098 }
1099
1100 static void tcp_v6_timewait_ack(struct sock *sk, struct sk_buff *skb)
1101 {
1102 struct inet_timewait_sock *tw = inet_twsk(sk);
1103 struct tcp_timewait_sock *tcptw = tcp_twsk(sk);
1104
1105 tcp_v6_send_ack(skb, tcptw->tw_snd_nxt, tcptw->tw_rcv_nxt,
1106 tcptw->tw_rcv_wnd >> tw->tw_rcv_wscale,
1107 tcptw->tw_ts_recent, tcp_twsk_md5_key(tcptw));
1108
1109 inet_twsk_put(tw);
1110 }
1111
1112 static void tcp_v6_reqsk_send_ack(struct sk_buff *skb, struct request_sock *req)
1113 {
1114 tcp_v6_send_ack(skb, tcp_rsk(req)->snt_isn + 1, tcp_rsk(req)->rcv_isn + 1, req->rcv_wnd, req->ts_recent,
1115 tcp_v6_md5_do_lookup(skb->sk, &ipv6_hdr(skb)->daddr));
1116 }
1117
1118
1119 static struct sock *tcp_v6_hnd_req(struct sock *sk,struct sk_buff *skb)
1120 {
1121 struct request_sock *req, **prev;
1122 const struct tcphdr *th = tcp_hdr(skb);
1123 struct sock *nsk;
1124
1125 /* Find possible connection requests. */
1126 req = inet6_csk_search_req(sk, &prev, th->source,
1127 &ipv6_hdr(skb)->saddr,
1128 &ipv6_hdr(skb)->daddr, inet6_iif(skb));
1129 if (req)
1130 return tcp_check_req(sk, skb, req, prev);
1131
1132 nsk = __inet6_lookup_established(sock_net(sk), &tcp_hashinfo,
1133 &ipv6_hdr(skb)->saddr, th->source,
1134 &ipv6_hdr(skb)->daddr, ntohs(th->dest), inet6_iif(skb));
1135
1136 if (nsk) {
1137 if (nsk->sk_state != TCP_TIME_WAIT) {
1138 bh_lock_sock(nsk);
1139 return nsk;
1140 }
1141 inet_twsk_put(inet_twsk(nsk));
1142 return NULL;
1143 }
1144
1145 #ifdef CONFIG_SYN_COOKIES
1146 if (!th->rst && !th->syn && th->ack)
1147 sk = cookie_v6_check(sk, skb);
1148 #endif
1149 return sk;
1150 }
1151
1152 /* FIXME: this is substantially similar to the ipv4 code.
1153 * Can some kind of merge be done? -- erics
1154 */
1155 static int tcp_v6_conn_request(struct sock *sk, struct sk_buff *skb)
1156 {
1157 struct inet6_request_sock *treq;
1158 struct ipv6_pinfo *np = inet6_sk(sk);
1159 struct tcp_options_received tmp_opt;
1160 struct tcp_sock *tp = tcp_sk(sk);
1161 struct request_sock *req = NULL;
1162 __u32 isn = TCP_SKB_CB(skb)->when;
1163 #ifdef CONFIG_SYN_COOKIES
1164 int want_cookie = 0;
1165 #else
1166 #define want_cookie 0
1167 #endif
1168
1169 if (skb->protocol == htons(ETH_P_IP))
1170 return tcp_v4_conn_request(sk, skb);
1171
1172 if (!ipv6_unicast_destination(skb))
1173 goto drop;
1174
1175 if (inet_csk_reqsk_queue_is_full(sk) && !isn) {
1176 if (net_ratelimit())
1177 syn_flood_warning(skb);
1178 #ifdef CONFIG_SYN_COOKIES
1179 if (sysctl_tcp_syncookies)
1180 want_cookie = 1;
1181 else
1182 #endif
1183 goto drop;
1184 }
1185
1186 if (sk_acceptq_is_full(sk) && inet_csk_reqsk_queue_young(sk) > 1)
1187 goto drop;
1188
1189 req = inet6_reqsk_alloc(&tcp6_request_sock_ops);
1190 if (req == NULL)
1191 goto drop;
1192
1193 #ifdef CONFIG_TCP_MD5SIG
1194 tcp_rsk(req)->af_specific = &tcp_request_sock_ipv6_ops;
1195 #endif
1196
1197 tcp_clear_options(&tmp_opt);
1198 tmp_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
1199 tmp_opt.user_mss = tp->rx_opt.user_mss;
1200
1201 tcp_parse_options(skb, &tmp_opt, 0);
1202
1203 if (want_cookie && !tmp_opt.saw_tstamp)
1204 tcp_clear_options(&tmp_opt);
1205
1206 tmp_opt.tstamp_ok = tmp_opt.saw_tstamp;
1207 tcp_openreq_init(req, &tmp_opt, skb);
1208
1209 treq = inet6_rsk(req);
1210 ipv6_addr_copy(&treq->rmt_addr, &ipv6_hdr(skb)->saddr);
1211 ipv6_addr_copy(&treq->loc_addr, &ipv6_hdr(skb)->daddr);
1212 if (!want_cookie)
1213 TCP_ECN_create_request(req, tcp_hdr(skb));
1214
1215 if (want_cookie) {
1216 isn = cookie_v6_init_sequence(sk, skb, &req->mss);
1217 req->cookie_ts = tmp_opt.tstamp_ok;
1218 } else if (!isn) {
1219 if (ipv6_opt_accepted(sk, skb) ||
1220 np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo ||
1221 np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim) {
1222 atomic_inc(&skb->users);
1223 treq->pktopts = skb;
1224 }
1225 treq->iif = sk->sk_bound_dev_if;
1226
1227 /* So that link locals have meaning */
1228 if (!sk->sk_bound_dev_if &&
1229 ipv6_addr_type(&treq->rmt_addr) & IPV6_ADDR_LINKLOCAL)
1230 treq->iif = inet6_iif(skb);
1231
1232 isn = tcp_v6_init_sequence(skb);
1233 }
1234
1235 tcp_rsk(req)->snt_isn = isn;
1236
1237 security_inet_conn_request(sk, skb, req);
1238
1239 if (tcp_v6_send_synack(sk, req))
1240 goto drop;
1241
1242 if (!want_cookie) {
1243 inet6_csk_reqsk_queue_hash_add(sk, req, TCP_TIMEOUT_INIT);
1244 return 0;
1245 }
1246
1247 drop:
1248 if (req)
1249 reqsk_free(req);
1250
1251 return 0; /* don't send reset */
1252 }
1253
1254 static struct sock * tcp_v6_syn_recv_sock(struct sock *sk, struct sk_buff *skb,
1255 struct request_sock *req,
1256 struct dst_entry *dst)
1257 {
1258 struct inet6_request_sock *treq = inet6_rsk(req);
1259 struct ipv6_pinfo *newnp, *np = inet6_sk(sk);
1260 struct tcp6_sock *newtcp6sk;
1261 struct inet_sock *newinet;
1262 struct tcp_sock *newtp;
1263 struct sock *newsk;
1264 struct ipv6_txoptions *opt;
1265 #ifdef CONFIG_TCP_MD5SIG
1266 struct tcp_md5sig_key *key;
1267 #endif
1268
1269 if (skb->protocol == htons(ETH_P_IP)) {
1270 /*
1271 * v6 mapped
1272 */
1273
1274 newsk = tcp_v4_syn_recv_sock(sk, skb, req, dst);
1275
1276 if (newsk == NULL)
1277 return NULL;
1278
1279 newtcp6sk = (struct tcp6_sock *)newsk;
1280 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1281
1282 newinet = inet_sk(newsk);
1283 newnp = inet6_sk(newsk);
1284 newtp = tcp_sk(newsk);
1285
1286 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1287
1288 ipv6_addr_set(&newnp->daddr, 0, 0, htonl(0x0000FFFF),
1289 newinet->daddr);
1290
1291 ipv6_addr_set(&newnp->saddr, 0, 0, htonl(0x0000FFFF),
1292 newinet->saddr);
1293
1294 ipv6_addr_copy(&newnp->rcv_saddr, &newnp->saddr);
1295
1296 inet_csk(newsk)->icsk_af_ops = &ipv6_mapped;
1297 newsk->sk_backlog_rcv = tcp_v4_do_rcv;
1298 #ifdef CONFIG_TCP_MD5SIG
1299 newtp->af_specific = &tcp_sock_ipv6_mapped_specific;
1300 #endif
1301
1302 newnp->pktoptions = NULL;
1303 newnp->opt = NULL;
1304 newnp->mcast_oif = inet6_iif(skb);
1305 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
1306
1307 /*
1308 * No need to charge this sock to the relevant IPv6 refcnt debug socks count
1309 * here, tcp_create_openreq_child now does this for us, see the comment in
1310 * that function for the gory details. -acme
1311 */
1312
1313 /* It is tricky place. Until this moment IPv4 tcp
1314 worked with IPv6 icsk.icsk_af_ops.
1315 Sync it now.
1316 */
1317 tcp_sync_mss(newsk, inet_csk(newsk)->icsk_pmtu_cookie);
1318
1319 return newsk;
1320 }
1321
1322 opt = np->opt;
1323
1324 if (sk_acceptq_is_full(sk))
1325 goto out_overflow;
1326
1327 if (dst == NULL) {
1328 struct in6_addr *final_p = NULL, final;
1329 struct flowi fl;
1330
1331 memset(&fl, 0, sizeof(fl));
1332 fl.proto = IPPROTO_TCP;
1333 ipv6_addr_copy(&fl.fl6_dst, &treq->rmt_addr);
1334 if (opt && opt->srcrt) {
1335 struct rt0_hdr *rt0 = (struct rt0_hdr *) opt->srcrt;
1336 ipv6_addr_copy(&final, &fl.fl6_dst);
1337 ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
1338 final_p = &final;
1339 }
1340 ipv6_addr_copy(&fl.fl6_src, &treq->loc_addr);
1341 fl.oif = sk->sk_bound_dev_if;
1342 fl.fl_ip_dport = inet_rsk(req)->rmt_port;
1343 fl.fl_ip_sport = inet_sk(sk)->sport;
1344 security_req_classify_flow(req, &fl);
1345
1346 if (ip6_dst_lookup(sk, &dst, &fl))
1347 goto out;
1348
1349 if (final_p)
1350 ipv6_addr_copy(&fl.fl6_dst, final_p);
1351
1352 if ((xfrm_lookup(&dst, &fl, sk, 0)) < 0)
1353 goto out;
1354 }
1355
1356 newsk = tcp_create_openreq_child(sk, req, skb);
1357 if (newsk == NULL)
1358 goto out;
1359
1360 /*
1361 * No need to charge this sock to the relevant IPv6 refcnt debug socks
1362 * count here, tcp_create_openreq_child now does this for us, see the
1363 * comment in that function for the gory details. -acme
1364 */
1365
1366 newsk->sk_gso_type = SKB_GSO_TCPV6;
1367 __ip6_dst_store(newsk, dst, NULL, NULL);
1368
1369 newtcp6sk = (struct tcp6_sock *)newsk;
1370 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1371
1372 newtp = tcp_sk(newsk);
1373 newinet = inet_sk(newsk);
1374 newnp = inet6_sk(newsk);
1375
1376 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1377
1378 ipv6_addr_copy(&newnp->daddr, &treq->rmt_addr);
1379 ipv6_addr_copy(&newnp->saddr, &treq->loc_addr);
1380 ipv6_addr_copy(&newnp->rcv_saddr, &treq->loc_addr);
1381 newsk->sk_bound_dev_if = treq->iif;
1382
1383 /* Now IPv6 options...
1384
1385 First: no IPv4 options.
1386 */
1387 newinet->opt = NULL;
1388 newnp->ipv6_fl_list = NULL;
1389
1390 /* Clone RX bits */
1391 newnp->rxopt.all = np->rxopt.all;
1392
1393 /* Clone pktoptions received with SYN */
1394 newnp->pktoptions = NULL;
1395 if (treq->pktopts != NULL) {
1396 newnp->pktoptions = skb_clone(treq->pktopts, GFP_ATOMIC);
1397 kfree_skb(treq->pktopts);
1398 treq->pktopts = NULL;
1399 if (newnp->pktoptions)
1400 skb_set_owner_r(newnp->pktoptions, newsk);
1401 }
1402 newnp->opt = NULL;
1403 newnp->mcast_oif = inet6_iif(skb);
1404 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
1405
1406 /* Clone native IPv6 options from listening socket (if any)
1407
1408 Yes, keeping reference count would be much more clever,
1409 but we make one more one thing there: reattach optmem
1410 to newsk.
1411 */
1412 if (opt) {
1413 newnp->opt = ipv6_dup_options(newsk, opt);
1414 if (opt != np->opt)
1415 sock_kfree_s(sk, opt, opt->tot_len);
1416 }
1417
1418 inet_csk(newsk)->icsk_ext_hdr_len = 0;
1419 if (newnp->opt)
1420 inet_csk(newsk)->icsk_ext_hdr_len = (newnp->opt->opt_nflen +
1421 newnp->opt->opt_flen);
1422
1423 tcp_mtup_init(newsk);
1424 tcp_sync_mss(newsk, dst_mtu(dst));
1425 newtp->advmss = dst_metric(dst, RTAX_ADVMSS);
1426 tcp_initialize_rcv_mss(newsk);
1427
1428 newinet->daddr = newinet->saddr = newinet->rcv_saddr = LOOPBACK4_IPV6;
1429
1430 #ifdef CONFIG_TCP_MD5SIG
1431 /* Copy over the MD5 key from the original socket */
1432 if ((key = tcp_v6_md5_do_lookup(sk, &newnp->daddr)) != NULL) {
1433 /* We're using one, so create a matching key
1434 * on the newsk structure. If we fail to get
1435 * memory, then we end up not copying the key
1436 * across. Shucks.
1437 */
1438 char *newkey = kmemdup(key->key, key->keylen, GFP_ATOMIC);
1439 if (newkey != NULL)
1440 tcp_v6_md5_do_add(newsk, &inet6_sk(sk)->daddr,
1441 newkey, key->keylen);
1442 }
1443 #endif
1444
1445 __inet6_hash(newsk);
1446 __inet_inherit_port(sk, newsk);
1447
1448 return newsk;
1449
1450 out_overflow:
1451 NET_INC_STATS_BH(LINUX_MIB_LISTENOVERFLOWS);
1452 out:
1453 NET_INC_STATS_BH(LINUX_MIB_LISTENDROPS);
1454 if (opt && opt != np->opt)
1455 sock_kfree_s(sk, opt, opt->tot_len);
1456 dst_release(dst);
1457 return NULL;
1458 }
1459
1460 static __sum16 tcp_v6_checksum_init(struct sk_buff *skb)
1461 {
1462 if (skb->ip_summed == CHECKSUM_COMPLETE) {
1463 if (!tcp_v6_check(tcp_hdr(skb), skb->len, &ipv6_hdr(skb)->saddr,
1464 &ipv6_hdr(skb)->daddr, skb->csum)) {
1465 skb->ip_summed = CHECKSUM_UNNECESSARY;
1466 return 0;
1467 }
1468 }
1469
1470 skb->csum = ~csum_unfold(tcp_v6_check(tcp_hdr(skb), skb->len,
1471 &ipv6_hdr(skb)->saddr,
1472 &ipv6_hdr(skb)->daddr, 0));
1473
1474 if (skb->len <= 76) {
1475 return __skb_checksum_complete(skb);
1476 }
1477 return 0;
1478 }
1479
1480 /* The socket must have it's spinlock held when we get
1481 * here.
1482 *
1483 * We have a potential double-lock case here, so even when
1484 * doing backlog processing we use the BH locking scheme.
1485 * This is because we cannot sleep with the original spinlock
1486 * held.
1487 */
1488 static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb)
1489 {
1490 struct ipv6_pinfo *np = inet6_sk(sk);
1491 struct tcp_sock *tp;
1492 struct sk_buff *opt_skb = NULL;
1493
1494 /* Imagine: socket is IPv6. IPv4 packet arrives,
1495 goes to IPv4 receive handler and backlogged.
1496 From backlog it always goes here. Kerboom...
1497 Fortunately, tcp_rcv_established and rcv_established
1498 handle them correctly, but it is not case with
1499 tcp_v6_hnd_req and tcp_v6_send_reset(). --ANK
1500 */
1501
1502 if (skb->protocol == htons(ETH_P_IP))
1503 return tcp_v4_do_rcv(sk, skb);
1504
1505 #ifdef CONFIG_TCP_MD5SIG
1506 if (tcp_v6_inbound_md5_hash (sk, skb))
1507 goto discard;
1508 #endif
1509
1510 if (sk_filter(sk, skb))
1511 goto discard;
1512
1513 /*
1514 * socket locking is here for SMP purposes as backlog rcv
1515 * is currently called with bh processing disabled.
1516 */
1517
1518 /* Do Stevens' IPV6_PKTOPTIONS.
1519
1520 Yes, guys, it is the only place in our code, where we
1521 may make it not affecting IPv4.
1522 The rest of code is protocol independent,
1523 and I do not like idea to uglify IPv4.
1524
1525 Actually, all the idea behind IPV6_PKTOPTIONS
1526 looks not very well thought. For now we latch
1527 options, received in the last packet, enqueued
1528 by tcp. Feel free to propose better solution.
1529 --ANK (980728)
1530 */
1531 if (np->rxopt.all)
1532 opt_skb = skb_clone(skb, GFP_ATOMIC);
1533
1534 if (sk->sk_state == TCP_ESTABLISHED) { /* Fast path */
1535 TCP_CHECK_TIMER(sk);
1536 if (tcp_rcv_established(sk, skb, tcp_hdr(skb), skb->len))
1537 goto reset;
1538 TCP_CHECK_TIMER(sk);
1539 if (opt_skb)
1540 goto ipv6_pktoptions;
1541 return 0;
1542 }
1543
1544 if (skb->len < tcp_hdrlen(skb) || tcp_checksum_complete(skb))
1545 goto csum_err;
1546
1547 if (sk->sk_state == TCP_LISTEN) {
1548 struct sock *nsk = tcp_v6_hnd_req(sk, skb);
1549 if (!nsk)
1550 goto discard;
1551
1552 /*
1553 * Queue it on the new socket if the new socket is active,
1554 * otherwise we just shortcircuit this and continue with
1555 * the new socket..
1556 */
1557 if(nsk != sk) {
1558 if (tcp_child_process(sk, nsk, skb))
1559 goto reset;
1560 if (opt_skb)
1561 __kfree_skb(opt_skb);
1562 return 0;
1563 }
1564 }
1565
1566 TCP_CHECK_TIMER(sk);
1567 if (tcp_rcv_state_process(sk, skb, tcp_hdr(skb), skb->len))
1568 goto reset;
1569 TCP_CHECK_TIMER(sk);
1570 if (opt_skb)
1571 goto ipv6_pktoptions;
1572 return 0;
1573
1574 reset:
1575 tcp_v6_send_reset(sk, skb);
1576 discard:
1577 if (opt_skb)
1578 __kfree_skb(opt_skb);
1579 kfree_skb(skb);
1580 return 0;
1581 csum_err:
1582 TCP_INC_STATS_BH(TCP_MIB_INERRS);
1583 goto discard;
1584
1585
1586 ipv6_pktoptions:
1587 /* Do you ask, what is it?
1588
1589 1. skb was enqueued by tcp.
1590 2. skb is added to tail of read queue, rather than out of order.
1591 3. socket is not in passive state.
1592 4. Finally, it really contains options, which user wants to receive.
1593 */
1594 tp = tcp_sk(sk);
1595 if (TCP_SKB_CB(opt_skb)->end_seq == tp->rcv_nxt &&
1596 !((1 << sk->sk_state) & (TCPF_CLOSE | TCPF_LISTEN))) {
1597 if (np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo)
1598 np->mcast_oif = inet6_iif(opt_skb);
1599 if (np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim)
1600 np->mcast_hops = ipv6_hdr(opt_skb)->hop_limit;
1601 if (ipv6_opt_accepted(sk, opt_skb)) {
1602 skb_set_owner_r(opt_skb, sk);
1603 opt_skb = xchg(&np->pktoptions, opt_skb);
1604 } else {
1605 __kfree_skb(opt_skb);
1606 opt_skb = xchg(&np->pktoptions, NULL);
1607 }
1608 }
1609
1610 if (opt_skb)
1611 kfree_skb(opt_skb);
1612 return 0;
1613 }
1614
1615 static int tcp_v6_rcv(struct sk_buff *skb)
1616 {
1617 struct tcphdr *th;
1618 struct sock *sk;
1619 int ret;
1620
1621 if (skb->pkt_type != PACKET_HOST)
1622 goto discard_it;
1623
1624 /*
1625 * Count it even if it's bad.
1626 */
1627 TCP_INC_STATS_BH(TCP_MIB_INSEGS);
1628
1629 if (!pskb_may_pull(skb, sizeof(struct tcphdr)))
1630 goto discard_it;
1631
1632 th = tcp_hdr(skb);
1633
1634 if (th->doff < sizeof(struct tcphdr)/4)
1635 goto bad_packet;
1636 if (!pskb_may_pull(skb, th->doff*4))
1637 goto discard_it;
1638
1639 if (!skb_csum_unnecessary(skb) && tcp_v6_checksum_init(skb))
1640 goto bad_packet;
1641
1642 th = tcp_hdr(skb);
1643 TCP_SKB_CB(skb)->seq = ntohl(th->seq);
1644 TCP_SKB_CB(skb)->end_seq = (TCP_SKB_CB(skb)->seq + th->syn + th->fin +
1645 skb->len - th->doff*4);
1646 TCP_SKB_CB(skb)->ack_seq = ntohl(th->ack_seq);
1647 TCP_SKB_CB(skb)->when = 0;
1648 TCP_SKB_CB(skb)->flags = ipv6_get_dsfield(ipv6_hdr(skb));
1649 TCP_SKB_CB(skb)->sacked = 0;
1650
1651 sk = __inet6_lookup(dev_net(skb->dev), &tcp_hashinfo,
1652 &ipv6_hdr(skb)->saddr, th->source,
1653 &ipv6_hdr(skb)->daddr, ntohs(th->dest),
1654 inet6_iif(skb));
1655
1656 if (!sk)
1657 goto no_tcp_socket;
1658
1659 process:
1660 if (sk->sk_state == TCP_TIME_WAIT)
1661 goto do_time_wait;
1662
1663 if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
1664 goto discard_and_relse;
1665
1666 if (sk_filter(sk, skb))
1667 goto discard_and_relse;
1668
1669 skb->dev = NULL;
1670
1671 bh_lock_sock_nested(sk);
1672 ret = 0;
1673 if (!sock_owned_by_user(sk)) {
1674 #ifdef CONFIG_NET_DMA
1675 struct tcp_sock *tp = tcp_sk(sk);
1676 if (!tp->ucopy.dma_chan && tp->ucopy.pinned_list)
1677 tp->ucopy.dma_chan = get_softnet_dma();
1678 if (tp->ucopy.dma_chan)
1679 ret = tcp_v6_do_rcv(sk, skb);
1680 else
1681 #endif
1682 {
1683 if (!tcp_prequeue(sk, skb))
1684 ret = tcp_v6_do_rcv(sk, skb);
1685 }
1686 } else
1687 sk_add_backlog(sk, skb);
1688 bh_unlock_sock(sk);
1689
1690 sock_put(sk);
1691 return ret ? -1 : 0;
1692
1693 no_tcp_socket:
1694 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb))
1695 goto discard_it;
1696
1697 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
1698 bad_packet:
1699 TCP_INC_STATS_BH(TCP_MIB_INERRS);
1700 } else {
1701 tcp_v6_send_reset(NULL, skb);
1702 }
1703
1704 discard_it:
1705
1706 /*
1707 * Discard frame
1708 */
1709
1710 kfree_skb(skb);
1711 return 0;
1712
1713 discard_and_relse:
1714 sock_put(sk);
1715 goto discard_it;
1716
1717 do_time_wait:
1718 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
1719 inet_twsk_put(inet_twsk(sk));
1720 goto discard_it;
1721 }
1722
1723 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
1724 TCP_INC_STATS_BH(TCP_MIB_INERRS);
1725 inet_twsk_put(inet_twsk(sk));
1726 goto discard_it;
1727 }
1728
1729 switch (tcp_timewait_state_process(inet_twsk(sk), skb, th)) {
1730 case TCP_TW_SYN:
1731 {
1732 struct sock *sk2;
1733
1734 sk2 = inet6_lookup_listener(dev_net(skb->dev), &tcp_hashinfo,
1735 &ipv6_hdr(skb)->daddr,
1736 ntohs(th->dest), inet6_iif(skb));
1737 if (sk2 != NULL) {
1738 struct inet_timewait_sock *tw = inet_twsk(sk);
1739 inet_twsk_deschedule(tw, &tcp_death_row);
1740 inet_twsk_put(tw);
1741 sk = sk2;
1742 goto process;
1743 }
1744 /* Fall through to ACK */
1745 }
1746 case TCP_TW_ACK:
1747 tcp_v6_timewait_ack(sk, skb);
1748 break;
1749 case TCP_TW_RST:
1750 goto no_tcp_socket;
1751 case TCP_TW_SUCCESS:;
1752 }
1753 goto discard_it;
1754 }
1755
1756 static int tcp_v6_remember_stamp(struct sock *sk)
1757 {
1758 /* Alas, not yet... */
1759 return 0;
1760 }
1761
1762 static struct inet_connection_sock_af_ops ipv6_specific = {
1763 .queue_xmit = inet6_csk_xmit,
1764 .send_check = tcp_v6_send_check,
1765 .rebuild_header = inet6_sk_rebuild_header,
1766 .conn_request = tcp_v6_conn_request,
1767 .syn_recv_sock = tcp_v6_syn_recv_sock,
1768 .remember_stamp = tcp_v6_remember_stamp,
1769 .net_header_len = sizeof(struct ipv6hdr),
1770 .setsockopt = ipv6_setsockopt,
1771 .getsockopt = ipv6_getsockopt,
1772 .addr2sockaddr = inet6_csk_addr2sockaddr,
1773 .sockaddr_len = sizeof(struct sockaddr_in6),
1774 .bind_conflict = inet6_csk_bind_conflict,
1775 #ifdef CONFIG_COMPAT
1776 .compat_setsockopt = compat_ipv6_setsockopt,
1777 .compat_getsockopt = compat_ipv6_getsockopt,
1778 #endif
1779 };
1780
1781 #ifdef CONFIG_TCP_MD5SIG
1782 static struct tcp_sock_af_ops tcp_sock_ipv6_specific = {
1783 .md5_lookup = tcp_v6_md5_lookup,
1784 .calc_md5_hash = tcp_v6_calc_md5_hash,
1785 .md5_add = tcp_v6_md5_add_func,
1786 .md5_parse = tcp_v6_parse_md5_keys,
1787 };
1788 #endif
1789
1790 /*
1791 * TCP over IPv4 via INET6 API
1792 */
1793
1794 static struct inet_connection_sock_af_ops ipv6_mapped = {
1795 .queue_xmit = ip_queue_xmit,
1796 .send_check = tcp_v4_send_check,
1797 .rebuild_header = inet_sk_rebuild_header,
1798 .conn_request = tcp_v6_conn_request,
1799 .syn_recv_sock = tcp_v6_syn_recv_sock,
1800 .remember_stamp = tcp_v4_remember_stamp,
1801 .net_header_len = sizeof(struct iphdr),
1802 .setsockopt = ipv6_setsockopt,
1803 .getsockopt = ipv6_getsockopt,
1804 .addr2sockaddr = inet6_csk_addr2sockaddr,
1805 .sockaddr_len = sizeof(struct sockaddr_in6),
1806 .bind_conflict = inet6_csk_bind_conflict,
1807 #ifdef CONFIG_COMPAT
1808 .compat_setsockopt = compat_ipv6_setsockopt,
1809 .compat_getsockopt = compat_ipv6_getsockopt,
1810 #endif
1811 };
1812
1813 #ifdef CONFIG_TCP_MD5SIG
1814 static struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific = {
1815 .md5_lookup = tcp_v4_md5_lookup,
1816 .calc_md5_hash = tcp_v4_calc_md5_hash,
1817 .md5_add = tcp_v6_md5_add_func,
1818 .md5_parse = tcp_v6_parse_md5_keys,
1819 };
1820 #endif
1821
1822 /* NOTE: A lot of things set to zero explicitly by call to
1823 * sk_alloc() so need not be done here.
1824 */
1825 static int tcp_v6_init_sock(struct sock *sk)
1826 {
1827 struct inet_connection_sock *icsk = inet_csk(sk);
1828 struct tcp_sock *tp = tcp_sk(sk);
1829
1830 skb_queue_head_init(&tp->out_of_order_queue);
1831 tcp_init_xmit_timers(sk);
1832 tcp_prequeue_init(tp);
1833
1834 icsk->icsk_rto = TCP_TIMEOUT_INIT;
1835 tp->mdev = TCP_TIMEOUT_INIT;
1836
1837 /* So many TCP implementations out there (incorrectly) count the
1838 * initial SYN frame in their delayed-ACK and congestion control
1839 * algorithms that we must have the following bandaid to talk
1840 * efficiently to them. -DaveM
1841 */
1842 tp->snd_cwnd = 2;
1843
1844 /* See draft-stevens-tcpca-spec-01 for discussion of the
1845 * initialization of these values.
1846 */
1847 tp->snd_ssthresh = 0x7fffffff;
1848 tp->snd_cwnd_clamp = ~0;
1849 tp->mss_cache = 536;
1850
1851 tp->reordering = sysctl_tcp_reordering;
1852
1853 sk->sk_state = TCP_CLOSE;
1854
1855 icsk->icsk_af_ops = &ipv6_specific;
1856 icsk->icsk_ca_ops = &tcp_init_congestion_ops;
1857 icsk->icsk_sync_mss = tcp_sync_mss;
1858 sk->sk_write_space = sk_stream_write_space;
1859 sock_set_flag(sk, SOCK_USE_WRITE_QUEUE);
1860
1861 #ifdef CONFIG_TCP_MD5SIG
1862 tp->af_specific = &tcp_sock_ipv6_specific;
1863 #endif
1864
1865 sk->sk_sndbuf = sysctl_tcp_wmem[1];
1866 sk->sk_rcvbuf = sysctl_tcp_rmem[1];
1867
1868 atomic_inc(&tcp_sockets_allocated);
1869
1870 return 0;
1871 }
1872
1873 static void tcp_v6_destroy_sock(struct sock *sk)
1874 {
1875 #ifdef CONFIG_TCP_MD5SIG
1876 /* Clean up the MD5 key list */
1877 if (tcp_sk(sk)->md5sig_info)
1878 tcp_v6_clear_md5_list(sk);
1879 #endif
1880 tcp_v4_destroy_sock(sk);
1881 inet6_destroy_sock(sk);
1882 }
1883
1884 #ifdef CONFIG_PROC_FS
1885 /* Proc filesystem TCPv6 sock list dumping. */
1886 static void get_openreq6(struct seq_file *seq,
1887 struct sock *sk, struct request_sock *req, int i, int uid)
1888 {
1889 int ttd = req->expires - jiffies;
1890 struct in6_addr *src = &inet6_rsk(req)->loc_addr;
1891 struct in6_addr *dest = &inet6_rsk(req)->rmt_addr;
1892
1893 if (ttd < 0)
1894 ttd = 0;
1895
1896 seq_printf(seq,
1897 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1898 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %p\n",
1899 i,
1900 src->s6_addr32[0], src->s6_addr32[1],
1901 src->s6_addr32[2], src->s6_addr32[3],
1902 ntohs(inet_sk(sk)->sport),
1903 dest->s6_addr32[0], dest->s6_addr32[1],
1904 dest->s6_addr32[2], dest->s6_addr32[3],
1905 ntohs(inet_rsk(req)->rmt_port),
1906 TCP_SYN_RECV,
1907 0,0, /* could print option size, but that is af dependent. */
1908 1, /* timers active (only the expire timer) */
1909 jiffies_to_clock_t(ttd),
1910 req->retrans,
1911 uid,
1912 0, /* non standard timer */
1913 0, /* open_requests have no inode */
1914 0, req);
1915 }
1916
1917 static void get_tcp6_sock(struct seq_file *seq, struct sock *sp, int i)
1918 {
1919 struct in6_addr *dest, *src;
1920 __u16 destp, srcp;
1921 int timer_active;
1922 unsigned long timer_expires;
1923 struct inet_sock *inet = inet_sk(sp);
1924 struct tcp_sock *tp = tcp_sk(sp);
1925 const struct inet_connection_sock *icsk = inet_csk(sp);
1926 struct ipv6_pinfo *np = inet6_sk(sp);
1927
1928 dest = &np->daddr;
1929 src = &np->rcv_saddr;
1930 destp = ntohs(inet->dport);
1931 srcp = ntohs(inet->sport);
1932
1933 if (icsk->icsk_pending == ICSK_TIME_RETRANS) {
1934 timer_active = 1;
1935 timer_expires = icsk->icsk_timeout;
1936 } else if (icsk->icsk_pending == ICSK_TIME_PROBE0) {
1937 timer_active = 4;
1938 timer_expires = icsk->icsk_timeout;
1939 } else if (timer_pending(&sp->sk_timer)) {
1940 timer_active = 2;
1941 timer_expires = sp->sk_timer.expires;
1942 } else {
1943 timer_active = 0;
1944 timer_expires = jiffies;
1945 }
1946
1947 seq_printf(seq,
1948 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1949 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %lu %d %p %lu %lu %u %u %d\n",
1950 i,
1951 src->s6_addr32[0], src->s6_addr32[1],
1952 src->s6_addr32[2], src->s6_addr32[3], srcp,
1953 dest->s6_addr32[0], dest->s6_addr32[1],
1954 dest->s6_addr32[2], dest->s6_addr32[3], destp,
1955 sp->sk_state,
1956 tp->write_seq-tp->snd_una,
1957 (sp->sk_state == TCP_LISTEN) ? sp->sk_ack_backlog : (tp->rcv_nxt - tp->copied_seq),
1958 timer_active,
1959 jiffies_to_clock_t(timer_expires - jiffies),
1960 icsk->icsk_retransmits,
1961 sock_i_uid(sp),
1962 icsk->icsk_probes_out,
1963 sock_i_ino(sp),
1964 atomic_read(&sp->sk_refcnt), sp,
1965 jiffies_to_clock_t(icsk->icsk_rto),
1966 jiffies_to_clock_t(icsk->icsk_ack.ato),
1967 (icsk->icsk_ack.quick << 1 ) | icsk->icsk_ack.pingpong,
1968 tp->snd_cwnd, tp->snd_ssthresh>=0xFFFF?-1:tp->snd_ssthresh
1969 );
1970 }
1971
1972 static void get_timewait6_sock(struct seq_file *seq,
1973 struct inet_timewait_sock *tw, int i)
1974 {
1975 struct in6_addr *dest, *src;
1976 __u16 destp, srcp;
1977 struct inet6_timewait_sock *tw6 = inet6_twsk((struct sock *)tw);
1978 int ttd = tw->tw_ttd - jiffies;
1979
1980 if (ttd < 0)
1981 ttd = 0;
1982
1983 dest = &tw6->tw_v6_daddr;
1984 src = &tw6->tw_v6_rcv_saddr;
1985 destp = ntohs(tw->tw_dport);
1986 srcp = ntohs(tw->tw_sport);
1987
1988 seq_printf(seq,
1989 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1990 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %p\n",
1991 i,
1992 src->s6_addr32[0], src->s6_addr32[1],
1993 src->s6_addr32[2], src->s6_addr32[3], srcp,
1994 dest->s6_addr32[0], dest->s6_addr32[1],
1995 dest->s6_addr32[2], dest->s6_addr32[3], destp,
1996 tw->tw_substate, 0, 0,
1997 3, jiffies_to_clock_t(ttd), 0, 0, 0, 0,
1998 atomic_read(&tw->tw_refcnt), tw);
1999 }
2000
2001 static int tcp6_seq_show(struct seq_file *seq, void *v)
2002 {
2003 struct tcp_iter_state *st;
2004
2005 if (v == SEQ_START_TOKEN) {
2006 seq_puts(seq,
2007 " sl "
2008 "local_address "
2009 "remote_address "
2010 "st tx_queue rx_queue tr tm->when retrnsmt"
2011 " uid timeout inode\n");
2012 goto out;
2013 }
2014 st = seq->private;
2015
2016 switch (st->state) {
2017 case TCP_SEQ_STATE_LISTENING:
2018 case TCP_SEQ_STATE_ESTABLISHED:
2019 get_tcp6_sock(seq, v, st->num);
2020 break;
2021 case TCP_SEQ_STATE_OPENREQ:
2022 get_openreq6(seq, st->syn_wait_sk, v, st->num, st->uid);
2023 break;
2024 case TCP_SEQ_STATE_TIME_WAIT:
2025 get_timewait6_sock(seq, v, st->num);
2026 break;
2027 }
2028 out:
2029 return 0;
2030 }
2031
2032 static struct tcp_seq_afinfo tcp6_seq_afinfo = {
2033 .name = "tcp6",
2034 .family = AF_INET6,
2035 .seq_fops = {
2036 .owner = THIS_MODULE,
2037 },
2038 .seq_ops = {
2039 .show = tcp6_seq_show,
2040 },
2041 };
2042
2043 int tcp6_proc_init(struct net *net)
2044 {
2045 return tcp_proc_register(net, &tcp6_seq_afinfo);
2046 }
2047
2048 void tcp6_proc_exit(struct net *net)
2049 {
2050 tcp_proc_unregister(net, &tcp6_seq_afinfo);
2051 }
2052 #endif
2053
2054 struct proto tcpv6_prot = {
2055 .name = "TCPv6",
2056 .owner = THIS_MODULE,
2057 .close = tcp_close,
2058 .connect = tcp_v6_connect,
2059 .disconnect = tcp_disconnect,
2060 .accept = inet_csk_accept,
2061 .ioctl = tcp_ioctl,
2062 .init = tcp_v6_init_sock,
2063 .destroy = tcp_v6_destroy_sock,
2064 .shutdown = tcp_shutdown,
2065 .setsockopt = tcp_setsockopt,
2066 .getsockopt = tcp_getsockopt,
2067 .recvmsg = tcp_recvmsg,
2068 .backlog_rcv = tcp_v6_do_rcv,
2069 .hash = tcp_v6_hash,
2070 .unhash = inet_unhash,
2071 .get_port = inet_csk_get_port,
2072 .enter_memory_pressure = tcp_enter_memory_pressure,
2073 .sockets_allocated = &tcp_sockets_allocated,
2074 .memory_allocated = &tcp_memory_allocated,
2075 .memory_pressure = &tcp_memory_pressure,
2076 .orphan_count = &tcp_orphan_count,
2077 .sysctl_mem = sysctl_tcp_mem,
2078 .sysctl_wmem = sysctl_tcp_wmem,
2079 .sysctl_rmem = sysctl_tcp_rmem,
2080 .max_header = MAX_TCP_HEADER,
2081 .obj_size = sizeof(struct tcp6_sock),
2082 .twsk_prot = &tcp6_timewait_sock_ops,
2083 .rsk_prot = &tcp6_request_sock_ops,
2084 .h.hashinfo = &tcp_hashinfo,
2085 #ifdef CONFIG_COMPAT
2086 .compat_setsockopt = compat_tcp_setsockopt,
2087 .compat_getsockopt = compat_tcp_getsockopt,
2088 #endif
2089 };
2090
2091 static struct inet6_protocol tcpv6_protocol = {
2092 .handler = tcp_v6_rcv,
2093 .err_handler = tcp_v6_err,
2094 .gso_send_check = tcp_v6_gso_send_check,
2095 .gso_segment = tcp_tso_segment,
2096 .flags = INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
2097 };
2098
2099 static struct inet_protosw tcpv6_protosw = {
2100 .type = SOCK_STREAM,
2101 .protocol = IPPROTO_TCP,
2102 .prot = &tcpv6_prot,
2103 .ops = &inet6_stream_ops,
2104 .capability = -1,
2105 .no_check = 0,
2106 .flags = INET_PROTOSW_PERMANENT |
2107 INET_PROTOSW_ICSK,
2108 };
2109
2110 static int tcpv6_net_init(struct net *net)
2111 {
2112 return inet_ctl_sock_create(&net->ipv6.tcp_sk, PF_INET6,
2113 SOCK_RAW, IPPROTO_TCP, net);
2114 }
2115
2116 static void tcpv6_net_exit(struct net *net)
2117 {
2118 inet_ctl_sock_destroy(net->ipv6.tcp_sk);
2119 }
2120
2121 static struct pernet_operations tcpv6_net_ops = {
2122 .init = tcpv6_net_init,
2123 .exit = tcpv6_net_exit,
2124 };
2125
2126 int __init tcpv6_init(void)
2127 {
2128 int ret;
2129
2130 ret = inet6_add_protocol(&tcpv6_protocol, IPPROTO_TCP);
2131 if (ret)
2132 goto out;
2133
2134 /* register inet6 protocol */
2135 ret = inet6_register_protosw(&tcpv6_protosw);
2136 if (ret)
2137 goto out_tcpv6_protocol;
2138
2139 ret = register_pernet_subsys(&tcpv6_net_ops);
2140 if (ret)
2141 goto out_tcpv6_protosw;
2142 out:
2143 return ret;
2144
2145 out_tcpv6_protocol:
2146 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
2147 out_tcpv6_protosw:
2148 inet6_unregister_protosw(&tcpv6_protosw);
2149 goto out;
2150 }
2151
2152 void tcpv6_exit(void)
2153 {
2154 unregister_pernet_subsys(&tcpv6_net_ops);
2155 inet6_unregister_protosw(&tcpv6_protosw);
2156 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
2157 }
This page took 0.100062 seconds and 6 git commands to generate.