3 * Linux INET6 implementation
6 * Pedro Roque <roque@di.fc.ul.pt>
10 * linux/net/ipv4/tcp_input.c
11 * linux/net/ipv4/tcp_output.c
14 * Hideaki YOSHIFUJI : sin6_scope_id support
15 * YOSHIFUJI Hideaki @USAGI and: Support IPV6_V6ONLY socket option, which
16 * Alexey Kuznetsov allow both IPv4 and IPv6 sockets to bind
17 * a single port at the same time.
18 * YOSHIFUJI Hideaki @USAGI: convert /proc/net/tcp6 to seq_file.
20 * This program is free software; you can redistribute it and/or
21 * modify it under the terms of the GNU General Public License
22 * as published by the Free Software Foundation; either version
23 * 2 of the License, or (at your option) any later version.
26 #include <linux/bottom_half.h>
27 #include <linux/module.h>
28 #include <linux/errno.h>
29 #include <linux/types.h>
30 #include <linux/socket.h>
31 #include <linux/sockios.h>
32 #include <linux/net.h>
33 #include <linux/jiffies.h>
35 #include <linux/in6.h>
36 #include <linux/netdevice.h>
37 #include <linux/init.h>
38 #include <linux/jhash.h>
39 #include <linux/ipsec.h>
40 #include <linux/times.h>
41 #include <linux/slab.h>
43 #include <linux/ipv6.h>
44 #include <linux/icmpv6.h>
45 #include <linux/random.h>
48 #include <net/ndisc.h>
49 #include <net/inet6_hashtables.h>
50 #include <net/inet6_connection_sock.h>
52 #include <net/transp_v6.h>
53 #include <net/addrconf.h>
54 #include <net/ip6_route.h>
55 #include <net/ip6_checksum.h>
56 #include <net/inet_ecn.h>
57 #include <net/protocol.h>
60 #include <net/dsfield.h>
61 #include <net/timewait_sock.h>
62 #include <net/netdma.h>
63 #include <net/inet_common.h>
64 #include <net/secure_seq.h>
66 #include <asm/uaccess.h>
68 #include <linux/proc_fs.h>
69 #include <linux/seq_file.h>
71 #include <linux/crypto.h>
72 #include <linux/scatterlist.h>
74 static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb);
75 static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
76 struct request_sock *req);
78 static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb);
79 static void __tcp_v6_send_check(struct sk_buff *skb,
80 const struct in6_addr *saddr,
81 const struct in6_addr *daddr);
83 static const struct inet_connection_sock_af_ops ipv6_mapped;
84 static const struct inet_connection_sock_af_ops ipv6_specific;
85 #ifdef CONFIG_TCP_MD5SIG
86 static const struct tcp_sock_af_ops tcp_sock_ipv6_specific;
87 static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific;
89 static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
90 const struct in6_addr *addr)
96 static void tcp_v6_hash(struct sock *sk)
98 if (sk->sk_state != TCP_CLOSE) {
99 if (inet_csk(sk)->icsk_af_ops == &ipv6_mapped) {
104 __inet6_hash(sk, NULL);
109 static __inline__ __sum16 tcp_v6_check(int len,
110 const struct in6_addr *saddr,
111 const struct in6_addr *daddr,
114 return csum_ipv6_magic(saddr, daddr, len, IPPROTO_TCP, base);
117 static __u32 tcp_v6_init_sequence(const struct sk_buff *skb)
119 return secure_tcpv6_sequence_number(ipv6_hdr(skb)->daddr.s6_addr32,
120 ipv6_hdr(skb)->saddr.s6_addr32,
122 tcp_hdr(skb)->source);
125 static int tcp_v6_connect(struct sock *sk, struct sockaddr *uaddr,
128 struct sockaddr_in6 *usin = (struct sockaddr_in6 *) uaddr;
129 struct inet_sock *inet = inet_sk(sk);
130 struct inet_connection_sock *icsk = inet_csk(sk);
131 struct ipv6_pinfo *np = inet6_sk(sk);
132 struct tcp_sock *tp = tcp_sk(sk);
133 struct in6_addr *saddr = NULL, *final_p, final;
136 struct dst_entry *dst;
140 if (addr_len < SIN6_LEN_RFC2133)
143 if (usin->sin6_family != AF_INET6)
144 return -EAFNOSUPPORT;
146 memset(&fl6, 0, sizeof(fl6));
149 fl6.flowlabel = usin->sin6_flowinfo&IPV6_FLOWINFO_MASK;
150 IP6_ECN_flow_init(fl6.flowlabel);
151 if (fl6.flowlabel&IPV6_FLOWLABEL_MASK) {
152 struct ip6_flowlabel *flowlabel;
153 flowlabel = fl6_sock_lookup(sk, fl6.flowlabel);
154 if (flowlabel == NULL)
156 ipv6_addr_copy(&usin->sin6_addr, &flowlabel->dst);
157 fl6_sock_release(flowlabel);
162 * connect() to INADDR_ANY means loopback (BSD'ism).
165 if(ipv6_addr_any(&usin->sin6_addr))
166 usin->sin6_addr.s6_addr[15] = 0x1;
168 addr_type = ipv6_addr_type(&usin->sin6_addr);
170 if(addr_type & IPV6_ADDR_MULTICAST)
173 if (addr_type&IPV6_ADDR_LINKLOCAL) {
174 if (addr_len >= sizeof(struct sockaddr_in6) &&
175 usin->sin6_scope_id) {
176 /* If interface is set while binding, indices
179 if (sk->sk_bound_dev_if &&
180 sk->sk_bound_dev_if != usin->sin6_scope_id)
183 sk->sk_bound_dev_if = usin->sin6_scope_id;
186 /* Connect to link-local address requires an interface */
187 if (!sk->sk_bound_dev_if)
191 if (tp->rx_opt.ts_recent_stamp &&
192 !ipv6_addr_equal(&np->daddr, &usin->sin6_addr)) {
193 tp->rx_opt.ts_recent = 0;
194 tp->rx_opt.ts_recent_stamp = 0;
198 ipv6_addr_copy(&np->daddr, &usin->sin6_addr);
199 np->flow_label = fl6.flowlabel;
205 if (addr_type == IPV6_ADDR_MAPPED) {
206 u32 exthdrlen = icsk->icsk_ext_hdr_len;
207 struct sockaddr_in sin;
209 SOCK_DEBUG(sk, "connect: ipv4 mapped\n");
211 if (__ipv6_only_sock(sk))
214 sin.sin_family = AF_INET;
215 sin.sin_port = usin->sin6_port;
216 sin.sin_addr.s_addr = usin->sin6_addr.s6_addr32[3];
218 icsk->icsk_af_ops = &ipv6_mapped;
219 sk->sk_backlog_rcv = tcp_v4_do_rcv;
220 #ifdef CONFIG_TCP_MD5SIG
221 tp->af_specific = &tcp_sock_ipv6_mapped_specific;
224 err = tcp_v4_connect(sk, (struct sockaddr *)&sin, sizeof(sin));
227 icsk->icsk_ext_hdr_len = exthdrlen;
228 icsk->icsk_af_ops = &ipv6_specific;
229 sk->sk_backlog_rcv = tcp_v6_do_rcv;
230 #ifdef CONFIG_TCP_MD5SIG
231 tp->af_specific = &tcp_sock_ipv6_specific;
235 ipv6_addr_set_v4mapped(inet->inet_saddr, &np->saddr);
236 ipv6_addr_set_v4mapped(inet->inet_rcv_saddr,
243 if (!ipv6_addr_any(&np->rcv_saddr))
244 saddr = &np->rcv_saddr;
246 fl6.flowi6_proto = IPPROTO_TCP;
247 ipv6_addr_copy(&fl6.daddr, &np->daddr);
248 ipv6_addr_copy(&fl6.saddr,
249 (saddr ? saddr : &np->saddr));
250 fl6.flowi6_oif = sk->sk_bound_dev_if;
251 fl6.flowi6_mark = sk->sk_mark;
252 fl6.fl6_dport = usin->sin6_port;
253 fl6.fl6_sport = inet->inet_sport;
255 final_p = fl6_update_dst(&fl6, np->opt, &final);
257 security_sk_classify_flow(sk, flowi6_to_flowi(&fl6));
259 dst = ip6_dst_lookup_flow(sk, &fl6, final_p, true);
267 ipv6_addr_copy(&np->rcv_saddr, saddr);
270 /* set the source address */
271 ipv6_addr_copy(&np->saddr, saddr);
272 inet->inet_rcv_saddr = LOOPBACK4_IPV6;
274 sk->sk_gso_type = SKB_GSO_TCPV6;
275 __ip6_dst_store(sk, dst, NULL, NULL);
277 rt = (struct rt6_info *) dst;
278 if (tcp_death_row.sysctl_tw_recycle &&
279 !tp->rx_opt.ts_recent_stamp &&
280 ipv6_addr_equal(&rt->rt6i_dst.addr, &np->daddr)) {
281 struct inet_peer *peer = rt6_get_peer(rt);
283 * VJ's idea. We save last timestamp seen from
284 * the destination in peer table, when entering state
285 * TIME-WAIT * and initialize rx_opt.ts_recent from it,
286 * when trying new connection.
289 inet_peer_refcheck(peer);
290 if ((u32)get_seconds() - peer->tcp_ts_stamp <= TCP_PAWS_MSL) {
291 tp->rx_opt.ts_recent_stamp = peer->tcp_ts_stamp;
292 tp->rx_opt.ts_recent = peer->tcp_ts;
297 icsk->icsk_ext_hdr_len = 0;
299 icsk->icsk_ext_hdr_len = (np->opt->opt_flen +
302 tp->rx_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
304 inet->inet_dport = usin->sin6_port;
306 tcp_set_state(sk, TCP_SYN_SENT);
307 err = inet6_hash_connect(&tcp_death_row, sk);
312 tp->write_seq = secure_tcpv6_sequence_number(np->saddr.s6_addr32,
317 err = tcp_connect(sk);
324 tcp_set_state(sk, TCP_CLOSE);
327 inet->inet_dport = 0;
328 sk->sk_route_caps = 0;
332 static void tcp_v6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
333 u8 type, u8 code, int offset, __be32 info)
335 const struct ipv6hdr *hdr = (const struct ipv6hdr*)skb->data;
336 const struct tcphdr *th = (struct tcphdr *)(skb->data+offset);
337 struct ipv6_pinfo *np;
342 struct net *net = dev_net(skb->dev);
344 sk = inet6_lookup(net, &tcp_hashinfo, &hdr->daddr,
345 th->dest, &hdr->saddr, th->source, skb->dev->ifindex);
348 ICMP6_INC_STATS_BH(net, __in6_dev_get(skb->dev),
353 if (sk->sk_state == TCP_TIME_WAIT) {
354 inet_twsk_put(inet_twsk(sk));
359 if (sock_owned_by_user(sk))
360 NET_INC_STATS_BH(net, LINUX_MIB_LOCKDROPPEDICMPS);
362 if (sk->sk_state == TCP_CLOSE)
365 if (ipv6_hdr(skb)->hop_limit < inet6_sk(sk)->min_hopcount) {
366 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
371 seq = ntohl(th->seq);
372 if (sk->sk_state != TCP_LISTEN &&
373 !between(seq, tp->snd_una, tp->snd_nxt)) {
374 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
380 if (type == ICMPV6_PKT_TOOBIG) {
381 struct dst_entry *dst;
383 if (sock_owned_by_user(sk))
385 if ((1 << sk->sk_state) & (TCPF_LISTEN | TCPF_CLOSE))
388 /* icmp should have updated the destination cache entry */
389 dst = __sk_dst_check(sk, np->dst_cookie);
392 struct inet_sock *inet = inet_sk(sk);
395 /* BUGGG_FUTURE: Again, it is not clear how
396 to handle rthdr case. Ignore this complexity
399 memset(&fl6, 0, sizeof(fl6));
400 fl6.flowi6_proto = IPPROTO_TCP;
401 ipv6_addr_copy(&fl6.daddr, &np->daddr);
402 ipv6_addr_copy(&fl6.saddr, &np->saddr);
403 fl6.flowi6_oif = sk->sk_bound_dev_if;
404 fl6.flowi6_mark = sk->sk_mark;
405 fl6.fl6_dport = inet->inet_dport;
406 fl6.fl6_sport = inet->inet_sport;
407 security_skb_classify_flow(skb, flowi6_to_flowi(&fl6));
409 dst = ip6_dst_lookup_flow(sk, &fl6, NULL, false);
411 sk->sk_err_soft = -PTR_ERR(dst);
418 if (inet_csk(sk)->icsk_pmtu_cookie > dst_mtu(dst)) {
419 tcp_sync_mss(sk, dst_mtu(dst));
420 tcp_simple_retransmit(sk);
421 } /* else let the usual retransmit timer handle it */
426 icmpv6_err_convert(type, code, &err);
428 /* Might be for an request_sock */
429 switch (sk->sk_state) {
430 struct request_sock *req, **prev;
432 if (sock_owned_by_user(sk))
435 req = inet6_csk_search_req(sk, &prev, th->dest, &hdr->daddr,
436 &hdr->saddr, inet6_iif(skb));
440 /* ICMPs are not backlogged, hence we cannot get
441 * an established socket here.
443 WARN_ON(req->sk != NULL);
445 if (seq != tcp_rsk(req)->snt_isn) {
446 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
450 inet_csk_reqsk_queue_drop(sk, req, prev);
454 case TCP_SYN_RECV: /* Cannot happen.
455 It can, it SYNs are crossed. --ANK */
456 if (!sock_owned_by_user(sk)) {
458 sk->sk_error_report(sk); /* Wake people up to see the error (see connect in sock.c) */
462 sk->sk_err_soft = err;
466 if (!sock_owned_by_user(sk) && np->recverr) {
468 sk->sk_error_report(sk);
470 sk->sk_err_soft = err;
478 static int tcp_v6_send_synack(struct sock *sk, struct request_sock *req,
479 struct request_values *rvp)
481 struct inet6_request_sock *treq = inet6_rsk(req);
482 struct ipv6_pinfo *np = inet6_sk(sk);
483 struct sk_buff * skb;
484 struct ipv6_txoptions *opt = NULL;
485 struct in6_addr * final_p, final;
487 struct dst_entry *dst;
490 memset(&fl6, 0, sizeof(fl6));
491 fl6.flowi6_proto = IPPROTO_TCP;
492 ipv6_addr_copy(&fl6.daddr, &treq->rmt_addr);
493 ipv6_addr_copy(&fl6.saddr, &treq->loc_addr);
495 fl6.flowi6_oif = treq->iif;
496 fl6.flowi6_mark = sk->sk_mark;
497 fl6.fl6_dport = inet_rsk(req)->rmt_port;
498 fl6.fl6_sport = inet_rsk(req)->loc_port;
499 security_req_classify_flow(req, flowi6_to_flowi(&fl6));
502 final_p = fl6_update_dst(&fl6, opt, &final);
504 dst = ip6_dst_lookup_flow(sk, &fl6, final_p, false);
510 skb = tcp_make_synack(sk, dst, req, rvp);
513 __tcp_v6_send_check(skb, &treq->loc_addr, &treq->rmt_addr);
515 ipv6_addr_copy(&fl6.daddr, &treq->rmt_addr);
516 err = ip6_xmit(sk, skb, &fl6, opt, np->tclass);
517 err = net_xmit_eval(err);
521 if (opt && opt != np->opt)
522 sock_kfree_s(sk, opt, opt->tot_len);
527 static int tcp_v6_rtx_synack(struct sock *sk, struct request_sock *req,
528 struct request_values *rvp)
530 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_RETRANSSEGS);
531 return tcp_v6_send_synack(sk, req, rvp);
534 static void tcp_v6_reqsk_destructor(struct request_sock *req)
536 kfree_skb(inet6_rsk(req)->pktopts);
539 #ifdef CONFIG_TCP_MD5SIG
540 static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
541 const struct in6_addr *addr)
543 struct tcp_sock *tp = tcp_sk(sk);
548 if (!tp->md5sig_info || !tp->md5sig_info->entries6)
551 for (i = 0; i < tp->md5sig_info->entries6; i++) {
552 if (ipv6_addr_equal(&tp->md5sig_info->keys6[i].addr, addr))
553 return &tp->md5sig_info->keys6[i].base;
558 static struct tcp_md5sig_key *tcp_v6_md5_lookup(struct sock *sk,
559 struct sock *addr_sk)
561 return tcp_v6_md5_do_lookup(sk, &inet6_sk(addr_sk)->daddr);
564 static struct tcp_md5sig_key *tcp_v6_reqsk_md5_lookup(struct sock *sk,
565 struct request_sock *req)
567 return tcp_v6_md5_do_lookup(sk, &inet6_rsk(req)->rmt_addr);
570 static int tcp_v6_md5_do_add(struct sock *sk, const struct in6_addr *peer,
571 char *newkey, u8 newkeylen)
573 /* Add key to the list */
574 struct tcp_md5sig_key *key;
575 struct tcp_sock *tp = tcp_sk(sk);
576 struct tcp6_md5sig_key *keys;
578 key = tcp_v6_md5_do_lookup(sk, peer);
580 /* modify existing entry - just update that one */
583 key->keylen = newkeylen;
585 /* reallocate new list if current one is full. */
586 if (!tp->md5sig_info) {
587 tp->md5sig_info = kzalloc(sizeof(*tp->md5sig_info), GFP_ATOMIC);
588 if (!tp->md5sig_info) {
592 sk_nocaps_add(sk, NETIF_F_GSO_MASK);
594 if (tp->md5sig_info->entries6 == 0 &&
595 !tcp_alloc_md5sig_pool()) {
599 if (tp->md5sig_info->alloced6 == tp->md5sig_info->entries6) {
600 keys = kmalloc((sizeof (tp->md5sig_info->keys6[0]) *
601 (tp->md5sig_info->entries6 + 1)), GFP_ATOMIC);
608 if (tp->md5sig_info->entries6)
609 memmove(keys, tp->md5sig_info->keys6,
610 (sizeof (tp->md5sig_info->keys6[0]) *
611 tp->md5sig_info->entries6));
613 kfree(tp->md5sig_info->keys6);
614 tp->md5sig_info->keys6 = keys;
615 tp->md5sig_info->alloced6++;
618 ipv6_addr_copy(&tp->md5sig_info->keys6[tp->md5sig_info->entries6].addr,
620 tp->md5sig_info->keys6[tp->md5sig_info->entries6].base.key = newkey;
621 tp->md5sig_info->keys6[tp->md5sig_info->entries6].base.keylen = newkeylen;
623 tp->md5sig_info->entries6++;
628 static int tcp_v6_md5_add_func(struct sock *sk, struct sock *addr_sk,
629 u8 *newkey, __u8 newkeylen)
631 return tcp_v6_md5_do_add(sk, &inet6_sk(addr_sk)->daddr,
635 static int tcp_v6_md5_do_del(struct sock *sk, const struct in6_addr *peer)
637 struct tcp_sock *tp = tcp_sk(sk);
640 for (i = 0; i < tp->md5sig_info->entries6; i++) {
641 if (ipv6_addr_equal(&tp->md5sig_info->keys6[i].addr, peer)) {
643 kfree(tp->md5sig_info->keys6[i].base.key);
644 tp->md5sig_info->entries6--;
646 if (tp->md5sig_info->entries6 == 0) {
647 kfree(tp->md5sig_info->keys6);
648 tp->md5sig_info->keys6 = NULL;
649 tp->md5sig_info->alloced6 = 0;
651 /* shrink the database */
652 if (tp->md5sig_info->entries6 != i)
653 memmove(&tp->md5sig_info->keys6[i],
654 &tp->md5sig_info->keys6[i+1],
655 (tp->md5sig_info->entries6 - i)
656 * sizeof (tp->md5sig_info->keys6[0]));
664 static void tcp_v6_clear_md5_list (struct sock *sk)
666 struct tcp_sock *tp = tcp_sk(sk);
669 if (tp->md5sig_info->entries6) {
670 for (i = 0; i < tp->md5sig_info->entries6; i++)
671 kfree(tp->md5sig_info->keys6[i].base.key);
672 tp->md5sig_info->entries6 = 0;
675 kfree(tp->md5sig_info->keys6);
676 tp->md5sig_info->keys6 = NULL;
677 tp->md5sig_info->alloced6 = 0;
679 if (tp->md5sig_info->entries4) {
680 for (i = 0; i < tp->md5sig_info->entries4; i++)
681 kfree(tp->md5sig_info->keys4[i].base.key);
682 tp->md5sig_info->entries4 = 0;
685 kfree(tp->md5sig_info->keys4);
686 tp->md5sig_info->keys4 = NULL;
687 tp->md5sig_info->alloced4 = 0;
690 static int tcp_v6_parse_md5_keys (struct sock *sk, char __user *optval,
693 struct tcp_md5sig cmd;
694 struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)&cmd.tcpm_addr;
697 if (optlen < sizeof(cmd))
700 if (copy_from_user(&cmd, optval, sizeof(cmd)))
703 if (sin6->sin6_family != AF_INET6)
706 if (!cmd.tcpm_keylen) {
707 if (!tcp_sk(sk)->md5sig_info)
709 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
710 return tcp_v4_md5_do_del(sk, sin6->sin6_addr.s6_addr32[3]);
711 return tcp_v6_md5_do_del(sk, &sin6->sin6_addr);
714 if (cmd.tcpm_keylen > TCP_MD5SIG_MAXKEYLEN)
717 if (!tcp_sk(sk)->md5sig_info) {
718 struct tcp_sock *tp = tcp_sk(sk);
719 struct tcp_md5sig_info *p;
721 p = kzalloc(sizeof(struct tcp_md5sig_info), GFP_KERNEL);
726 sk_nocaps_add(sk, NETIF_F_GSO_MASK);
729 newkey = kmemdup(cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
732 if (ipv6_addr_v4mapped(&sin6->sin6_addr)) {
733 return tcp_v4_md5_do_add(sk, sin6->sin6_addr.s6_addr32[3],
734 newkey, cmd.tcpm_keylen);
736 return tcp_v6_md5_do_add(sk, &sin6->sin6_addr, newkey, cmd.tcpm_keylen);
739 static int tcp_v6_md5_hash_pseudoheader(struct tcp_md5sig_pool *hp,
740 const struct in6_addr *daddr,
741 const struct in6_addr *saddr, int nbytes)
743 struct tcp6_pseudohdr *bp;
744 struct scatterlist sg;
746 bp = &hp->md5_blk.ip6;
747 /* 1. TCP pseudo-header (RFC2460) */
748 ipv6_addr_copy(&bp->saddr, saddr);
749 ipv6_addr_copy(&bp->daddr, daddr);
750 bp->protocol = cpu_to_be32(IPPROTO_TCP);
751 bp->len = cpu_to_be32(nbytes);
753 sg_init_one(&sg, bp, sizeof(*bp));
754 return crypto_hash_update(&hp->md5_desc, &sg, sizeof(*bp));
757 static int tcp_v6_md5_hash_hdr(char *md5_hash, struct tcp_md5sig_key *key,
758 const struct in6_addr *daddr, struct in6_addr *saddr,
759 const struct tcphdr *th)
761 struct tcp_md5sig_pool *hp;
762 struct hash_desc *desc;
764 hp = tcp_get_md5sig_pool();
766 goto clear_hash_noput;
767 desc = &hp->md5_desc;
769 if (crypto_hash_init(desc))
771 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, th->doff << 2))
773 if (tcp_md5_hash_header(hp, th))
775 if (tcp_md5_hash_key(hp, key))
777 if (crypto_hash_final(desc, md5_hash))
780 tcp_put_md5sig_pool();
784 tcp_put_md5sig_pool();
786 memset(md5_hash, 0, 16);
790 static int tcp_v6_md5_hash_skb(char *md5_hash, struct tcp_md5sig_key *key,
791 const struct sock *sk,
792 const struct request_sock *req,
793 const struct sk_buff *skb)
795 const struct in6_addr *saddr, *daddr;
796 struct tcp_md5sig_pool *hp;
797 struct hash_desc *desc;
798 const struct tcphdr *th = tcp_hdr(skb);
801 saddr = &inet6_sk(sk)->saddr;
802 daddr = &inet6_sk(sk)->daddr;
804 saddr = &inet6_rsk(req)->loc_addr;
805 daddr = &inet6_rsk(req)->rmt_addr;
807 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
808 saddr = &ip6h->saddr;
809 daddr = &ip6h->daddr;
812 hp = tcp_get_md5sig_pool();
814 goto clear_hash_noput;
815 desc = &hp->md5_desc;
817 if (crypto_hash_init(desc))
820 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, skb->len))
822 if (tcp_md5_hash_header(hp, th))
824 if (tcp_md5_hash_skb_data(hp, skb, th->doff << 2))
826 if (tcp_md5_hash_key(hp, key))
828 if (crypto_hash_final(desc, md5_hash))
831 tcp_put_md5sig_pool();
835 tcp_put_md5sig_pool();
837 memset(md5_hash, 0, 16);
841 static int tcp_v6_inbound_md5_hash(struct sock *sk, const struct sk_buff *skb)
843 const __u8 *hash_location = NULL;
844 struct tcp_md5sig_key *hash_expected;
845 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
846 const struct tcphdr *th = tcp_hdr(skb);
850 hash_expected = tcp_v6_md5_do_lookup(sk, &ip6h->saddr);
851 hash_location = tcp_parse_md5sig_option(th);
853 /* We've parsed the options - do we have a hash? */
854 if (!hash_expected && !hash_location)
857 if (hash_expected && !hash_location) {
858 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5NOTFOUND);
862 if (!hash_expected && hash_location) {
863 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5UNEXPECTED);
867 /* check the signature */
868 genhash = tcp_v6_md5_hash_skb(newhash,
872 if (genhash || memcmp(hash_location, newhash, 16) != 0) {
873 if (net_ratelimit()) {
874 printk(KERN_INFO "MD5 Hash %s for [%pI6c]:%u->[%pI6c]:%u\n",
875 genhash ? "failed" : "mismatch",
876 &ip6h->saddr, ntohs(th->source),
877 &ip6h->daddr, ntohs(th->dest));
885 struct request_sock_ops tcp6_request_sock_ops __read_mostly = {
887 .obj_size = sizeof(struct tcp6_request_sock),
888 .rtx_syn_ack = tcp_v6_rtx_synack,
889 .send_ack = tcp_v6_reqsk_send_ack,
890 .destructor = tcp_v6_reqsk_destructor,
891 .send_reset = tcp_v6_send_reset,
892 .syn_ack_timeout = tcp_syn_ack_timeout,
895 #ifdef CONFIG_TCP_MD5SIG
896 static const struct tcp_request_sock_ops tcp_request_sock_ipv6_ops = {
897 .md5_lookup = tcp_v6_reqsk_md5_lookup,
898 .calc_md5_hash = tcp_v6_md5_hash_skb,
902 static void __tcp_v6_send_check(struct sk_buff *skb,
903 const struct in6_addr *saddr, const struct in6_addr *daddr)
905 struct tcphdr *th = tcp_hdr(skb);
907 if (skb->ip_summed == CHECKSUM_PARTIAL) {
908 th->check = ~tcp_v6_check(skb->len, saddr, daddr, 0);
909 skb->csum_start = skb_transport_header(skb) - skb->head;
910 skb->csum_offset = offsetof(struct tcphdr, check);
912 th->check = tcp_v6_check(skb->len, saddr, daddr,
913 csum_partial(th, th->doff << 2,
918 static void tcp_v6_send_check(struct sock *sk, struct sk_buff *skb)
920 struct ipv6_pinfo *np = inet6_sk(sk);
922 __tcp_v6_send_check(skb, &np->saddr, &np->daddr);
925 static int tcp_v6_gso_send_check(struct sk_buff *skb)
927 const struct ipv6hdr *ipv6h;
930 if (!pskb_may_pull(skb, sizeof(*th)))
933 ipv6h = ipv6_hdr(skb);
937 skb->ip_summed = CHECKSUM_PARTIAL;
938 __tcp_v6_send_check(skb, &ipv6h->saddr, &ipv6h->daddr);
942 static struct sk_buff **tcp6_gro_receive(struct sk_buff **head,
945 const struct ipv6hdr *iph = skb_gro_network_header(skb);
947 switch (skb->ip_summed) {
948 case CHECKSUM_COMPLETE:
949 if (!tcp_v6_check(skb_gro_len(skb), &iph->saddr, &iph->daddr,
951 skb->ip_summed = CHECKSUM_UNNECESSARY;
957 NAPI_GRO_CB(skb)->flush = 1;
961 return tcp_gro_receive(head, skb);
964 static int tcp6_gro_complete(struct sk_buff *skb)
966 const struct ipv6hdr *iph = ipv6_hdr(skb);
967 struct tcphdr *th = tcp_hdr(skb);
969 th->check = ~tcp_v6_check(skb->len - skb_transport_offset(skb),
970 &iph->saddr, &iph->daddr, 0);
971 skb_shinfo(skb)->gso_type = SKB_GSO_TCPV6;
973 return tcp_gro_complete(skb);
976 static void tcp_v6_send_response(struct sk_buff *skb, u32 seq, u32 ack, u32 win,
977 u32 ts, struct tcp_md5sig_key *key, int rst, u8 tclass)
979 const struct tcphdr *th = tcp_hdr(skb);
981 struct sk_buff *buff;
983 struct net *net = dev_net(skb_dst(skb)->dev);
984 struct sock *ctl_sk = net->ipv6.tcp_sk;
985 unsigned int tot_len = sizeof(struct tcphdr);
986 struct dst_entry *dst;
990 tot_len += TCPOLEN_TSTAMP_ALIGNED;
991 #ifdef CONFIG_TCP_MD5SIG
993 tot_len += TCPOLEN_MD5SIG_ALIGNED;
996 buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
1001 skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
1003 t1 = (struct tcphdr *) skb_push(buff, tot_len);
1004 skb_reset_transport_header(buff);
1006 /* Swap the send and the receive. */
1007 memset(t1, 0, sizeof(*t1));
1008 t1->dest = th->source;
1009 t1->source = th->dest;
1010 t1->doff = tot_len / 4;
1011 t1->seq = htonl(seq);
1012 t1->ack_seq = htonl(ack);
1013 t1->ack = !rst || !th->ack;
1015 t1->window = htons(win);
1017 topt = (__be32 *)(t1 + 1);
1020 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
1021 (TCPOPT_TIMESTAMP << 8) | TCPOLEN_TIMESTAMP);
1022 *topt++ = htonl(tcp_time_stamp);
1023 *topt++ = htonl(ts);
1026 #ifdef CONFIG_TCP_MD5SIG
1028 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
1029 (TCPOPT_MD5SIG << 8) | TCPOLEN_MD5SIG);
1030 tcp_v6_md5_hash_hdr((__u8 *)topt, key,
1031 &ipv6_hdr(skb)->saddr,
1032 &ipv6_hdr(skb)->daddr, t1);
1036 memset(&fl6, 0, sizeof(fl6));
1037 ipv6_addr_copy(&fl6.daddr, &ipv6_hdr(skb)->saddr);
1038 ipv6_addr_copy(&fl6.saddr, &ipv6_hdr(skb)->daddr);
1040 buff->ip_summed = CHECKSUM_PARTIAL;
1043 __tcp_v6_send_check(buff, &fl6.saddr, &fl6.daddr);
1045 fl6.flowi6_proto = IPPROTO_TCP;
1046 if (ipv6_addr_type(&fl6.daddr) & IPV6_ADDR_LINKLOCAL)
1047 fl6.flowi6_oif = inet6_iif(skb);
1048 fl6.fl6_dport = t1->dest;
1049 fl6.fl6_sport = t1->source;
1050 security_skb_classify_flow(skb, flowi6_to_flowi(&fl6));
1052 /* Pass a socket to ip6_dst_lookup either it is for RST
1053 * Underlying function will use this to retrieve the network
1056 dst = ip6_dst_lookup_flow(ctl_sk, &fl6, NULL, false);
1058 skb_dst_set(buff, dst);
1059 ip6_xmit(ctl_sk, buff, &fl6, NULL, tclass);
1060 TCP_INC_STATS_BH(net, TCP_MIB_OUTSEGS);
1062 TCP_INC_STATS_BH(net, TCP_MIB_OUTRSTS);
1069 static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb)
1071 const struct tcphdr *th = tcp_hdr(skb);
1072 u32 seq = 0, ack_seq = 0;
1073 struct tcp_md5sig_key *key = NULL;
1078 if (!ipv6_unicast_destination(skb))
1081 #ifdef CONFIG_TCP_MD5SIG
1083 key = tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->saddr);
1087 seq = ntohl(th->ack_seq);
1089 ack_seq = ntohl(th->seq) + th->syn + th->fin + skb->len -
1092 tcp_v6_send_response(skb, seq, ack_seq, 0, 0, key, 1, 0);
1095 static void tcp_v6_send_ack(struct sk_buff *skb, u32 seq, u32 ack, u32 win, u32 ts,
1096 struct tcp_md5sig_key *key, u8 tclass)
1098 tcp_v6_send_response(skb, seq, ack, win, ts, key, 0, tclass);
1101 static void tcp_v6_timewait_ack(struct sock *sk, struct sk_buff *skb)
1103 struct inet_timewait_sock *tw = inet_twsk(sk);
1104 struct tcp_timewait_sock *tcptw = tcp_twsk(sk);
1106 tcp_v6_send_ack(skb, tcptw->tw_snd_nxt, tcptw->tw_rcv_nxt,
1107 tcptw->tw_rcv_wnd >> tw->tw_rcv_wscale,
1108 tcptw->tw_ts_recent, tcp_twsk_md5_key(tcptw),
1114 static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
1115 struct request_sock *req)
1117 tcp_v6_send_ack(skb, tcp_rsk(req)->snt_isn + 1, tcp_rsk(req)->rcv_isn + 1, req->rcv_wnd, req->ts_recent,
1118 tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr), 0);
1122 static struct sock *tcp_v6_hnd_req(struct sock *sk,struct sk_buff *skb)
1124 struct request_sock *req, **prev;
1125 const struct tcphdr *th = tcp_hdr(skb);
1128 /* Find possible connection requests. */
1129 req = inet6_csk_search_req(sk, &prev, th->source,
1130 &ipv6_hdr(skb)->saddr,
1131 &ipv6_hdr(skb)->daddr, inet6_iif(skb));
1133 return tcp_check_req(sk, skb, req, prev);
1135 nsk = __inet6_lookup_established(sock_net(sk), &tcp_hashinfo,
1136 &ipv6_hdr(skb)->saddr, th->source,
1137 &ipv6_hdr(skb)->daddr, ntohs(th->dest), inet6_iif(skb));
1140 if (nsk->sk_state != TCP_TIME_WAIT) {
1144 inet_twsk_put(inet_twsk(nsk));
1148 #ifdef CONFIG_SYN_COOKIES
1150 sk = cookie_v6_check(sk, skb);
1155 /* FIXME: this is substantially similar to the ipv4 code.
1156 * Can some kind of merge be done? -- erics
1158 static int tcp_v6_conn_request(struct sock *sk, struct sk_buff *skb)
1160 struct tcp_extend_values tmp_ext;
1161 struct tcp_options_received tmp_opt;
1162 const u8 *hash_location;
1163 struct request_sock *req;
1164 struct inet6_request_sock *treq;
1165 struct ipv6_pinfo *np = inet6_sk(sk);
1166 struct tcp_sock *tp = tcp_sk(sk);
1167 __u32 isn = TCP_SKB_CB(skb)->when;
1168 struct dst_entry *dst = NULL;
1169 int want_cookie = 0;
1171 if (skb->protocol == htons(ETH_P_IP))
1172 return tcp_v4_conn_request(sk, skb);
1174 if (!ipv6_unicast_destination(skb))
1177 if (inet_csk_reqsk_queue_is_full(sk) && !isn) {
1178 want_cookie = tcp_syn_flood_action(sk, skb, "TCPv6");
1183 if (sk_acceptq_is_full(sk) && inet_csk_reqsk_queue_young(sk) > 1)
1186 req = inet6_reqsk_alloc(&tcp6_request_sock_ops);
1190 #ifdef CONFIG_TCP_MD5SIG
1191 tcp_rsk(req)->af_specific = &tcp_request_sock_ipv6_ops;
1194 tcp_clear_options(&tmp_opt);
1195 tmp_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
1196 tmp_opt.user_mss = tp->rx_opt.user_mss;
1197 tcp_parse_options(skb, &tmp_opt, &hash_location, 0);
1199 if (tmp_opt.cookie_plus > 0 &&
1200 tmp_opt.saw_tstamp &&
1201 !tp->rx_opt.cookie_out_never &&
1202 (sysctl_tcp_cookie_size > 0 ||
1203 (tp->cookie_values != NULL &&
1204 tp->cookie_values->cookie_desired > 0))) {
1207 u32 *mess = &tmp_ext.cookie_bakery[COOKIE_DIGEST_WORDS];
1208 int l = tmp_opt.cookie_plus - TCPOLEN_COOKIE_BASE;
1210 if (tcp_cookie_generator(&tmp_ext.cookie_bakery[0]) != 0)
1213 /* Secret recipe starts with IP addresses */
1214 d = (__force u32 *)&ipv6_hdr(skb)->daddr.s6_addr32[0];
1219 d = (__force u32 *)&ipv6_hdr(skb)->saddr.s6_addr32[0];
1225 /* plus variable length Initiator Cookie */
1228 *c++ ^= *hash_location++;
1230 want_cookie = 0; /* not our kind of cookie */
1231 tmp_ext.cookie_out_never = 0; /* false */
1232 tmp_ext.cookie_plus = tmp_opt.cookie_plus;
1233 } else if (!tp->rx_opt.cookie_in_always) {
1234 /* redundant indications, but ensure initialization. */
1235 tmp_ext.cookie_out_never = 1; /* true */
1236 tmp_ext.cookie_plus = 0;
1240 tmp_ext.cookie_in_always = tp->rx_opt.cookie_in_always;
1242 if (want_cookie && !tmp_opt.saw_tstamp)
1243 tcp_clear_options(&tmp_opt);
1245 tmp_opt.tstamp_ok = tmp_opt.saw_tstamp;
1246 tcp_openreq_init(req, &tmp_opt, skb);
1248 treq = inet6_rsk(req);
1249 ipv6_addr_copy(&treq->rmt_addr, &ipv6_hdr(skb)->saddr);
1250 ipv6_addr_copy(&treq->loc_addr, &ipv6_hdr(skb)->daddr);
1251 if (!want_cookie || tmp_opt.tstamp_ok)
1252 TCP_ECN_create_request(req, skb);
1254 treq->iif = sk->sk_bound_dev_if;
1256 /* So that link locals have meaning */
1257 if (!sk->sk_bound_dev_if &&
1258 ipv6_addr_type(&treq->rmt_addr) & IPV6_ADDR_LINKLOCAL)
1259 treq->iif = inet6_iif(skb);
1262 struct inet_peer *peer = NULL;
1264 if (ipv6_opt_accepted(sk, skb) ||
1265 np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo ||
1266 np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim) {
1267 atomic_inc(&skb->users);
1268 treq->pktopts = skb;
1272 isn = cookie_v6_init_sequence(sk, skb, &req->mss);
1273 req->cookie_ts = tmp_opt.tstamp_ok;
1277 /* VJ's idea. We save last timestamp seen
1278 * from the destination in peer table, when entering
1279 * state TIME-WAIT, and check against it before
1280 * accepting new connection request.
1282 * If "isn" is not zero, this request hit alive
1283 * timewait bucket, so that all the necessary checks
1284 * are made in the function processing timewait state.
1286 if (tmp_opt.saw_tstamp &&
1287 tcp_death_row.sysctl_tw_recycle &&
1288 (dst = inet6_csk_route_req(sk, req)) != NULL &&
1289 (peer = rt6_get_peer((struct rt6_info *)dst)) != NULL &&
1290 ipv6_addr_equal((struct in6_addr *)peer->daddr.addr.a6,
1292 inet_peer_refcheck(peer);
1293 if ((u32)get_seconds() - peer->tcp_ts_stamp < TCP_PAWS_MSL &&
1294 (s32)(peer->tcp_ts - req->ts_recent) >
1296 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_PAWSPASSIVEREJECTED);
1297 goto drop_and_release;
1300 /* Kill the following clause, if you dislike this way. */
1301 else if (!sysctl_tcp_syncookies &&
1302 (sysctl_max_syn_backlog - inet_csk_reqsk_queue_len(sk) <
1303 (sysctl_max_syn_backlog >> 2)) &&
1304 (!peer || !peer->tcp_ts_stamp) &&
1305 (!dst || !dst_metric(dst, RTAX_RTT))) {
1306 /* Without syncookies last quarter of
1307 * backlog is filled with destinations,
1308 * proven to be alive.
1309 * It means that we continue to communicate
1310 * to destinations, already remembered
1311 * to the moment of synflood.
1313 LIMIT_NETDEBUG(KERN_DEBUG "TCP: drop open request from %pI6/%u\n",
1314 &treq->rmt_addr, ntohs(tcp_hdr(skb)->source));
1315 goto drop_and_release;
1318 isn = tcp_v6_init_sequence(skb);
1321 tcp_rsk(req)->snt_isn = isn;
1322 tcp_rsk(req)->snt_synack = tcp_time_stamp;
1324 security_inet_conn_request(sk, skb, req);
1326 if (tcp_v6_send_synack(sk, req,
1327 (struct request_values *)&tmp_ext) ||
1331 inet6_csk_reqsk_queue_hash_add(sk, req, TCP_TIMEOUT_INIT);
1339 return 0; /* don't send reset */
1342 static struct sock * tcp_v6_syn_recv_sock(struct sock *sk, struct sk_buff *skb,
1343 struct request_sock *req,
1344 struct dst_entry *dst)
1346 struct inet6_request_sock *treq;
1347 struct ipv6_pinfo *newnp, *np = inet6_sk(sk);
1348 struct tcp6_sock *newtcp6sk;
1349 struct inet_sock *newinet;
1350 struct tcp_sock *newtp;
1352 struct ipv6_txoptions *opt;
1353 #ifdef CONFIG_TCP_MD5SIG
1354 struct tcp_md5sig_key *key;
1357 if (skb->protocol == htons(ETH_P_IP)) {
1362 newsk = tcp_v4_syn_recv_sock(sk, skb, req, dst);
1367 newtcp6sk = (struct tcp6_sock *)newsk;
1368 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1370 newinet = inet_sk(newsk);
1371 newnp = inet6_sk(newsk);
1372 newtp = tcp_sk(newsk);
1374 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1376 ipv6_addr_set_v4mapped(newinet->inet_daddr, &newnp->daddr);
1378 ipv6_addr_set_v4mapped(newinet->inet_saddr, &newnp->saddr);
1380 ipv6_addr_copy(&newnp->rcv_saddr, &newnp->saddr);
1382 inet_csk(newsk)->icsk_af_ops = &ipv6_mapped;
1383 newsk->sk_backlog_rcv = tcp_v4_do_rcv;
1384 #ifdef CONFIG_TCP_MD5SIG
1385 newtp->af_specific = &tcp_sock_ipv6_mapped_specific;
1388 newnp->ipv6_ac_list = NULL;
1389 newnp->ipv6_fl_list = NULL;
1390 newnp->pktoptions = NULL;
1392 newnp->mcast_oif = inet6_iif(skb);
1393 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
1396 * No need to charge this sock to the relevant IPv6 refcnt debug socks count
1397 * here, tcp_create_openreq_child now does this for us, see the comment in
1398 * that function for the gory details. -acme
1401 /* It is tricky place. Until this moment IPv4 tcp
1402 worked with IPv6 icsk.icsk_af_ops.
1405 tcp_sync_mss(newsk, inet_csk(newsk)->icsk_pmtu_cookie);
1410 treq = inet6_rsk(req);
1413 if (sk_acceptq_is_full(sk))
1417 dst = inet6_csk_route_req(sk, req);
1422 newsk = tcp_create_openreq_child(sk, req, skb);
1427 * No need to charge this sock to the relevant IPv6 refcnt debug socks
1428 * count here, tcp_create_openreq_child now does this for us, see the
1429 * comment in that function for the gory details. -acme
1432 newsk->sk_gso_type = SKB_GSO_TCPV6;
1433 __ip6_dst_store(newsk, dst, NULL, NULL);
1435 newtcp6sk = (struct tcp6_sock *)newsk;
1436 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1438 newtp = tcp_sk(newsk);
1439 newinet = inet_sk(newsk);
1440 newnp = inet6_sk(newsk);
1442 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1444 ipv6_addr_copy(&newnp->daddr, &treq->rmt_addr);
1445 ipv6_addr_copy(&newnp->saddr, &treq->loc_addr);
1446 ipv6_addr_copy(&newnp->rcv_saddr, &treq->loc_addr);
1447 newsk->sk_bound_dev_if = treq->iif;
1449 /* Now IPv6 options...
1451 First: no IPv4 options.
1453 newinet->inet_opt = NULL;
1454 newnp->ipv6_ac_list = NULL;
1455 newnp->ipv6_fl_list = NULL;
1458 newnp->rxopt.all = np->rxopt.all;
1460 /* Clone pktoptions received with SYN */
1461 newnp->pktoptions = NULL;
1462 if (treq->pktopts != NULL) {
1463 newnp->pktoptions = skb_clone(treq->pktopts, GFP_ATOMIC);
1464 kfree_skb(treq->pktopts);
1465 treq->pktopts = NULL;
1466 if (newnp->pktoptions)
1467 skb_set_owner_r(newnp->pktoptions, newsk);
1470 newnp->mcast_oif = inet6_iif(skb);
1471 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
1473 /* Clone native IPv6 options from listening socket (if any)
1475 Yes, keeping reference count would be much more clever,
1476 but we make one more one thing there: reattach optmem
1480 newnp->opt = ipv6_dup_options(newsk, opt);
1482 sock_kfree_s(sk, opt, opt->tot_len);
1485 inet_csk(newsk)->icsk_ext_hdr_len = 0;
1487 inet_csk(newsk)->icsk_ext_hdr_len = (newnp->opt->opt_nflen +
1488 newnp->opt->opt_flen);
1490 tcp_mtup_init(newsk);
1491 tcp_sync_mss(newsk, dst_mtu(dst));
1492 newtp->advmss = dst_metric_advmss(dst);
1493 if (tcp_sk(sk)->rx_opt.user_mss &&
1494 tcp_sk(sk)->rx_opt.user_mss < newtp->advmss)
1495 newtp->advmss = tcp_sk(sk)->rx_opt.user_mss;
1497 tcp_initialize_rcv_mss(newsk);
1498 if (tcp_rsk(req)->snt_synack)
1499 tcp_valid_rtt_meas(newsk,
1500 tcp_time_stamp - tcp_rsk(req)->snt_synack);
1501 newtp->total_retrans = req->retrans;
1503 newinet->inet_daddr = newinet->inet_saddr = LOOPBACK4_IPV6;
1504 newinet->inet_rcv_saddr = LOOPBACK4_IPV6;
1506 #ifdef CONFIG_TCP_MD5SIG
1507 /* Copy over the MD5 key from the original socket */
1508 if ((key = tcp_v6_md5_do_lookup(sk, &newnp->daddr)) != NULL) {
1509 /* We're using one, so create a matching key
1510 * on the newsk structure. If we fail to get
1511 * memory, then we end up not copying the key
1514 char *newkey = kmemdup(key->key, key->keylen, GFP_ATOMIC);
1516 tcp_v6_md5_do_add(newsk, &newnp->daddr,
1517 newkey, key->keylen);
1521 if (__inet_inherit_port(sk, newsk) < 0) {
1522 inet_csk_prepare_forced_close(newsk);
1526 __inet6_hash(newsk, NULL);
1531 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
1533 if (opt && opt != np->opt)
1534 sock_kfree_s(sk, opt, opt->tot_len);
1537 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1541 static __sum16 tcp_v6_checksum_init(struct sk_buff *skb)
1543 if (skb->ip_summed == CHECKSUM_COMPLETE) {
1544 if (!tcp_v6_check(skb->len, &ipv6_hdr(skb)->saddr,
1545 &ipv6_hdr(skb)->daddr, skb->csum)) {
1546 skb->ip_summed = CHECKSUM_UNNECESSARY;
1551 skb->csum = ~csum_unfold(tcp_v6_check(skb->len,
1552 &ipv6_hdr(skb)->saddr,
1553 &ipv6_hdr(skb)->daddr, 0));
1555 if (skb->len <= 76) {
1556 return __skb_checksum_complete(skb);
1561 /* The socket must have it's spinlock held when we get
1564 * We have a potential double-lock case here, so even when
1565 * doing backlog processing we use the BH locking scheme.
1566 * This is because we cannot sleep with the original spinlock
1569 static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb)
1571 struct ipv6_pinfo *np = inet6_sk(sk);
1572 struct tcp_sock *tp;
1573 struct sk_buff *opt_skb = NULL;
1575 /* Imagine: socket is IPv6. IPv4 packet arrives,
1576 goes to IPv4 receive handler and backlogged.
1577 From backlog it always goes here. Kerboom...
1578 Fortunately, tcp_rcv_established and rcv_established
1579 handle them correctly, but it is not case with
1580 tcp_v6_hnd_req and tcp_v6_send_reset(). --ANK
1583 if (skb->protocol == htons(ETH_P_IP))
1584 return tcp_v4_do_rcv(sk, skb);
1586 #ifdef CONFIG_TCP_MD5SIG
1587 if (tcp_v6_inbound_md5_hash (sk, skb))
1591 if (sk_filter(sk, skb))
1595 * socket locking is here for SMP purposes as backlog rcv
1596 * is currently called with bh processing disabled.
1599 /* Do Stevens' IPV6_PKTOPTIONS.
1601 Yes, guys, it is the only place in our code, where we
1602 may make it not affecting IPv4.
1603 The rest of code is protocol independent,
1604 and I do not like idea to uglify IPv4.
1606 Actually, all the idea behind IPV6_PKTOPTIONS
1607 looks not very well thought. For now we latch
1608 options, received in the last packet, enqueued
1609 by tcp. Feel free to propose better solution.
1613 opt_skb = skb_clone(skb, GFP_ATOMIC);
1615 if (sk->sk_state == TCP_ESTABLISHED) { /* Fast path */
1616 sock_rps_save_rxhash(sk, skb);
1617 if (tcp_rcv_established(sk, skb, tcp_hdr(skb), skb->len))
1620 goto ipv6_pktoptions;
1624 if (skb->len < tcp_hdrlen(skb) || tcp_checksum_complete(skb))
1627 if (sk->sk_state == TCP_LISTEN) {
1628 struct sock *nsk = tcp_v6_hnd_req(sk, skb);
1633 * Queue it on the new socket if the new socket is active,
1634 * otherwise we just shortcircuit this and continue with
1638 sock_rps_save_rxhash(nsk, skb);
1639 if (tcp_child_process(sk, nsk, skb))
1642 __kfree_skb(opt_skb);
1646 sock_rps_save_rxhash(sk, skb);
1648 if (tcp_rcv_state_process(sk, skb, tcp_hdr(skb), skb->len))
1651 goto ipv6_pktoptions;
1655 tcp_v6_send_reset(sk, skb);
1658 __kfree_skb(opt_skb);
1662 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_INERRS);
1667 /* Do you ask, what is it?
1669 1. skb was enqueued by tcp.
1670 2. skb is added to tail of read queue, rather than out of order.
1671 3. socket is not in passive state.
1672 4. Finally, it really contains options, which user wants to receive.
1675 if (TCP_SKB_CB(opt_skb)->end_seq == tp->rcv_nxt &&
1676 !((1 << sk->sk_state) & (TCPF_CLOSE | TCPF_LISTEN))) {
1677 if (np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo)
1678 np->mcast_oif = inet6_iif(opt_skb);
1679 if (np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim)
1680 np->mcast_hops = ipv6_hdr(opt_skb)->hop_limit;
1681 if (ipv6_opt_accepted(sk, opt_skb)) {
1682 skb_set_owner_r(opt_skb, sk);
1683 opt_skb = xchg(&np->pktoptions, opt_skb);
1685 __kfree_skb(opt_skb);
1686 opt_skb = xchg(&np->pktoptions, NULL);
1694 static int tcp_v6_rcv(struct sk_buff *skb)
1696 const struct tcphdr *th;
1697 const struct ipv6hdr *hdr;
1700 struct net *net = dev_net(skb->dev);
1702 if (skb->pkt_type != PACKET_HOST)
1706 * Count it even if it's bad.
1708 TCP_INC_STATS_BH(net, TCP_MIB_INSEGS);
1710 if (!pskb_may_pull(skb, sizeof(struct tcphdr)))
1715 if (th->doff < sizeof(struct tcphdr)/4)
1717 if (!pskb_may_pull(skb, th->doff*4))
1720 if (!skb_csum_unnecessary(skb) && tcp_v6_checksum_init(skb))
1724 hdr = ipv6_hdr(skb);
1725 TCP_SKB_CB(skb)->seq = ntohl(th->seq);
1726 TCP_SKB_CB(skb)->end_seq = (TCP_SKB_CB(skb)->seq + th->syn + th->fin +
1727 skb->len - th->doff*4);
1728 TCP_SKB_CB(skb)->ack_seq = ntohl(th->ack_seq);
1729 TCP_SKB_CB(skb)->when = 0;
1730 TCP_SKB_CB(skb)->ip_dsfield = ipv6_get_dsfield(hdr);
1731 TCP_SKB_CB(skb)->sacked = 0;
1733 sk = __inet6_lookup_skb(&tcp_hashinfo, skb, th->source, th->dest);
1738 if (sk->sk_state == TCP_TIME_WAIT)
1741 if (hdr->hop_limit < inet6_sk(sk)->min_hopcount) {
1742 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
1743 goto discard_and_relse;
1746 if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
1747 goto discard_and_relse;
1749 if (sk_filter(sk, skb))
1750 goto discard_and_relse;
1754 bh_lock_sock_nested(sk);
1756 if (!sock_owned_by_user(sk)) {
1757 #ifdef CONFIG_NET_DMA
1758 struct tcp_sock *tp = tcp_sk(sk);
1759 if (!tp->ucopy.dma_chan && tp->ucopy.pinned_list)
1760 tp->ucopy.dma_chan = dma_find_channel(DMA_MEMCPY);
1761 if (tp->ucopy.dma_chan)
1762 ret = tcp_v6_do_rcv(sk, skb);
1766 if (!tcp_prequeue(sk, skb))
1767 ret = tcp_v6_do_rcv(sk, skb);
1769 } else if (unlikely(sk_add_backlog(sk, skb))) {
1771 NET_INC_STATS_BH(net, LINUX_MIB_TCPBACKLOGDROP);
1772 goto discard_and_relse;
1777 return ret ? -1 : 0;
1780 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb))
1783 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
1785 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
1787 tcp_v6_send_reset(NULL, skb);
1804 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
1805 inet_twsk_put(inet_twsk(sk));
1809 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
1810 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
1811 inet_twsk_put(inet_twsk(sk));
1815 switch (tcp_timewait_state_process(inet_twsk(sk), skb, th)) {
1820 sk2 = inet6_lookup_listener(dev_net(skb->dev), &tcp_hashinfo,
1821 &ipv6_hdr(skb)->daddr,
1822 ntohs(th->dest), inet6_iif(skb));
1824 struct inet_timewait_sock *tw = inet_twsk(sk);
1825 inet_twsk_deschedule(tw, &tcp_death_row);
1830 /* Fall through to ACK */
1833 tcp_v6_timewait_ack(sk, skb);
1837 case TCP_TW_SUCCESS:;
1842 static struct inet_peer *tcp_v6_get_peer(struct sock *sk, bool *release_it)
1844 struct rt6_info *rt = (struct rt6_info *) __sk_dst_get(sk);
1845 struct ipv6_pinfo *np = inet6_sk(sk);
1846 struct inet_peer *peer;
1849 !ipv6_addr_equal(&np->daddr, &rt->rt6i_dst.addr)) {
1850 peer = inet_getpeer_v6(&np->daddr, 1);
1854 rt6_bind_peer(rt, 1);
1855 peer = rt->rt6i_peer;
1856 *release_it = false;
1862 static void *tcp_v6_tw_get_peer(struct sock *sk)
1864 const struct inet6_timewait_sock *tw6 = inet6_twsk(sk);
1865 const struct inet_timewait_sock *tw = inet_twsk(sk);
1867 if (tw->tw_family == AF_INET)
1868 return tcp_v4_tw_get_peer(sk);
1870 return inet_getpeer_v6(&tw6->tw_v6_daddr, 1);
1873 static struct timewait_sock_ops tcp6_timewait_sock_ops = {
1874 .twsk_obj_size = sizeof(struct tcp6_timewait_sock),
1875 .twsk_unique = tcp_twsk_unique,
1876 .twsk_destructor= tcp_twsk_destructor,
1877 .twsk_getpeer = tcp_v6_tw_get_peer,
1880 static const struct inet_connection_sock_af_ops ipv6_specific = {
1881 .queue_xmit = inet6_csk_xmit,
1882 .send_check = tcp_v6_send_check,
1883 .rebuild_header = inet6_sk_rebuild_header,
1884 .conn_request = tcp_v6_conn_request,
1885 .syn_recv_sock = tcp_v6_syn_recv_sock,
1886 .get_peer = tcp_v6_get_peer,
1887 .net_header_len = sizeof(struct ipv6hdr),
1888 .setsockopt = ipv6_setsockopt,
1889 .getsockopt = ipv6_getsockopt,
1890 .addr2sockaddr = inet6_csk_addr2sockaddr,
1891 .sockaddr_len = sizeof(struct sockaddr_in6),
1892 .bind_conflict = inet6_csk_bind_conflict,
1893 #ifdef CONFIG_COMPAT
1894 .compat_setsockopt = compat_ipv6_setsockopt,
1895 .compat_getsockopt = compat_ipv6_getsockopt,
1899 #ifdef CONFIG_TCP_MD5SIG
1900 static const struct tcp_sock_af_ops tcp_sock_ipv6_specific = {
1901 .md5_lookup = tcp_v6_md5_lookup,
1902 .calc_md5_hash = tcp_v6_md5_hash_skb,
1903 .md5_add = tcp_v6_md5_add_func,
1904 .md5_parse = tcp_v6_parse_md5_keys,
1909 * TCP over IPv4 via INET6 API
1912 static const struct inet_connection_sock_af_ops ipv6_mapped = {
1913 .queue_xmit = ip_queue_xmit,
1914 .send_check = tcp_v4_send_check,
1915 .rebuild_header = inet_sk_rebuild_header,
1916 .conn_request = tcp_v6_conn_request,
1917 .syn_recv_sock = tcp_v6_syn_recv_sock,
1918 .get_peer = tcp_v4_get_peer,
1919 .net_header_len = sizeof(struct iphdr),
1920 .setsockopt = ipv6_setsockopt,
1921 .getsockopt = ipv6_getsockopt,
1922 .addr2sockaddr = inet6_csk_addr2sockaddr,
1923 .sockaddr_len = sizeof(struct sockaddr_in6),
1924 .bind_conflict = inet6_csk_bind_conflict,
1925 #ifdef CONFIG_COMPAT
1926 .compat_setsockopt = compat_ipv6_setsockopt,
1927 .compat_getsockopt = compat_ipv6_getsockopt,
1931 #ifdef CONFIG_TCP_MD5SIG
1932 static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific = {
1933 .md5_lookup = tcp_v4_md5_lookup,
1934 .calc_md5_hash = tcp_v4_md5_hash_skb,
1935 .md5_add = tcp_v6_md5_add_func,
1936 .md5_parse = tcp_v6_parse_md5_keys,
1940 /* NOTE: A lot of things set to zero explicitly by call to
1941 * sk_alloc() so need not be done here.
1943 static int tcp_v6_init_sock(struct sock *sk)
1945 struct inet_connection_sock *icsk = inet_csk(sk);
1946 struct tcp_sock *tp = tcp_sk(sk);
1948 skb_queue_head_init(&tp->out_of_order_queue);
1949 tcp_init_xmit_timers(sk);
1950 tcp_prequeue_init(tp);
1952 icsk->icsk_rto = TCP_TIMEOUT_INIT;
1953 tp->mdev = TCP_TIMEOUT_INIT;
1955 /* So many TCP implementations out there (incorrectly) count the
1956 * initial SYN frame in their delayed-ACK and congestion control
1957 * algorithms that we must have the following bandaid to talk
1958 * efficiently to them. -DaveM
1962 /* See draft-stevens-tcpca-spec-01 for discussion of the
1963 * initialization of these values.
1965 tp->snd_ssthresh = TCP_INFINITE_SSTHRESH;
1966 tp->snd_cwnd_clamp = ~0;
1967 tp->mss_cache = TCP_MSS_DEFAULT;
1969 tp->reordering = sysctl_tcp_reordering;
1971 sk->sk_state = TCP_CLOSE;
1973 icsk->icsk_af_ops = &ipv6_specific;
1974 icsk->icsk_ca_ops = &tcp_init_congestion_ops;
1975 icsk->icsk_sync_mss = tcp_sync_mss;
1976 sk->sk_write_space = sk_stream_write_space;
1977 sock_set_flag(sk, SOCK_USE_WRITE_QUEUE);
1979 #ifdef CONFIG_TCP_MD5SIG
1980 tp->af_specific = &tcp_sock_ipv6_specific;
1983 /* TCP Cookie Transactions */
1984 if (sysctl_tcp_cookie_size > 0) {
1985 /* Default, cookies without s_data_payload. */
1987 kzalloc(sizeof(*tp->cookie_values),
1989 if (tp->cookie_values != NULL)
1990 kref_init(&tp->cookie_values->kref);
1992 /* Presumed zeroed, in order of appearance:
1993 * cookie_in_always, cookie_out_never,
1994 * s_data_constant, s_data_in, s_data_out
1996 sk->sk_sndbuf = sysctl_tcp_wmem[1];
1997 sk->sk_rcvbuf = sysctl_tcp_rmem[1];
2000 percpu_counter_inc(&tcp_sockets_allocated);
2006 static void tcp_v6_destroy_sock(struct sock *sk)
2008 #ifdef CONFIG_TCP_MD5SIG
2009 /* Clean up the MD5 key list */
2010 if (tcp_sk(sk)->md5sig_info)
2011 tcp_v6_clear_md5_list(sk);
2013 tcp_v4_destroy_sock(sk);
2014 inet6_destroy_sock(sk);
2017 #ifdef CONFIG_PROC_FS
2018 /* Proc filesystem TCPv6 sock list dumping. */
2019 static void get_openreq6(struct seq_file *seq,
2020 const struct sock *sk, struct request_sock *req, int i, int uid)
2022 int ttd = req->expires - jiffies;
2023 const struct in6_addr *src = &inet6_rsk(req)->loc_addr;
2024 const struct in6_addr *dest = &inet6_rsk(req)->rmt_addr;
2030 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
2031 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %pK\n",
2033 src->s6_addr32[0], src->s6_addr32[1],
2034 src->s6_addr32[2], src->s6_addr32[3],
2035 ntohs(inet_rsk(req)->loc_port),
2036 dest->s6_addr32[0], dest->s6_addr32[1],
2037 dest->s6_addr32[2], dest->s6_addr32[3],
2038 ntohs(inet_rsk(req)->rmt_port),
2040 0,0, /* could print option size, but that is af dependent. */
2041 1, /* timers active (only the expire timer) */
2042 jiffies_to_clock_t(ttd),
2045 0, /* non standard timer */
2046 0, /* open_requests have no inode */
2050 static void get_tcp6_sock(struct seq_file *seq, struct sock *sp, int i)
2052 const struct in6_addr *dest, *src;
2055 unsigned long timer_expires;
2056 const struct inet_sock *inet = inet_sk(sp);
2057 const struct tcp_sock *tp = tcp_sk(sp);
2058 const struct inet_connection_sock *icsk = inet_csk(sp);
2059 const struct ipv6_pinfo *np = inet6_sk(sp);
2062 src = &np->rcv_saddr;
2063 destp = ntohs(inet->inet_dport);
2064 srcp = ntohs(inet->inet_sport);
2066 if (icsk->icsk_pending == ICSK_TIME_RETRANS) {
2068 timer_expires = icsk->icsk_timeout;
2069 } else if (icsk->icsk_pending == ICSK_TIME_PROBE0) {
2071 timer_expires = icsk->icsk_timeout;
2072 } else if (timer_pending(&sp->sk_timer)) {
2074 timer_expires = sp->sk_timer.expires;
2077 timer_expires = jiffies;
2081 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
2082 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %lu %d %pK %lu %lu %u %u %d\n",
2084 src->s6_addr32[0], src->s6_addr32[1],
2085 src->s6_addr32[2], src->s6_addr32[3], srcp,
2086 dest->s6_addr32[0], dest->s6_addr32[1],
2087 dest->s6_addr32[2], dest->s6_addr32[3], destp,
2089 tp->write_seq-tp->snd_una,
2090 (sp->sk_state == TCP_LISTEN) ? sp->sk_ack_backlog : (tp->rcv_nxt - tp->copied_seq),
2092 jiffies_to_clock_t(timer_expires - jiffies),
2093 icsk->icsk_retransmits,
2095 icsk->icsk_probes_out,
2097 atomic_read(&sp->sk_refcnt), sp,
2098 jiffies_to_clock_t(icsk->icsk_rto),
2099 jiffies_to_clock_t(icsk->icsk_ack.ato),
2100 (icsk->icsk_ack.quick << 1 ) | icsk->icsk_ack.pingpong,
2102 tcp_in_initial_slowstart(tp) ? -1 : tp->snd_ssthresh
2106 static void get_timewait6_sock(struct seq_file *seq,
2107 struct inet_timewait_sock *tw, int i)
2109 const struct in6_addr *dest, *src;
2111 const struct inet6_timewait_sock *tw6 = inet6_twsk((struct sock *)tw);
2112 int ttd = tw->tw_ttd - jiffies;
2117 dest = &tw6->tw_v6_daddr;
2118 src = &tw6->tw_v6_rcv_saddr;
2119 destp = ntohs(tw->tw_dport);
2120 srcp = ntohs(tw->tw_sport);
2123 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
2124 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %pK\n",
2126 src->s6_addr32[0], src->s6_addr32[1],
2127 src->s6_addr32[2], src->s6_addr32[3], srcp,
2128 dest->s6_addr32[0], dest->s6_addr32[1],
2129 dest->s6_addr32[2], dest->s6_addr32[3], destp,
2130 tw->tw_substate, 0, 0,
2131 3, jiffies_to_clock_t(ttd), 0, 0, 0, 0,
2132 atomic_read(&tw->tw_refcnt), tw);
2135 static int tcp6_seq_show(struct seq_file *seq, void *v)
2137 struct tcp_iter_state *st;
2139 if (v == SEQ_START_TOKEN) {
2144 "st tx_queue rx_queue tr tm->when retrnsmt"
2145 " uid timeout inode\n");
2150 switch (st->state) {
2151 case TCP_SEQ_STATE_LISTENING:
2152 case TCP_SEQ_STATE_ESTABLISHED:
2153 get_tcp6_sock(seq, v, st->num);
2155 case TCP_SEQ_STATE_OPENREQ:
2156 get_openreq6(seq, st->syn_wait_sk, v, st->num, st->uid);
2158 case TCP_SEQ_STATE_TIME_WAIT:
2159 get_timewait6_sock(seq, v, st->num);
2166 static const struct file_operations tcp6_afinfo_seq_fops = {
2167 .owner = THIS_MODULE,
2168 .open = tcp_seq_open,
2170 .llseek = seq_lseek,
2171 .release = seq_release_net
2174 static struct tcp_seq_afinfo tcp6_seq_afinfo = {
2177 .seq_fops = &tcp6_afinfo_seq_fops,
2179 .show = tcp6_seq_show,
2183 int __net_init tcp6_proc_init(struct net *net)
2185 return tcp_proc_register(net, &tcp6_seq_afinfo);
2188 void tcp6_proc_exit(struct net *net)
2190 tcp_proc_unregister(net, &tcp6_seq_afinfo);
2194 static void tcp_v6_clear_sk(struct sock *sk, int size)
2196 struct inet_sock *inet = inet_sk(sk);
2198 /* we do not want to clear pinet6 field, because of RCU lookups */
2199 sk_prot_clear_nulls(sk, offsetof(struct inet_sock, pinet6));
2201 size -= offsetof(struct inet_sock, pinet6) + sizeof(inet->pinet6);
2202 memset(&inet->pinet6 + 1, 0, size);
2205 struct proto tcpv6_prot = {
2207 .owner = THIS_MODULE,
2209 .connect = tcp_v6_connect,
2210 .disconnect = tcp_disconnect,
2211 .accept = inet_csk_accept,
2213 .init = tcp_v6_init_sock,
2214 .destroy = tcp_v6_destroy_sock,
2215 .shutdown = tcp_shutdown,
2216 .setsockopt = tcp_setsockopt,
2217 .getsockopt = tcp_getsockopt,
2218 .recvmsg = tcp_recvmsg,
2219 .sendmsg = tcp_sendmsg,
2220 .sendpage = tcp_sendpage,
2221 .backlog_rcv = tcp_v6_do_rcv,
2222 .hash = tcp_v6_hash,
2223 .unhash = inet_unhash,
2224 .get_port = inet_csk_get_port,
2225 .enter_memory_pressure = tcp_enter_memory_pressure,
2226 .sockets_allocated = &tcp_sockets_allocated,
2227 .memory_allocated = &tcp_memory_allocated,
2228 .memory_pressure = &tcp_memory_pressure,
2229 .orphan_count = &tcp_orphan_count,
2230 .sysctl_mem = sysctl_tcp_mem,
2231 .sysctl_wmem = sysctl_tcp_wmem,
2232 .sysctl_rmem = sysctl_tcp_rmem,
2233 .max_header = MAX_TCP_HEADER,
2234 .obj_size = sizeof(struct tcp6_sock),
2235 .slab_flags = SLAB_DESTROY_BY_RCU,
2236 .twsk_prot = &tcp6_timewait_sock_ops,
2237 .rsk_prot = &tcp6_request_sock_ops,
2238 .h.hashinfo = &tcp_hashinfo,
2239 .no_autobind = true,
2240 #ifdef CONFIG_COMPAT
2241 .compat_setsockopt = compat_tcp_setsockopt,
2242 .compat_getsockopt = compat_tcp_getsockopt,
2244 .clear_sk = tcp_v6_clear_sk,
2247 static const struct inet6_protocol tcpv6_protocol = {
2248 .handler = tcp_v6_rcv,
2249 .err_handler = tcp_v6_err,
2250 .gso_send_check = tcp_v6_gso_send_check,
2251 .gso_segment = tcp_tso_segment,
2252 .gro_receive = tcp6_gro_receive,
2253 .gro_complete = tcp6_gro_complete,
2254 .flags = INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
2257 static struct inet_protosw tcpv6_protosw = {
2258 .type = SOCK_STREAM,
2259 .protocol = IPPROTO_TCP,
2260 .prot = &tcpv6_prot,
2261 .ops = &inet6_stream_ops,
2263 .flags = INET_PROTOSW_PERMANENT |
2267 static int __net_init tcpv6_net_init(struct net *net)
2269 return inet_ctl_sock_create(&net->ipv6.tcp_sk, PF_INET6,
2270 SOCK_RAW, IPPROTO_TCP, net);
2273 static void __net_exit tcpv6_net_exit(struct net *net)
2275 inet_ctl_sock_destroy(net->ipv6.tcp_sk);
2278 static void __net_exit tcpv6_net_exit_batch(struct list_head *net_exit_list)
2280 inet_twsk_purge(&tcp_hashinfo, &tcp_death_row, AF_INET6);
2283 static struct pernet_operations tcpv6_net_ops = {
2284 .init = tcpv6_net_init,
2285 .exit = tcpv6_net_exit,
2286 .exit_batch = tcpv6_net_exit_batch,
2289 int __init tcpv6_init(void)
2293 ret = inet6_add_protocol(&tcpv6_protocol, IPPROTO_TCP);
2297 /* register inet6 protocol */
2298 ret = inet6_register_protosw(&tcpv6_protosw);
2300 goto out_tcpv6_protocol;
2302 ret = register_pernet_subsys(&tcpv6_net_ops);
2304 goto out_tcpv6_protosw;
2309 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
2311 inet6_unregister_protosw(&tcpv6_protosw);
2315 void tcpv6_exit(void)
2317 unregister_pernet_subsys(&tcpv6_net_ops);
2318 inet6_unregister_protosw(&tcpv6_protosw);
2319 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);