]> Pileus Git - ~andy/linux/blob - net/ipv6/tcp_ipv6.c
tcp: shrink tcp6_timewait_sock by one cache line
[~andy/linux] / net / ipv6 / tcp_ipv6.c
1 /*
2  *      TCP over IPv6
3  *      Linux INET6 implementation
4  *
5  *      Authors:
6  *      Pedro Roque             <roque@di.fc.ul.pt>
7  *
8  *      Based on:
9  *      linux/net/ipv4/tcp.c
10  *      linux/net/ipv4/tcp_input.c
11  *      linux/net/ipv4/tcp_output.c
12  *
13  *      Fixes:
14  *      Hideaki YOSHIFUJI       :       sin6_scope_id support
15  *      YOSHIFUJI Hideaki @USAGI and:   Support IPV6_V6ONLY socket option, which
16  *      Alexey Kuznetsov                allow both IPv4 and IPv6 sockets to bind
17  *                                      a single port at the same time.
18  *      YOSHIFUJI Hideaki @USAGI:       convert /proc/net/tcp6 to seq_file.
19  *
20  *      This program is free software; you can redistribute it and/or
21  *      modify it under the terms of the GNU General Public License
22  *      as published by the Free Software Foundation; either version
23  *      2 of the License, or (at your option) any later version.
24  */
25
26 #include <linux/bottom_half.h>
27 #include <linux/module.h>
28 #include <linux/errno.h>
29 #include <linux/types.h>
30 #include <linux/socket.h>
31 #include <linux/sockios.h>
32 #include <linux/net.h>
33 #include <linux/jiffies.h>
34 #include <linux/in.h>
35 #include <linux/in6.h>
36 #include <linux/netdevice.h>
37 #include <linux/init.h>
38 #include <linux/jhash.h>
39 #include <linux/ipsec.h>
40 #include <linux/times.h>
41 #include <linux/slab.h>
42
43 #include <linux/ipv6.h>
44 #include <linux/icmpv6.h>
45 #include <linux/random.h>
46
47 #include <net/tcp.h>
48 #include <net/ndisc.h>
49 #include <net/inet6_hashtables.h>
50 #include <net/inet6_connection_sock.h>
51 #include <net/ipv6.h>
52 #include <net/transp_v6.h>
53 #include <net/addrconf.h>
54 #include <net/ip6_route.h>
55 #include <net/ip6_checksum.h>
56 #include <net/inet_ecn.h>
57 #include <net/protocol.h>
58 #include <net/xfrm.h>
59 #include <net/snmp.h>
60 #include <net/dsfield.h>
61 #include <net/timewait_sock.h>
62 #include <net/netdma.h>
63 #include <net/inet_common.h>
64 #include <net/secure_seq.h>
65 #include <net/tcp_memcontrol.h>
66 #include <net/busy_poll.h>
67
68 #include <asm/uaccess.h>
69
70 #include <linux/proc_fs.h>
71 #include <linux/seq_file.h>
72
73 #include <linux/crypto.h>
74 #include <linux/scatterlist.h>
75
76 static void     tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb);
77 static void     tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
78                                       struct request_sock *req);
79
80 static int      tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb);
81
82 static const struct inet_connection_sock_af_ops ipv6_mapped;
83 static const struct inet_connection_sock_af_ops ipv6_specific;
84 #ifdef CONFIG_TCP_MD5SIG
85 static const struct tcp_sock_af_ops tcp_sock_ipv6_specific;
86 static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific;
87 #else
88 static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
89                                                    const struct in6_addr *addr)
90 {
91         return NULL;
92 }
93 #endif
94
95 static void inet6_sk_rx_dst_set(struct sock *sk, const struct sk_buff *skb)
96 {
97         struct dst_entry *dst = skb_dst(skb);
98         const struct rt6_info *rt = (const struct rt6_info *)dst;
99
100         dst_hold(dst);
101         sk->sk_rx_dst = dst;
102         inet_sk(sk)->rx_dst_ifindex = skb->skb_iif;
103         if (rt->rt6i_node)
104                 inet6_sk(sk)->rx_dst_cookie = rt->rt6i_node->fn_sernum;
105 }
106
107 static void tcp_v6_hash(struct sock *sk)
108 {
109         if (sk->sk_state != TCP_CLOSE) {
110                 if (inet_csk(sk)->icsk_af_ops == &ipv6_mapped) {
111                         tcp_prot.hash(sk);
112                         return;
113                 }
114                 local_bh_disable();
115                 __inet6_hash(sk, NULL);
116                 local_bh_enable();
117         }
118 }
119
120 static __u32 tcp_v6_init_sequence(const struct sk_buff *skb)
121 {
122         return secure_tcpv6_sequence_number(ipv6_hdr(skb)->daddr.s6_addr32,
123                                             ipv6_hdr(skb)->saddr.s6_addr32,
124                                             tcp_hdr(skb)->dest,
125                                             tcp_hdr(skb)->source);
126 }
127
128 static int tcp_v6_connect(struct sock *sk, struct sockaddr *uaddr,
129                           int addr_len)
130 {
131         struct sockaddr_in6 *usin = (struct sockaddr_in6 *) uaddr;
132         struct inet_sock *inet = inet_sk(sk);
133         struct inet_connection_sock *icsk = inet_csk(sk);
134         struct ipv6_pinfo *np = inet6_sk(sk);
135         struct tcp_sock *tp = tcp_sk(sk);
136         struct in6_addr *saddr = NULL, *final_p, final;
137         struct rt6_info *rt;
138         struct flowi6 fl6;
139         struct dst_entry *dst;
140         int addr_type;
141         int err;
142
143         if (addr_len < SIN6_LEN_RFC2133)
144                 return -EINVAL;
145
146         if (usin->sin6_family != AF_INET6)
147                 return -EAFNOSUPPORT;
148
149         memset(&fl6, 0, sizeof(fl6));
150
151         if (np->sndflow) {
152                 fl6.flowlabel = usin->sin6_flowinfo&IPV6_FLOWINFO_MASK;
153                 IP6_ECN_flow_init(fl6.flowlabel);
154                 if (fl6.flowlabel&IPV6_FLOWLABEL_MASK) {
155                         struct ip6_flowlabel *flowlabel;
156                         flowlabel = fl6_sock_lookup(sk, fl6.flowlabel);
157                         if (flowlabel == NULL)
158                                 return -EINVAL;
159                         usin->sin6_addr = flowlabel->dst;
160                         fl6_sock_release(flowlabel);
161                 }
162         }
163
164         /*
165          *      connect() to INADDR_ANY means loopback (BSD'ism).
166          */
167
168         if(ipv6_addr_any(&usin->sin6_addr))
169                 usin->sin6_addr.s6_addr[15] = 0x1;
170
171         addr_type = ipv6_addr_type(&usin->sin6_addr);
172
173         if(addr_type & IPV6_ADDR_MULTICAST)
174                 return -ENETUNREACH;
175
176         if (addr_type&IPV6_ADDR_LINKLOCAL) {
177                 if (addr_len >= sizeof(struct sockaddr_in6) &&
178                     usin->sin6_scope_id) {
179                         /* If interface is set while binding, indices
180                          * must coincide.
181                          */
182                         if (sk->sk_bound_dev_if &&
183                             sk->sk_bound_dev_if != usin->sin6_scope_id)
184                                 return -EINVAL;
185
186                         sk->sk_bound_dev_if = usin->sin6_scope_id;
187                 }
188
189                 /* Connect to link-local address requires an interface */
190                 if (!sk->sk_bound_dev_if)
191                         return -EINVAL;
192         }
193
194         if (tp->rx_opt.ts_recent_stamp &&
195             !ipv6_addr_equal(&np->daddr, &usin->sin6_addr)) {
196                 tp->rx_opt.ts_recent = 0;
197                 tp->rx_opt.ts_recent_stamp = 0;
198                 tp->write_seq = 0;
199         }
200
201         np->daddr = usin->sin6_addr;
202         np->flow_label = fl6.flowlabel;
203
204         /*
205          *      TCP over IPv4
206          */
207
208         if (addr_type == IPV6_ADDR_MAPPED) {
209                 u32 exthdrlen = icsk->icsk_ext_hdr_len;
210                 struct sockaddr_in sin;
211
212                 SOCK_DEBUG(sk, "connect: ipv4 mapped\n");
213
214                 if (__ipv6_only_sock(sk))
215                         return -ENETUNREACH;
216
217                 sin.sin_family = AF_INET;
218                 sin.sin_port = usin->sin6_port;
219                 sin.sin_addr.s_addr = usin->sin6_addr.s6_addr32[3];
220
221                 icsk->icsk_af_ops = &ipv6_mapped;
222                 sk->sk_backlog_rcv = tcp_v4_do_rcv;
223 #ifdef CONFIG_TCP_MD5SIG
224                 tp->af_specific = &tcp_sock_ipv6_mapped_specific;
225 #endif
226
227                 err = tcp_v4_connect(sk, (struct sockaddr *)&sin, sizeof(sin));
228
229                 if (err) {
230                         icsk->icsk_ext_hdr_len = exthdrlen;
231                         icsk->icsk_af_ops = &ipv6_specific;
232                         sk->sk_backlog_rcv = tcp_v6_do_rcv;
233 #ifdef CONFIG_TCP_MD5SIG
234                         tp->af_specific = &tcp_sock_ipv6_specific;
235 #endif
236                         goto failure;
237                 } else {
238                         ipv6_addr_set_v4mapped(inet->inet_saddr, &np->saddr);
239                         ipv6_addr_set_v4mapped(inet->inet_rcv_saddr,
240                                                &np->rcv_saddr);
241                 }
242
243                 return err;
244         }
245
246         if (!ipv6_addr_any(&np->rcv_saddr))
247                 saddr = &np->rcv_saddr;
248
249         fl6.flowi6_proto = IPPROTO_TCP;
250         fl6.daddr = np->daddr;
251         fl6.saddr = saddr ? *saddr : np->saddr;
252         fl6.flowi6_oif = sk->sk_bound_dev_if;
253         fl6.flowi6_mark = sk->sk_mark;
254         fl6.fl6_dport = usin->sin6_port;
255         fl6.fl6_sport = inet->inet_sport;
256
257         final_p = fl6_update_dst(&fl6, np->opt, &final);
258
259         security_sk_classify_flow(sk, flowi6_to_flowi(&fl6));
260
261         dst = ip6_dst_lookup_flow(sk, &fl6, final_p, true);
262         if (IS_ERR(dst)) {
263                 err = PTR_ERR(dst);
264                 goto failure;
265         }
266
267         if (saddr == NULL) {
268                 saddr = &fl6.saddr;
269                 np->rcv_saddr = *saddr;
270         }
271
272         /* set the source address */
273         np->saddr = *saddr;
274         inet->inet_rcv_saddr = LOOPBACK4_IPV6;
275
276         sk->sk_gso_type = SKB_GSO_TCPV6;
277         __ip6_dst_store(sk, dst, NULL, NULL);
278
279         rt = (struct rt6_info *) dst;
280         if (tcp_death_row.sysctl_tw_recycle &&
281             !tp->rx_opt.ts_recent_stamp &&
282             ipv6_addr_equal(&rt->rt6i_dst.addr, &np->daddr))
283                 tcp_fetch_timewait_stamp(sk, dst);
284
285         icsk->icsk_ext_hdr_len = 0;
286         if (np->opt)
287                 icsk->icsk_ext_hdr_len = (np->opt->opt_flen +
288                                           np->opt->opt_nflen);
289
290         tp->rx_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
291
292         inet->inet_dport = usin->sin6_port;
293
294         tcp_set_state(sk, TCP_SYN_SENT);
295         err = inet6_hash_connect(&tcp_death_row, sk);
296         if (err)
297                 goto late_failure;
298
299         if (!tp->write_seq && likely(!tp->repair))
300                 tp->write_seq = secure_tcpv6_sequence_number(np->saddr.s6_addr32,
301                                                              np->daddr.s6_addr32,
302                                                              inet->inet_sport,
303                                                              inet->inet_dport);
304
305         err = tcp_connect(sk);
306         if (err)
307                 goto late_failure;
308
309         return 0;
310
311 late_failure:
312         tcp_set_state(sk, TCP_CLOSE);
313         __sk_dst_reset(sk);
314 failure:
315         inet->inet_dport = 0;
316         sk->sk_route_caps = 0;
317         return err;
318 }
319
320 static void tcp_v6_mtu_reduced(struct sock *sk)
321 {
322         struct dst_entry *dst;
323
324         if ((1 << sk->sk_state) & (TCPF_LISTEN | TCPF_CLOSE))
325                 return;
326
327         dst = inet6_csk_update_pmtu(sk, tcp_sk(sk)->mtu_info);
328         if (!dst)
329                 return;
330
331         if (inet_csk(sk)->icsk_pmtu_cookie > dst_mtu(dst)) {
332                 tcp_sync_mss(sk, dst_mtu(dst));
333                 tcp_simple_retransmit(sk);
334         }
335 }
336
337 static void tcp_v6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
338                 u8 type, u8 code, int offset, __be32 info)
339 {
340         const struct ipv6hdr *hdr = (const struct ipv6hdr*)skb->data;
341         const struct tcphdr *th = (struct tcphdr *)(skb->data+offset);
342         struct ipv6_pinfo *np;
343         struct sock *sk;
344         int err;
345         struct tcp_sock *tp;
346         __u32 seq;
347         struct net *net = dev_net(skb->dev);
348
349         sk = inet6_lookup(net, &tcp_hashinfo, &hdr->daddr,
350                         th->dest, &hdr->saddr, th->source, skb->dev->ifindex);
351
352         if (sk == NULL) {
353                 ICMP6_INC_STATS_BH(net, __in6_dev_get(skb->dev),
354                                    ICMP6_MIB_INERRORS);
355                 return;
356         }
357
358         if (sk->sk_state == TCP_TIME_WAIT) {
359                 inet_twsk_put(inet_twsk(sk));
360                 return;
361         }
362
363         bh_lock_sock(sk);
364         if (sock_owned_by_user(sk) && type != ICMPV6_PKT_TOOBIG)
365                 NET_INC_STATS_BH(net, LINUX_MIB_LOCKDROPPEDICMPS);
366
367         if (sk->sk_state == TCP_CLOSE)
368                 goto out;
369
370         if (ipv6_hdr(skb)->hop_limit < inet6_sk(sk)->min_hopcount) {
371                 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
372                 goto out;
373         }
374
375         tp = tcp_sk(sk);
376         seq = ntohl(th->seq);
377         if (sk->sk_state != TCP_LISTEN &&
378             !between(seq, tp->snd_una, tp->snd_nxt)) {
379                 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
380                 goto out;
381         }
382
383         np = inet6_sk(sk);
384
385         if (type == NDISC_REDIRECT) {
386                 struct dst_entry *dst = __sk_dst_check(sk, np->dst_cookie);
387
388                 if (dst)
389                         dst->ops->redirect(dst, sk, skb);
390                 goto out;
391         }
392
393         if (type == ICMPV6_PKT_TOOBIG) {
394                 /* We are not interested in TCP_LISTEN and open_requests
395                  * (SYN-ACKs send out by Linux are always <576bytes so
396                  * they should go through unfragmented).
397                  */
398                 if (sk->sk_state == TCP_LISTEN)
399                         goto out;
400
401                 tp->mtu_info = ntohl(info);
402                 if (!sock_owned_by_user(sk))
403                         tcp_v6_mtu_reduced(sk);
404                 else if (!test_and_set_bit(TCP_MTU_REDUCED_DEFERRED,
405                                            &tp->tsq_flags))
406                         sock_hold(sk);
407                 goto out;
408         }
409
410         icmpv6_err_convert(type, code, &err);
411
412         /* Might be for an request_sock */
413         switch (sk->sk_state) {
414                 struct request_sock *req, **prev;
415         case TCP_LISTEN:
416                 if (sock_owned_by_user(sk))
417                         goto out;
418
419                 req = inet6_csk_search_req(sk, &prev, th->dest, &hdr->daddr,
420                                            &hdr->saddr, inet6_iif(skb));
421                 if (!req)
422                         goto out;
423
424                 /* ICMPs are not backlogged, hence we cannot get
425                  * an established socket here.
426                  */
427                 WARN_ON(req->sk != NULL);
428
429                 if (seq != tcp_rsk(req)->snt_isn) {
430                         NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
431                         goto out;
432                 }
433
434                 inet_csk_reqsk_queue_drop(sk, req, prev);
435                 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
436                 goto out;
437
438         case TCP_SYN_SENT:
439         case TCP_SYN_RECV:  /* Cannot happen.
440                                It can, it SYNs are crossed. --ANK */
441                 if (!sock_owned_by_user(sk)) {
442                         sk->sk_err = err;
443                         sk->sk_error_report(sk);                /* Wake people up to see the error (see connect in sock.c) */
444
445                         tcp_done(sk);
446                 } else
447                         sk->sk_err_soft = err;
448                 goto out;
449         }
450
451         if (!sock_owned_by_user(sk) && np->recverr) {
452                 sk->sk_err = err;
453                 sk->sk_error_report(sk);
454         } else
455                 sk->sk_err_soft = err;
456
457 out:
458         bh_unlock_sock(sk);
459         sock_put(sk);
460 }
461
462
463 static int tcp_v6_send_synack(struct sock *sk, struct dst_entry *dst,
464                               struct flowi6 *fl6,
465                               struct request_sock *req,
466                               u16 queue_mapping)
467 {
468         struct inet6_request_sock *treq = inet6_rsk(req);
469         struct ipv6_pinfo *np = inet6_sk(sk);
470         struct sk_buff * skb;
471         int err = -ENOMEM;
472
473         /* First, grab a route. */
474         if (!dst && (dst = inet6_csk_route_req(sk, fl6, req)) == NULL)
475                 goto done;
476
477         skb = tcp_make_synack(sk, dst, req, NULL);
478
479         if (skb) {
480                 __tcp_v6_send_check(skb, &treq->loc_addr, &treq->rmt_addr);
481
482                 fl6->daddr = treq->rmt_addr;
483                 skb_set_queue_mapping(skb, queue_mapping);
484                 err = ip6_xmit(sk, skb, fl6, np->opt, np->tclass);
485                 err = net_xmit_eval(err);
486         }
487
488 done:
489         return err;
490 }
491
492 static int tcp_v6_rtx_synack(struct sock *sk, struct request_sock *req)
493 {
494         struct flowi6 fl6;
495         int res;
496
497         res = tcp_v6_send_synack(sk, NULL, &fl6, req, 0);
498         if (!res)
499                 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_RETRANSSEGS);
500         return res;
501 }
502
503 static void tcp_v6_reqsk_destructor(struct request_sock *req)
504 {
505         kfree_skb(inet6_rsk(req)->pktopts);
506 }
507
508 #ifdef CONFIG_TCP_MD5SIG
509 static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
510                                                    const struct in6_addr *addr)
511 {
512         return tcp_md5_do_lookup(sk, (union tcp_md5_addr *)addr, AF_INET6);
513 }
514
515 static struct tcp_md5sig_key *tcp_v6_md5_lookup(struct sock *sk,
516                                                 struct sock *addr_sk)
517 {
518         return tcp_v6_md5_do_lookup(sk, &inet6_sk(addr_sk)->daddr);
519 }
520
521 static struct tcp_md5sig_key *tcp_v6_reqsk_md5_lookup(struct sock *sk,
522                                                       struct request_sock *req)
523 {
524         return tcp_v6_md5_do_lookup(sk, &inet6_rsk(req)->rmt_addr);
525 }
526
527 static int tcp_v6_parse_md5_keys (struct sock *sk, char __user *optval,
528                                   int optlen)
529 {
530         struct tcp_md5sig cmd;
531         struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)&cmd.tcpm_addr;
532
533         if (optlen < sizeof(cmd))
534                 return -EINVAL;
535
536         if (copy_from_user(&cmd, optval, sizeof(cmd)))
537                 return -EFAULT;
538
539         if (sin6->sin6_family != AF_INET6)
540                 return -EINVAL;
541
542         if (!cmd.tcpm_keylen) {
543                 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
544                         return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
545                                               AF_INET);
546                 return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
547                                       AF_INET6);
548         }
549
550         if (cmd.tcpm_keylen > TCP_MD5SIG_MAXKEYLEN)
551                 return -EINVAL;
552
553         if (ipv6_addr_v4mapped(&sin6->sin6_addr))
554                 return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
555                                       AF_INET, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
556
557         return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
558                               AF_INET6, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
559 }
560
561 static int tcp_v6_md5_hash_pseudoheader(struct tcp_md5sig_pool *hp,
562                                         const struct in6_addr *daddr,
563                                         const struct in6_addr *saddr, int nbytes)
564 {
565         struct tcp6_pseudohdr *bp;
566         struct scatterlist sg;
567
568         bp = &hp->md5_blk.ip6;
569         /* 1. TCP pseudo-header (RFC2460) */
570         bp->saddr = *saddr;
571         bp->daddr = *daddr;
572         bp->protocol = cpu_to_be32(IPPROTO_TCP);
573         bp->len = cpu_to_be32(nbytes);
574
575         sg_init_one(&sg, bp, sizeof(*bp));
576         return crypto_hash_update(&hp->md5_desc, &sg, sizeof(*bp));
577 }
578
579 static int tcp_v6_md5_hash_hdr(char *md5_hash, struct tcp_md5sig_key *key,
580                                const struct in6_addr *daddr, struct in6_addr *saddr,
581                                const struct tcphdr *th)
582 {
583         struct tcp_md5sig_pool *hp;
584         struct hash_desc *desc;
585
586         hp = tcp_get_md5sig_pool();
587         if (!hp)
588                 goto clear_hash_noput;
589         desc = &hp->md5_desc;
590
591         if (crypto_hash_init(desc))
592                 goto clear_hash;
593         if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, th->doff << 2))
594                 goto clear_hash;
595         if (tcp_md5_hash_header(hp, th))
596                 goto clear_hash;
597         if (tcp_md5_hash_key(hp, key))
598                 goto clear_hash;
599         if (crypto_hash_final(desc, md5_hash))
600                 goto clear_hash;
601
602         tcp_put_md5sig_pool();
603         return 0;
604
605 clear_hash:
606         tcp_put_md5sig_pool();
607 clear_hash_noput:
608         memset(md5_hash, 0, 16);
609         return 1;
610 }
611
612 static int tcp_v6_md5_hash_skb(char *md5_hash, struct tcp_md5sig_key *key,
613                                const struct sock *sk,
614                                const struct request_sock *req,
615                                const struct sk_buff *skb)
616 {
617         const struct in6_addr *saddr, *daddr;
618         struct tcp_md5sig_pool *hp;
619         struct hash_desc *desc;
620         const struct tcphdr *th = tcp_hdr(skb);
621
622         if (sk) {
623                 saddr = &inet6_sk(sk)->saddr;
624                 daddr = &inet6_sk(sk)->daddr;
625         } else if (req) {
626                 saddr = &inet6_rsk(req)->loc_addr;
627                 daddr = &inet6_rsk(req)->rmt_addr;
628         } else {
629                 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
630                 saddr = &ip6h->saddr;
631                 daddr = &ip6h->daddr;
632         }
633
634         hp = tcp_get_md5sig_pool();
635         if (!hp)
636                 goto clear_hash_noput;
637         desc = &hp->md5_desc;
638
639         if (crypto_hash_init(desc))
640                 goto clear_hash;
641
642         if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, skb->len))
643                 goto clear_hash;
644         if (tcp_md5_hash_header(hp, th))
645                 goto clear_hash;
646         if (tcp_md5_hash_skb_data(hp, skb, th->doff << 2))
647                 goto clear_hash;
648         if (tcp_md5_hash_key(hp, key))
649                 goto clear_hash;
650         if (crypto_hash_final(desc, md5_hash))
651                 goto clear_hash;
652
653         tcp_put_md5sig_pool();
654         return 0;
655
656 clear_hash:
657         tcp_put_md5sig_pool();
658 clear_hash_noput:
659         memset(md5_hash, 0, 16);
660         return 1;
661 }
662
663 static int tcp_v6_inbound_md5_hash(struct sock *sk, const struct sk_buff *skb)
664 {
665         const __u8 *hash_location = NULL;
666         struct tcp_md5sig_key *hash_expected;
667         const struct ipv6hdr *ip6h = ipv6_hdr(skb);
668         const struct tcphdr *th = tcp_hdr(skb);
669         int genhash;
670         u8 newhash[16];
671
672         hash_expected = tcp_v6_md5_do_lookup(sk, &ip6h->saddr);
673         hash_location = tcp_parse_md5sig_option(th);
674
675         /* We've parsed the options - do we have a hash? */
676         if (!hash_expected && !hash_location)
677                 return 0;
678
679         if (hash_expected && !hash_location) {
680                 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5NOTFOUND);
681                 return 1;
682         }
683
684         if (!hash_expected && hash_location) {
685                 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5UNEXPECTED);
686                 return 1;
687         }
688
689         /* check the signature */
690         genhash = tcp_v6_md5_hash_skb(newhash,
691                                       hash_expected,
692                                       NULL, NULL, skb);
693
694         if (genhash || memcmp(hash_location, newhash, 16) != 0) {
695                 net_info_ratelimited("MD5 Hash %s for [%pI6c]:%u->[%pI6c]:%u\n",
696                                      genhash ? "failed" : "mismatch",
697                                      &ip6h->saddr, ntohs(th->source),
698                                      &ip6h->daddr, ntohs(th->dest));
699                 return 1;
700         }
701         return 0;
702 }
703 #endif
704
705 struct request_sock_ops tcp6_request_sock_ops __read_mostly = {
706         .family         =       AF_INET6,
707         .obj_size       =       sizeof(struct tcp6_request_sock),
708         .rtx_syn_ack    =       tcp_v6_rtx_synack,
709         .send_ack       =       tcp_v6_reqsk_send_ack,
710         .destructor     =       tcp_v6_reqsk_destructor,
711         .send_reset     =       tcp_v6_send_reset,
712         .syn_ack_timeout =      tcp_syn_ack_timeout,
713 };
714
715 #ifdef CONFIG_TCP_MD5SIG
716 static const struct tcp_request_sock_ops tcp_request_sock_ipv6_ops = {
717         .md5_lookup     =       tcp_v6_reqsk_md5_lookup,
718         .calc_md5_hash  =       tcp_v6_md5_hash_skb,
719 };
720 #endif
721
722 static void tcp_v6_send_response(struct sk_buff *skb, u32 seq, u32 ack, u32 win,
723                                  u32 tsval, u32 tsecr,
724                                  struct tcp_md5sig_key *key, int rst, u8 tclass)
725 {
726         const struct tcphdr *th = tcp_hdr(skb);
727         struct tcphdr *t1;
728         struct sk_buff *buff;
729         struct flowi6 fl6;
730         struct net *net = dev_net(skb_dst(skb)->dev);
731         struct sock *ctl_sk = net->ipv6.tcp_sk;
732         unsigned int tot_len = sizeof(struct tcphdr);
733         struct dst_entry *dst;
734         __be32 *topt;
735
736         if (tsecr)
737                 tot_len += TCPOLEN_TSTAMP_ALIGNED;
738 #ifdef CONFIG_TCP_MD5SIG
739         if (key)
740                 tot_len += TCPOLEN_MD5SIG_ALIGNED;
741 #endif
742
743         buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
744                          GFP_ATOMIC);
745         if (buff == NULL)
746                 return;
747
748         skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
749
750         t1 = (struct tcphdr *) skb_push(buff, tot_len);
751         skb_reset_transport_header(buff);
752
753         /* Swap the send and the receive. */
754         memset(t1, 0, sizeof(*t1));
755         t1->dest = th->source;
756         t1->source = th->dest;
757         t1->doff = tot_len / 4;
758         t1->seq = htonl(seq);
759         t1->ack_seq = htonl(ack);
760         t1->ack = !rst || !th->ack;
761         t1->rst = rst;
762         t1->window = htons(win);
763
764         topt = (__be32 *)(t1 + 1);
765
766         if (tsecr) {
767                 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
768                                 (TCPOPT_TIMESTAMP << 8) | TCPOLEN_TIMESTAMP);
769                 *topt++ = htonl(tsval);
770                 *topt++ = htonl(tsecr);
771         }
772
773 #ifdef CONFIG_TCP_MD5SIG
774         if (key) {
775                 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
776                                 (TCPOPT_MD5SIG << 8) | TCPOLEN_MD5SIG);
777                 tcp_v6_md5_hash_hdr((__u8 *)topt, key,
778                                     &ipv6_hdr(skb)->saddr,
779                                     &ipv6_hdr(skb)->daddr, t1);
780         }
781 #endif
782
783         memset(&fl6, 0, sizeof(fl6));
784         fl6.daddr = ipv6_hdr(skb)->saddr;
785         fl6.saddr = ipv6_hdr(skb)->daddr;
786
787         buff->ip_summed = CHECKSUM_PARTIAL;
788         buff->csum = 0;
789
790         __tcp_v6_send_check(buff, &fl6.saddr, &fl6.daddr);
791
792         fl6.flowi6_proto = IPPROTO_TCP;
793         if (ipv6_addr_type(&fl6.daddr) & IPV6_ADDR_LINKLOCAL)
794                 fl6.flowi6_oif = inet6_iif(skb);
795         fl6.fl6_dport = t1->dest;
796         fl6.fl6_sport = t1->source;
797         security_skb_classify_flow(skb, flowi6_to_flowi(&fl6));
798
799         /* Pass a socket to ip6_dst_lookup either it is for RST
800          * Underlying function will use this to retrieve the network
801          * namespace
802          */
803         dst = ip6_dst_lookup_flow(ctl_sk, &fl6, NULL, false);
804         if (!IS_ERR(dst)) {
805                 skb_dst_set(buff, dst);
806                 ip6_xmit(ctl_sk, buff, &fl6, NULL, tclass);
807                 TCP_INC_STATS_BH(net, TCP_MIB_OUTSEGS);
808                 if (rst)
809                         TCP_INC_STATS_BH(net, TCP_MIB_OUTRSTS);
810                 return;
811         }
812
813         kfree_skb(buff);
814 }
815
816 static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb)
817 {
818         const struct tcphdr *th = tcp_hdr(skb);
819         u32 seq = 0, ack_seq = 0;
820         struct tcp_md5sig_key *key = NULL;
821 #ifdef CONFIG_TCP_MD5SIG
822         const __u8 *hash_location = NULL;
823         struct ipv6hdr *ipv6h = ipv6_hdr(skb);
824         unsigned char newhash[16];
825         int genhash;
826         struct sock *sk1 = NULL;
827 #endif
828
829         if (th->rst)
830                 return;
831
832         if (!ipv6_unicast_destination(skb))
833                 return;
834
835 #ifdef CONFIG_TCP_MD5SIG
836         hash_location = tcp_parse_md5sig_option(th);
837         if (!sk && hash_location) {
838                 /*
839                  * active side is lost. Try to find listening socket through
840                  * source port, and then find md5 key through listening socket.
841                  * we are not loose security here:
842                  * Incoming packet is checked with md5 hash with finding key,
843                  * no RST generated if md5 hash doesn't match.
844                  */
845                 sk1 = inet6_lookup_listener(dev_net(skb_dst(skb)->dev),
846                                            &tcp_hashinfo, &ipv6h->saddr,
847                                            th->source, &ipv6h->daddr,
848                                            ntohs(th->source), inet6_iif(skb));
849                 if (!sk1)
850                         return;
851
852                 rcu_read_lock();
853                 key = tcp_v6_md5_do_lookup(sk1, &ipv6h->saddr);
854                 if (!key)
855                         goto release_sk1;
856
857                 genhash = tcp_v6_md5_hash_skb(newhash, key, NULL, NULL, skb);
858                 if (genhash || memcmp(hash_location, newhash, 16) != 0)
859                         goto release_sk1;
860         } else {
861                 key = sk ? tcp_v6_md5_do_lookup(sk, &ipv6h->saddr) : NULL;
862         }
863 #endif
864
865         if (th->ack)
866                 seq = ntohl(th->ack_seq);
867         else
868                 ack_seq = ntohl(th->seq) + th->syn + th->fin + skb->len -
869                           (th->doff << 2);
870
871         tcp_v6_send_response(skb, seq, ack_seq, 0, 0, 0, key, 1, 0);
872
873 #ifdef CONFIG_TCP_MD5SIG
874 release_sk1:
875         if (sk1) {
876                 rcu_read_unlock();
877                 sock_put(sk1);
878         }
879 #endif
880 }
881
882 static void tcp_v6_send_ack(struct sk_buff *skb, u32 seq, u32 ack,
883                             u32 win, u32 tsval, u32 tsecr,
884                             struct tcp_md5sig_key *key, u8 tclass)
885 {
886         tcp_v6_send_response(skb, seq, ack, win, tsval, tsecr, key, 0, tclass);
887 }
888
889 static void tcp_v6_timewait_ack(struct sock *sk, struct sk_buff *skb)
890 {
891         struct inet_timewait_sock *tw = inet_twsk(sk);
892         struct tcp_timewait_sock *tcptw = tcp_twsk(sk);
893
894         tcp_v6_send_ack(skb, tcptw->tw_snd_nxt, tcptw->tw_rcv_nxt,
895                         tcptw->tw_rcv_wnd >> tw->tw_rcv_wscale,
896                         tcp_time_stamp + tcptw->tw_ts_offset,
897                         tcptw->tw_ts_recent, tcp_twsk_md5_key(tcptw),
898                         tw->tw_tclass);
899
900         inet_twsk_put(tw);
901 }
902
903 static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
904                                   struct request_sock *req)
905 {
906         tcp_v6_send_ack(skb, tcp_rsk(req)->snt_isn + 1, tcp_rsk(req)->rcv_isn + 1,
907                         req->rcv_wnd, tcp_time_stamp, req->ts_recent,
908                         tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr), 0);
909 }
910
911
912 static struct sock *tcp_v6_hnd_req(struct sock *sk,struct sk_buff *skb)
913 {
914         struct request_sock *req, **prev;
915         const struct tcphdr *th = tcp_hdr(skb);
916         struct sock *nsk;
917
918         /* Find possible connection requests. */
919         req = inet6_csk_search_req(sk, &prev, th->source,
920                                    &ipv6_hdr(skb)->saddr,
921                                    &ipv6_hdr(skb)->daddr, inet6_iif(skb));
922         if (req)
923                 return tcp_check_req(sk, skb, req, prev, false);
924
925         nsk = __inet6_lookup_established(sock_net(sk), &tcp_hashinfo,
926                         &ipv6_hdr(skb)->saddr, th->source,
927                         &ipv6_hdr(skb)->daddr, ntohs(th->dest), inet6_iif(skb));
928
929         if (nsk) {
930                 if (nsk->sk_state != TCP_TIME_WAIT) {
931                         bh_lock_sock(nsk);
932                         return nsk;
933                 }
934                 inet_twsk_put(inet_twsk(nsk));
935                 return NULL;
936         }
937
938 #ifdef CONFIG_SYN_COOKIES
939         if (!th->syn)
940                 sk = cookie_v6_check(sk, skb);
941 #endif
942         return sk;
943 }
944
945 /* FIXME: this is substantially similar to the ipv4 code.
946  * Can some kind of merge be done? -- erics
947  */
948 static int tcp_v6_conn_request(struct sock *sk, struct sk_buff *skb)
949 {
950         struct tcp_options_received tmp_opt;
951         struct request_sock *req;
952         struct inet6_request_sock *treq;
953         struct ipv6_pinfo *np = inet6_sk(sk);
954         struct tcp_sock *tp = tcp_sk(sk);
955         __u32 isn = TCP_SKB_CB(skb)->when;
956         struct dst_entry *dst = NULL;
957         struct flowi6 fl6;
958         bool want_cookie = false;
959
960         if (skb->protocol == htons(ETH_P_IP))
961                 return tcp_v4_conn_request(sk, skb);
962
963         if (!ipv6_unicast_destination(skb))
964                 goto drop;
965
966         if ((sysctl_tcp_syncookies == 2 ||
967              inet_csk_reqsk_queue_is_full(sk)) && !isn) {
968                 want_cookie = tcp_syn_flood_action(sk, skb, "TCPv6");
969                 if (!want_cookie)
970                         goto drop;
971         }
972
973         if (sk_acceptq_is_full(sk) && inet_csk_reqsk_queue_young(sk) > 1) {
974                 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
975                 goto drop;
976         }
977
978         req = inet6_reqsk_alloc(&tcp6_request_sock_ops);
979         if (req == NULL)
980                 goto drop;
981
982 #ifdef CONFIG_TCP_MD5SIG
983         tcp_rsk(req)->af_specific = &tcp_request_sock_ipv6_ops;
984 #endif
985
986         tcp_clear_options(&tmp_opt);
987         tmp_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
988         tmp_opt.user_mss = tp->rx_opt.user_mss;
989         tcp_parse_options(skb, &tmp_opt, 0, NULL);
990
991         if (want_cookie && !tmp_opt.saw_tstamp)
992                 tcp_clear_options(&tmp_opt);
993
994         tmp_opt.tstamp_ok = tmp_opt.saw_tstamp;
995         tcp_openreq_init(req, &tmp_opt, skb);
996
997         treq = inet6_rsk(req);
998         treq->rmt_addr = ipv6_hdr(skb)->saddr;
999         treq->loc_addr = ipv6_hdr(skb)->daddr;
1000         if (!want_cookie || tmp_opt.tstamp_ok)
1001                 TCP_ECN_create_request(req, skb, sock_net(sk));
1002
1003         treq->iif = sk->sk_bound_dev_if;
1004
1005         /* So that link locals have meaning */
1006         if (!sk->sk_bound_dev_if &&
1007             ipv6_addr_type(&treq->rmt_addr) & IPV6_ADDR_LINKLOCAL)
1008                 treq->iif = inet6_iif(skb);
1009
1010         if (!isn) {
1011                 if (ipv6_opt_accepted(sk, skb) ||
1012                     np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo ||
1013                     np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim) {
1014                         atomic_inc(&skb->users);
1015                         treq->pktopts = skb;
1016                 }
1017
1018                 if (want_cookie) {
1019                         isn = cookie_v6_init_sequence(sk, skb, &req->mss);
1020                         req->cookie_ts = tmp_opt.tstamp_ok;
1021                         goto have_isn;
1022                 }
1023
1024                 /* VJ's idea. We save last timestamp seen
1025                  * from the destination in peer table, when entering
1026                  * state TIME-WAIT, and check against it before
1027                  * accepting new connection request.
1028                  *
1029                  * If "isn" is not zero, this request hit alive
1030                  * timewait bucket, so that all the necessary checks
1031                  * are made in the function processing timewait state.
1032                  */
1033                 if (tmp_opt.saw_tstamp &&
1034                     tcp_death_row.sysctl_tw_recycle &&
1035                     (dst = inet6_csk_route_req(sk, &fl6, req)) != NULL) {
1036                         if (!tcp_peer_is_proven(req, dst, true)) {
1037                                 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_PAWSPASSIVEREJECTED);
1038                                 goto drop_and_release;
1039                         }
1040                 }
1041                 /* Kill the following clause, if you dislike this way. */
1042                 else if (!sysctl_tcp_syncookies &&
1043                          (sysctl_max_syn_backlog - inet_csk_reqsk_queue_len(sk) <
1044                           (sysctl_max_syn_backlog >> 2)) &&
1045                          !tcp_peer_is_proven(req, dst, false)) {
1046                         /* Without syncookies last quarter of
1047                          * backlog is filled with destinations,
1048                          * proven to be alive.
1049                          * It means that we continue to communicate
1050                          * to destinations, already remembered
1051                          * to the moment of synflood.
1052                          */
1053                         LIMIT_NETDEBUG(KERN_DEBUG "TCP: drop open request from %pI6/%u\n",
1054                                        &treq->rmt_addr, ntohs(tcp_hdr(skb)->source));
1055                         goto drop_and_release;
1056                 }
1057
1058                 isn = tcp_v6_init_sequence(skb);
1059         }
1060 have_isn:
1061         tcp_rsk(req)->snt_isn = isn;
1062
1063         if (security_inet_conn_request(sk, skb, req))
1064                 goto drop_and_release;
1065
1066         if (tcp_v6_send_synack(sk, dst, &fl6, req,
1067                                skb_get_queue_mapping(skb)) ||
1068             want_cookie)
1069                 goto drop_and_free;
1070
1071         tcp_rsk(req)->snt_synack = tcp_time_stamp;
1072         tcp_rsk(req)->listener = NULL;
1073         inet6_csk_reqsk_queue_hash_add(sk, req, TCP_TIMEOUT_INIT);
1074         return 0;
1075
1076 drop_and_release:
1077         dst_release(dst);
1078 drop_and_free:
1079         reqsk_free(req);
1080 drop:
1081         NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1082         return 0; /* don't send reset */
1083 }
1084
1085 static struct sock * tcp_v6_syn_recv_sock(struct sock *sk, struct sk_buff *skb,
1086                                           struct request_sock *req,
1087                                           struct dst_entry *dst)
1088 {
1089         struct inet6_request_sock *treq;
1090         struct ipv6_pinfo *newnp, *np = inet6_sk(sk);
1091         struct tcp6_sock *newtcp6sk;
1092         struct inet_sock *newinet;
1093         struct tcp_sock *newtp;
1094         struct sock *newsk;
1095 #ifdef CONFIG_TCP_MD5SIG
1096         struct tcp_md5sig_key *key;
1097 #endif
1098         struct flowi6 fl6;
1099
1100         if (skb->protocol == htons(ETH_P_IP)) {
1101                 /*
1102                  *      v6 mapped
1103                  */
1104
1105                 newsk = tcp_v4_syn_recv_sock(sk, skb, req, dst);
1106
1107                 if (newsk == NULL)
1108                         return NULL;
1109
1110                 newtcp6sk = (struct tcp6_sock *)newsk;
1111                 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1112
1113                 newinet = inet_sk(newsk);
1114                 newnp = inet6_sk(newsk);
1115                 newtp = tcp_sk(newsk);
1116
1117                 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1118
1119                 ipv6_addr_set_v4mapped(newinet->inet_daddr, &newnp->daddr);
1120
1121                 ipv6_addr_set_v4mapped(newinet->inet_saddr, &newnp->saddr);
1122
1123                 newnp->rcv_saddr = newnp->saddr;
1124
1125                 inet_csk(newsk)->icsk_af_ops = &ipv6_mapped;
1126                 newsk->sk_backlog_rcv = tcp_v4_do_rcv;
1127 #ifdef CONFIG_TCP_MD5SIG
1128                 newtp->af_specific = &tcp_sock_ipv6_mapped_specific;
1129 #endif
1130
1131                 newnp->ipv6_ac_list = NULL;
1132                 newnp->ipv6_fl_list = NULL;
1133                 newnp->pktoptions  = NULL;
1134                 newnp->opt         = NULL;
1135                 newnp->mcast_oif   = inet6_iif(skb);
1136                 newnp->mcast_hops  = ipv6_hdr(skb)->hop_limit;
1137                 newnp->rcv_tclass  = ipv6_get_dsfield(ipv6_hdr(skb));
1138
1139                 /*
1140                  * No need to charge this sock to the relevant IPv6 refcnt debug socks count
1141                  * here, tcp_create_openreq_child now does this for us, see the comment in
1142                  * that function for the gory details. -acme
1143                  */
1144
1145                 /* It is tricky place. Until this moment IPv4 tcp
1146                    worked with IPv6 icsk.icsk_af_ops.
1147                    Sync it now.
1148                  */
1149                 tcp_sync_mss(newsk, inet_csk(newsk)->icsk_pmtu_cookie);
1150
1151                 return newsk;
1152         }
1153
1154         treq = inet6_rsk(req);
1155
1156         if (sk_acceptq_is_full(sk))
1157                 goto out_overflow;
1158
1159         if (!dst) {
1160                 dst = inet6_csk_route_req(sk, &fl6, req);
1161                 if (!dst)
1162                         goto out;
1163         }
1164
1165         newsk = tcp_create_openreq_child(sk, req, skb);
1166         if (newsk == NULL)
1167                 goto out_nonewsk;
1168
1169         /*
1170          * No need to charge this sock to the relevant IPv6 refcnt debug socks
1171          * count here, tcp_create_openreq_child now does this for us, see the
1172          * comment in that function for the gory details. -acme
1173          */
1174
1175         newsk->sk_gso_type = SKB_GSO_TCPV6;
1176         __ip6_dst_store(newsk, dst, NULL, NULL);
1177         inet6_sk_rx_dst_set(newsk, skb);
1178
1179         newtcp6sk = (struct tcp6_sock *)newsk;
1180         inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1181
1182         newtp = tcp_sk(newsk);
1183         newinet = inet_sk(newsk);
1184         newnp = inet6_sk(newsk);
1185
1186         memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1187
1188         newnp->daddr = treq->rmt_addr;
1189         newnp->saddr = treq->loc_addr;
1190         newnp->rcv_saddr = treq->loc_addr;
1191         newsk->sk_bound_dev_if = treq->iif;
1192
1193         /* Now IPv6 options...
1194
1195            First: no IPv4 options.
1196          */
1197         newinet->inet_opt = NULL;
1198         newnp->ipv6_ac_list = NULL;
1199         newnp->ipv6_fl_list = NULL;
1200
1201         /* Clone RX bits */
1202         newnp->rxopt.all = np->rxopt.all;
1203
1204         /* Clone pktoptions received with SYN */
1205         newnp->pktoptions = NULL;
1206         if (treq->pktopts != NULL) {
1207                 newnp->pktoptions = skb_clone(treq->pktopts,
1208                                               sk_gfp_atomic(sk, GFP_ATOMIC));
1209                 consume_skb(treq->pktopts);
1210                 treq->pktopts = NULL;
1211                 if (newnp->pktoptions)
1212                         skb_set_owner_r(newnp->pktoptions, newsk);
1213         }
1214         newnp->opt        = NULL;
1215         newnp->mcast_oif  = inet6_iif(skb);
1216         newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
1217         newnp->rcv_tclass = ipv6_get_dsfield(ipv6_hdr(skb));
1218
1219         /* Clone native IPv6 options from listening socket (if any)
1220
1221            Yes, keeping reference count would be much more clever,
1222            but we make one more one thing there: reattach optmem
1223            to newsk.
1224          */
1225         if (np->opt)
1226                 newnp->opt = ipv6_dup_options(newsk, np->opt);
1227
1228         inet_csk(newsk)->icsk_ext_hdr_len = 0;
1229         if (newnp->opt)
1230                 inet_csk(newsk)->icsk_ext_hdr_len = (newnp->opt->opt_nflen +
1231                                                      newnp->opt->opt_flen);
1232
1233         tcp_mtup_init(newsk);
1234         tcp_sync_mss(newsk, dst_mtu(dst));
1235         newtp->advmss = dst_metric_advmss(dst);
1236         if (tcp_sk(sk)->rx_opt.user_mss &&
1237             tcp_sk(sk)->rx_opt.user_mss < newtp->advmss)
1238                 newtp->advmss = tcp_sk(sk)->rx_opt.user_mss;
1239
1240         tcp_initialize_rcv_mss(newsk);
1241
1242         newinet->inet_daddr = newinet->inet_saddr = LOOPBACK4_IPV6;
1243         newinet->inet_rcv_saddr = LOOPBACK4_IPV6;
1244
1245 #ifdef CONFIG_TCP_MD5SIG
1246         /* Copy over the MD5 key from the original socket */
1247         if ((key = tcp_v6_md5_do_lookup(sk, &newnp->daddr)) != NULL) {
1248                 /* We're using one, so create a matching key
1249                  * on the newsk structure. If we fail to get
1250                  * memory, then we end up not copying the key
1251                  * across. Shucks.
1252                  */
1253                 tcp_md5_do_add(newsk, (union tcp_md5_addr *)&newnp->daddr,
1254                                AF_INET6, key->key, key->keylen,
1255                                sk_gfp_atomic(sk, GFP_ATOMIC));
1256         }
1257 #endif
1258
1259         if (__inet_inherit_port(sk, newsk) < 0) {
1260                 inet_csk_prepare_forced_close(newsk);
1261                 tcp_done(newsk);
1262                 goto out;
1263         }
1264         __inet6_hash(newsk, NULL);
1265
1266         return newsk;
1267
1268 out_overflow:
1269         NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
1270 out_nonewsk:
1271         dst_release(dst);
1272 out:
1273         NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1274         return NULL;
1275 }
1276
1277 static __sum16 tcp_v6_checksum_init(struct sk_buff *skb)
1278 {
1279         if (skb->ip_summed == CHECKSUM_COMPLETE) {
1280                 if (!tcp_v6_check(skb->len, &ipv6_hdr(skb)->saddr,
1281                                   &ipv6_hdr(skb)->daddr, skb->csum)) {
1282                         skb->ip_summed = CHECKSUM_UNNECESSARY;
1283                         return 0;
1284                 }
1285         }
1286
1287         skb->csum = ~csum_unfold(tcp_v6_check(skb->len,
1288                                               &ipv6_hdr(skb)->saddr,
1289                                               &ipv6_hdr(skb)->daddr, 0));
1290
1291         if (skb->len <= 76) {
1292                 return __skb_checksum_complete(skb);
1293         }
1294         return 0;
1295 }
1296
1297 /* The socket must have it's spinlock held when we get
1298  * here.
1299  *
1300  * We have a potential double-lock case here, so even when
1301  * doing backlog processing we use the BH locking scheme.
1302  * This is because we cannot sleep with the original spinlock
1303  * held.
1304  */
1305 static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb)
1306 {
1307         struct ipv6_pinfo *np = inet6_sk(sk);
1308         struct tcp_sock *tp;
1309         struct sk_buff *opt_skb = NULL;
1310
1311         /* Imagine: socket is IPv6. IPv4 packet arrives,
1312            goes to IPv4 receive handler and backlogged.
1313            From backlog it always goes here. Kerboom...
1314            Fortunately, tcp_rcv_established and rcv_established
1315            handle them correctly, but it is not case with
1316            tcp_v6_hnd_req and tcp_v6_send_reset().   --ANK
1317          */
1318
1319         if (skb->protocol == htons(ETH_P_IP))
1320                 return tcp_v4_do_rcv(sk, skb);
1321
1322 #ifdef CONFIG_TCP_MD5SIG
1323         if (tcp_v6_inbound_md5_hash (sk, skb))
1324                 goto discard;
1325 #endif
1326
1327         if (sk_filter(sk, skb))
1328                 goto discard;
1329
1330         /*
1331          *      socket locking is here for SMP purposes as backlog rcv
1332          *      is currently called with bh processing disabled.
1333          */
1334
1335         /* Do Stevens' IPV6_PKTOPTIONS.
1336
1337            Yes, guys, it is the only place in our code, where we
1338            may make it not affecting IPv4.
1339            The rest of code is protocol independent,
1340            and I do not like idea to uglify IPv4.
1341
1342            Actually, all the idea behind IPV6_PKTOPTIONS
1343            looks not very well thought. For now we latch
1344            options, received in the last packet, enqueued
1345            by tcp. Feel free to propose better solution.
1346                                                --ANK (980728)
1347          */
1348         if (np->rxopt.all)
1349                 opt_skb = skb_clone(skb, sk_gfp_atomic(sk, GFP_ATOMIC));
1350
1351         if (sk->sk_state == TCP_ESTABLISHED) { /* Fast path */
1352                 struct dst_entry *dst = sk->sk_rx_dst;
1353
1354                 sock_rps_save_rxhash(sk, skb);
1355                 if (dst) {
1356                         if (inet_sk(sk)->rx_dst_ifindex != skb->skb_iif ||
1357                             dst->ops->check(dst, np->rx_dst_cookie) == NULL) {
1358                                 dst_release(dst);
1359                                 sk->sk_rx_dst = NULL;
1360                         }
1361                 }
1362
1363                 tcp_rcv_established(sk, skb, tcp_hdr(skb), skb->len);
1364                 if (opt_skb)
1365                         goto ipv6_pktoptions;
1366                 return 0;
1367         }
1368
1369         if (skb->len < tcp_hdrlen(skb) || tcp_checksum_complete(skb))
1370                 goto csum_err;
1371
1372         if (sk->sk_state == TCP_LISTEN) {
1373                 struct sock *nsk = tcp_v6_hnd_req(sk, skb);
1374                 if (!nsk)
1375                         goto discard;
1376
1377                 /*
1378                  * Queue it on the new socket if the new socket is active,
1379                  * otherwise we just shortcircuit this and continue with
1380                  * the new socket..
1381                  */
1382                 if(nsk != sk) {
1383                         sock_rps_save_rxhash(nsk, skb);
1384                         if (tcp_child_process(sk, nsk, skb))
1385                                 goto reset;
1386                         if (opt_skb)
1387                                 __kfree_skb(opt_skb);
1388                         return 0;
1389                 }
1390         } else
1391                 sock_rps_save_rxhash(sk, skb);
1392
1393         if (tcp_rcv_state_process(sk, skb, tcp_hdr(skb), skb->len))
1394                 goto reset;
1395         if (opt_skb)
1396                 goto ipv6_pktoptions;
1397         return 0;
1398
1399 reset:
1400         tcp_v6_send_reset(sk, skb);
1401 discard:
1402         if (opt_skb)
1403                 __kfree_skb(opt_skb);
1404         kfree_skb(skb);
1405         return 0;
1406 csum_err:
1407         TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_CSUMERRORS);
1408         TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_INERRS);
1409         goto discard;
1410
1411
1412 ipv6_pktoptions:
1413         /* Do you ask, what is it?
1414
1415            1. skb was enqueued by tcp.
1416            2. skb is added to tail of read queue, rather than out of order.
1417            3. socket is not in passive state.
1418            4. Finally, it really contains options, which user wants to receive.
1419          */
1420         tp = tcp_sk(sk);
1421         if (TCP_SKB_CB(opt_skb)->end_seq == tp->rcv_nxt &&
1422             !((1 << sk->sk_state) & (TCPF_CLOSE | TCPF_LISTEN))) {
1423                 if (np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo)
1424                         np->mcast_oif = inet6_iif(opt_skb);
1425                 if (np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim)
1426                         np->mcast_hops = ipv6_hdr(opt_skb)->hop_limit;
1427                 if (np->rxopt.bits.rxtclass)
1428                         np->rcv_tclass = ipv6_get_dsfield(ipv6_hdr(opt_skb));
1429                 if (ipv6_opt_accepted(sk, opt_skb)) {
1430                         skb_set_owner_r(opt_skb, sk);
1431                         opt_skb = xchg(&np->pktoptions, opt_skb);
1432                 } else {
1433                         __kfree_skb(opt_skb);
1434                         opt_skb = xchg(&np->pktoptions, NULL);
1435                 }
1436         }
1437
1438         kfree_skb(opt_skb);
1439         return 0;
1440 }
1441
1442 static int tcp_v6_rcv(struct sk_buff *skb)
1443 {
1444         const struct tcphdr *th;
1445         const struct ipv6hdr *hdr;
1446         struct sock *sk;
1447         int ret;
1448         struct net *net = dev_net(skb->dev);
1449
1450         if (skb->pkt_type != PACKET_HOST)
1451                 goto discard_it;
1452
1453         /*
1454          *      Count it even if it's bad.
1455          */
1456         TCP_INC_STATS_BH(net, TCP_MIB_INSEGS);
1457
1458         if (!pskb_may_pull(skb, sizeof(struct tcphdr)))
1459                 goto discard_it;
1460
1461         th = tcp_hdr(skb);
1462
1463         if (th->doff < sizeof(struct tcphdr)/4)
1464                 goto bad_packet;
1465         if (!pskb_may_pull(skb, th->doff*4))
1466                 goto discard_it;
1467
1468         if (!skb_csum_unnecessary(skb) && tcp_v6_checksum_init(skb))
1469                 goto csum_error;
1470
1471         th = tcp_hdr(skb);
1472         hdr = ipv6_hdr(skb);
1473         TCP_SKB_CB(skb)->seq = ntohl(th->seq);
1474         TCP_SKB_CB(skb)->end_seq = (TCP_SKB_CB(skb)->seq + th->syn + th->fin +
1475                                     skb->len - th->doff*4);
1476         TCP_SKB_CB(skb)->ack_seq = ntohl(th->ack_seq);
1477         TCP_SKB_CB(skb)->when = 0;
1478         TCP_SKB_CB(skb)->ip_dsfield = ipv6_get_dsfield(hdr);
1479         TCP_SKB_CB(skb)->sacked = 0;
1480
1481         sk = __inet6_lookup_skb(&tcp_hashinfo, skb, th->source, th->dest);
1482         if (!sk)
1483                 goto no_tcp_socket;
1484
1485 process:
1486         if (sk->sk_state == TCP_TIME_WAIT)
1487                 goto do_time_wait;
1488
1489         if (hdr->hop_limit < inet6_sk(sk)->min_hopcount) {
1490                 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
1491                 goto discard_and_relse;
1492         }
1493
1494         if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
1495                 goto discard_and_relse;
1496
1497         if (sk_filter(sk, skb))
1498                 goto discard_and_relse;
1499
1500         sk_mark_napi_id(sk, skb);
1501         skb->dev = NULL;
1502
1503         bh_lock_sock_nested(sk);
1504         ret = 0;
1505         if (!sock_owned_by_user(sk)) {
1506 #ifdef CONFIG_NET_DMA
1507                 struct tcp_sock *tp = tcp_sk(sk);
1508                 if (!tp->ucopy.dma_chan && tp->ucopy.pinned_list)
1509                         tp->ucopy.dma_chan = net_dma_find_channel();
1510                 if (tp->ucopy.dma_chan)
1511                         ret = tcp_v6_do_rcv(sk, skb);
1512                 else
1513 #endif
1514                 {
1515                         if (!tcp_prequeue(sk, skb))
1516                                 ret = tcp_v6_do_rcv(sk, skb);
1517                 }
1518         } else if (unlikely(sk_add_backlog(sk, skb,
1519                                            sk->sk_rcvbuf + sk->sk_sndbuf))) {
1520                 bh_unlock_sock(sk);
1521                 NET_INC_STATS_BH(net, LINUX_MIB_TCPBACKLOGDROP);
1522                 goto discard_and_relse;
1523         }
1524         bh_unlock_sock(sk);
1525
1526         sock_put(sk);
1527         return ret ? -1 : 0;
1528
1529 no_tcp_socket:
1530         if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb))
1531                 goto discard_it;
1532
1533         if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
1534 csum_error:
1535                 TCP_INC_STATS_BH(net, TCP_MIB_CSUMERRORS);
1536 bad_packet:
1537                 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
1538         } else {
1539                 tcp_v6_send_reset(NULL, skb);
1540         }
1541
1542 discard_it:
1543         kfree_skb(skb);
1544         return 0;
1545
1546 discard_and_relse:
1547         sock_put(sk);
1548         goto discard_it;
1549
1550 do_time_wait:
1551         if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
1552                 inet_twsk_put(inet_twsk(sk));
1553                 goto discard_it;
1554         }
1555
1556         if (skb->len < (th->doff<<2)) {
1557                 inet_twsk_put(inet_twsk(sk));
1558                 goto bad_packet;
1559         }
1560         if (tcp_checksum_complete(skb)) {
1561                 inet_twsk_put(inet_twsk(sk));
1562                 goto csum_error;
1563         }
1564
1565         switch (tcp_timewait_state_process(inet_twsk(sk), skb, th)) {
1566         case TCP_TW_SYN:
1567         {
1568                 struct sock *sk2;
1569
1570                 sk2 = inet6_lookup_listener(dev_net(skb->dev), &tcp_hashinfo,
1571                                             &ipv6_hdr(skb)->saddr, th->source,
1572                                             &ipv6_hdr(skb)->daddr,
1573                                             ntohs(th->dest), inet6_iif(skb));
1574                 if (sk2 != NULL) {
1575                         struct inet_timewait_sock *tw = inet_twsk(sk);
1576                         inet_twsk_deschedule(tw, &tcp_death_row);
1577                         inet_twsk_put(tw);
1578                         sk = sk2;
1579                         goto process;
1580                 }
1581                 /* Fall through to ACK */
1582         }
1583         case TCP_TW_ACK:
1584                 tcp_v6_timewait_ack(sk, skb);
1585                 break;
1586         case TCP_TW_RST:
1587                 goto no_tcp_socket;
1588         case TCP_TW_SUCCESS:;
1589         }
1590         goto discard_it;
1591 }
1592
1593 static void tcp_v6_early_demux(struct sk_buff *skb)
1594 {
1595         const struct ipv6hdr *hdr;
1596         const struct tcphdr *th;
1597         struct sock *sk;
1598
1599         if (skb->pkt_type != PACKET_HOST)
1600                 return;
1601
1602         if (!pskb_may_pull(skb, skb_transport_offset(skb) + sizeof(struct tcphdr)))
1603                 return;
1604
1605         hdr = ipv6_hdr(skb);
1606         th = tcp_hdr(skb);
1607
1608         if (th->doff < sizeof(struct tcphdr) / 4)
1609                 return;
1610
1611         sk = __inet6_lookup_established(dev_net(skb->dev), &tcp_hashinfo,
1612                                         &hdr->saddr, th->source,
1613                                         &hdr->daddr, ntohs(th->dest),
1614                                         inet6_iif(skb));
1615         if (sk) {
1616                 skb->sk = sk;
1617                 skb->destructor = sock_edemux;
1618                 if (sk->sk_state != TCP_TIME_WAIT) {
1619                         struct dst_entry *dst = sk->sk_rx_dst;
1620
1621                         if (dst)
1622                                 dst = dst_check(dst, inet6_sk(sk)->rx_dst_cookie);
1623                         if (dst &&
1624                             inet_sk(sk)->rx_dst_ifindex == skb->skb_iif)
1625                                 skb_dst_set_noref(skb, dst);
1626                 }
1627         }
1628 }
1629
1630 static struct timewait_sock_ops tcp6_timewait_sock_ops = {
1631         .twsk_obj_size  = sizeof(struct tcp6_timewait_sock),
1632         .twsk_unique    = tcp_twsk_unique,
1633         .twsk_destructor= tcp_twsk_destructor,
1634 };
1635
1636 static const struct inet_connection_sock_af_ops ipv6_specific = {
1637         .queue_xmit        = inet6_csk_xmit,
1638         .send_check        = tcp_v6_send_check,
1639         .rebuild_header    = inet6_sk_rebuild_header,
1640         .sk_rx_dst_set     = inet6_sk_rx_dst_set,
1641         .conn_request      = tcp_v6_conn_request,
1642         .syn_recv_sock     = tcp_v6_syn_recv_sock,
1643         .net_header_len    = sizeof(struct ipv6hdr),
1644         .net_frag_header_len = sizeof(struct frag_hdr),
1645         .setsockopt        = ipv6_setsockopt,
1646         .getsockopt        = ipv6_getsockopt,
1647         .addr2sockaddr     = inet6_csk_addr2sockaddr,
1648         .sockaddr_len      = sizeof(struct sockaddr_in6),
1649         .bind_conflict     = inet6_csk_bind_conflict,
1650 #ifdef CONFIG_COMPAT
1651         .compat_setsockopt = compat_ipv6_setsockopt,
1652         .compat_getsockopt = compat_ipv6_getsockopt,
1653 #endif
1654 };
1655
1656 #ifdef CONFIG_TCP_MD5SIG
1657 static const struct tcp_sock_af_ops tcp_sock_ipv6_specific = {
1658         .md5_lookup     =       tcp_v6_md5_lookup,
1659         .calc_md5_hash  =       tcp_v6_md5_hash_skb,
1660         .md5_parse      =       tcp_v6_parse_md5_keys,
1661 };
1662 #endif
1663
1664 /*
1665  *      TCP over IPv4 via INET6 API
1666  */
1667
1668 static const struct inet_connection_sock_af_ops ipv6_mapped = {
1669         .queue_xmit        = ip_queue_xmit,
1670         .send_check        = tcp_v4_send_check,
1671         .rebuild_header    = inet_sk_rebuild_header,
1672         .sk_rx_dst_set     = inet_sk_rx_dst_set,
1673         .conn_request      = tcp_v6_conn_request,
1674         .syn_recv_sock     = tcp_v6_syn_recv_sock,
1675         .net_header_len    = sizeof(struct iphdr),
1676         .setsockopt        = ipv6_setsockopt,
1677         .getsockopt        = ipv6_getsockopt,
1678         .addr2sockaddr     = inet6_csk_addr2sockaddr,
1679         .sockaddr_len      = sizeof(struct sockaddr_in6),
1680         .bind_conflict     = inet6_csk_bind_conflict,
1681 #ifdef CONFIG_COMPAT
1682         .compat_setsockopt = compat_ipv6_setsockopt,
1683         .compat_getsockopt = compat_ipv6_getsockopt,
1684 #endif
1685 };
1686
1687 #ifdef CONFIG_TCP_MD5SIG
1688 static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific = {
1689         .md5_lookup     =       tcp_v4_md5_lookup,
1690         .calc_md5_hash  =       tcp_v4_md5_hash_skb,
1691         .md5_parse      =       tcp_v6_parse_md5_keys,
1692 };
1693 #endif
1694
1695 /* NOTE: A lot of things set to zero explicitly by call to
1696  *       sk_alloc() so need not be done here.
1697  */
1698 static int tcp_v6_init_sock(struct sock *sk)
1699 {
1700         struct inet_connection_sock *icsk = inet_csk(sk);
1701
1702         tcp_init_sock(sk);
1703
1704         icsk->icsk_af_ops = &ipv6_specific;
1705
1706 #ifdef CONFIG_TCP_MD5SIG
1707         tcp_sk(sk)->af_specific = &tcp_sock_ipv6_specific;
1708 #endif
1709
1710         return 0;
1711 }
1712
1713 static void tcp_v6_destroy_sock(struct sock *sk)
1714 {
1715         tcp_v4_destroy_sock(sk);
1716         inet6_destroy_sock(sk);
1717 }
1718
1719 #ifdef CONFIG_PROC_FS
1720 /* Proc filesystem TCPv6 sock list dumping. */
1721 static void get_openreq6(struct seq_file *seq,
1722                          const struct sock *sk, struct request_sock *req, int i, kuid_t uid)
1723 {
1724         int ttd = req->expires - jiffies;
1725         const struct in6_addr *src = &inet6_rsk(req)->loc_addr;
1726         const struct in6_addr *dest = &inet6_rsk(req)->rmt_addr;
1727
1728         if (ttd < 0)
1729                 ttd = 0;
1730
1731         seq_printf(seq,
1732                    "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1733                    "%02X %08X:%08X %02X:%08lX %08X %5u %8d %d %d %pK\n",
1734                    i,
1735                    src->s6_addr32[0], src->s6_addr32[1],
1736                    src->s6_addr32[2], src->s6_addr32[3],
1737                    ntohs(inet_rsk(req)->loc_port),
1738                    dest->s6_addr32[0], dest->s6_addr32[1],
1739                    dest->s6_addr32[2], dest->s6_addr32[3],
1740                    ntohs(inet_rsk(req)->rmt_port),
1741                    TCP_SYN_RECV,
1742                    0,0, /* could print option size, but that is af dependent. */
1743                    1,   /* timers active (only the expire timer) */
1744                    jiffies_to_clock_t(ttd),
1745                    req->num_timeout,
1746                    from_kuid_munged(seq_user_ns(seq), uid),
1747                    0,  /* non standard timer */
1748                    0, /* open_requests have no inode */
1749                    0, req);
1750 }
1751
1752 static void get_tcp6_sock(struct seq_file *seq, struct sock *sp, int i)
1753 {
1754         const struct in6_addr *dest, *src;
1755         __u16 destp, srcp;
1756         int timer_active;
1757         unsigned long timer_expires;
1758         const struct inet_sock *inet = inet_sk(sp);
1759         const struct tcp_sock *tp = tcp_sk(sp);
1760         const struct inet_connection_sock *icsk = inet_csk(sp);
1761         const struct ipv6_pinfo *np = inet6_sk(sp);
1762
1763         dest  = &np->daddr;
1764         src   = &np->rcv_saddr;
1765         destp = ntohs(inet->inet_dport);
1766         srcp  = ntohs(inet->inet_sport);
1767
1768         if (icsk->icsk_pending == ICSK_TIME_RETRANS) {
1769                 timer_active    = 1;
1770                 timer_expires   = icsk->icsk_timeout;
1771         } else if (icsk->icsk_pending == ICSK_TIME_PROBE0) {
1772                 timer_active    = 4;
1773                 timer_expires   = icsk->icsk_timeout;
1774         } else if (timer_pending(&sp->sk_timer)) {
1775                 timer_active    = 2;
1776                 timer_expires   = sp->sk_timer.expires;
1777         } else {
1778                 timer_active    = 0;
1779                 timer_expires = jiffies;
1780         }
1781
1782         seq_printf(seq,
1783                    "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1784                    "%02X %08X:%08X %02X:%08lX %08X %5u %8d %lu %d %pK %lu %lu %u %u %d\n",
1785                    i,
1786                    src->s6_addr32[0], src->s6_addr32[1],
1787                    src->s6_addr32[2], src->s6_addr32[3], srcp,
1788                    dest->s6_addr32[0], dest->s6_addr32[1],
1789                    dest->s6_addr32[2], dest->s6_addr32[3], destp,
1790                    sp->sk_state,
1791                    tp->write_seq-tp->snd_una,
1792                    (sp->sk_state == TCP_LISTEN) ? sp->sk_ack_backlog : (tp->rcv_nxt - tp->copied_seq),
1793                    timer_active,
1794                    jiffies_delta_to_clock_t(timer_expires - jiffies),
1795                    icsk->icsk_retransmits,
1796                    from_kuid_munged(seq_user_ns(seq), sock_i_uid(sp)),
1797                    icsk->icsk_probes_out,
1798                    sock_i_ino(sp),
1799                    atomic_read(&sp->sk_refcnt), sp,
1800                    jiffies_to_clock_t(icsk->icsk_rto),
1801                    jiffies_to_clock_t(icsk->icsk_ack.ato),
1802                    (icsk->icsk_ack.quick << 1 ) | icsk->icsk_ack.pingpong,
1803                    tp->snd_cwnd,
1804                    tcp_in_initial_slowstart(tp) ? -1 : tp->snd_ssthresh
1805                    );
1806 }
1807
1808 static void get_timewait6_sock(struct seq_file *seq,
1809                                struct inet_timewait_sock *tw, int i)
1810 {
1811         const struct in6_addr *dest, *src;
1812         __u16 destp, srcp;
1813         const struct inet6_timewait_sock *tw6 = inet6_twsk((struct sock *)tw);
1814         s32 delta = tw->tw_ttd - inet_tw_time_stamp();
1815
1816         dest = &tw6->tw_v6_daddr;
1817         src  = &tw6->tw_v6_rcv_saddr;
1818         destp = ntohs(tw->tw_dport);
1819         srcp  = ntohs(tw->tw_sport);
1820
1821         seq_printf(seq,
1822                    "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1823                    "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %pK\n",
1824                    i,
1825                    src->s6_addr32[0], src->s6_addr32[1],
1826                    src->s6_addr32[2], src->s6_addr32[3], srcp,
1827                    dest->s6_addr32[0], dest->s6_addr32[1],
1828                    dest->s6_addr32[2], dest->s6_addr32[3], destp,
1829                    tw->tw_substate, 0, 0,
1830                    3, jiffies_delta_to_clock_t(delta), 0, 0, 0, 0,
1831                    atomic_read(&tw->tw_refcnt), tw);
1832 }
1833
1834 static int tcp6_seq_show(struct seq_file *seq, void *v)
1835 {
1836         struct tcp_iter_state *st;
1837
1838         if (v == SEQ_START_TOKEN) {
1839                 seq_puts(seq,
1840                          "  sl  "
1841                          "local_address                         "
1842                          "remote_address                        "
1843                          "st tx_queue rx_queue tr tm->when retrnsmt"
1844                          "   uid  timeout inode\n");
1845                 goto out;
1846         }
1847         st = seq->private;
1848
1849         switch (st->state) {
1850         case TCP_SEQ_STATE_LISTENING:
1851         case TCP_SEQ_STATE_ESTABLISHED:
1852                 get_tcp6_sock(seq, v, st->num);
1853                 break;
1854         case TCP_SEQ_STATE_OPENREQ:
1855                 get_openreq6(seq, st->syn_wait_sk, v, st->num, st->uid);
1856                 break;
1857         case TCP_SEQ_STATE_TIME_WAIT:
1858                 get_timewait6_sock(seq, v, st->num);
1859                 break;
1860         }
1861 out:
1862         return 0;
1863 }
1864
1865 static const struct file_operations tcp6_afinfo_seq_fops = {
1866         .owner   = THIS_MODULE,
1867         .open    = tcp_seq_open,
1868         .read    = seq_read,
1869         .llseek  = seq_lseek,
1870         .release = seq_release_net
1871 };
1872
1873 static struct tcp_seq_afinfo tcp6_seq_afinfo = {
1874         .name           = "tcp6",
1875         .family         = AF_INET6,
1876         .seq_fops       = &tcp6_afinfo_seq_fops,
1877         .seq_ops        = {
1878                 .show           = tcp6_seq_show,
1879         },
1880 };
1881
1882 int __net_init tcp6_proc_init(struct net *net)
1883 {
1884         return tcp_proc_register(net, &tcp6_seq_afinfo);
1885 }
1886
1887 void tcp6_proc_exit(struct net *net)
1888 {
1889         tcp_proc_unregister(net, &tcp6_seq_afinfo);
1890 }
1891 #endif
1892
1893 static void tcp_v6_clear_sk(struct sock *sk, int size)
1894 {
1895         struct inet_sock *inet = inet_sk(sk);
1896
1897         /* we do not want to clear pinet6 field, because of RCU lookups */
1898         sk_prot_clear_nulls(sk, offsetof(struct inet_sock, pinet6));
1899
1900         size -= offsetof(struct inet_sock, pinet6) + sizeof(inet->pinet6);
1901         memset(&inet->pinet6 + 1, 0, size);
1902 }
1903
1904 struct proto tcpv6_prot = {
1905         .name                   = "TCPv6",
1906         .owner                  = THIS_MODULE,
1907         .close                  = tcp_close,
1908         .connect                = tcp_v6_connect,
1909         .disconnect             = tcp_disconnect,
1910         .accept                 = inet_csk_accept,
1911         .ioctl                  = tcp_ioctl,
1912         .init                   = tcp_v6_init_sock,
1913         .destroy                = tcp_v6_destroy_sock,
1914         .shutdown               = tcp_shutdown,
1915         .setsockopt             = tcp_setsockopt,
1916         .getsockopt             = tcp_getsockopt,
1917         .recvmsg                = tcp_recvmsg,
1918         .sendmsg                = tcp_sendmsg,
1919         .sendpage               = tcp_sendpage,
1920         .backlog_rcv            = tcp_v6_do_rcv,
1921         .release_cb             = tcp_release_cb,
1922         .mtu_reduced            = tcp_v6_mtu_reduced,
1923         .hash                   = tcp_v6_hash,
1924         .unhash                 = inet_unhash,
1925         .get_port               = inet_csk_get_port,
1926         .enter_memory_pressure  = tcp_enter_memory_pressure,
1927         .stream_memory_free     = tcp_stream_memory_free,
1928         .sockets_allocated      = &tcp_sockets_allocated,
1929         .memory_allocated       = &tcp_memory_allocated,
1930         .memory_pressure        = &tcp_memory_pressure,
1931         .orphan_count           = &tcp_orphan_count,
1932         .sysctl_wmem            = sysctl_tcp_wmem,
1933         .sysctl_rmem            = sysctl_tcp_rmem,
1934         .max_header             = MAX_TCP_HEADER,
1935         .obj_size               = sizeof(struct tcp6_sock),
1936         .slab_flags             = SLAB_DESTROY_BY_RCU,
1937         .twsk_prot              = &tcp6_timewait_sock_ops,
1938         .rsk_prot               = &tcp6_request_sock_ops,
1939         .h.hashinfo             = &tcp_hashinfo,
1940         .no_autobind            = true,
1941 #ifdef CONFIG_COMPAT
1942         .compat_setsockopt      = compat_tcp_setsockopt,
1943         .compat_getsockopt      = compat_tcp_getsockopt,
1944 #endif
1945 #ifdef CONFIG_MEMCG_KMEM
1946         .proto_cgroup           = tcp_proto_cgroup,
1947 #endif
1948         .clear_sk               = tcp_v6_clear_sk,
1949 };
1950
1951 static const struct inet6_protocol tcpv6_protocol = {
1952         .early_demux    =       tcp_v6_early_demux,
1953         .handler        =       tcp_v6_rcv,
1954         .err_handler    =       tcp_v6_err,
1955         .flags          =       INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
1956 };
1957
1958 static struct inet_protosw tcpv6_protosw = {
1959         .type           =       SOCK_STREAM,
1960         .protocol       =       IPPROTO_TCP,
1961         .prot           =       &tcpv6_prot,
1962         .ops            =       &inet6_stream_ops,
1963         .no_check       =       0,
1964         .flags          =       INET_PROTOSW_PERMANENT |
1965                                 INET_PROTOSW_ICSK,
1966 };
1967
1968 static int __net_init tcpv6_net_init(struct net *net)
1969 {
1970         return inet_ctl_sock_create(&net->ipv6.tcp_sk, PF_INET6,
1971                                     SOCK_RAW, IPPROTO_TCP, net);
1972 }
1973
1974 static void __net_exit tcpv6_net_exit(struct net *net)
1975 {
1976         inet_ctl_sock_destroy(net->ipv6.tcp_sk);
1977 }
1978
1979 static void __net_exit tcpv6_net_exit_batch(struct list_head *net_exit_list)
1980 {
1981         inet_twsk_purge(&tcp_hashinfo, &tcp_death_row, AF_INET6);
1982 }
1983
1984 static struct pernet_operations tcpv6_net_ops = {
1985         .init       = tcpv6_net_init,
1986         .exit       = tcpv6_net_exit,
1987         .exit_batch = tcpv6_net_exit_batch,
1988 };
1989
1990 int __init tcpv6_init(void)
1991 {
1992         int ret;
1993
1994         ret = inet6_add_protocol(&tcpv6_protocol, IPPROTO_TCP);
1995         if (ret)
1996                 goto out;
1997
1998         /* register inet6 protocol */
1999         ret = inet6_register_protosw(&tcpv6_protosw);
2000         if (ret)
2001                 goto out_tcpv6_protocol;
2002
2003         ret = register_pernet_subsys(&tcpv6_net_ops);
2004         if (ret)
2005                 goto out_tcpv6_protosw;
2006 out:
2007         return ret;
2008
2009 out_tcpv6_protosw:
2010         inet6_unregister_protosw(&tcpv6_protosw);
2011 out_tcpv6_protocol:
2012         inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
2013         goto out;
2014 }
2015
2016 void tcpv6_exit(void)
2017 {
2018         unregister_pernet_subsys(&tcpv6_net_ops);
2019         inet6_unregister_protosw(&tcpv6_protosw);
2020         inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
2021 }