Merge git://git.kernel.org/pub/scm/linux/kernel/git/mason/btrfs-unstable
[linux-2.6] / net / ipv6 / tcp_ipv6.c
1 /*
2  *      TCP over IPv6
3  *      Linux INET6 implementation
4  *
5  *      Authors:
6  *      Pedro Roque             <roque@di.fc.ul.pt>
7  *
8  *      Based on:
9  *      linux/net/ipv4/tcp.c
10  *      linux/net/ipv4/tcp_input.c
11  *      linux/net/ipv4/tcp_output.c
12  *
13  *      Fixes:
14  *      Hideaki YOSHIFUJI       :       sin6_scope_id support
15  *      YOSHIFUJI Hideaki @USAGI and:   Support IPV6_V6ONLY socket option, which
16  *      Alexey Kuznetsov                allow both IPv4 and IPv6 sockets to bind
17  *                                      a single port at the same time.
18  *      YOSHIFUJI Hideaki @USAGI:       convert /proc/net/tcp6 to seq_file.
19  *
20  *      This program is free software; you can redistribute it and/or
21  *      modify it under the terms of the GNU General Public License
22  *      as published by the Free Software Foundation; either version
23  *      2 of the License, or (at your option) any later version.
24  */
25
26 #include <linux/bottom_half.h>
27 #include <linux/module.h>
28 #include <linux/errno.h>
29 #include <linux/types.h>
30 #include <linux/socket.h>
31 #include <linux/sockios.h>
32 #include <linux/net.h>
33 #include <linux/jiffies.h>
34 #include <linux/in.h>
35 #include <linux/in6.h>
36 #include <linux/netdevice.h>
37 #include <linux/init.h>
38 #include <linux/jhash.h>
39 #include <linux/ipsec.h>
40 #include <linux/times.h>
41
42 #include <linux/ipv6.h>
43 #include <linux/icmpv6.h>
44 #include <linux/random.h>
45
46 #include <net/tcp.h>
47 #include <net/ndisc.h>
48 #include <net/inet6_hashtables.h>
49 #include <net/inet6_connection_sock.h>
50 #include <net/ipv6.h>
51 #include <net/transp_v6.h>
52 #include <net/addrconf.h>
53 #include <net/ip6_route.h>
54 #include <net/ip6_checksum.h>
55 #include <net/inet_ecn.h>
56 #include <net/protocol.h>
57 #include <net/xfrm.h>
58 #include <net/snmp.h>
59 #include <net/dsfield.h>
60 #include <net/timewait_sock.h>
61 #include <net/netdma.h>
62 #include <net/inet_common.h>
63
64 #include <asm/uaccess.h>
65
66 #include <linux/proc_fs.h>
67 #include <linux/seq_file.h>
68
69 #include <linux/crypto.h>
70 #include <linux/scatterlist.h>
71
72 static void     tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb);
73 static void     tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
74                                       struct request_sock *req);
75
76 static int      tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb);
77
78 static struct inet_connection_sock_af_ops ipv6_mapped;
79 static struct inet_connection_sock_af_ops ipv6_specific;
80 #ifdef CONFIG_TCP_MD5SIG
81 static struct tcp_sock_af_ops tcp_sock_ipv6_specific;
82 static struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific;
83 #else
84 static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
85                                                    struct in6_addr *addr)
86 {
87         return NULL;
88 }
89 #endif
90
91 static void tcp_v6_hash(struct sock *sk)
92 {
93         if (sk->sk_state != TCP_CLOSE) {
94                 if (inet_csk(sk)->icsk_af_ops == &ipv6_mapped) {
95                         tcp_prot.hash(sk);
96                         return;
97                 }
98                 local_bh_disable();
99                 __inet6_hash(sk);
100                 local_bh_enable();
101         }
102 }
103
104 static __inline__ __sum16 tcp_v6_check(int len,
105                                    struct in6_addr *saddr,
106                                    struct in6_addr *daddr,
107                                    __wsum base)
108 {
109         return csum_ipv6_magic(saddr, daddr, len, IPPROTO_TCP, base);
110 }
111
112 static __u32 tcp_v6_init_sequence(struct sk_buff *skb)
113 {
114         return secure_tcpv6_sequence_number(ipv6_hdr(skb)->daddr.s6_addr32,
115                                             ipv6_hdr(skb)->saddr.s6_addr32,
116                                             tcp_hdr(skb)->dest,
117                                             tcp_hdr(skb)->source);
118 }
119
120 static int tcp_v6_connect(struct sock *sk, struct sockaddr *uaddr,
121                           int addr_len)
122 {
123         struct sockaddr_in6 *usin = (struct sockaddr_in6 *) uaddr;
124         struct inet_sock *inet = inet_sk(sk);
125         struct inet_connection_sock *icsk = inet_csk(sk);
126         struct ipv6_pinfo *np = inet6_sk(sk);
127         struct tcp_sock *tp = tcp_sk(sk);
128         struct in6_addr *saddr = NULL, *final_p = NULL, final;
129         struct flowi fl;
130         struct dst_entry *dst;
131         int addr_type;
132         int err;
133
134         if (addr_len < SIN6_LEN_RFC2133)
135                 return -EINVAL;
136
137         if (usin->sin6_family != AF_INET6)
138                 return(-EAFNOSUPPORT);
139
140         memset(&fl, 0, sizeof(fl));
141
142         if (np->sndflow) {
143                 fl.fl6_flowlabel = usin->sin6_flowinfo&IPV6_FLOWINFO_MASK;
144                 IP6_ECN_flow_init(fl.fl6_flowlabel);
145                 if (fl.fl6_flowlabel&IPV6_FLOWLABEL_MASK) {
146                         struct ip6_flowlabel *flowlabel;
147                         flowlabel = fl6_sock_lookup(sk, fl.fl6_flowlabel);
148                         if (flowlabel == NULL)
149                                 return -EINVAL;
150                         ipv6_addr_copy(&usin->sin6_addr, &flowlabel->dst);
151                         fl6_sock_release(flowlabel);
152                 }
153         }
154
155         /*
156          *      connect() to INADDR_ANY means loopback (BSD'ism).
157          */
158
159         if(ipv6_addr_any(&usin->sin6_addr))
160                 usin->sin6_addr.s6_addr[15] = 0x1;
161
162         addr_type = ipv6_addr_type(&usin->sin6_addr);
163
164         if(addr_type & IPV6_ADDR_MULTICAST)
165                 return -ENETUNREACH;
166
167         if (addr_type&IPV6_ADDR_LINKLOCAL) {
168                 if (addr_len >= sizeof(struct sockaddr_in6) &&
169                     usin->sin6_scope_id) {
170                         /* If interface is set while binding, indices
171                          * must coincide.
172                          */
173                         if (sk->sk_bound_dev_if &&
174                             sk->sk_bound_dev_if != usin->sin6_scope_id)
175                                 return -EINVAL;
176
177                         sk->sk_bound_dev_if = usin->sin6_scope_id;
178                 }
179
180                 /* Connect to link-local address requires an interface */
181                 if (!sk->sk_bound_dev_if)
182                         return -EINVAL;
183         }
184
185         if (tp->rx_opt.ts_recent_stamp &&
186             !ipv6_addr_equal(&np->daddr, &usin->sin6_addr)) {
187                 tp->rx_opt.ts_recent = 0;
188                 tp->rx_opt.ts_recent_stamp = 0;
189                 tp->write_seq = 0;
190         }
191
192         ipv6_addr_copy(&np->daddr, &usin->sin6_addr);
193         np->flow_label = fl.fl6_flowlabel;
194
195         /*
196          *      TCP over IPv4
197          */
198
199         if (addr_type == IPV6_ADDR_MAPPED) {
200                 u32 exthdrlen = icsk->icsk_ext_hdr_len;
201                 struct sockaddr_in sin;
202
203                 SOCK_DEBUG(sk, "connect: ipv4 mapped\n");
204
205                 if (__ipv6_only_sock(sk))
206                         return -ENETUNREACH;
207
208                 sin.sin_family = AF_INET;
209                 sin.sin_port = usin->sin6_port;
210                 sin.sin_addr.s_addr = usin->sin6_addr.s6_addr32[3];
211
212                 icsk->icsk_af_ops = &ipv6_mapped;
213                 sk->sk_backlog_rcv = tcp_v4_do_rcv;
214 #ifdef CONFIG_TCP_MD5SIG
215                 tp->af_specific = &tcp_sock_ipv6_mapped_specific;
216 #endif
217
218                 err = tcp_v4_connect(sk, (struct sockaddr *)&sin, sizeof(sin));
219
220                 if (err) {
221                         icsk->icsk_ext_hdr_len = exthdrlen;
222                         icsk->icsk_af_ops = &ipv6_specific;
223                         sk->sk_backlog_rcv = tcp_v6_do_rcv;
224 #ifdef CONFIG_TCP_MD5SIG
225                         tp->af_specific = &tcp_sock_ipv6_specific;
226 #endif
227                         goto failure;
228                 } else {
229                         ipv6_addr_set(&np->saddr, 0, 0, htonl(0x0000FFFF),
230                                       inet->saddr);
231                         ipv6_addr_set(&np->rcv_saddr, 0, 0, htonl(0x0000FFFF),
232                                       inet->rcv_saddr);
233                 }
234
235                 return err;
236         }
237
238         if (!ipv6_addr_any(&np->rcv_saddr))
239                 saddr = &np->rcv_saddr;
240
241         fl.proto = IPPROTO_TCP;
242         ipv6_addr_copy(&fl.fl6_dst, &np->daddr);
243         ipv6_addr_copy(&fl.fl6_src,
244                        (saddr ? saddr : &np->saddr));
245         fl.oif = sk->sk_bound_dev_if;
246         fl.fl_ip_dport = usin->sin6_port;
247         fl.fl_ip_sport = inet->sport;
248
249         if (np->opt && np->opt->srcrt) {
250                 struct rt0_hdr *rt0 = (struct rt0_hdr *)np->opt->srcrt;
251                 ipv6_addr_copy(&final, &fl.fl6_dst);
252                 ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
253                 final_p = &final;
254         }
255
256         security_sk_classify_flow(sk, &fl);
257
258         err = ip6_dst_lookup(sk, &dst, &fl);
259         if (err)
260                 goto failure;
261         if (final_p)
262                 ipv6_addr_copy(&fl.fl6_dst, final_p);
263
264         err = __xfrm_lookup(sock_net(sk), &dst, &fl, sk, XFRM_LOOKUP_WAIT);
265         if (err < 0) {
266                 if (err == -EREMOTE)
267                         err = ip6_dst_blackhole(sk, &dst, &fl);
268                 if (err < 0)
269                         goto failure;
270         }
271
272         if (saddr == NULL) {
273                 saddr = &fl.fl6_src;
274                 ipv6_addr_copy(&np->rcv_saddr, saddr);
275         }
276
277         /* set the source address */
278         ipv6_addr_copy(&np->saddr, saddr);
279         inet->rcv_saddr = LOOPBACK4_IPV6;
280
281         sk->sk_gso_type = SKB_GSO_TCPV6;
282         __ip6_dst_store(sk, dst, NULL, NULL);
283
284         icsk->icsk_ext_hdr_len = 0;
285         if (np->opt)
286                 icsk->icsk_ext_hdr_len = (np->opt->opt_flen +
287                                           np->opt->opt_nflen);
288
289         tp->rx_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
290
291         inet->dport = usin->sin6_port;
292
293         tcp_set_state(sk, TCP_SYN_SENT);
294         err = inet6_hash_connect(&tcp_death_row, sk);
295         if (err)
296                 goto late_failure;
297
298         if (!tp->write_seq)
299                 tp->write_seq = secure_tcpv6_sequence_number(np->saddr.s6_addr32,
300                                                              np->daddr.s6_addr32,
301                                                              inet->sport,
302                                                              inet->dport);
303
304         err = tcp_connect(sk);
305         if (err)
306                 goto late_failure;
307
308         return 0;
309
310 late_failure:
311         tcp_set_state(sk, TCP_CLOSE);
312         __sk_dst_reset(sk);
313 failure:
314         inet->dport = 0;
315         sk->sk_route_caps = 0;
316         return err;
317 }
318
319 static void tcp_v6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
320                 int type, int code, int offset, __be32 info)
321 {
322         struct ipv6hdr *hdr = (struct ipv6hdr*)skb->data;
323         const struct tcphdr *th = (struct tcphdr *)(skb->data+offset);
324         struct ipv6_pinfo *np;
325         struct sock *sk;
326         int err;
327         struct tcp_sock *tp;
328         __u32 seq;
329         struct net *net = dev_net(skb->dev);
330
331         sk = inet6_lookup(net, &tcp_hashinfo, &hdr->daddr,
332                         th->dest, &hdr->saddr, th->source, skb->dev->ifindex);
333
334         if (sk == NULL) {
335                 ICMP6_INC_STATS_BH(net, __in6_dev_get(skb->dev),
336                                    ICMP6_MIB_INERRORS);
337                 return;
338         }
339
340         if (sk->sk_state == TCP_TIME_WAIT) {
341                 inet_twsk_put(inet_twsk(sk));
342                 return;
343         }
344
345         bh_lock_sock(sk);
346         if (sock_owned_by_user(sk))
347                 NET_INC_STATS_BH(net, LINUX_MIB_LOCKDROPPEDICMPS);
348
349         if (sk->sk_state == TCP_CLOSE)
350                 goto out;
351
352         tp = tcp_sk(sk);
353         seq = ntohl(th->seq);
354         if (sk->sk_state != TCP_LISTEN &&
355             !between(seq, tp->snd_una, tp->snd_nxt)) {
356                 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
357                 goto out;
358         }
359
360         np = inet6_sk(sk);
361
362         if (type == ICMPV6_PKT_TOOBIG) {
363                 struct dst_entry *dst = NULL;
364
365                 if (sock_owned_by_user(sk))
366                         goto out;
367                 if ((1 << sk->sk_state) & (TCPF_LISTEN | TCPF_CLOSE))
368                         goto out;
369
370                 /* icmp should have updated the destination cache entry */
371                 dst = __sk_dst_check(sk, np->dst_cookie);
372
373                 if (dst == NULL) {
374                         struct inet_sock *inet = inet_sk(sk);
375                         struct flowi fl;
376
377                         /* BUGGG_FUTURE: Again, it is not clear how
378                            to handle rthdr case. Ignore this complexity
379                            for now.
380                          */
381                         memset(&fl, 0, sizeof(fl));
382                         fl.proto = IPPROTO_TCP;
383                         ipv6_addr_copy(&fl.fl6_dst, &np->daddr);
384                         ipv6_addr_copy(&fl.fl6_src, &np->saddr);
385                         fl.oif = sk->sk_bound_dev_if;
386                         fl.fl_ip_dport = inet->dport;
387                         fl.fl_ip_sport = inet->sport;
388                         security_skb_classify_flow(skb, &fl);
389
390                         if ((err = ip6_dst_lookup(sk, &dst, &fl))) {
391                                 sk->sk_err_soft = -err;
392                                 goto out;
393                         }
394
395                         if ((err = xfrm_lookup(net, &dst, &fl, sk, 0)) < 0) {
396                                 sk->sk_err_soft = -err;
397                                 goto out;
398                         }
399
400                 } else
401                         dst_hold(dst);
402
403                 if (inet_csk(sk)->icsk_pmtu_cookie > dst_mtu(dst)) {
404                         tcp_sync_mss(sk, dst_mtu(dst));
405                         tcp_simple_retransmit(sk);
406                 } /* else let the usual retransmit timer handle it */
407                 dst_release(dst);
408                 goto out;
409         }
410
411         icmpv6_err_convert(type, code, &err);
412
413         /* Might be for an request_sock */
414         switch (sk->sk_state) {
415                 struct request_sock *req, **prev;
416         case TCP_LISTEN:
417                 if (sock_owned_by_user(sk))
418                         goto out;
419
420                 req = inet6_csk_search_req(sk, &prev, th->dest, &hdr->daddr,
421                                            &hdr->saddr, inet6_iif(skb));
422                 if (!req)
423                         goto out;
424
425                 /* ICMPs are not backlogged, hence we cannot get
426                  * an established socket here.
427                  */
428                 WARN_ON(req->sk != NULL);
429
430                 if (seq != tcp_rsk(req)->snt_isn) {
431                         NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
432                         goto out;
433                 }
434
435                 inet_csk_reqsk_queue_drop(sk, req, prev);
436                 goto out;
437
438         case TCP_SYN_SENT:
439         case TCP_SYN_RECV:  /* Cannot happen.
440                                It can, it SYNs are crossed. --ANK */
441                 if (!sock_owned_by_user(sk)) {
442                         sk->sk_err = err;
443                         sk->sk_error_report(sk);                /* Wake people up to see the error (see connect in sock.c) */
444
445                         tcp_done(sk);
446                 } else
447                         sk->sk_err_soft = err;
448                 goto out;
449         }
450
451         if (!sock_owned_by_user(sk) && np->recverr) {
452                 sk->sk_err = err;
453                 sk->sk_error_report(sk);
454         } else
455                 sk->sk_err_soft = err;
456
457 out:
458         bh_unlock_sock(sk);
459         sock_put(sk);
460 }
461
462
463 static int tcp_v6_send_synack(struct sock *sk, struct request_sock *req)
464 {
465         struct inet6_request_sock *treq = inet6_rsk(req);
466         struct ipv6_pinfo *np = inet6_sk(sk);
467         struct sk_buff * skb;
468         struct ipv6_txoptions *opt = NULL;
469         struct in6_addr * final_p = NULL, final;
470         struct flowi fl;
471         struct dst_entry *dst;
472         int err = -1;
473
474         memset(&fl, 0, sizeof(fl));
475         fl.proto = IPPROTO_TCP;
476         ipv6_addr_copy(&fl.fl6_dst, &treq->rmt_addr);
477         ipv6_addr_copy(&fl.fl6_src, &treq->loc_addr);
478         fl.fl6_flowlabel = 0;
479         fl.oif = treq->iif;
480         fl.fl_ip_dport = inet_rsk(req)->rmt_port;
481         fl.fl_ip_sport = inet_rsk(req)->loc_port;
482         security_req_classify_flow(req, &fl);
483
484         opt = np->opt;
485         if (opt && opt->srcrt) {
486                 struct rt0_hdr *rt0 = (struct rt0_hdr *) opt->srcrt;
487                 ipv6_addr_copy(&final, &fl.fl6_dst);
488                 ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
489                 final_p = &final;
490         }
491
492         err = ip6_dst_lookup(sk, &dst, &fl);
493         if (err)
494                 goto done;
495         if (final_p)
496                 ipv6_addr_copy(&fl.fl6_dst, final_p);
497         if ((err = xfrm_lookup(sock_net(sk), &dst, &fl, sk, 0)) < 0)
498                 goto done;
499
500         skb = tcp_make_synack(sk, dst, req);
501         if (skb) {
502                 struct tcphdr *th = tcp_hdr(skb);
503
504                 th->check = tcp_v6_check(skb->len,
505                                          &treq->loc_addr, &treq->rmt_addr,
506                                          csum_partial(th, skb->len, skb->csum));
507
508                 ipv6_addr_copy(&fl.fl6_dst, &treq->rmt_addr);
509                 err = ip6_xmit(sk, skb, &fl, opt, 0);
510                 err = net_xmit_eval(err);
511         }
512
513 done:
514         if (opt && opt != np->opt)
515                 sock_kfree_s(sk, opt, opt->tot_len);
516         dst_release(dst);
517         return err;
518 }
519
520 static inline void syn_flood_warning(struct sk_buff *skb)
521 {
522 #ifdef CONFIG_SYN_COOKIES
523         if (sysctl_tcp_syncookies)
524                 printk(KERN_INFO
525                        "TCPv6: Possible SYN flooding on port %d. "
526                        "Sending cookies.\n", ntohs(tcp_hdr(skb)->dest));
527         else
528 #endif
529                 printk(KERN_INFO
530                        "TCPv6: Possible SYN flooding on port %d. "
531                        "Dropping request.\n", ntohs(tcp_hdr(skb)->dest));
532 }
533
534 static void tcp_v6_reqsk_destructor(struct request_sock *req)
535 {
536         kfree_skb(inet6_rsk(req)->pktopts);
537 }
538
539 #ifdef CONFIG_TCP_MD5SIG
540 static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
541                                                    struct in6_addr *addr)
542 {
543         struct tcp_sock *tp = tcp_sk(sk);
544         int i;
545
546         BUG_ON(tp == NULL);
547
548         if (!tp->md5sig_info || !tp->md5sig_info->entries6)
549                 return NULL;
550
551         for (i = 0; i < tp->md5sig_info->entries6; i++) {
552                 if (ipv6_addr_equal(&tp->md5sig_info->keys6[i].addr, addr))
553                         return &tp->md5sig_info->keys6[i].base;
554         }
555         return NULL;
556 }
557
558 static struct tcp_md5sig_key *tcp_v6_md5_lookup(struct sock *sk,
559                                                 struct sock *addr_sk)
560 {
561         return tcp_v6_md5_do_lookup(sk, &inet6_sk(addr_sk)->daddr);
562 }
563
564 static struct tcp_md5sig_key *tcp_v6_reqsk_md5_lookup(struct sock *sk,
565                                                       struct request_sock *req)
566 {
567         return tcp_v6_md5_do_lookup(sk, &inet6_rsk(req)->rmt_addr);
568 }
569
570 static int tcp_v6_md5_do_add(struct sock *sk, struct in6_addr *peer,
571                              char *newkey, u8 newkeylen)
572 {
573         /* Add key to the list */
574         struct tcp_md5sig_key *key;
575         struct tcp_sock *tp = tcp_sk(sk);
576         struct tcp6_md5sig_key *keys;
577
578         key = tcp_v6_md5_do_lookup(sk, peer);
579         if (key) {
580                 /* modify existing entry - just update that one */
581                 kfree(key->key);
582                 key->key = newkey;
583                 key->keylen = newkeylen;
584         } else {
585                 /* reallocate new list if current one is full. */
586                 if (!tp->md5sig_info) {
587                         tp->md5sig_info = kzalloc(sizeof(*tp->md5sig_info), GFP_ATOMIC);
588                         if (!tp->md5sig_info) {
589                                 kfree(newkey);
590                                 return -ENOMEM;
591                         }
592                         sk->sk_route_caps &= ~NETIF_F_GSO_MASK;
593                 }
594                 if (tcp_alloc_md5sig_pool() == NULL) {
595                         kfree(newkey);
596                         return -ENOMEM;
597                 }
598                 if (tp->md5sig_info->alloced6 == tp->md5sig_info->entries6) {
599                         keys = kmalloc((sizeof (tp->md5sig_info->keys6[0]) *
600                                        (tp->md5sig_info->entries6 + 1)), GFP_ATOMIC);
601
602                         if (!keys) {
603                                 tcp_free_md5sig_pool();
604                                 kfree(newkey);
605                                 return -ENOMEM;
606                         }
607
608                         if (tp->md5sig_info->entries6)
609                                 memmove(keys, tp->md5sig_info->keys6,
610                                         (sizeof (tp->md5sig_info->keys6[0]) *
611                                          tp->md5sig_info->entries6));
612
613                         kfree(tp->md5sig_info->keys6);
614                         tp->md5sig_info->keys6 = keys;
615                         tp->md5sig_info->alloced6++;
616                 }
617
618                 ipv6_addr_copy(&tp->md5sig_info->keys6[tp->md5sig_info->entries6].addr,
619                                peer);
620                 tp->md5sig_info->keys6[tp->md5sig_info->entries6].base.key = newkey;
621                 tp->md5sig_info->keys6[tp->md5sig_info->entries6].base.keylen = newkeylen;
622
623                 tp->md5sig_info->entries6++;
624         }
625         return 0;
626 }
627
628 static int tcp_v6_md5_add_func(struct sock *sk, struct sock *addr_sk,
629                                u8 *newkey, __u8 newkeylen)
630 {
631         return tcp_v6_md5_do_add(sk, &inet6_sk(addr_sk)->daddr,
632                                  newkey, newkeylen);
633 }
634
635 static int tcp_v6_md5_do_del(struct sock *sk, struct in6_addr *peer)
636 {
637         struct tcp_sock *tp = tcp_sk(sk);
638         int i;
639
640         for (i = 0; i < tp->md5sig_info->entries6; i++) {
641                 if (ipv6_addr_equal(&tp->md5sig_info->keys6[i].addr, peer)) {
642                         /* Free the key */
643                         kfree(tp->md5sig_info->keys6[i].base.key);
644                         tp->md5sig_info->entries6--;
645
646                         if (tp->md5sig_info->entries6 == 0) {
647                                 kfree(tp->md5sig_info->keys6);
648                                 tp->md5sig_info->keys6 = NULL;
649                                 tp->md5sig_info->alloced6 = 0;
650                         } else {
651                                 /* shrink the database */
652                                 if (tp->md5sig_info->entries6 != i)
653                                         memmove(&tp->md5sig_info->keys6[i],
654                                                 &tp->md5sig_info->keys6[i+1],
655                                                 (tp->md5sig_info->entries6 - i)
656                                                 * sizeof (tp->md5sig_info->keys6[0]));
657                         }
658                         tcp_free_md5sig_pool();
659                         return 0;
660                 }
661         }
662         return -ENOENT;
663 }
664
665 static void tcp_v6_clear_md5_list (struct sock *sk)
666 {
667         struct tcp_sock *tp = tcp_sk(sk);
668         int i;
669
670         if (tp->md5sig_info->entries6) {
671                 for (i = 0; i < tp->md5sig_info->entries6; i++)
672                         kfree(tp->md5sig_info->keys6[i].base.key);
673                 tp->md5sig_info->entries6 = 0;
674                 tcp_free_md5sig_pool();
675         }
676
677         kfree(tp->md5sig_info->keys6);
678         tp->md5sig_info->keys6 = NULL;
679         tp->md5sig_info->alloced6 = 0;
680
681         if (tp->md5sig_info->entries4) {
682                 for (i = 0; i < tp->md5sig_info->entries4; i++)
683                         kfree(tp->md5sig_info->keys4[i].base.key);
684                 tp->md5sig_info->entries4 = 0;
685                 tcp_free_md5sig_pool();
686         }
687
688         kfree(tp->md5sig_info->keys4);
689         tp->md5sig_info->keys4 = NULL;
690         tp->md5sig_info->alloced4 = 0;
691 }
692
693 static int tcp_v6_parse_md5_keys (struct sock *sk, char __user *optval,
694                                   int optlen)
695 {
696         struct tcp_md5sig cmd;
697         struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)&cmd.tcpm_addr;
698         u8 *newkey;
699
700         if (optlen < sizeof(cmd))
701                 return -EINVAL;
702
703         if (copy_from_user(&cmd, optval, sizeof(cmd)))
704                 return -EFAULT;
705
706         if (sin6->sin6_family != AF_INET6)
707                 return -EINVAL;
708
709         if (!cmd.tcpm_keylen) {
710                 if (!tcp_sk(sk)->md5sig_info)
711                         return -ENOENT;
712                 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
713                         return tcp_v4_md5_do_del(sk, sin6->sin6_addr.s6_addr32[3]);
714                 return tcp_v6_md5_do_del(sk, &sin6->sin6_addr);
715         }
716
717         if (cmd.tcpm_keylen > TCP_MD5SIG_MAXKEYLEN)
718                 return -EINVAL;
719
720         if (!tcp_sk(sk)->md5sig_info) {
721                 struct tcp_sock *tp = tcp_sk(sk);
722                 struct tcp_md5sig_info *p;
723
724                 p = kzalloc(sizeof(struct tcp_md5sig_info), GFP_KERNEL);
725                 if (!p)
726                         return -ENOMEM;
727
728                 tp->md5sig_info = p;
729                 sk->sk_route_caps &= ~NETIF_F_GSO_MASK;
730         }
731
732         newkey = kmemdup(cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
733         if (!newkey)
734                 return -ENOMEM;
735         if (ipv6_addr_v4mapped(&sin6->sin6_addr)) {
736                 return tcp_v4_md5_do_add(sk, sin6->sin6_addr.s6_addr32[3],
737                                          newkey, cmd.tcpm_keylen);
738         }
739         return tcp_v6_md5_do_add(sk, &sin6->sin6_addr, newkey, cmd.tcpm_keylen);
740 }
741
742 static int tcp_v6_md5_hash_pseudoheader(struct tcp_md5sig_pool *hp,
743                                         struct in6_addr *daddr,
744                                         struct in6_addr *saddr, int nbytes)
745 {
746         struct tcp6_pseudohdr *bp;
747         struct scatterlist sg;
748
749         bp = &hp->md5_blk.ip6;
750         /* 1. TCP pseudo-header (RFC2460) */
751         ipv6_addr_copy(&bp->saddr, saddr);
752         ipv6_addr_copy(&bp->daddr, daddr);
753         bp->protocol = cpu_to_be32(IPPROTO_TCP);
754         bp->len = cpu_to_be32(nbytes);
755
756         sg_init_one(&sg, bp, sizeof(*bp));
757         return crypto_hash_update(&hp->md5_desc, &sg, sizeof(*bp));
758 }
759
760 static int tcp_v6_md5_hash_hdr(char *md5_hash, struct tcp_md5sig_key *key,
761                                struct in6_addr *daddr, struct in6_addr *saddr,
762                                struct tcphdr *th)
763 {
764         struct tcp_md5sig_pool *hp;
765         struct hash_desc *desc;
766
767         hp = tcp_get_md5sig_pool();
768         if (!hp)
769                 goto clear_hash_noput;
770         desc = &hp->md5_desc;
771
772         if (crypto_hash_init(desc))
773                 goto clear_hash;
774         if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, th->doff << 2))
775                 goto clear_hash;
776         if (tcp_md5_hash_header(hp, th))
777                 goto clear_hash;
778         if (tcp_md5_hash_key(hp, key))
779                 goto clear_hash;
780         if (crypto_hash_final(desc, md5_hash))
781                 goto clear_hash;
782
783         tcp_put_md5sig_pool();
784         return 0;
785
786 clear_hash:
787         tcp_put_md5sig_pool();
788 clear_hash_noput:
789         memset(md5_hash, 0, 16);
790         return 1;
791 }
792
793 static int tcp_v6_md5_hash_skb(char *md5_hash, struct tcp_md5sig_key *key,
794                                struct sock *sk, struct request_sock *req,
795                                struct sk_buff *skb)
796 {
797         struct in6_addr *saddr, *daddr;
798         struct tcp_md5sig_pool *hp;
799         struct hash_desc *desc;
800         struct tcphdr *th = tcp_hdr(skb);
801
802         if (sk) {
803                 saddr = &inet6_sk(sk)->saddr;
804                 daddr = &inet6_sk(sk)->daddr;
805         } else if (req) {
806                 saddr = &inet6_rsk(req)->loc_addr;
807                 daddr = &inet6_rsk(req)->rmt_addr;
808         } else {
809                 struct ipv6hdr *ip6h = ipv6_hdr(skb);
810                 saddr = &ip6h->saddr;
811                 daddr = &ip6h->daddr;
812         }
813
814         hp = tcp_get_md5sig_pool();
815         if (!hp)
816                 goto clear_hash_noput;
817         desc = &hp->md5_desc;
818
819         if (crypto_hash_init(desc))
820                 goto clear_hash;
821
822         if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, skb->len))
823                 goto clear_hash;
824         if (tcp_md5_hash_header(hp, th))
825                 goto clear_hash;
826         if (tcp_md5_hash_skb_data(hp, skb, th->doff << 2))
827                 goto clear_hash;
828         if (tcp_md5_hash_key(hp, key))
829                 goto clear_hash;
830         if (crypto_hash_final(desc, md5_hash))
831                 goto clear_hash;
832
833         tcp_put_md5sig_pool();
834         return 0;
835
836 clear_hash:
837         tcp_put_md5sig_pool();
838 clear_hash_noput:
839         memset(md5_hash, 0, 16);
840         return 1;
841 }
842
843 static int tcp_v6_inbound_md5_hash (struct sock *sk, struct sk_buff *skb)
844 {
845         __u8 *hash_location = NULL;
846         struct tcp_md5sig_key *hash_expected;
847         struct ipv6hdr *ip6h = ipv6_hdr(skb);
848         struct tcphdr *th = tcp_hdr(skb);
849         int genhash;
850         u8 newhash[16];
851
852         hash_expected = tcp_v6_md5_do_lookup(sk, &ip6h->saddr);
853         hash_location = tcp_parse_md5sig_option(th);
854
855         /* We've parsed the options - do we have a hash? */
856         if (!hash_expected && !hash_location)
857                 return 0;
858
859         if (hash_expected && !hash_location) {
860                 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5NOTFOUND);
861                 return 1;
862         }
863
864         if (!hash_expected && hash_location) {
865                 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5UNEXPECTED);
866                 return 1;
867         }
868
869         /* check the signature */
870         genhash = tcp_v6_md5_hash_skb(newhash,
871                                       hash_expected,
872                                       NULL, NULL, skb);
873
874         if (genhash || memcmp(hash_location, newhash, 16) != 0) {
875                 if (net_ratelimit()) {
876                         printk(KERN_INFO "MD5 Hash %s for (%pI6, %u)->(%pI6, %u)\n",
877                                genhash ? "failed" : "mismatch",
878                                &ip6h->saddr, ntohs(th->source),
879                                &ip6h->daddr, ntohs(th->dest));
880                 }
881                 return 1;
882         }
883         return 0;
884 }
885 #endif
886
887 struct request_sock_ops tcp6_request_sock_ops __read_mostly = {
888         .family         =       AF_INET6,
889         .obj_size       =       sizeof(struct tcp6_request_sock),
890         .rtx_syn_ack    =       tcp_v6_send_synack,
891         .send_ack       =       tcp_v6_reqsk_send_ack,
892         .destructor     =       tcp_v6_reqsk_destructor,
893         .send_reset     =       tcp_v6_send_reset
894 };
895
896 #ifdef CONFIG_TCP_MD5SIG
897 static struct tcp_request_sock_ops tcp_request_sock_ipv6_ops = {
898         .md5_lookup     =       tcp_v6_reqsk_md5_lookup,
899 };
900 #endif
901
902 static struct timewait_sock_ops tcp6_timewait_sock_ops = {
903         .twsk_obj_size  = sizeof(struct tcp6_timewait_sock),
904         .twsk_unique    = tcp_twsk_unique,
905         .twsk_destructor= tcp_twsk_destructor,
906 };
907
908 static void tcp_v6_send_check(struct sock *sk, int len, struct sk_buff *skb)
909 {
910         struct ipv6_pinfo *np = inet6_sk(sk);
911         struct tcphdr *th = tcp_hdr(skb);
912
913         if (skb->ip_summed == CHECKSUM_PARTIAL) {
914                 th->check = ~csum_ipv6_magic(&np->saddr, &np->daddr, len, IPPROTO_TCP,  0);
915                 skb->csum_start = skb_transport_header(skb) - skb->head;
916                 skb->csum_offset = offsetof(struct tcphdr, check);
917         } else {
918                 th->check = csum_ipv6_magic(&np->saddr, &np->daddr, len, IPPROTO_TCP,
919                                             csum_partial(th, th->doff<<2,
920                                                          skb->csum));
921         }
922 }
923
924 static int tcp_v6_gso_send_check(struct sk_buff *skb)
925 {
926         struct ipv6hdr *ipv6h;
927         struct tcphdr *th;
928
929         if (!pskb_may_pull(skb, sizeof(*th)))
930                 return -EINVAL;
931
932         ipv6h = ipv6_hdr(skb);
933         th = tcp_hdr(skb);
934
935         th->check = 0;
936         th->check = ~csum_ipv6_magic(&ipv6h->saddr, &ipv6h->daddr, skb->len,
937                                      IPPROTO_TCP, 0);
938         skb->csum_start = skb_transport_header(skb) - skb->head;
939         skb->csum_offset = offsetof(struct tcphdr, check);
940         skb->ip_summed = CHECKSUM_PARTIAL;
941         return 0;
942 }
943
944 struct sk_buff **tcp6_gro_receive(struct sk_buff **head, struct sk_buff *skb)
945 {
946         struct ipv6hdr *iph = ipv6_hdr(skb);
947
948         switch (skb->ip_summed) {
949         case CHECKSUM_COMPLETE:
950                 if (!tcp_v6_check(skb_gro_len(skb), &iph->saddr, &iph->daddr,
951                                   skb->csum)) {
952                         skb->ip_summed = CHECKSUM_UNNECESSARY;
953                         break;
954                 }
955
956                 /* fall through */
957         case CHECKSUM_NONE:
958                 NAPI_GRO_CB(skb)->flush = 1;
959                 return NULL;
960         }
961
962         return tcp_gro_receive(head, skb);
963 }
964 EXPORT_SYMBOL(tcp6_gro_receive);
965
966 int tcp6_gro_complete(struct sk_buff *skb)
967 {
968         struct ipv6hdr *iph = ipv6_hdr(skb);
969         struct tcphdr *th = tcp_hdr(skb);
970
971         th->check = ~tcp_v6_check(skb->len - skb_transport_offset(skb),
972                                   &iph->saddr, &iph->daddr, 0);
973         skb_shinfo(skb)->gso_type = SKB_GSO_TCPV6;
974
975         return tcp_gro_complete(skb);
976 }
977 EXPORT_SYMBOL(tcp6_gro_complete);
978
979 static void tcp_v6_send_response(struct sk_buff *skb, u32 seq, u32 ack, u32 win,
980                                  u32 ts, struct tcp_md5sig_key *key, int rst)
981 {
982         struct tcphdr *th = tcp_hdr(skb), *t1;
983         struct sk_buff *buff;
984         struct flowi fl;
985         struct net *net = dev_net(skb->dst->dev);
986         struct sock *ctl_sk = net->ipv6.tcp_sk;
987         unsigned int tot_len = sizeof(struct tcphdr);
988         __be32 *topt;
989
990         if (ts)
991                 tot_len += TCPOLEN_TSTAMP_ALIGNED;
992 #ifdef CONFIG_TCP_MD5SIG
993         if (key)
994                 tot_len += TCPOLEN_MD5SIG_ALIGNED;
995 #endif
996
997         buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
998                          GFP_ATOMIC);
999         if (buff == NULL)
1000                 return;
1001
1002         skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
1003
1004         t1 = (struct tcphdr *) skb_push(buff, tot_len);
1005
1006         /* Swap the send and the receive. */
1007         memset(t1, 0, sizeof(*t1));
1008         t1->dest = th->source;
1009         t1->source = th->dest;
1010         t1->doff = tot_len / 4;
1011         t1->seq = htonl(seq);
1012         t1->ack_seq = htonl(ack);
1013         t1->ack = !rst || !th->ack;
1014         t1->rst = rst;
1015         t1->window = htons(win);
1016
1017         topt = (__be32 *)(t1 + 1);
1018
1019         if (ts) {
1020                 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
1021                                 (TCPOPT_TIMESTAMP << 8) | TCPOLEN_TIMESTAMP);
1022                 *topt++ = htonl(tcp_time_stamp);
1023                 *topt++ = htonl(ts);
1024         }
1025
1026 #ifdef CONFIG_TCP_MD5SIG
1027         if (key) {
1028                 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
1029                                 (TCPOPT_MD5SIG << 8) | TCPOLEN_MD5SIG);
1030                 tcp_v6_md5_hash_hdr((__u8 *)topt, key,
1031                                     &ipv6_hdr(skb)->saddr,
1032                                     &ipv6_hdr(skb)->daddr, t1);
1033         }
1034 #endif
1035
1036         buff->csum = csum_partial(t1, tot_len, 0);
1037
1038         memset(&fl, 0, sizeof(fl));
1039         ipv6_addr_copy(&fl.fl6_dst, &ipv6_hdr(skb)->saddr);
1040         ipv6_addr_copy(&fl.fl6_src, &ipv6_hdr(skb)->daddr);
1041
1042         t1->check = csum_ipv6_magic(&fl.fl6_src, &fl.fl6_dst,
1043                                     tot_len, IPPROTO_TCP,
1044                                     buff->csum);
1045
1046         fl.proto = IPPROTO_TCP;
1047         fl.oif = inet6_iif(skb);
1048         fl.fl_ip_dport = t1->dest;
1049         fl.fl_ip_sport = t1->source;
1050         security_skb_classify_flow(skb, &fl);
1051
1052         /* Pass a socket to ip6_dst_lookup either it is for RST
1053          * Underlying function will use this to retrieve the network
1054          * namespace
1055          */
1056         if (!ip6_dst_lookup(ctl_sk, &buff->dst, &fl)) {
1057                 if (xfrm_lookup(net, &buff->dst, &fl, NULL, 0) >= 0) {
1058                         ip6_xmit(ctl_sk, buff, &fl, NULL, 0);
1059                         TCP_INC_STATS_BH(net, TCP_MIB_OUTSEGS);
1060                         if (rst)
1061                                 TCP_INC_STATS_BH(net, TCP_MIB_OUTRSTS);
1062                         return;
1063                 }
1064         }
1065
1066         kfree_skb(buff);
1067 }
1068
1069 static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb)
1070 {
1071         struct tcphdr *th = tcp_hdr(skb);
1072         u32 seq = 0, ack_seq = 0;
1073         struct tcp_md5sig_key *key = NULL;
1074
1075         if (th->rst)
1076                 return;
1077
1078         if (!ipv6_unicast_destination(skb))
1079                 return;
1080
1081 #ifdef CONFIG_TCP_MD5SIG
1082         if (sk)
1083                 key = tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr);
1084 #endif
1085
1086         if (th->ack)
1087                 seq = ntohl(th->ack_seq);
1088         else
1089                 ack_seq = ntohl(th->seq) + th->syn + th->fin + skb->len -
1090                           (th->doff << 2);
1091
1092         tcp_v6_send_response(skb, seq, ack_seq, 0, 0, key, 1);
1093 }
1094
1095 static void tcp_v6_send_ack(struct sk_buff *skb, u32 seq, u32 ack, u32 win, u32 ts,
1096                             struct tcp_md5sig_key *key)
1097 {
1098         tcp_v6_send_response(skb, seq, ack, win, ts, key, 0);
1099 }
1100
1101 static void tcp_v6_timewait_ack(struct sock *sk, struct sk_buff *skb)
1102 {
1103         struct inet_timewait_sock *tw = inet_twsk(sk);
1104         struct tcp_timewait_sock *tcptw = tcp_twsk(sk);
1105
1106         tcp_v6_send_ack(skb, tcptw->tw_snd_nxt, tcptw->tw_rcv_nxt,
1107                         tcptw->tw_rcv_wnd >> tw->tw_rcv_wscale,
1108                         tcptw->tw_ts_recent, tcp_twsk_md5_key(tcptw));
1109
1110         inet_twsk_put(tw);
1111 }
1112
1113 static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
1114                                   struct request_sock *req)
1115 {
1116         tcp_v6_send_ack(skb, tcp_rsk(req)->snt_isn + 1, tcp_rsk(req)->rcv_isn + 1, req->rcv_wnd, req->ts_recent,
1117                         tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr));
1118 }
1119
1120
1121 static struct sock *tcp_v6_hnd_req(struct sock *sk,struct sk_buff *skb)
1122 {
1123         struct request_sock *req, **prev;
1124         const struct tcphdr *th = tcp_hdr(skb);
1125         struct sock *nsk;
1126
1127         /* Find possible connection requests. */
1128         req = inet6_csk_search_req(sk, &prev, th->source,
1129                                    &ipv6_hdr(skb)->saddr,
1130                                    &ipv6_hdr(skb)->daddr, inet6_iif(skb));
1131         if (req)
1132                 return tcp_check_req(sk, skb, req, prev);
1133
1134         nsk = __inet6_lookup_established(sock_net(sk), &tcp_hashinfo,
1135                         &ipv6_hdr(skb)->saddr, th->source,
1136                         &ipv6_hdr(skb)->daddr, ntohs(th->dest), inet6_iif(skb));
1137
1138         if (nsk) {
1139                 if (nsk->sk_state != TCP_TIME_WAIT) {
1140                         bh_lock_sock(nsk);
1141                         return nsk;
1142                 }
1143                 inet_twsk_put(inet_twsk(nsk));
1144                 return NULL;
1145         }
1146
1147 #ifdef CONFIG_SYN_COOKIES
1148         if (!th->rst && !th->syn && th->ack)
1149                 sk = cookie_v6_check(sk, skb);
1150 #endif
1151         return sk;
1152 }
1153
1154 /* FIXME: this is substantially similar to the ipv4 code.
1155  * Can some kind of merge be done? -- erics
1156  */
1157 static int tcp_v6_conn_request(struct sock *sk, struct sk_buff *skb)
1158 {
1159         struct inet6_request_sock *treq;
1160         struct ipv6_pinfo *np = inet6_sk(sk);
1161         struct tcp_options_received tmp_opt;
1162         struct tcp_sock *tp = tcp_sk(sk);
1163         struct request_sock *req = NULL;
1164         __u32 isn = TCP_SKB_CB(skb)->when;
1165 #ifdef CONFIG_SYN_COOKIES
1166         int want_cookie = 0;
1167 #else
1168 #define want_cookie 0
1169 #endif
1170
1171         if (skb->protocol == htons(ETH_P_IP))
1172                 return tcp_v4_conn_request(sk, skb);
1173
1174         if (!ipv6_unicast_destination(skb))
1175                 goto drop;
1176
1177         if (inet_csk_reqsk_queue_is_full(sk) && !isn) {
1178                 if (net_ratelimit())
1179                         syn_flood_warning(skb);
1180 #ifdef CONFIG_SYN_COOKIES
1181                 if (sysctl_tcp_syncookies)
1182                         want_cookie = 1;
1183                 else
1184 #endif
1185                 goto drop;
1186         }
1187
1188         if (sk_acceptq_is_full(sk) && inet_csk_reqsk_queue_young(sk) > 1)
1189                 goto drop;
1190
1191         req = inet6_reqsk_alloc(&tcp6_request_sock_ops);
1192         if (req == NULL)
1193                 goto drop;
1194
1195 #ifdef CONFIG_TCP_MD5SIG
1196         tcp_rsk(req)->af_specific = &tcp_request_sock_ipv6_ops;
1197 #endif
1198
1199         tcp_clear_options(&tmp_opt);
1200         tmp_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
1201         tmp_opt.user_mss = tp->rx_opt.user_mss;
1202
1203         tcp_parse_options(skb, &tmp_opt, 0);
1204
1205         if (want_cookie && !tmp_opt.saw_tstamp)
1206                 tcp_clear_options(&tmp_opt);
1207
1208         tmp_opt.tstamp_ok = tmp_opt.saw_tstamp;
1209         tcp_openreq_init(req, &tmp_opt, skb);
1210
1211         treq = inet6_rsk(req);
1212         ipv6_addr_copy(&treq->rmt_addr, &ipv6_hdr(skb)->saddr);
1213         ipv6_addr_copy(&treq->loc_addr, &ipv6_hdr(skb)->daddr);
1214         if (!want_cookie)
1215                 TCP_ECN_create_request(req, tcp_hdr(skb));
1216
1217         if (want_cookie) {
1218                 isn = cookie_v6_init_sequence(sk, skb, &req->mss);
1219                 req->cookie_ts = tmp_opt.tstamp_ok;
1220         } else if (!isn) {
1221                 if (ipv6_opt_accepted(sk, skb) ||
1222                     np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo ||
1223                     np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim) {
1224                         atomic_inc(&skb->users);
1225                         treq->pktopts = skb;
1226                 }
1227                 treq->iif = sk->sk_bound_dev_if;
1228
1229                 /* So that link locals have meaning */
1230                 if (!sk->sk_bound_dev_if &&
1231                     ipv6_addr_type(&treq->rmt_addr) & IPV6_ADDR_LINKLOCAL)
1232                         treq->iif = inet6_iif(skb);
1233
1234                 isn = tcp_v6_init_sequence(skb);
1235         }
1236
1237         tcp_rsk(req)->snt_isn = isn;
1238
1239         security_inet_conn_request(sk, skb, req);
1240
1241         if (tcp_v6_send_synack(sk, req))
1242                 goto drop;
1243
1244         if (!want_cookie) {
1245                 inet6_csk_reqsk_queue_hash_add(sk, req, TCP_TIMEOUT_INIT);
1246                 return 0;
1247         }
1248
1249 drop:
1250         if (req)
1251                 reqsk_free(req);
1252
1253         return 0; /* don't send reset */
1254 }
1255
1256 static struct sock * tcp_v6_syn_recv_sock(struct sock *sk, struct sk_buff *skb,
1257                                           struct request_sock *req,
1258                                           struct dst_entry *dst)
1259 {
1260         struct inet6_request_sock *treq;
1261         struct ipv6_pinfo *newnp, *np = inet6_sk(sk);
1262         struct tcp6_sock *newtcp6sk;
1263         struct inet_sock *newinet;
1264         struct tcp_sock *newtp;
1265         struct sock *newsk;
1266         struct ipv6_txoptions *opt;
1267 #ifdef CONFIG_TCP_MD5SIG
1268         struct tcp_md5sig_key *key;
1269 #endif
1270
1271         if (skb->protocol == htons(ETH_P_IP)) {
1272                 /*
1273                  *      v6 mapped
1274                  */
1275
1276                 newsk = tcp_v4_syn_recv_sock(sk, skb, req, dst);
1277
1278                 if (newsk == NULL)
1279                         return NULL;
1280
1281                 newtcp6sk = (struct tcp6_sock *)newsk;
1282                 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1283
1284                 newinet = inet_sk(newsk);
1285                 newnp = inet6_sk(newsk);
1286                 newtp = tcp_sk(newsk);
1287
1288                 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1289
1290                 ipv6_addr_set(&newnp->daddr, 0, 0, htonl(0x0000FFFF),
1291                               newinet->daddr);
1292
1293                 ipv6_addr_set(&newnp->saddr, 0, 0, htonl(0x0000FFFF),
1294                               newinet->saddr);
1295
1296                 ipv6_addr_copy(&newnp->rcv_saddr, &newnp->saddr);
1297
1298                 inet_csk(newsk)->icsk_af_ops = &ipv6_mapped;
1299                 newsk->sk_backlog_rcv = tcp_v4_do_rcv;
1300 #ifdef CONFIG_TCP_MD5SIG
1301                 newtp->af_specific = &tcp_sock_ipv6_mapped_specific;
1302 #endif
1303
1304                 newnp->pktoptions  = NULL;
1305                 newnp->opt         = NULL;
1306                 newnp->mcast_oif   = inet6_iif(skb);
1307                 newnp->mcast_hops  = ipv6_hdr(skb)->hop_limit;
1308
1309                 /*
1310                  * No need to charge this sock to the relevant IPv6 refcnt debug socks count
1311                  * here, tcp_create_openreq_child now does this for us, see the comment in
1312                  * that function for the gory details. -acme
1313                  */
1314
1315                 /* It is tricky place. Until this moment IPv4 tcp
1316                    worked with IPv6 icsk.icsk_af_ops.
1317                    Sync it now.
1318                  */
1319                 tcp_sync_mss(newsk, inet_csk(newsk)->icsk_pmtu_cookie);
1320
1321                 return newsk;
1322         }
1323
1324         treq = inet6_rsk(req);
1325         opt = np->opt;
1326
1327         if (sk_acceptq_is_full(sk))
1328                 goto out_overflow;
1329
1330         if (dst == NULL) {
1331                 struct in6_addr *final_p = NULL, final;
1332                 struct flowi fl;
1333
1334                 memset(&fl, 0, sizeof(fl));
1335                 fl.proto = IPPROTO_TCP;
1336                 ipv6_addr_copy(&fl.fl6_dst, &treq->rmt_addr);
1337                 if (opt && opt->srcrt) {
1338                         struct rt0_hdr *rt0 = (struct rt0_hdr *) opt->srcrt;
1339                         ipv6_addr_copy(&final, &fl.fl6_dst);
1340                         ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
1341                         final_p = &final;
1342                 }
1343                 ipv6_addr_copy(&fl.fl6_src, &treq->loc_addr);
1344                 fl.oif = sk->sk_bound_dev_if;
1345                 fl.fl_ip_dport = inet_rsk(req)->rmt_port;
1346                 fl.fl_ip_sport = inet_rsk(req)->loc_port;
1347                 security_req_classify_flow(req, &fl);
1348
1349                 if (ip6_dst_lookup(sk, &dst, &fl))
1350                         goto out;
1351
1352                 if (final_p)
1353                         ipv6_addr_copy(&fl.fl6_dst, final_p);
1354
1355                 if ((xfrm_lookup(sock_net(sk), &dst, &fl, sk, 0)) < 0)
1356                         goto out;
1357         }
1358
1359         newsk = tcp_create_openreq_child(sk, req, skb);
1360         if (newsk == NULL)
1361                 goto out;
1362
1363         /*
1364          * No need to charge this sock to the relevant IPv6 refcnt debug socks
1365          * count here, tcp_create_openreq_child now does this for us, see the
1366          * comment in that function for the gory details. -acme
1367          */
1368
1369         newsk->sk_gso_type = SKB_GSO_TCPV6;
1370         __ip6_dst_store(newsk, dst, NULL, NULL);
1371
1372         newtcp6sk = (struct tcp6_sock *)newsk;
1373         inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1374
1375         newtp = tcp_sk(newsk);
1376         newinet = inet_sk(newsk);
1377         newnp = inet6_sk(newsk);
1378
1379         memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1380
1381         ipv6_addr_copy(&newnp->daddr, &treq->rmt_addr);
1382         ipv6_addr_copy(&newnp->saddr, &treq->loc_addr);
1383         ipv6_addr_copy(&newnp->rcv_saddr, &treq->loc_addr);
1384         newsk->sk_bound_dev_if = treq->iif;
1385
1386         /* Now IPv6 options...
1387
1388            First: no IPv4 options.
1389          */
1390         newinet->opt = NULL;
1391         newnp->ipv6_fl_list = NULL;
1392
1393         /* Clone RX bits */
1394         newnp->rxopt.all = np->rxopt.all;
1395
1396         /* Clone pktoptions received with SYN */
1397         newnp->pktoptions = NULL;
1398         if (treq->pktopts != NULL) {
1399                 newnp->pktoptions = skb_clone(treq->pktopts, GFP_ATOMIC);
1400                 kfree_skb(treq->pktopts);
1401                 treq->pktopts = NULL;
1402                 if (newnp->pktoptions)
1403                         skb_set_owner_r(newnp->pktoptions, newsk);
1404         }
1405         newnp->opt        = NULL;
1406         newnp->mcast_oif  = inet6_iif(skb);
1407         newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
1408
1409         /* Clone native IPv6 options from listening socket (if any)
1410
1411            Yes, keeping reference count would be much more clever,
1412            but we make one more one thing there: reattach optmem
1413            to newsk.
1414          */
1415         if (opt) {
1416                 newnp->opt = ipv6_dup_options(newsk, opt);
1417                 if (opt != np->opt)
1418                         sock_kfree_s(sk, opt, opt->tot_len);
1419         }
1420
1421         inet_csk(newsk)->icsk_ext_hdr_len = 0;
1422         if (newnp->opt)
1423                 inet_csk(newsk)->icsk_ext_hdr_len = (newnp->opt->opt_nflen +
1424                                                      newnp->opt->opt_flen);
1425
1426         tcp_mtup_init(newsk);
1427         tcp_sync_mss(newsk, dst_mtu(dst));
1428         newtp->advmss = dst_metric(dst, RTAX_ADVMSS);
1429         tcp_initialize_rcv_mss(newsk);
1430
1431         newinet->daddr = newinet->saddr = newinet->rcv_saddr = LOOPBACK4_IPV6;
1432
1433 #ifdef CONFIG_TCP_MD5SIG
1434         /* Copy over the MD5 key from the original socket */
1435         if ((key = tcp_v6_md5_do_lookup(sk, &newnp->daddr)) != NULL) {
1436                 /* We're using one, so create a matching key
1437                  * on the newsk structure. If we fail to get
1438                  * memory, then we end up not copying the key
1439                  * across. Shucks.
1440                  */
1441                 char *newkey = kmemdup(key->key, key->keylen, GFP_ATOMIC);
1442                 if (newkey != NULL)
1443                         tcp_v6_md5_do_add(newsk, &inet6_sk(sk)->daddr,
1444                                           newkey, key->keylen);
1445         }
1446 #endif
1447
1448         __inet6_hash(newsk);
1449         __inet_inherit_port(sk, newsk);
1450
1451         return newsk;
1452
1453 out_overflow:
1454         NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
1455 out:
1456         NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1457         if (opt && opt != np->opt)
1458                 sock_kfree_s(sk, opt, opt->tot_len);
1459         dst_release(dst);
1460         return NULL;
1461 }
1462
1463 static __sum16 tcp_v6_checksum_init(struct sk_buff *skb)
1464 {
1465         if (skb->ip_summed == CHECKSUM_COMPLETE) {
1466                 if (!tcp_v6_check(skb->len, &ipv6_hdr(skb)->saddr,
1467                                   &ipv6_hdr(skb)->daddr, skb->csum)) {
1468                         skb->ip_summed = CHECKSUM_UNNECESSARY;
1469                         return 0;
1470                 }
1471         }
1472
1473         skb->csum = ~csum_unfold(tcp_v6_check(skb->len,
1474                                               &ipv6_hdr(skb)->saddr,
1475                                               &ipv6_hdr(skb)->daddr, 0));
1476
1477         if (skb->len <= 76) {
1478                 return __skb_checksum_complete(skb);
1479         }
1480         return 0;
1481 }
1482
1483 /* The socket must have it's spinlock held when we get
1484  * here.
1485  *
1486  * We have a potential double-lock case here, so even when
1487  * doing backlog processing we use the BH locking scheme.
1488  * This is because we cannot sleep with the original spinlock
1489  * held.
1490  */
1491 static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb)
1492 {
1493         struct ipv6_pinfo *np = inet6_sk(sk);
1494         struct tcp_sock *tp;
1495         struct sk_buff *opt_skb = NULL;
1496
1497         /* Imagine: socket is IPv6. IPv4 packet arrives,
1498            goes to IPv4 receive handler and backlogged.
1499            From backlog it always goes here. Kerboom...
1500            Fortunately, tcp_rcv_established and rcv_established
1501            handle them correctly, but it is not case with
1502            tcp_v6_hnd_req and tcp_v6_send_reset().   --ANK
1503          */
1504
1505         if (skb->protocol == htons(ETH_P_IP))
1506                 return tcp_v4_do_rcv(sk, skb);
1507
1508 #ifdef CONFIG_TCP_MD5SIG
1509         if (tcp_v6_inbound_md5_hash (sk, skb))
1510                 goto discard;
1511 #endif
1512
1513         if (sk_filter(sk, skb))
1514                 goto discard;
1515
1516         /*
1517          *      socket locking is here for SMP purposes as backlog rcv
1518          *      is currently called with bh processing disabled.
1519          */
1520
1521         /* Do Stevens' IPV6_PKTOPTIONS.
1522
1523            Yes, guys, it is the only place in our code, where we
1524            may make it not affecting IPv4.
1525            The rest of code is protocol independent,
1526            and I do not like idea to uglify IPv4.
1527
1528            Actually, all the idea behind IPV6_PKTOPTIONS
1529            looks not very well thought. For now we latch
1530            options, received in the last packet, enqueued
1531            by tcp. Feel free to propose better solution.
1532                                                --ANK (980728)
1533          */
1534         if (np->rxopt.all)
1535                 opt_skb = skb_clone(skb, GFP_ATOMIC);
1536
1537         if (sk->sk_state == TCP_ESTABLISHED) { /* Fast path */
1538                 TCP_CHECK_TIMER(sk);
1539                 if (tcp_rcv_established(sk, skb, tcp_hdr(skb), skb->len))
1540                         goto reset;
1541                 TCP_CHECK_TIMER(sk);
1542                 if (opt_skb)
1543                         goto ipv6_pktoptions;
1544                 return 0;
1545         }
1546
1547         if (skb->len < tcp_hdrlen(skb) || tcp_checksum_complete(skb))
1548                 goto csum_err;
1549
1550         if (sk->sk_state == TCP_LISTEN) {
1551                 struct sock *nsk = tcp_v6_hnd_req(sk, skb);
1552                 if (!nsk)
1553                         goto discard;
1554
1555                 /*
1556                  * Queue it on the new socket if the new socket is active,
1557                  * otherwise we just shortcircuit this and continue with
1558                  * the new socket..
1559                  */
1560                 if(nsk != sk) {
1561                         if (tcp_child_process(sk, nsk, skb))
1562                                 goto reset;
1563                         if (opt_skb)
1564                                 __kfree_skb(opt_skb);
1565                         return 0;
1566                 }
1567         }
1568
1569         TCP_CHECK_TIMER(sk);
1570         if (tcp_rcv_state_process(sk, skb, tcp_hdr(skb), skb->len))
1571                 goto reset;
1572         TCP_CHECK_TIMER(sk);
1573         if (opt_skb)
1574                 goto ipv6_pktoptions;
1575         return 0;
1576
1577 reset:
1578         tcp_v6_send_reset(sk, skb);
1579 discard:
1580         if (opt_skb)
1581                 __kfree_skb(opt_skb);
1582         kfree_skb(skb);
1583         return 0;
1584 csum_err:
1585         TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_INERRS);
1586         goto discard;
1587
1588
1589 ipv6_pktoptions:
1590         /* Do you ask, what is it?
1591
1592            1. skb was enqueued by tcp.
1593            2. skb is added to tail of read queue, rather than out of order.
1594            3. socket is not in passive state.
1595            4. Finally, it really contains options, which user wants to receive.
1596          */
1597         tp = tcp_sk(sk);
1598         if (TCP_SKB_CB(opt_skb)->end_seq == tp->rcv_nxt &&
1599             !((1 << sk->sk_state) & (TCPF_CLOSE | TCPF_LISTEN))) {
1600                 if (np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo)
1601                         np->mcast_oif = inet6_iif(opt_skb);
1602                 if (np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim)
1603                         np->mcast_hops = ipv6_hdr(opt_skb)->hop_limit;
1604                 if (ipv6_opt_accepted(sk, opt_skb)) {
1605                         skb_set_owner_r(opt_skb, sk);
1606                         opt_skb = xchg(&np->pktoptions, opt_skb);
1607                 } else {
1608                         __kfree_skb(opt_skb);
1609                         opt_skb = xchg(&np->pktoptions, NULL);
1610                 }
1611         }
1612
1613         kfree_skb(opt_skb);
1614         return 0;
1615 }
1616
1617 static int tcp_v6_rcv(struct sk_buff *skb)
1618 {
1619         struct tcphdr *th;
1620         struct sock *sk;
1621         int ret;
1622         struct net *net = dev_net(skb->dev);
1623
1624         if (skb->pkt_type != PACKET_HOST)
1625                 goto discard_it;
1626
1627         /*
1628          *      Count it even if it's bad.
1629          */
1630         TCP_INC_STATS_BH(net, TCP_MIB_INSEGS);
1631
1632         if (!pskb_may_pull(skb, sizeof(struct tcphdr)))
1633                 goto discard_it;
1634
1635         th = tcp_hdr(skb);
1636
1637         if (th->doff < sizeof(struct tcphdr)/4)
1638                 goto bad_packet;
1639         if (!pskb_may_pull(skb, th->doff*4))
1640                 goto discard_it;
1641
1642         if (!skb_csum_unnecessary(skb) && tcp_v6_checksum_init(skb))
1643                 goto bad_packet;
1644
1645         th = tcp_hdr(skb);
1646         TCP_SKB_CB(skb)->seq = ntohl(th->seq);
1647         TCP_SKB_CB(skb)->end_seq = (TCP_SKB_CB(skb)->seq + th->syn + th->fin +
1648                                     skb->len - th->doff*4);
1649         TCP_SKB_CB(skb)->ack_seq = ntohl(th->ack_seq);
1650         TCP_SKB_CB(skb)->when = 0;
1651         TCP_SKB_CB(skb)->flags = ipv6_get_dsfield(ipv6_hdr(skb));
1652         TCP_SKB_CB(skb)->sacked = 0;
1653
1654         sk = __inet6_lookup_skb(&tcp_hashinfo, skb, th->source, th->dest);
1655         if (!sk)
1656                 goto no_tcp_socket;
1657
1658 process:
1659         if (sk->sk_state == TCP_TIME_WAIT)
1660                 goto do_time_wait;
1661
1662         if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
1663                 goto discard_and_relse;
1664
1665         if (sk_filter(sk, skb))
1666                 goto discard_and_relse;
1667
1668         skb->dev = NULL;
1669
1670         bh_lock_sock_nested(sk);
1671         ret = 0;
1672         if (!sock_owned_by_user(sk)) {
1673 #ifdef CONFIG_NET_DMA
1674                 struct tcp_sock *tp = tcp_sk(sk);
1675                 if (!tp->ucopy.dma_chan && tp->ucopy.pinned_list)
1676                         tp->ucopy.dma_chan = dma_find_channel(DMA_MEMCPY);
1677                 if (tp->ucopy.dma_chan)
1678                         ret = tcp_v6_do_rcv(sk, skb);
1679                 else
1680 #endif
1681                 {
1682                         if (!tcp_prequeue(sk, skb))
1683                                 ret = tcp_v6_do_rcv(sk, skb);
1684                 }
1685         } else
1686                 sk_add_backlog(sk, skb);
1687         bh_unlock_sock(sk);
1688
1689         sock_put(sk);
1690         return ret ? -1 : 0;
1691
1692 no_tcp_socket:
1693         if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb))
1694                 goto discard_it;
1695
1696         if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
1697 bad_packet:
1698                 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
1699         } else {
1700                 tcp_v6_send_reset(NULL, skb);
1701         }
1702
1703 discard_it:
1704
1705         /*
1706          *      Discard frame
1707          */
1708
1709         kfree_skb(skb);
1710         return 0;
1711
1712 discard_and_relse:
1713         sock_put(sk);
1714         goto discard_it;
1715
1716 do_time_wait:
1717         if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
1718                 inet_twsk_put(inet_twsk(sk));
1719                 goto discard_it;
1720         }
1721
1722         if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
1723                 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
1724                 inet_twsk_put(inet_twsk(sk));
1725                 goto discard_it;
1726         }
1727
1728         switch (tcp_timewait_state_process(inet_twsk(sk), skb, th)) {
1729         case TCP_TW_SYN:
1730         {
1731                 struct sock *sk2;
1732
1733                 sk2 = inet6_lookup_listener(dev_net(skb->dev), &tcp_hashinfo,
1734                                             &ipv6_hdr(skb)->daddr,
1735                                             ntohs(th->dest), inet6_iif(skb));
1736                 if (sk2 != NULL) {
1737                         struct inet_timewait_sock *tw = inet_twsk(sk);
1738                         inet_twsk_deschedule(tw, &tcp_death_row);
1739                         inet_twsk_put(tw);
1740                         sk = sk2;
1741                         goto process;
1742                 }
1743                 /* Fall through to ACK */
1744         }
1745         case TCP_TW_ACK:
1746                 tcp_v6_timewait_ack(sk, skb);
1747                 break;
1748         case TCP_TW_RST:
1749                 goto no_tcp_socket;
1750         case TCP_TW_SUCCESS:;
1751         }
1752         goto discard_it;
1753 }
1754
1755 static int tcp_v6_remember_stamp(struct sock *sk)
1756 {
1757         /* Alas, not yet... */
1758         return 0;
1759 }
1760
1761 static struct inet_connection_sock_af_ops ipv6_specific = {
1762         .queue_xmit        = inet6_csk_xmit,
1763         .send_check        = tcp_v6_send_check,
1764         .rebuild_header    = inet6_sk_rebuild_header,
1765         .conn_request      = tcp_v6_conn_request,
1766         .syn_recv_sock     = tcp_v6_syn_recv_sock,
1767         .remember_stamp    = tcp_v6_remember_stamp,
1768         .net_header_len    = sizeof(struct ipv6hdr),
1769         .setsockopt        = ipv6_setsockopt,
1770         .getsockopt        = ipv6_getsockopt,
1771         .addr2sockaddr     = inet6_csk_addr2sockaddr,
1772         .sockaddr_len      = sizeof(struct sockaddr_in6),
1773         .bind_conflict     = inet6_csk_bind_conflict,
1774 #ifdef CONFIG_COMPAT
1775         .compat_setsockopt = compat_ipv6_setsockopt,
1776         .compat_getsockopt = compat_ipv6_getsockopt,
1777 #endif
1778 };
1779
1780 #ifdef CONFIG_TCP_MD5SIG
1781 static struct tcp_sock_af_ops tcp_sock_ipv6_specific = {
1782         .md5_lookup     =       tcp_v6_md5_lookup,
1783         .calc_md5_hash  =       tcp_v6_md5_hash_skb,
1784         .md5_add        =       tcp_v6_md5_add_func,
1785         .md5_parse      =       tcp_v6_parse_md5_keys,
1786 };
1787 #endif
1788
1789 /*
1790  *      TCP over IPv4 via INET6 API
1791  */
1792
1793 static struct inet_connection_sock_af_ops ipv6_mapped = {
1794         .queue_xmit        = ip_queue_xmit,
1795         .send_check        = tcp_v4_send_check,
1796         .rebuild_header    = inet_sk_rebuild_header,
1797         .conn_request      = tcp_v6_conn_request,
1798         .syn_recv_sock     = tcp_v6_syn_recv_sock,
1799         .remember_stamp    = tcp_v4_remember_stamp,
1800         .net_header_len    = sizeof(struct iphdr),
1801         .setsockopt        = ipv6_setsockopt,
1802         .getsockopt        = ipv6_getsockopt,
1803         .addr2sockaddr     = inet6_csk_addr2sockaddr,
1804         .sockaddr_len      = sizeof(struct sockaddr_in6),
1805         .bind_conflict     = inet6_csk_bind_conflict,
1806 #ifdef CONFIG_COMPAT
1807         .compat_setsockopt = compat_ipv6_setsockopt,
1808         .compat_getsockopt = compat_ipv6_getsockopt,
1809 #endif
1810 };
1811
1812 #ifdef CONFIG_TCP_MD5SIG
1813 static struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific = {
1814         .md5_lookup     =       tcp_v4_md5_lookup,
1815         .calc_md5_hash  =       tcp_v4_md5_hash_skb,
1816         .md5_add        =       tcp_v6_md5_add_func,
1817         .md5_parse      =       tcp_v6_parse_md5_keys,
1818 };
1819 #endif
1820
1821 /* NOTE: A lot of things set to zero explicitly by call to
1822  *       sk_alloc() so need not be done here.
1823  */
1824 static int tcp_v6_init_sock(struct sock *sk)
1825 {
1826         struct inet_connection_sock *icsk = inet_csk(sk);
1827         struct tcp_sock *tp = tcp_sk(sk);
1828
1829         skb_queue_head_init(&tp->out_of_order_queue);
1830         tcp_init_xmit_timers(sk);
1831         tcp_prequeue_init(tp);
1832
1833         icsk->icsk_rto = TCP_TIMEOUT_INIT;
1834         tp->mdev = TCP_TIMEOUT_INIT;
1835
1836         /* So many TCP implementations out there (incorrectly) count the
1837          * initial SYN frame in their delayed-ACK and congestion control
1838          * algorithms that we must have the following bandaid to talk
1839          * efficiently to them.  -DaveM
1840          */
1841         tp->snd_cwnd = 2;
1842
1843         /* See draft-stevens-tcpca-spec-01 for discussion of the
1844          * initialization of these values.
1845          */
1846         tp->snd_ssthresh = 0x7fffffff;
1847         tp->snd_cwnd_clamp = ~0;
1848         tp->mss_cache = 536;
1849
1850         tp->reordering = sysctl_tcp_reordering;
1851
1852         sk->sk_state = TCP_CLOSE;
1853
1854         icsk->icsk_af_ops = &ipv6_specific;
1855         icsk->icsk_ca_ops = &tcp_init_congestion_ops;
1856         icsk->icsk_sync_mss = tcp_sync_mss;
1857         sk->sk_write_space = sk_stream_write_space;
1858         sock_set_flag(sk, SOCK_USE_WRITE_QUEUE);
1859
1860 #ifdef CONFIG_TCP_MD5SIG
1861         tp->af_specific = &tcp_sock_ipv6_specific;
1862 #endif
1863
1864         sk->sk_sndbuf = sysctl_tcp_wmem[1];
1865         sk->sk_rcvbuf = sysctl_tcp_rmem[1];
1866
1867         local_bh_disable();
1868         percpu_counter_inc(&tcp_sockets_allocated);
1869         local_bh_enable();
1870
1871         return 0;
1872 }
1873
1874 static void tcp_v6_destroy_sock(struct sock *sk)
1875 {
1876 #ifdef CONFIG_TCP_MD5SIG
1877         /* Clean up the MD5 key list */
1878         if (tcp_sk(sk)->md5sig_info)
1879                 tcp_v6_clear_md5_list(sk);
1880 #endif
1881         tcp_v4_destroy_sock(sk);
1882         inet6_destroy_sock(sk);
1883 }
1884
1885 #ifdef CONFIG_PROC_FS
1886 /* Proc filesystem TCPv6 sock list dumping. */
1887 static void get_openreq6(struct seq_file *seq,
1888                          struct sock *sk, struct request_sock *req, int i, int uid)
1889 {
1890         int ttd = req->expires - jiffies;
1891         struct in6_addr *src = &inet6_rsk(req)->loc_addr;
1892         struct in6_addr *dest = &inet6_rsk(req)->rmt_addr;
1893
1894         if (ttd < 0)
1895                 ttd = 0;
1896
1897         seq_printf(seq,
1898                    "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1899                    "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %p\n",
1900                    i,
1901                    src->s6_addr32[0], src->s6_addr32[1],
1902                    src->s6_addr32[2], src->s6_addr32[3],
1903                    ntohs(inet_rsk(req)->loc_port),
1904                    dest->s6_addr32[0], dest->s6_addr32[1],
1905                    dest->s6_addr32[2], dest->s6_addr32[3],
1906                    ntohs(inet_rsk(req)->rmt_port),
1907                    TCP_SYN_RECV,
1908                    0,0, /* could print option size, but that is af dependent. */
1909                    1,   /* timers active (only the expire timer) */
1910                    jiffies_to_clock_t(ttd),
1911                    req->retrans,
1912                    uid,
1913                    0,  /* non standard timer */
1914                    0, /* open_requests have no inode */
1915                    0, req);
1916 }
1917
1918 static void get_tcp6_sock(struct seq_file *seq, struct sock *sp, int i)
1919 {
1920         struct in6_addr *dest, *src;
1921         __u16 destp, srcp;
1922         int timer_active;
1923         unsigned long timer_expires;
1924         struct inet_sock *inet = inet_sk(sp);
1925         struct tcp_sock *tp = tcp_sk(sp);
1926         const struct inet_connection_sock *icsk = inet_csk(sp);
1927         struct ipv6_pinfo *np = inet6_sk(sp);
1928
1929         dest  = &np->daddr;
1930         src   = &np->rcv_saddr;
1931         destp = ntohs(inet->dport);
1932         srcp  = ntohs(inet->sport);
1933
1934         if (icsk->icsk_pending == ICSK_TIME_RETRANS) {
1935                 timer_active    = 1;
1936                 timer_expires   = icsk->icsk_timeout;
1937         } else if (icsk->icsk_pending == ICSK_TIME_PROBE0) {
1938                 timer_active    = 4;
1939                 timer_expires   = icsk->icsk_timeout;
1940         } else if (timer_pending(&sp->sk_timer)) {
1941                 timer_active    = 2;
1942                 timer_expires   = sp->sk_timer.expires;
1943         } else {
1944                 timer_active    = 0;
1945                 timer_expires = jiffies;
1946         }
1947
1948         seq_printf(seq,
1949                    "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1950                    "%02X %08X:%08X %02X:%08lX %08X %5d %8d %lu %d %p %lu %lu %u %u %d\n",
1951                    i,
1952                    src->s6_addr32[0], src->s6_addr32[1],
1953                    src->s6_addr32[2], src->s6_addr32[3], srcp,
1954                    dest->s6_addr32[0], dest->s6_addr32[1],
1955                    dest->s6_addr32[2], dest->s6_addr32[3], destp,
1956                    sp->sk_state,
1957                    tp->write_seq-tp->snd_una,
1958                    (sp->sk_state == TCP_LISTEN) ? sp->sk_ack_backlog : (tp->rcv_nxt - tp->copied_seq),
1959                    timer_active,
1960                    jiffies_to_clock_t(timer_expires - jiffies),
1961                    icsk->icsk_retransmits,
1962                    sock_i_uid(sp),
1963                    icsk->icsk_probes_out,
1964                    sock_i_ino(sp),
1965                    atomic_read(&sp->sk_refcnt), sp,
1966                    jiffies_to_clock_t(icsk->icsk_rto),
1967                    jiffies_to_clock_t(icsk->icsk_ack.ato),
1968                    (icsk->icsk_ack.quick << 1 ) | icsk->icsk_ack.pingpong,
1969                    tp->snd_cwnd, tp->snd_ssthresh>=0xFFFF?-1:tp->snd_ssthresh
1970                    );
1971 }
1972
1973 static void get_timewait6_sock(struct seq_file *seq,
1974                                struct inet_timewait_sock *tw, int i)
1975 {
1976         struct in6_addr *dest, *src;
1977         __u16 destp, srcp;
1978         struct inet6_timewait_sock *tw6 = inet6_twsk((struct sock *)tw);
1979         int ttd = tw->tw_ttd - jiffies;
1980
1981         if (ttd < 0)
1982                 ttd = 0;
1983
1984         dest = &tw6->tw_v6_daddr;
1985         src  = &tw6->tw_v6_rcv_saddr;
1986         destp = ntohs(tw->tw_dport);
1987         srcp  = ntohs(tw->tw_sport);
1988
1989         seq_printf(seq,
1990                    "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1991                    "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %p\n",
1992                    i,
1993                    src->s6_addr32[0], src->s6_addr32[1],
1994                    src->s6_addr32[2], src->s6_addr32[3], srcp,
1995                    dest->s6_addr32[0], dest->s6_addr32[1],
1996                    dest->s6_addr32[2], dest->s6_addr32[3], destp,
1997                    tw->tw_substate, 0, 0,
1998                    3, jiffies_to_clock_t(ttd), 0, 0, 0, 0,
1999                    atomic_read(&tw->tw_refcnt), tw);
2000 }
2001
2002 static int tcp6_seq_show(struct seq_file *seq, void *v)
2003 {
2004         struct tcp_iter_state *st;
2005
2006         if (v == SEQ_START_TOKEN) {
2007                 seq_puts(seq,
2008                          "  sl  "
2009                          "local_address                         "
2010                          "remote_address                        "
2011                          "st tx_queue rx_queue tr tm->when retrnsmt"
2012                          "   uid  timeout inode\n");
2013                 goto out;
2014         }
2015         st = seq->private;
2016
2017         switch (st->state) {
2018         case TCP_SEQ_STATE_LISTENING:
2019         case TCP_SEQ_STATE_ESTABLISHED:
2020                 get_tcp6_sock(seq, v, st->num);
2021                 break;
2022         case TCP_SEQ_STATE_OPENREQ:
2023                 get_openreq6(seq, st->syn_wait_sk, v, st->num, st->uid);
2024                 break;
2025         case TCP_SEQ_STATE_TIME_WAIT:
2026                 get_timewait6_sock(seq, v, st->num);
2027                 break;
2028         }
2029 out:
2030         return 0;
2031 }
2032
2033 static struct tcp_seq_afinfo tcp6_seq_afinfo = {
2034         .name           = "tcp6",
2035         .family         = AF_INET6,
2036         .seq_fops       = {
2037                 .owner          = THIS_MODULE,
2038         },
2039         .seq_ops        = {
2040                 .show           = tcp6_seq_show,
2041         },
2042 };
2043
2044 int tcp6_proc_init(struct net *net)
2045 {
2046         return tcp_proc_register(net, &tcp6_seq_afinfo);
2047 }
2048
2049 void tcp6_proc_exit(struct net *net)
2050 {
2051         tcp_proc_unregister(net, &tcp6_seq_afinfo);
2052 }
2053 #endif
2054
2055 struct proto tcpv6_prot = {
2056         .name                   = "TCPv6",
2057         .owner                  = THIS_MODULE,
2058         .close                  = tcp_close,
2059         .connect                = tcp_v6_connect,
2060         .disconnect             = tcp_disconnect,
2061         .accept                 = inet_csk_accept,
2062         .ioctl                  = tcp_ioctl,
2063         .init                   = tcp_v6_init_sock,
2064         .destroy                = tcp_v6_destroy_sock,
2065         .shutdown               = tcp_shutdown,
2066         .setsockopt             = tcp_setsockopt,
2067         .getsockopt             = tcp_getsockopt,
2068         .recvmsg                = tcp_recvmsg,
2069         .backlog_rcv            = tcp_v6_do_rcv,
2070         .hash                   = tcp_v6_hash,
2071         .unhash                 = inet_unhash,
2072         .get_port               = inet_csk_get_port,
2073         .enter_memory_pressure  = tcp_enter_memory_pressure,
2074         .sockets_allocated      = &tcp_sockets_allocated,
2075         .memory_allocated       = &tcp_memory_allocated,
2076         .memory_pressure        = &tcp_memory_pressure,
2077         .orphan_count           = &tcp_orphan_count,
2078         .sysctl_mem             = sysctl_tcp_mem,
2079         .sysctl_wmem            = sysctl_tcp_wmem,
2080         .sysctl_rmem            = sysctl_tcp_rmem,
2081         .max_header             = MAX_TCP_HEADER,
2082         .obj_size               = sizeof(struct tcp6_sock),
2083         .slab_flags             = SLAB_DESTROY_BY_RCU,
2084         .twsk_prot              = &tcp6_timewait_sock_ops,
2085         .rsk_prot               = &tcp6_request_sock_ops,
2086         .h.hashinfo             = &tcp_hashinfo,
2087 #ifdef CONFIG_COMPAT
2088         .compat_setsockopt      = compat_tcp_setsockopt,
2089         .compat_getsockopt      = compat_tcp_getsockopt,
2090 #endif
2091 };
2092
2093 static struct inet6_protocol tcpv6_protocol = {
2094         .handler        =       tcp_v6_rcv,
2095         .err_handler    =       tcp_v6_err,
2096         .gso_send_check =       tcp_v6_gso_send_check,
2097         .gso_segment    =       tcp_tso_segment,
2098         .gro_receive    =       tcp6_gro_receive,
2099         .gro_complete   =       tcp6_gro_complete,
2100         .flags          =       INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
2101 };
2102
2103 static struct inet_protosw tcpv6_protosw = {
2104         .type           =       SOCK_STREAM,
2105         .protocol       =       IPPROTO_TCP,
2106         .prot           =       &tcpv6_prot,
2107         .ops            =       &inet6_stream_ops,
2108         .capability     =       -1,
2109         .no_check       =       0,
2110         .flags          =       INET_PROTOSW_PERMANENT |
2111                                 INET_PROTOSW_ICSK,
2112 };
2113
2114 static int tcpv6_net_init(struct net *net)
2115 {
2116         return inet_ctl_sock_create(&net->ipv6.tcp_sk, PF_INET6,
2117                                     SOCK_RAW, IPPROTO_TCP, net);
2118 }
2119
2120 static void tcpv6_net_exit(struct net *net)
2121 {
2122         inet_ctl_sock_destroy(net->ipv6.tcp_sk);
2123         inet_twsk_purge(net, &tcp_hashinfo, &tcp_death_row, AF_INET6);
2124 }
2125
2126 static struct pernet_operations tcpv6_net_ops = {
2127         .init = tcpv6_net_init,
2128         .exit = tcpv6_net_exit,
2129 };
2130
2131 int __init tcpv6_init(void)
2132 {
2133         int ret;
2134
2135         ret = inet6_add_protocol(&tcpv6_protocol, IPPROTO_TCP);
2136         if (ret)
2137                 goto out;
2138
2139         /* register inet6 protocol */
2140         ret = inet6_register_protosw(&tcpv6_protosw);
2141         if (ret)
2142                 goto out_tcpv6_protocol;
2143
2144         ret = register_pernet_subsys(&tcpv6_net_ops);
2145         if (ret)
2146                 goto out_tcpv6_protosw;
2147 out:
2148         return ret;
2149
2150 out_tcpv6_protocol:
2151         inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
2152 out_tcpv6_protosw:
2153         inet6_unregister_protosw(&tcpv6_protosw);
2154         goto out;
2155 }
2156
2157 void tcpv6_exit(void)
2158 {
2159         unregister_pernet_subsys(&tcpv6_net_ops);
2160         inet6_unregister_protosw(&tcpv6_protosw);
2161         inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
2162 }